@ARTICLE{BANDINI_2026_ARTICLE_BJPV_571381,
AUTHOR = {Bandini, M. and Jama Musse, J. and Piccini, S. and Vilela Ruiz, G. E.},
TITLE = {The Language of Things: Agricultural, Culinary, and Musical Terms in Ugo Ferrandi’s (1851–1933) Somali Notebooks},
YEAR = {2026},
ABSTRACT = {This article offers a linguistic and ethnographic analysis of a set of indigenous terms recorded by the Italian explorer Ugo Ferrandi (1851-1933) during his two-year stay in the town of Lugh (Luuq), southern Somalia, where he served as commander of an Italian outpost during the second Bottego expedition (1895–1897). The study specifically focuses on terms related to agriculture, cooking, and music—three core domains of material culture. Despite limitations posed by the absence of a standardised orthography and Ferrandi’s lack of formal training in local languages, his notebooks provide rare lexical insights into pre-standard Somali and the multilingual environment of the Jubba region, where Somali (including the Maay variety), Oromo, Swahili, and other languages coexisted. Drawing on philological analysis, early bilingual dictionaries, contemporaneous travel accounts, and oral testimonies collected in Somalia during the 1980s, the study addresses issues of dialectal variation, orthographic practices, and semantic shifts. These findings contribute to a broader project aimed at developing a glossary of pre-standard Somali terminology, intended as a resource for linguists, anthropologists, and scholars of African material culture, and to facilitate the recovery and dissemination of this important yet understudied primary source},
KEYWORDS = {Ugo Ferrandi, Somali Language, Italian colonialism, Agricultural terminology, Culinary terminology, Musical terminology},
PAGES = {63-109},
VOLUME = {22},
JOURNAL = {ETHNORÊMA},
}
@ARTICLE{BELBACHIR_2026_ARTICLE_BMCN_579744,
AUTHOR = {Belbachir, S. and Mohajir, M. E. and Chahhou, M. and Nahli, O.},
TITLE = {Building a semantic resource for the Moroccan dialect: a hybrid approach with LeOnI and semantic similarity},
YEAR = {2026},
ABSTRACT = {The construction of lexical-semantic resources for low-resource languages is a crucial task in natural language processing, as it enables the development of linguistic technologies that are often unavailable for under-represented languages. In this study, we present a methodology for building a structured lexical-semantic resource for the Moroccan Arabic dialect (Darija) as a low-resource language. Our method consists of two steps. The first step involves mapping a lexico-semantic network for Darija to the Princeton WordNet and the Suggested Upper Merged Ontology (SUMO). We apply the Lexical Ontology Inference (LeOnI) framework to link Darija words using a bilingual resource and existing WordNet-SUMO mapping. Darija words are classified as monosemous or polysemous to guide the mapping process. The second step introduces a similarity-based refinement process, combining semantic similarity components with ontological-lexical adjustment factors. A scoring function reliably guides the automatic mapping and disambiguation of synsets and concepts. Our results demonstrate that the combination of symbolic and distributional semantics yields accurate and interpretable wordnet-like resources for dialects. We also analyze semantic coverage and translation gaps, highlighting concepts that are untranslatable or culturally specific to Darija. The proposed framework can be generalized to other low-resource languages, as the core mapping and refinement stages in our method are language-independent. Once the Darija lexical-semantic resource is finalized, the constructed dataset will be made publicly available to promote reproducibility and facilitate research into Arabic semantic processing and dialectal natural language processing},
KEYWORDS = {Moroccan Arabic (Darija),Lexical-semantic resources,Cross-lingual semantic mapping,Low-resource language processing,Semantic similarity,Word sense disambiguation},
URL = {https://iris.cnr.it/handle/20.500.14243/579744},
VOLUME = {60 (2)},
DOI = {10.1007/s10579-026-09920-0},
ISSN = {1574-020X},
JOURNAL = {LANGUAGE RESOURCES AND EVALUATION},
}
@ARTICLE{CRISTIANO_2026_ARTICLE_CG_575361,
AUTHOR = {Cristiano, F. and Giovannetti, E.},
TITLE = {Discorsi di potere e intelligenza artificiale},
YEAR = {2026},
ABSTRACT = {L’articolo riflette sul rapporto tra discorsi di potere e intelligenza artificiale, interrogando il ruolo dei modelli linguistici come strumenti di supporto all’analisi critica del discorso. Lontano da letture celebrative o allarmistiche, il contributo mostra come l’uso consapevole dell’AI possa aiutare a far emergere ricorrenze, cornici interpretative e asimmetrie discorsive, rafforzando (e non sostituendo) lo sguardo critico umano. Un invito a pensare l’intelligenza artificiale non come un soggetto neutro ma come una lente attraverso cui osservare il funzionamento del potere nel linguaggio},
KEYWORDS = {analisi critica del discorso, large language models, intelligenza artificiale},
PAGES = {116-119},
URL = {https://fondazionerut.org/erre/},
VOLUME = {6},
JOURNAL = {ERRE},
}
@ARTICLE{DINI_2026_ARTICLE_DDBD_580564,
AUTHOR = {Dini, L. and Domenichelli, L. and Brunato, D. and Dell'Orletta, F.},
TITLE = {On the impact of pretraining data ordering in transformer encoder-and decoder-only language models},
YEAR = {2026},
ABSTRACT = {Pretraining large language models typically relies on randomly ordered corpora, implicitly assuming that data order has limited impact on learning. However, curriculum learning suggests that the sequence of training examples can influence optimization and representation dynamics. In this work, we systematically examine pretraining data ordering as an independent design variable for transformer-based language models, analyzing how curriculum-inspired strategies affect learning trajectories, representations, and transfer performance. We pretrain encoder-only and decoder-only models under controlled conditions, varying only the ordering of training data according to readability-based complexity proxies and their inverted variants, alongside multiple random baselines. Beyond final accuracy, we adopt a multi-dimensional evaluation framework combining intrinsic metrics, linguistic probing across training stages, downstream tasks, and geometric analyses of embedding spaces. Results indicate architecture-dependent tendencies in response to data ordering. Encoder models generally exhibit stronger sensitivity to curriculum strategies, with noticeable differences in optimization behavior, probing dynamics, and representation geometry. Decoder models appear comparatively more stable under forward curricula, with more pronounced effects emerging under inverted orderings. Probing analyses suggest that early improvements reflect differences in data exposure rather than accelerated linguistic acquisition, while later-stage effects selectively mirror properties emphasized by specific curricula. Geometric analyses show that data ordering reshapes global variance structure, often increasing anisotropy, without substantially altering nonlinear intrinsic dimensionality. Overall, data ordering functions as a selective inductive bias during pretraining, influencing learning dynamics and representational emphasis rather than consistently improving performance. These findings clarify how curriculum design interacts with transformer architectures and delineate its practical impact on pretraining outcomes},
KEYWORDS = {Curriculum learning, Data ordering, Language model pretraining, Linguistic representations, Representation geometry},
VOLUME = {342},
DOI = {10.1016/j},
JOURNAL = {KNOWLEDGE-BASED SYSTEMS},
}
@ARTICLE{MARZI_2026_ARTICLE_MFNPTDSKK_574721,
AUTHOR = {Marzi, C. and Ferro, M. and Nadalini, A. and Pirrelli, V. and Todorova, M. and Dimitrova, T. and Stefanova, V. and Kukova, H. and Koeva, S.},
TITLE = {Comparable reading development in Bulgarian and Italian: cross-linguistic insights from a finger-tracking study},
YEAR = {2026},
ABSTRACT = {Transparent orthographies, such as Bulgarian and Italian, feature highly consistent grapheme-phoneme correspondences, enabling rapid acquisition of decoding skills. Despite belonging to different language families and using distinct scripts (i. e., Cyrillic vs. Latin), these languages provide an ideal framework to investigate whether orthographic transparency can outweigh script differences in shaping reading development. We conducted a cross-sectional study with primary school children from Grades 2 to 5 in Bulgaria and Italy. Reading performance was recorded using a novel finger-tracking technique, which allows the capture of temporal dynamics of reading in a portable, low-cost, and classroom-friendly format. Measures of reading time and text comprehension accuracy were compared across grades and languages. Developmental trajectories for both speed and comprehension accuracy showed remarkable similarity across Bulgarian and Italian, with both languages exhibiting steady improvement from grade 2 to grade 5. Our cross-linguistic results showed that reading development in primary school children follows both universal and language-specific trajectories. While broad developmental trajectories were similar, cross-linguistic differences emerged in the impact of morphological complexity, pointing to both universal and language-specific mechanisms. Our findings indicate that orthographic transparency may exert a stronger influence on early reading development than script type, even across languages from different families. The study also highlights the potential of finger-tracking for large-scale literacy research. Establishing comparable developmental benchmarks in transparent orthographies may inform cross-linguistic screening tools and early interventions},
KEYWORDS = {reading development, transparent orthographies, finger-tracking, cross-linguistic comparison, Bulgarian, Italian},
PAGES = {1-30},
URL = {https://www.mdpi.com/2226-471X/11/4/70},
VOLUME = {11 (4)},
DOI = {10.3390/languages11040070},
ISSN = {2226-471X},
JOURNAL = {LANGUAGES},
}
@ARTICLE{NODARI_2026_ARTICLE_NSCC_571501,
AUTHOR = {Nodari, R. and Soria, C. and Calamai, S. and Carella, G.},
TITLE = {Student Attitudes Toward World Englishes in the Italian School Context},
YEAR = {2026},
ABSTRACT = {This study investigates Italian secondary school students’ attitudes toward different English varieties (American, African American, British, Chinese, Indian, Italian, Multicultural London, Nigerian, and Ukrainian) within a World Englishes framework. Combining a variety identification task and a Verbal Guise Technique, 194 students rated speakers on competence, warmth, and speech traits. Results show generally low recognition rates, with Italian English being the most accurately identified, and recognition positively influencing evaluations on all dimensions. Accent effects emerged clearly: American and British English received the highest competence ratings, while Italian English, followed by American and African American English, was rated highest for warmth; Ukrainian English was evaluated least favourably overall. Familiarity with English accents significantly improved evaluations of competence, while appreciation of linguistic diversity positively influenced warmth. Gender effects were also observed, with male voices generally rated more positively, especially for Inner Circle varieties. Overall, the findings highlight the role of recognition, experience, and social framing in shaping evaluations of English varieties, with implications for more inclusive approaches to English language teaching},
KEYWORDS = {language attitudes, English varieties, accents, sociolinguistics, sociophonetics, perceptual sociophonetics},
DOI = {10.1111/ijal},
JOURNAL = {INTERNATIONAL JOURNAL OF APPLIED LINGUISTICS},
}
@ARTICLE{SRIVASTAVA_2026_ARTICLE_SFPC_561481,
AUTHOR = {Srivastava, M. and Ferro, M. and Pirrelli, V. and Coro, G.},
TITLE = {Enhancing token boundary detection in disfluent speech},
YEAR = {2026},
ABSTRACT = {This paper presents an open-source Automatic Speech Recognition (ASR) pipeline optimised for disfluent Italian read speech, designed to enhance both transcription accuracy and token boundary precision in low-resource settings. The study aims to address the difficulty that conventional ASR systems face in capturing the temporal irregularities of disfluent reading, which are crucial for psycholinguistic and clinical analyses of fluency. Building upon the WhisperX framework, the proposed system replaces the neural Voice Activity Detection module with an energy-based segmentation algorithm designed to preserve prosodic cues such as pauses and hesitations. A dual-alignment strategy integrates two complementary phoneme-level ASR models to correct onset–offset asymmetries, while a bias-compensation post-processing step mitigates systematic timing errors. Evaluation on the READLET (child read speech) and CLIPS (adult read speech) corpora shows consistent improvements over baseline systems, confirming enhanced robustness in boundary detection and transcription under disfluent conditions. The results demonstrate that the proposed architecture provides a general, language-independent framework for accurate alignment and disfluency-aware ASR. The approach can support downstream analyses of reading fluency and speech planning, contributing to both computational linguistics and clinical speech research},
KEYWORDS = {Automatic Speech Recognition, Statistical analysis, Disfluencies, Voice Activity Detection},
PAGES = {14},
URL = {https://www.sciencedirect.com/science/article/pii/S2667305325001401},
VOLUME = {29},
DOI = {10.1016/j.iswa.2025.200614},
ISSN = {2667-3053},
JOURNAL = {INTELLIGENT SYSTEMS WITH APPLICATIONS},
}
@ARTICLE{TODESCO_2026_ARTICLE_TRMM_580001,
AUTHOR = {Todesco, A. and Romagno, D. and Mancuso, M. and Marzi, C.},
TITLE = {Investigating language processing in stroke-affected brains: a pilot study on the key role of stimulus design to capture interface domains},
YEAR = {2026},
ABSTRACT = {Stroke represents one of the leading causes of acquired cognitive and communicative impairments, limiting the ability to use language appropriately and profoundly impacting quality of life and social participation. Post-stroke aphasia offers a crucial pathway for the understanding of the neuropsychological correlates of language processing and, despite advances in acute stroke management, linguistic deficits continue to represent a significant challenge for rehabilitation and long-term care. Additionally, one of the major challenges in investigating post-stroke language deficits lies in the marked variability across patients. In this pilot study, we investigated whether stimulus design may enhance the detection of linguistic processing deficits in stroke-affected individuals, targeting lexical class distinctions and morphosyntax/lexical semantics interface-level processing. Results from twelve Italian-speaking patients with unilateral stroke (6 left-hemisphere, 6 right-hemisphere) revealed differential effects of lesion lateralisation and lexical class on task performance. Task accuracy was shaped by individual and lesion-related factors, revealing task-specific dissociations between left-and right-hemisphere patients. These findings underscore the value of using targeted linguistic stimuli to detect subtle deficits that may go undetected by standard screening tools, contributing to a more comprehensive understanding of post-stroke aphasia},
KEYWORDS = {lexical-semantic processing, morphosyntax/lexical semantics interface processing, linguistic assessment, aphasia, post-stroke},
PAGES = {1-37},
URL = {https://www.jbe-platform.com/content/journals/10.1075/ml.25010.tod},
DOI = {10.1075/ml.25010.tod},
ISSN = {1871-1340},
JOURNAL = {THE MENTAL LEXICON},
}
@BOOK{CACCAVALE_2026_BOOK_CDDFLLLMMMNOPST_578881,
AUTHOR = {Caccavale, M. and Degl'Innocenti, E. and Dema, C. and Ferretti, R. and Lazzeri, E. and Licciulli, F. and Lo Giudice, C. and Manconi, A. and Miniello, G. and Modolo, I. and Natilli, M. and Oggioni, A. and Provost, L. and Spadi, A. and Tarallo, A.},
TITLE = {Raccolta dei contributi presentati dalla Comunità DS@CNR},
YEAR = {2026},
ABSTRACT = {Il presente documento raccoglie i contributi presentati nel corso della seconda giornata del primo incontro in presenza della comunità Data Steward del Consiglio Nazionale delle Ricerche (DS@CNR), svoltosi il 18–19 febbraio 2026 presso la Biblioteca Centrale del CNR a Roma. L’iniziativa si inserisce nel percorso avviato dal CNR per strutturare una rete istituzionale di competenze in materia di data stewardship, in linea con le politiche nazionali ed europee sulla Open Science e con l’obiettivo di promuovere una gestione responsabile, accessibile e FAIR2 dei dati e dei prodotti della ricerca. In questo contesto, la comunità DS@CNR rappresenta uno spazio di confronto e collaborazione tra professionalità eterogenee, chiamate a operare in un sistema complesso e distribuito come quello del CNR. La seconda giornata dell’incontro è stata interamente dedicata alla valorizzazione delle esperienze interne alla comunità, con l’obiettivo di condividere pratiche, strumenti e modelli operativi già attivi nei diversi ambiti disciplinari e infrastrutturali. Le presentazioni qui raccolte restituiscono un quadro articolato e multidisciplinare delle attività di data stewardship in corso, evidenziando al contempo sfide comuni e opportunità di sviluppo. I contributi spaziano dall’ambito delle infrastrutture di ricerca europee e nazionali — con esempi quali ELIXIR-IT, eLTER-RI, BBMRI. it, ACTRIS, LifeWatch Italy, SoBigData e NFFA — fino a iniziative strategiche come Cloud@CNR e il nodo marino IT-IOOS del progetto PNRR ITINERIS. Accanto a queste esperienze, trovano spazio riflessioni su temi trasversali e sempre più rilevanti, quali la gestione dei dati nelle discipline SSH (Social Sciences and Humanities), la sicurezza e governance del dato, la FAIRification, la definizione dei metadati e l’evoluzione dei Data Management Plan in contesti distribuiti. Nel loro insieme, gli interventi affrontano alcune delle principali sfide aperte per la comunità DS@CNR: l’armonizzazione delle pratiche di gestione dei dati in contesti eterogenei, l’interoperabilità tra infrastrutture e domini disciplinari, la sostenibilità dei servizi, la sicurezza e la compliance normativa, nonché il rafforzamento delle competenze e dei modelli organizzativi a supporto della ricerca. Le presentazioni qui raccolte rappresentano un primo passo concreto verso il consolidamento di una comunità di pratica capace di sostenere, in modo coordinato e strategico, l’evoluzione della gestione dei dati della ricerca all’interno del CNR, contribuendo agli obiettivi strategici della comunità DS@CNR, già definiti nel documento di visione pubblicato a dicembre 2025},
KEYWORDS = {Elaborazione dei dati, Scienza degli elaboratori, Informatica - Attività di ricerca},
PAGES = {166},
URL = {http://eprints.bice.rm.cnr.it/id/eprint/24180},
DOI = {10.57665/BICE_Datasteward_02_2026},
PUBLISHER = {CNR},
}
@INCOLLECTION{FERRETTI_2026_INCOLLECTION_FCCC_584544,
AUTHOR = {Ferretti, M. and Chiarella, D. and Cutugno, P. and Cinini, A.},
TITLE = {Linguistic Coping Strategies in Online Forums for Multiple Sclerosis: Insights for Peer Support and Digital Wellbeing},
YEAR = {2026},
ABSTRACT = {This study investigates how people living with Multiple Sclerosis (MS) use language to articulate coping strategies in a large Italian online forum. Drawing on a corpus of nearly 15, 000 messages authored by individuals with MS, we examine three distinct types of forum posts: initial messages that open a thread, self-replies written by the same user, and responses by other participants. Through a mixed-methods approach that combines linguistic profiling, readability metrics, and topic modeling, we identify structural, grammatical, and stylistic features that charac-terize different stages of online interaction. Our findings reveal a functional shift from autobiographical narration in initial posts to more dialogic, supportive, and emotionally expressive language in replies. We identify three recurring coping strate-gies emerging from forum discourse: (1) problem-focused coping, through detailed medical narratives and treatment decisions; (2) symptom-focused coping, involving bodily awareness and self-monitoring; and (3) emotion-focused coping, based on gratitude, reassurance, and social bonding. By highlighting the expressive and rela-tional functions of language in peer communication, this study contributes to the understanding of digital coping mechanisms in chronic illness contexts. It also offers insights for the development of linguistically informed tools capable of detecting emotional distress, emerging needs, or social disengagement. In the context of Active and Assisted Living (AAL), our findings suggest that language can act as a “soft sensor”, supporting more sensitive and user-centered approaches to digital health technologies},
KEYWORDS = {Patient narratives, Peer support, Coping strategies, Digital health, Forum communication,NLP},
PAGES = {509-529},
DOI = {10.1007/978},
ISBN = {9783032110497},
BOOKTITLE = {Ambient Assisted Living. ForItAAL 2025},
}
@INPROCEEDINGS{BIFFI_2026_INPROCEEDINGS_BCFGMS_580341,
AUTHOR = {Biffi, M. and Cucurullo, S. and Favaro, M. and Guadagnini, E. and Montemagni, S. and Sassolini, E.},
TITLE = {From Print to Digital and Beyond: The Retrodigitization of a Historical Dictionary of Italian as a Hybrid Lexical Resource},
YEAR = {2026},
ABSTRACT = {This paper presents the retrodigitization project of the Grande Dizionario della Lingua Italiana (GDLI), the largest historical dictionary of the Italian language. The GDLI’s 23, 000 pages-originally designed for human consultation-constitute an exceptional repository of linguistic and cultural-historical information, while posing significant challenges to large-scale digitization and data structuring. The project, still ongoing, will result in the development of a set of interoperable and interlinked resources: (i) a TEI-XML edition of the dictionary text, encoding its complex lexicographic structure; (ii) an annotated corpus of the quoted examples, enabling linguistic and historical research across centuries; and (iii) a database of quoted authors and works. Together, these components form a hybrid lexical resource that establishes the foundations for innovative and advanced modes of accessing and exploring the rich and multifaceted content of this historical dictionary},
KEYWORDS = {Historical Dictionary, Retro-digitization, Knowledge Organization, e-Lexicography},
PAGES = {770-777},
DOI = {10.63317/338howsz93sg},
PUBLISHER = {European Language Resources Association (ELRA)},
ISBN = {9782493814494},
BOOKTITLE = {Proceedings of the Fifteenth Language Resources and Evaluation Conference (LREC 2026)},
}
@INPROCEEDINGS{CAFISO_2026_INPROCEEDINGS_CCCCCDDDDGILLLMMMOPPPSTTV_585285,
AUTHOR = {Cafiso, M. and Carboni, A. and Caudai, C. and Colantonio, S. and Conti, F. and D'Acunto, M. and Daoudagh, S. and Del Corso, G. and Del Gratta, R. and Germanese, D. and Ignesti, G. and Lazzini, G. and Leone, G. R. and Leporini, B. and Magrini, M. and Martinelli, M. and Moroni, D. and Omrani, A. R. and Pardini, F. and Pascali, M. A. and Paradisi, P. and Sebastiaini, L. and Tampucci, M. and Tateo, V. and Volpini, F.},
TITLE = {Advancements in Artificial Intelligence and Computer Vision for Biomedical Applications @SI-Lab},
YEAR = {2026},
ABSTRACT = {This paper summarizes recent research at the Signals and Images Lab (ISTI-CNR) leveraging artificial intelligence, machine learning, and computer vision to address complex biomedical challenges. We highlight advancements in trustworthy, explainable algorithmic foundations alongside their practical clinical applications across diagnostic imaging, physiological signal analysis and neuromotor rehabilitation},
KEYWORDS = {Physiological signals, Neuromotor rehabilitation, Dance movement therapy, Artificial Intelligence, Machine Learning, Generative AI, Explainable AI, Uncertainty Quantification, Trustworthy AI},
URL = {https://iris.cnr.it/handle/20.500.14243/585285},
BOOKTITLE = {ITAL-IA 2026},
}
@INPROCEEDINGS{DIDONATO_2026_INPROCEEDINGS_D_579324,
AUTHOR = {Di Donato, F.},
TITLE = {CoARA e la riforma della valutazione della ricerca},
YEAR = {2026},
ABSTRACT = {La Coalition for Advancing Research Assessment (CoARA), istituita nel 2022 su iniziativa della Commissione Europea, conta oggi quasi 800 istituzioni globali impegnate nella riforma della valutazione della ricerca, con l'Italia come secondo Paese più rappresentato. Fondata sull'accordo ARRA, la coalizione mira a superare l'uso improprio di indicatori bibliometrici quantitativi (come l'Impact Factor e l'h-index) a favore di una valutazione basata sul merito intrinseco e sulla qualità, supportata dalla peer-review. La riforma promuove la scienza aperta, la multidisciplinarità e il riconoscimento di una pluralità di contributi, dai software alla didattica, superando il modello centrato esclusivamente sulle pubblicazioni. Tuttavia, l'attuazione pratica in Italia incontra ostacoli: il caso del CNR evidenzia come i criteri di valutazione restino spesso legati a logiche tradizionali e quantitative. È dunque necessaria una trasformazione culturale profonda, supportata da formazione e un quadro normativo allineato agli standard internazionali, per evitare l'isolamento del sistema scientifico nazionale},
KEYWORDS = {Coara, Open science, CNR},
PAGES = {15-21},
PUBLISHER = {CNR edizioni (Roma, ITA)},
ISBN = {978},
CONFERENCE_NAME = {VALORIZZAZIONE DEL PERSONALE RICERCATORE E TECNOLOGO DEGLI ENTI PUBBLICI DI RICERCA},
CONFERENCE_PLACE = {Roma},
BOOKTITLE = {VALORIZZAZIONE DEL PERSONALE RICERCATORE E TECNOLOGO DEGLI ENTI PUBBLICI DI RICERCA},
}
@INPROCEEDINGS{DIDONATO_2026_INPROCEEDINGS_D_579326,
AUTHOR = {Di Donato, F.},
TITLE = {Open science, research assessment reform, and autonomy of research(ers). A critical discussion},
YEAR = {2026},
ABSTRACT = {This contribution examines the critical interrelationships between open science, research autonomy, and the ongoing reform of research assessment. Adopting a philosophical-political perspective, it analyzes current pressures on scientific freedom, including geopolitical shifts, technological changes, and the dominance of private platforms over research data. The study questions who determines research value and how evaluation systems can act as instruments of power. It explores the Agreement on Reforming Research Assessment (ARRA) and CoARA principles, which advocate for the direct involvement of scholars in defining qualitative criteria. To contextualize these issues, the paper revisits the 18th and 19th-century Prussian university theories of Immanuel Kant and Wilhelm von Humboldt. Kant's concept of "public reason" and Humboldt’s vision of open-ended science establish a paradigm where research is inherently collaborative and inclusive. Ultimately, this historical model offers a framework to address contemporary contradictions in the open science landscape},
KEYWORDS = {open science, research autonomy, research assessment reform},
PAGES = {14-16},
URL = {https://ressh2026.igsg.cnr.it/},
DOI = {10.32091/RESSH2026},
ISBN = {9788890576485},
CONFERENCE_NAME = {RESSH 2026-Research Evaluation in the Social Sciences and Humanities Conference},
BOOKTITLE = {RESEARCH EVALUATION AND SCIENTIFIC AUTONOMY UNDER PRESSURE. Conference Proceedings},
}
@INPROCEEDINGS{DIDONATO_2026_INPROCEEDINGS_D_582385,
AUTHOR = {Di Donato, F.},
TITLE = {From the Umbrella to the Forest. Exploring Open Science through Images},
YEAR = {2026},
ABSTRACT = {This contribution analyses the visual metaphors used to describe Open Science (OS) and shows how these reveal the values, priorities and cultural assumptions of the movement. The journey begins with the metaphor of the ‘umbrella’ (Fecher, Friesike, 2013). The umbrella brings together and shelters related concepts under a single term: it is a tool created by humans for a specific purpose. However, what lies beneath the umbrella varies significantly, reflecting the diHerent priorities of the respective community. The 'mushroom' metaphor, introduced by Méndez (2017), marks a significant transition from an artefact to a natural organism, and represents a conceptual shift. In addition, the mushroom is not merely a vessel for observable practices. The idea of a hidden and foundational system represented by the roots is here introduced (Rafols et al., 2024). The next step in this evolution is the ‘wheel’ (Kramer, 2017), representing OS as a circular infinite research workflow. The image illustrates the various stages of the research process (from discovery and analysis to publication, dissemination and evaluation) as a continuous cycle, and evokes the hermeneutic circle. Through the wheel-among the most significant examples of human invention-OS is elevated from a collection of practices to a fundamental process for knowledge production, dissemination and assessment. The concept of a process is further elaborated on using the 'taxonomy' (Pontika and Knoth, 2015) and the 'tree' metaphors (YERUN, 2018; Méndez, 2022). By organising the components of OS into a hierarchical structure, the taxonomy/tree provides detail about the ecosystem. The final metaphor is the 'graph', used by UNESCO (2020). The image immediately evokes the topologies of the Internet and the World Wide Web. The graph describes OS as a dynamic, decentralised and distributed network of relationships. This vision of a complex, living network serves as a bridge to my proposed synthesis to represent OS as a 'forest'. The forest is a natural organism like the mushroom, it includes the symbolism of the tree, and its vast system of interconnected roots functions as a living graph. I this contribution I will discuss how the metaphor embodies a number of OS principles and values (collaboration, inclusiveness and biodiversity, collective intelligence) but also its ability to represent the real tensions and inequalities that persist in our 148 knowledge ecosystems (in terms of unequal distribution of resources, lack of equal opportunities, exclusion and competition, and eHiciency without equity). A value of the forest metaphor, then, is that it makes these tensions visible, challenging the status quo and forcing us to confront the gap between our principles and our practices (Sepehri, 2025). But it also helps us to radically change the way we evaluate research quality and value, encouraging us to go beyond conventional parameters of eHiciency and excellence and ask new and deeper questions about our work, such as: 'Is it sustainable? Is it inclusive? Is it creative? Is it alive?' (Mounier, 2022)},
KEYWORDS = {open science images, open science metaphors},
URL = {https://opensciencestudies.eu/for-2026-conference/for2026-book-of-abstracts/},
CONFERENCE_NAME = {FOR2026-The Future of Open Research: Reliable, Responsible, Equitable},
BOOKTITLE = {FOR2026 CONFERENCE The Future of Open Research: Reliable, Responsible, Equitable Munich, 4-6 May 2026 Book of Abstracts},
}
@INPROCEEDINGS{DIDONATO_2026_INPROCEEDINGS_D_582386,
AUTHOR = {Di Donato, F.},
TITLE = {From the Umbrella to the Forest. A Journey through the Visual Metaphors of Open Science},
YEAR = {2026},
ABSTRACT = {The poster provides a comprehensive overview of the visual metaphors used to represent Open Science, tracing their evolution from early man-made concepts to complex natural and networked models. Grounded in the methodological premise that metaphorical language possesses heuristic power in science, it analyzes the images of the umbrella, the mushroom, the wheel, the tree, and the graph. These metaphors are explored as tools that map the meanings of Open Science from the figurative and linguistic domains to the practices and values of specific research cultures. The analysis examines how early representations, such as the umbrella, focused on categorizing diverse practices under a single label, while later transitions to natural organisms like the mushroom introduced the vital concept of a "submerged" system of roots representing infrastructure, integrity and the rewarding system. The wheel and tree metaphors further emphasize Open Science as a circular process and a revolutionary, systemic change, respectively. Meanwhile, the graph metaphor reflects the decentralized, networked nature of modern knowledge production. The journey culminates in the proposal of a new metaphor: the forest. As a living "super-organism" the forest functions as a synthesis of previous metaphors, representing a collaborative, biodiverse, and inclusive ecosystem characterized by distributed intelligence and mutual aid. Beyond representing an ideal model, the forest metaphor is also used to highlight real systemic tensions, such as the unequal distribution of resources and institutional rivalries. Ultimately, it argues for an ecological and systemic shift in how the value of research is assessed, prioritizing sustainability, inclusivity, and collective intelligence},
KEYWORDS = {open science images, open science metaphors},
URL = {https://doi.org/10.5281/zenodo.19402630},
DOI = {10.5281/zenodo},
CONFERENCE_NAME = {FOR2026-MUNICH CONFERENCE The Future of Open Research: Reliable, Responsible, Equitable},
}
@INPROCEEDINGS{FAVARO_2026_INPROCEEDINGS_FGSBM_580324,
AUTHOR = {Favaro, M. and Guadagnini, E. and Sassolini, E. and Biffi, M. and Montemagni, S.},
TITLE = {When Lexicographic Quotations Become a Corpus: To Deduplicate or Not to Deduplicate?},
YEAR = {2026},
ABSTRACT = {Historical dictionaries are increasingly reused as sources for diachronic language corpora. In this context, lexicographic quotations represent a valuable yet challenging type of data, as they are both editorially curated and diachronically representative. A major issue in their computational reuse is the presence of duplicate and nearduplicate quotations. This paper addresses quotation deduplication in corpora derived from lexicographic resources. We introduce QRD (Quotation Reuse Detection), a multi-stage pipeline designed to identify, compare, and cluster quotations based on graded similarity rather than binary matching. The approach combines string-based similarity measures, iterative threshold analysis, and clustering, enabling both quantitative and qualitative investigation of quotation reuse. Our results show that deduplication in this context cannot be reduced to the automatic elimination of redundant data. The variability observed in the quotations-ranging from OCR-related noise to substantial editorial variation-reflects both technical and structural factors and calls for a more nuanced approach. QRD supports the identification of OCR-related errors and reveals patterns of textual reuse underlying the compilation of the dictionary. We argue that quotation deduplication should be conceived primarily as a task of identification and clustering. This perspective reframes deduplication from a data-cleaning operation into an analytical methodology for historically and editorially curated textual resources},
KEYWORDS = {Historical Corpora, Text Deduplication, Data Matching Process, Historical Lexicography},
PUBLISHER = {ELRA Language Resources Association},
ISBN = {9782493814586},
BOOKTITLE = {Fourth Workshop on Language Technologies for Historical and Ancient Languages (LT4HALA 2026) @ LREC 2026},
}
@INPROCEEDINGS{GIOVANNETTI_2026_INPROCEEDINGS_GBMP_579201,
AUTHOR = {Giovannetti, E. and Bellandi, A. and Marchi, S. and Papini, M.},
TITLE = {Extending the Semantic Layer of the CompL-it Italian Lexicon: Traits, Semantic Types, and Definitions},
YEAR = {2026},
ABSTRACT = {The growing impact of Large Language Models has highlighted the need for explicit, interpretable linguistic knowledge. Lexical resources respond to this need by offering structured representations that complement and constrain the implicit semantics of neural models. This paper presents an extension of CompL-it, currently the most comprehensive open computational lexicon of Italian. Building on the semantic layer inherited from LexicO—itself derived from the PAROLE-SIMPLE-CLIPS resource—the work enriches CompL-it with semantic traits and references to semantic types. Moreover, an experiment was conducted to generate missing definitions through an automatic process supported by LLMs. The resulting resource thus combines human-curated and machine-extended knowledge, ensuring both linguistic precision and scalability. This enriched semantic layer enhances CompL-it’s interoperability within the Linguistic Linked Data framework and strengthens its usability for NLP tasks such as word sense disambiguation, semantic role labelling, and knowledge grounding},
KEYWORDS = {computational lexicon, Linguistic Linked Open Data, OntoLex Lemon, Large Language Models, Word sense definitions, semantic enrichment},
PAGES = {7857-7866},
URL = {https://iris.cnr.it/handle/20.500.14243/579201},
DOI = {10.63317/3rvf2vbt4ier},
ISBN = {978-2-493814-49-4},
CONFERENCE_NAME = {Fifteenth Language Resources and Evaluation Conference (LREC 2026)},
BOOKTITLE = {Proceedings of the Fifteenth Language Resources and Evaluation Conference (LREC 2026)},
}
@INPROCEEDINGS{GIOVANNETTI_2026_INPROCEEDINGS_GC_582229,
AUTHOR = {Giovannetti, E. and Cristiano, F.},
TITLE = {Exploring the Use of Large Language Models in Critical Discourse Analysis: A Consensus-Based Pilot Study},
YEAR = {2026},
ABSTRACT = {Large Language Models (LLMs) are increasingly used in the social sciences and humanities (SSH) to support the analysis of complex textual data, raising methodological questions about evaluation and interpretive reliability. This paper explores the use of LLMs in Critical Discourse Analysis (CDA), considered here as a paradigmatic case of interpretive research in SSH, through a preliminary consensus-based evaluation framework. The study reports on a pilot experiment conducted on a small, theory-driven corpus of opinion articles addressing the October 7, 2023 attack and its aftermath. An LLM is asked to answer analytically motivated questions targeting different levels of discourse structure. Its responses are compared with annotations produced by multiple human analysts and aggregated through a consensus-based procedure. The results reveal an asymmetry in model performance: while LLMs align well with human consensus on macro-and superstructural features, they struggle with microstructural phenomena involving implicit meaning. These findings support the view of LLMs as epistemic support tools rather than replacements for human interpretation},
KEYWORDS = {critical discourse analysis, large language models, interpretive evaluation, consensus-based analysis, social sciences and humanities},
PAGES = {18-22},
URL = {http://lrec-conf.org/proceedings/lrec2026/workshops/llms4ssh/2026.llms4ssh-1.0.pdf},
PUBLISHER = {ELRA Language Resources Association (ELRA)},
ISBN = {978-2-493814-85-2},
CONFERENCE_NAME = {Shaping Multilingual, Multimodal AI for the Social Sciences and Humanities (LLMs4SSH) @ LREC 2026},
BOOKTITLE = {Proceedings of Shaping Multilingual, Multimodal AI for the Social Sciences and Humanities (LLMs4SSH) @ LREC 2026},
}
@INPROCEEDINGS{HASHOUSH_2026_INPROCEEDINGS_HCC_570982,
AUTHOR = {Hashoush, M. and Cadot, E. and Cardillo, F. A.},
TITLE = {Missing data imputation in epidemiology: a comparison between MICE and Machine Learning methods},
YEAR = {2026},
ABSTRACT = {Missing data represents a challenge in large-scale epidemiological studies as it can introduce a strong and negative bias in the final estimates when not handled appropriately. Addressing missing values is considered important for the correct assignment of cases from one hand and the characterisation of risk factors from another. In this study, we present a robust experimental comparison between MICE and several ML-based imputation approaches applied to the Ecuadorian birth data. We assess their performance and discuss the respective strengths and limitations within an epidemiological context},
KEYWORDS = {Missing data imputation, machine learning},
CONFERENCE_NAME = {EGU General Assembly 2026},
}
@INPROCEEDINGS{KHLIF_2026_INPROCEEDINGS_KMN_566042,
AUTHOR = {Khlif, N. and Mazroui, A. and Nahli, O.},
TITLE = {A Robust Morphological Analysis System for the Moroccan Dialect},
YEAR = {2026},
ABSTRACT = {This work presents DiMorph, a morphological engine for Moroccan Arabic (Darija), integrating custom pre-and post-processing techniques to address orthographic inconsistency and lack of standardization. A key feature of DiMorph is its multiword expression (MWE) recognition module, which enhances analysis by detecting and processing MWEs based on a predefined lexicon, leading to more accurate gloss generation. Tested on a Facebook corpus of 11, 085 tokens, DiMorph achieved 97. 84% in-vocabulary (INV) coverage, with an out-of-vocabulary (OOV) rate of 2. 16%, mostly consisting of foreign terms, proper names and emerging words. In all, 40. 48% of tokens had a single interpretation, while 59. 52% exhibited ambiguity, largely due to homography (89. 71%), polysemy (9. 31%) and morphological syncretism (0. 98%). By providing robust morphological analysis and MWE handling, DiMorph significantly enhances Darija text processing. Its linguistic resources will be released as open-source, fostering further advancements in Arabic dialect natural language processing (NLP)},
KEYWORDS = {Morphological engine, DiMorph, Moroccan dialect, Multiword expressions, Darija, Text processing.},
URL = {https://doi.org/10.1201/9781003671602},
DOI = {10.1201/9781003671602},
PUBLISHER = {CRC Press – Taylor \& Francis Group (Boca Raton, USA)},
ISBN = {9781003671602},
CONFERENCE_PLACE = {Boca Raton},
BOOKTITLE = {Smart Technologies for a Sustainable Environment},
}
@INPROCEEDINGS{MARZI_2026_INPROCEEDINGS_MBTNADBFTGP_580325,
AUTHOR = {Marzi, C. and Boni, N. and Todesco, A. and Nadalini, A. and Albertin, G. and Dolciotti, C. and Bongioanni, P. and Ferro, M. and Tamburini, F. and Gagliardi, G. and Pirrelli, V.},
TITLE = {Reading Dynamics and Comprehension in Cognitive Aging: A Multimodal Language Resource},
YEAR = {2026},
ABSTRACT = {We introduce a novel Italian language resource for the study of reading and comprehension in aging populations, combining behavioural and linguistic data from healthy controls (HC), individuals with subjective cognitive decline (SCI), participants with Mild Cognitive Impairment (MCI), and patients with mild dementia (CDR1). Reading performance was recorded through a finger-tracking based application during both silent and oral reading, enabling fine-grained temporal analyses at the text, token and character level. Comprehension was assessed via multiple question types (wh -, inferential, referential, and lexical). Descriptive and non-linear regression analyses informed a feature selection process, yielding temporal and comprehension-based measures that capture individual reading dynamics. These features were explored through unsupervised clustering and supervised classification to investigate their discriminative and predictive potential across cognitive profiles. The resource supports research on reading and cognitive decline, offers a reproducible protocol for large-scale data collection, and provides a foundation for developing early cognitive screening and monitoring tools for aging populations},
KEYWORDS = {reading behaviour, cognitive aging, finger-tracking, language resources for assistive technologies, cluster analysis, automatic classification},
PAGES = {2608-2618},
URL = {http://www.lrec-conf.org/proceedings/lrec2026/},
VOLUME = {15},
DOI = {10.63317/3wjy3a8cwnw8},
PUBLISHER = {ELRA (Paris, FRA)},
ISBN = {978-2-493814-49-4},
CONFERENCE_NAME = {Language Resources and Evaluation Conference (LREC 2026)},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the Fifteenth Language Resources and Evaluation Conference (LREC 2026)},
}
@INPROCEEDINGS{ORSINI_2026_INPROCEEDINGS_OB_580582,
AUTHOR = {Orsini, M. and Brunato, D.},
TITLE = {Steering Pragmatic Interpretation in LLMs: A Diagnostic Evaluation of Few-Shot and Reasoning-Based Prompting for Indirect Speech Acts},
YEAR = {2026},
ABSTRACT = {Pragmatic competence presents a persistent challenge for Large Language Models (LLMs), as it requires contextdependent inference beyond literal meaning. This study examines whether few-shot prompting can reliably steer LLMs toward appropriate interpretations of indirect speech acts under small-data conditions. Focusing on Italian, we evaluate three LLMs on a small dataset that captures pragmatic ambiguity through graded plausibility judgments. We compare a zero-shot baseline with multiple few-shot prompting configurations that vary in the number and composition of demonstrations, as well as in the presence of explicit pragmatic guidance. Results show that few-shot prompting does not yield robust or monotonic improvements overall. While performance improves substantially for conventionalized indirect speech acts, gains for non-conventionalized indirect speech acts are unstable and limited. In contrast, introducing explicit pragmatic reasoning along with demonstrations through guided chain-of-thought prompting appears more promising. Overall, these findings highlight the limits of example-based steering for pragmatic inference and suggest that explicitly modeling pragmatic reasoning may be a more effective direction in small-data settings},
KEYWORDS = {Italian, Indirect Speech Acts, Few-shot Prompting, Large Language Models Evaluation},
PAGES = {12-20},
ISBN = {978-2-493814-80-7},
CONFERENCE_NAME = {Workshop on Learning Non-Literal Expressions with Small Data @ LREC 2026},
BOOKTITLE = {Proceedings of the Workshop on Learning Non-Literal Expressions with Small Data, LREC 2026},
}
@INPROCEEDINGS{PAPUCCI_2026_INPROCEEDINGS_PVD_580421,
AUTHOR = {Papucci, M. and Venturi, G. and Dell'Orletta, F.},
TITLE = {Controllable Sentence Simplification in Italian: Fine-Tuning Large Language Models on Automatically Generated Resources},
YEAR = {2026},
ABSTRACT = {This paper presents a study on readability-controlled Sentence Simplification for Italian, addressing the scarcity of annotated resources for low-resource languages. We introduce IMPaCTS (Italian Multilevel Parallel Corpus for Text Simplification), the first fully automatically created corpus of 1, 444, 160 original–simple sentence pairs automatically annotated with readability levels and linguistic features. It was generated using an Italian LLM prompted in zero-shot to produce multiple simplifications per input sentence. Increasing portions of the resource are used to fine-tune mono-and multilingual open-weight LLMs, conditioning them to generate simplifications at a target readability level. Results from automatic and human evaluations show that fine-tuning on IMPaCTS improves performance both in terms of task completion and adherence to the targeted readability levels compared to few-shot baselines},
KEYWORDS = {Controlled Sentence Simplification, Readability Assessment, Large Language Models},
PAGES = {7178-7191},
URL = {http://www.lrec-conf.org/proceedings/lrec2026/pdf/2026.lrec2026-1.570},
DOI = {10.63317/5fgm358dfxt5},
ISBN = {978-2-493814-49-4},
CONFERENCE_NAME = {15th Language Resources and Evaluation Conference (LREC 2026)},
BOOKTITLE = {Proceedings of the 15th Language Resources and Evaluation Conference (LREC 2026)},
}
@INPROCEEDINGS{RUBIN_2026_INPROCEEDINGS_RBDD_564781,
AUTHOR = {Rubin, G. and Bardi, A. and Del Gratta, R. and Del Grosso, A. M.},
TITLE = {Enhancing interoperability of SPARQL endpoints: RESTful and OAI-PMH API for the DH-ATLAS project},
YEAR = {2026},
ABSTRACT = {Digital repositories leveraging RDF and Linked Data for Cultural Heritage metadata face a critical challenge: their native SPARQL endpoints often create silos because major aggregators rely on the OAI-PMH protocol for harvesting, and developers prefer RESTful APIs. This divergence undermines the visibility and FAIRness (Findable, Accessible, Interoperable, Reusable) of scholarly resources. This paper details the unified access strategy implemented for the DH-ATLAS project, which generated an Ontology and Knowledge Graph focused on Italian Digital Cultural Heritage research. To ensure broad dissemination and resource reuse without duplicating data, DH-ATLAS developed two configurable and modular software components to implement compatibility with the OpenAIRE guidelines and REST clients. Together, these components establish a cohesive and reusable solution for integrating semantic repositories with diverse metadata consumers, promoting the long-term sustainability and broader accessibility of the DH-ATLAS Knowledge Graph and serving as a model for other RDF infrastructures},
KEYWORDS = {Interoperability, Knowledge Graph, API, OpenAIRE, OAI-PMH, Digital Humanities and Cultural Heritage},
PAGES = {14},
URL = {https://ircdl2026.unimore.it/},
CONFERENCE_NAME = {IRCDL 2026-22nd Conference on Information and Research Science Connecting to Digital and Library Science},
BOOKTITLE = {IRCDL 2026},
}
@INPROCEEDINGS{CARDILLO_2026_INPROCEEDINGS_CADDFPSV_570943,
AUTHOR = {Cardillo, F. A. and Andrigo, A. and De Biasio, F. and Debole, F. and Favaro, M. and Papa, A. and Straccia, U. and Vignudelli, S.},
TITLE = {A preliminary analysis of high water events in Venice based on multi-decadal observations and clustering},
YEAR = {2026},
ABSTRACT = {High water events in Venice are a recurrent phenomenon, as the city is located only slightly above mean sea level and is directly in"uenced by water-level variations within the lagoon. Repeated "ooding has signi!cant economic and social impacts, limits pedestrian and naval tra#c and contributes to the degradation of buildings and cultural heritage. Current forecasting systems primarily estimate water levels and peak values, and these are typically estimated at a limited number of locations. Data-driven approaches, in particular Machine Learning (ML) methods, analyze historical data without relying on prede!ned, human-designed model structures. We present a preliminary analysis based on several clustering approaches, including k-means, DBSCAN, and deep learning–based methods, applied to a multi-decadal atmospheric dataset and to the longest available reconstructed hourly sea-level records for the northern Adriatic Sea, specifically developed for this study},
KEYWORDS = {Machine learning, Clustering},
PAGES = {1},
URL = {https://iris.cnr.it/handle/20.500.14243/570943},
VOLUME = {(17357)},
CONFERENCE_NAME = {EGU General Assembly 2026},
BOOKTITLE = {Proceedings of the EGU General Assembly 2026},
}
@INPROCEEDINGS{PROVOST_2026_INPROCEEDINGS_PDMP_579341,
AUTHOR = {Provost, L. M. and Di Donato, F. and Mannocci, A. and Pecoraro, F.},
TITLE = {From Commitment to Practice: Implementing ARRA Commitment 2 in Career Progression Procedures at the National Research Council of Italy},
YEAR = {2026},
ABSTRACT = {The global transition toward responsible research assessment (RRA), formalized by the Agreement on Reforming Research Assessment (ARRA), emphasizes qualitative evaluation over quantitative metrics. Despite broad international support, a significant gap persists between high-level policy commitments and their practical implementation. This study examines the operationalization of ARRA Commitment 2—balancing qualitative judgment with the responsible use of indicators—within career progression procedures at the National Research Council of Italy (CNR). Following its 2022 signature of the ARRA, CNR launched four competitive calls in 2023 that introduced Narrative CVs and a framework focused on qualitative merit. Through a qualitative content analysis of 4, 090 criteria defined by 90 evaluation committees, the research reveals a partial and uneven implementation of these principles. While research outputs are increasingly subject to qualitative assessment, mechanical scoring remains dominant for other contributions, such as teaching and evaluation. The findings highlight heterogeneous interpretations of qualitative assessment across disciplinary clusters and varying levels of guidance provided to committees. Ultimately, the study underscores the challenges of translating reform principles into consistent practice and encourages research organizations to "Evaluate your Evaluation" to better align assessment processes with career development goals},
KEYWORDS = {Coara, ARRA, CNR},
PAGES = {58-61},
URL = {https://ressh2026.igsg.cnr.it/},
DOI = {10.32091/RESSH2026},
ISBN = {9788890576485},
CONFERENCE_NAME = {RESSH 2026-Research Evaluation in the Social Sciences and Humanities Conference},
BOOKTITLE = {RESEARCH EVALUATION AND SCIENTIFIC AUTONOMY UNDER PRESSURE. Conference Proceedings},
}
@TECHREPORT{CARLINO_2026_TECHREPORT_C_571481,
AUTHOR = {Carlino, M.},
TITLE = {Analisi dei dati del profilo LinkedIn istituzionale di CNR-ILC relativi al periodo dicembre 2024-dicembre 2025},
YEAR = {2026},
ABSTRACT = {Analysis of CNR-ILC LinkedIn profile data for the period December 2024-December 2025},
KEYWORDS = {social media, analytics, LinkedIn, comunicazione, disseminazione},
PAGES = {1-28},
URL = {https://iris.cnr.it/handle/20.500.14243/571481},
}
@TECHREPORT{DELGRATTA_2026_TECHREPORT_DM_573024,
AUTHOR = {Del Gratta, R. and Mallia, M.},
TITLE = {Installing and configuring CLARIN-DSPACE 7},
YEAR = {2026},
ABSTRACT = {This work provides a comprehensive and systematic description of the installation, configuration, and deployment of the CLARIN-DSpace 7 platform, carried out in the context of upgrading the ILC4CLARIN repository to its latest version. CLARIN-DSpace 7 is a customized distribution of DSpace tailored to the needs of the European CLARIN infrastructure for managing language resources and technologies. The document presents a detailed technical guide covering the entire process, from system environment preparation to the configuration of core components, including the Spring Boot backend, Angular frontend, PostgreSQL database, Solr indexing engine, Tomcat application server, and Shibboleth-based federated authentication services. It also addresses key aspects such as SSL certificate management, Apache web server configuration, integration with AAI systems, and user interface customization. Particular attention is given to migration procedures from previous DSpace versions (5. x), highlighting challenges and solutions to ensure data integrity and service continuity. The work serves as a practical and replicable reference for the implementation of interoperable institutional repositories compliant with CLARIN standards and FAIR principles, supporting the management and dissemination of linguistic data and NLP tools in the scientific domain},
KEYWORDS = {DSpace 7, CLARIN, ILC4CLARIN, CLARIN-DSpace, Research Infrastructures, Repository Migration, Insitutional Repository},
URL = {https://iris.cnr.it/handle/20.500.14243/573024},
}
@TECHREPORT{GIOVANNETTI_2026_TECHREPORT_GAMP_579246,
AUTHOR = {Giovannetti, E. and Albanesi, D. and Marchi, S. and Papini, M.},
TITLE = {Traduco: l'Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-Rapporto tecnico 29},
YEAR = {2026},
ABSTRACT = {La presente relazione tecnico-scientifica descrive l’attività svolta da CNR-ILC nel contesto del Progetto Traduzione Talmud Babilonese nel periodo novembre 2025-aprile 2026. Le principali attività tecniche svolte sul sistema Traduco attualmente in produzione hanno riguardato l’aggiornamento di alcune funzionalità. Inoltre, sul fronte della ricerca, è proseguito il lavoro di sperimentazione di approcci di supporto alla traduzione attraverso l’uso di Large Language Models},
KEYWORDS = {Lessici elettronici, rappresentazione della conoscenza, Linguistica Computazionale, traduzione di testi religiosi, traduzione assistita dal calcolatore, Large Language Models, Intelligenza Artificiale},
URL = {https://iris.cnr.it/handle/20.500.14243/579246},
}
@TECHREPORT{LUZIETTI_2026_TECHREPORT_LO_577981,
AUTHOR = {Luzietti, R. B. and Ottaviani, R.},
TITLE = {Il trattamento dei dati personali nella ricerca: evento di formazione H2IOSC ai giovani ricercatori del settore SSH},
YEAR = {2026},
ABSTRACT = {Rapporto Tecnico relativo agli output emergenti da una formazione a giovani ricercatori erogata nell'ambito del Progetto H2IOSC (PNRR IR)},
KEYWORDS = {IR, SSH, Data Management Plan, Dati personali nella ricerca},
URL = {https://iris.cnr.it/handle/20.500.14243/577981},
}
@MISC{BURGASSI_2026_MISC_BPR_580082,
AUTHOR = {Burgassi, C. and Papini, M. and Ricotta, V.},
TITLE = {Il VocaBO: Vocabolario di Boccaccio online. Teoria e prassi lessicografica digitale},
YEAR = {2026},
ABSTRACT = {La lezione presentata nel corso del seminario "Etimologia, lessicologia e lessicografia italiana: metodi, ricerche e progetti in corso" rivolto ai dottorandi dell'Università per Stranieri di Siena, analizza l'esperienza maturata nel corso del progetto VocaBO. Viene presentato il progetto con il suo ciclo di lavoro, nonché gli strumenti utilizzati al suo interno, con le relative scelte metodologiche},
KEYWORDS = {Boccaccio, Lessicografia digitale, Maia},
URL = {https://iris.cnr.it/handle/20.500.14243/580082},
}
@MISC{CALAMAI_2026_MISC_CNS_571521,
AUTHOR = {Calamai, S. and Nodari, R. and Soria, C.},
TITLE = {Linguistic Discrimination in Education: Linguistic Autobiographies of Secondary School Students in Italy},
YEAR = {2026},
ABSTRACT = {This archive contains linguistic autobiographies collected within the Erasmus CIRCE project (Counteracting accent dIscrimination pRactiCes in Education, grant agreement no. 2022-1-IT02-KA220-SCH-000087602). The autobiographies were collected in Italy and focus on personal experiences, reflections, and attitudes related to linguistic and accent-based discrimination in educational contexts and everyday life. The dataset consists of 56 written autobiographical texts produced in Italian by secondary school students between 2023 and 2025. Written informed consent forms are securely stored in the institutional archive of the CIRCE project at University of Siena and are available for verification by authorised bodies. The linguistic autobiographies have been anonymised and are primarily intended for educational and research use by secondary school teachers and students, as well as by university students and educators, particularly in the fields of language education, sociolinguistics, and teacher training},
KEYWORDS = {linguistic autobiographies, language attitudes, language diversity, multilingualism, sociolinguistics},
DOI = {10.5281/zenodo},
}
@MISC{CALAMAI_2026_MISC_CNS_571511,
AUTHOR = {Calamai, S. and Nodari, R. and Soria, C.},
TITLE = {CIRCE Accented Italian Speech Stimuli Corpus},
YEAR = {2026},
ABSTRACT = {This dataset contains a corpus of audio accented speech stimuli in Italian, developed within the CIRCE project for use in perceptual experiments on accent perception and discrimination. The corpus includes 25 recordings from both male and female speakers who are native speakers of Italian (L1) as well as speakers who acquired Italian as a second language (L2). 8 accents of Italian as L1 and 3 accents of Italian as L2 are represented. All speakers read the same standardized text; individual recordings have an approximate duration of 23 seconds and are organized by speakers’ linguistic background (L1/L2). The dataset is designed to support matched-guise and verbal-guise experiments, as well as research and educational activities addressing accent perception, linguistic diversity, and accent discrimination},
KEYWORDS = {accent discrimination, accent perception, speech stimuli, verbal guise test, sociolinguistics, perceptual sociophonetics},
DOI = {10.5281/zenodo},
}
@MISC{CALAMAI_2026_MISC_CNSC_571522,
AUTHOR = {Calamai, S. and Nodari, R. and Soria, C. and Carella, G.},
TITLE = {CIRCE Experimental Results on Italian and English Accent Perception},
YEAR = {2026},
ABSTRACT = {This dataset contains the results of perceptual experiments (verbal-guise) conducted within the CIRCE project to investigate accent perception and accent-based discrimination in Italy. The dataset includes anonymized experimental data collected from participants exposed to the CIRCE experimental speech stimuli. The data document participants’ evaluations and responses to different L1 and L2 accents of Italian and English and are organized according to the specific experimental settings used. No personally identifiable information is included. The dataset is intended to support transparency, replicability, and secondary analysis in educational and social research contexts and is part of the CIRCE Zenodo community},
KEYWORDS = {language attitudes, English varieties, Italian varieties, accents, sociolinguistics, sociophonetics, perceptual sociophonetics},
DOI = {10.5281/zenodo},
}
@MISC{CALAMAI_2026_MISC_CSAMFGCBD_571622,
AUTHOR = {Calamai, S. and Soria, C. and Angiolini, C. S. and Meer, P. and Fuchs, R. and Guerra, L. and Cavalheiro, L. and Brdarević Čeljo, A. and Dubravac, V.},
TITLE = {Ethical and Legal guidelines for research data management: The CIRCE Experience as a Transferable Model},
YEAR = {2026},
ABSTRACT = {This document presents the Ethical and Legal Guidelines for Research Data Management developed within the Erasmus CIRCE project (Counteracting accent dIscrimination pRactiCes in Education). Drawing on the concrete experience of an international research consortium involving multiple European countries and human participants in educational settings, the guidelines outline the measures adopted to ensure lawful, fair, and ethically sound data management in compliance with the EU General Data Protection Regulation (GDPR). While grounded in the specific practices of the CIRCE project, the guidelines are intentionally designed as a transferable and adaptable model for other research projects, particularly those involving international collaboration, fieldwork in schools, and the processing of personal and sensitive data},
KEYWORDS = {Research Data Management, Research Ethics, Data Protection and GDPR Compliance, International Collaborative Research, Accent Discrimination in Education},
DOI = {10.5281/zenodo},
}
@MISC{CARELLA_2026_MISC_CGSC_571523,
AUTHOR = {Carella, G. and Galilei, G. and Soria, C. and Calamai, S.},
TITLE = {Linguistic Discrimination in Education: Audio Interviews with Secondary School Students and Teachers in Italy},
YEAR = {2026},
ABSTRACT = {This archive contains audio-recorded interviews collected within the Erasmus CIRCE project (Counteracting accent dIscrimination pRactiCes in Education, grant agreement no. 2022-1-IT02-KA220-SCH-000087602). The interviews were conducted in Italy between February and October 2024 and focus on experiences and perceptions of linguistic and accent-based discrimination in secondary education and everyday life. The dataset includes 20 interviews in total: 10 interviews with secondary school students and 10 interviews with teachers. Written informed consent forms are securely stored in the institutional archive of the CIRCE project at the University of Siena, Italy, and are available for verification by authorized bodies. The recordings are primarily intended for educational and research use by secondary school teachers and students, as well as by university students and educators, particularly in the fields of language education, sociolinguistics, and teacher training},
KEYWORDS = {linguistic discrimination, accent discrimination, interview, sociolinguistics, language diversity, mulitlingualism},
DOI = {10.5281/zenodo},
}
@MISC{DATTILO_2026_MISC_DGPS_572202,
AUTHOR = {Dattilo, D. and Giovannetti, E. and Papini, M. and Saponaro, D.},
TITLE = {Traduzione e intelligenza artificiale. Il software TRADUCO},
YEAR = {2026},
ABSTRACT = {La lezione per il Dottorato in Studi di Traduzione dell’Università per Stranieri di Siena analizza l'esperienza metodologica e tecnologica maturata nell'ambito del Progetto Talmud. L'intervento non si limiterà all'analisi dell'attività traduttiva e filologica, ma approfondirà l'architettura degli strumenti informatici sviluppati ad hoc per supportare il lavoro collaborativo. Particolare attenzione sarà dedicata alle recenti integrazioni di Intelligenza Artificiale, analizzando come l'approccio computazionale possa coadiuvare la traduzione di testi caratterizzati da elevata complessità linguistica e stratificazione interpretativa},
KEYWORDS = {Babylonian Talmud, Computer Assisted Translation, Large Language Models, Artificial Intelligence},
URL = {https://iris.cnr.it/handle/20.500.14243/572202},
}
@MISC{IACHELLO_2026_MISC_ISPMDC_576623,
AUTHOR = {Iachello, S. and Spinelli, F. and Pedonese, G. and Melaccio, D. and Degl'Innocenti, E. and Colautti, V.},
TITLE = {H2IOSC Booklet: Strengthening Research Infrastructures Consolidating the Federation},
YEAR = {2026},
ABSTRACT = {This booklet presents the H2IOSC (Humanities and Cultural Heritage Italian Open Science Cloud) initiative, focusing on its role in strengthening research infrastructures and consolidating a national federation within the Social Sciences and Humanities domain. Coordinated by the Italian National Research Council (CNR), H2IOSC brings together leading European Research Infrastructures to create an integrated, collaborative ecosystem for digital research. By federating distributed resources, services, and expertise, H2IOSC enhances the accessibility, interoperability, and sustainability of research infrastructures, enabling coordinated access to tools, datasets, and advanced technologies. The booklet illustrates how this federated approach supports diverse user communities—including researchers, cultural institutions, and industry stakeholders—through a unified entry point and a comprehensive portfolio of digital, enabling, and training services. Particular attention is given to the processes that underpin infrastructure strengthening, including service validation, technological maturity assessment, and user-driven evaluation activities. These mechanisms contribute to improving service quality, aligning technological development with user needs, and ensuring long-term impact. The publication also outlines the Cluster’s strategic vision for consolidating the federation, expanding its user base, and fostering partnerships across research, culture, and the private sector, reinforcing its role within the European Open Science ecosystem},
KEYWORDS = {Humanities and Cultural Heritage, Social Sciences and Humanities (SSH), Research Infrastructures, Open Science Cloud,},
PAGES = {8},
URL = {https://doi.org/10.5281/zenodo.19628513},
DOI = {10.5281/zenodo.19628512},
}
@ARTICLE{ALZETTA_2025_ARTICLE_AMDVM_570443,
AUTHOR = {Alzetta, C. and Miaschi, A. and Dell'Orletta, F. and Venturi, G. and Montemagni, S.},
TITLE = {Parallel Trees: a novel resource with aligned dependency and constituency syntactic representations},
YEAR = {2025},
ABSTRACT = {The paper introduces Parallel Trees, a novel multilingual treebank collection that includes 20 treebanks for 10 languages. The distinguishing property of this resource is that the sentences of each language are annotated using two syntactic representation paradigms (SRPs), respectively based on the notions of dependency and constituency. By aligning the annotations of existing resources, Parallel Trees represents an example of exploiting pre-existing treebanks to adapt them to novel applications. To illustrate its potential, we present a case study where the resource is employed as a benchmark to investigate whether and how BERT, one of the first prominent neural language models (NLMs), is sensitive to the dependency-and constituency-based approaches for representing the syntactic structure of a sentence. The case study results indicate that the model's sensitivity fluctuates across languages and experimental settings. The unique nature of the Parallel Trees resource creates the prerequisites for innovative studies comparing dependency and phrase-structure trees, allowing for more focused investigations without the interference of lexical variation},
KEYWORDS = {Parallel treebanks, Syntactic representation, Diagnostic probing paradigm, Neural language model},
PAGES = {3445-3485},
URL = {https://iris.cnr.it/handle/20.500.14243/570443},
VOLUME = {59 (4)},
DOI = {10.1007/s10579-025-09826-3},
ISSN = {1574-020X},
JOURNAL = {LANGUAGE RESOURCES AND EVALUATION},
}
@ARTICLE{ALZETTA_2025_ARTICLE_AT_545881,
AUTHOR = {Alzetta, C. and Torre, I.},
TITLE = {Prerequisite Relations Annotation Tool: Annotation and analysis of educational relations in texts},
YEAR = {2025},
ABSTRACT = {Relations between terms in texts have long been studied in linguistics and specialized knowledge domains, especially when occurring in educational materials like textbooks, where they play a crucial role in guiding instructional design and learning. Prerequisite relations (PR), which determine the sequence of presentation of domain terms, are particularly crucial for effective learning. Therefore, the authors consider them carefully when writing instructional texts. The reverse process of identifying PR within texts aims to extract the inherent knowledge structure they are based on and is a key task in the field of corpora annotation for educational knowledge modeling. Although there are tools for manual annotation, there is a need for specialized tools tailored to the unique properties of PR, enabling easy creation, analysis, and sharing of annotated datasets. In this paper, we introduce Prerequisite Relations Annotation Tool (PRAT), a novel tool designed for annotating PR based on a validated protocol. PRAT simplifies the process of capturing, analyzing, and visualizing prerequisite structures in educational texts. We outline PRAT's architecture and functionalities, emphasizing its unique features compared to existing corpora annotation tools. Through a user study involving users with diverse backgrounds, we show PRAT's effectiveness in real-world scenarios},
KEYWORDS = {Annotation, Annotation Tool, Prerequisite Relations, User Evaluation, Usability,},
PAGES = {1-22},
URL = {https://asistdl.onlinelibrary.wiley.com/doi/10.1002/asi.24992?af=R},
DOI = {10.1002/asi.24992},
ISSN = {2330-1643},
JOURNAL = {JOURNAL OF THE ASSOCIATION FOR INFORMATION SCIENCE AND TECHNOLOGY},
}
@ARTICLE{BANDINI_2025_ARTICLE_BQ_557403,
AUTHOR = {Bandini, M. and Quochi, V.},
TITLE = {A Systematic Literature Review on the Representation of Texts as Linguistic Linked Open Data},
YEAR = {2025},
ABSTRACT = {Despite the growing interest in publishing linguistic data as Linked Open Data (LOD), the representation of ancient language corpora within the Semantic Web remains challenging. While LOD principles have been successfully applied to linguistic resources such as dictionaries, lexicons, and terminologies, their use for textual corpora — particularly those related to ancient languages — is still limited. Through a systematic literature review, we investigate how textual data has been represented as Linguistic Linked Open Data (LLOD), evaluating the potential and limitations of existing approaches and methodologies for enhancing data integration and interoperability in the Digital Humanities. This systematic literature review follows a rigorous methodology encompassing literature identification, screening for inclusion, and quality assessment. By classifying and analysing relevant studies, we provide a comprehensive overview of current practices and offer insights into their benefits and limitations},
KEYWORDS = {Ancient languages, Ancient texts, DigitAnt, Linguistic Linked Open Data, Semantic Web, Systematic literature review},
PAGES = {289-315},
URL = {http://doi.org/10.6092/issn.2532-8816/21195},
VOLUME = {2025 (20)},
DOI = {10.6092/issn.2532-8816/21195},
ISSN = {2532-8816},
JOURNAL = {UMANISTICA DIGITALE},
}
@ARTICLE{BELLANDI_2025_ARTICLE_B_570747,
AUTHOR = {Bellandi, A.},
TITLE = {Lexicographic Resources in the Semantic Web: Models, Tools, and Case Studies},
YEAR = {2025},
ABSTRACT = {Dictionaries are essential tools for documenting and transmitting the linguistic and cultural heritage of a society. With the advent of Semantic Web technologies and the Linked Data paradigm, digital lexicographyhas undergone a significant transformation, evolving from the mere digitization of printed dictionaries to more advanced forms of linguistic data representation and interconnection. Within this context, the Lexicography Module (Lexicog) emerges as a data model developed by the W3C OntoLex communitygroup, designed to support the modeling of interoperable lexicographic resources in accordance with the FAIR principles. This paper provides a review of the Lexicog model, assessing its suitability for the practical needs of lexicographers in dictionary compilation and demonstrating its application through three real-world case studies involving different types of dictionaries. Furthermore, it presents a suite of open-source software tools developed to facilitate the construction and use of computational dictionaries. The goal is to promote open, sustainable digital lexicographic practices aligned with Semantic Web standards},
KEYWORDS = {E-Lexicography, Dictionary, Linguistic Resources, Linguistic Linked Data, Lexicog, LexO-server},
PAGES = {107-140},
URL = {https://umanisticadigitale.unibo.it/article/download/22199/20177/99682},
VOLUME = {21},
DOI = {10.60923/issn.2532-8816/22199},
ISSN = {2532-8816},
JOURNAL = {UMANISTICA DIGITALE},
}
@ARTICLE{BELLANDI_2025_ARTICLE_BMP_570843,
AUTHOR = {Bellandi, A. and Masbah, A. and Piccini, S.},
TITLE = {DEC Facile: Bringing Combinatory Explanatory Dictionaries to the Semantic Web},
YEAR = {2025},
ABSTRACT = {This paper presents DEC Facile, a tool specifically developed for the construction of computational Explanatory Combinatorial Dictionaries (ECDs). Unlike existing dictionary editors, DEC Facile combines the theoretical rigor of Explanatory Combinatorial Lexicology with Semantic Web standards, being powered by LexO-server and extended with Ontolex-Lemon modules. By natively integrating Linked Data principles, it ensures that lexical and terminology resources are interoperable, reusable, and easily connected to other datasets. The platform provides a user-friendly interface supporting core lexicographic and terminological tasks such as dictionary search, sense editing, and the encoding of lexical functions. DEC Facile thus represents a novel environment for lexicography, terminography, and computational linguistics, bridging the gap between ECL-based resources and the Semantic Web ecosystem. The system is currently being applied within the PRIN project Old Words for a New World. Translating Christianity to Baltic Pagans, where it supports the construction of an ECD for the earliest Baltic catechisms (Old Lithuanian, Old Latvian and Old Prussian)},
KEYWORDS = {Explanatory Combinatorial Dictionary, Ontolex-Lemon, Semantic Web, Linked Data},
PAGES = {81-98},
VOLUME = {1 (2)},
DOI = {10.25430/pupj},
JOURNAL = {JOURNAL OF DIGITAL TERMINOLOGY AND LEXICOGRAPHY},
}
@ARTICLE{BOLOGNESI_2025_ARTICLE_BCCFC_552644,
AUTHOR = {Bolognesi, C. and Cinini, A. and Cutugno, P. and Ferretti, M. and Chiarella, D.},
TITLE = {Towards a preschooler corpus of Italian: an experimental journey},
YEAR = {2025},
ABSTRACT = {The paper surveys the process and reasonings behind the written sources section of the Corpus of Italian for Preschoolers (CIP), a corpus collecting child-directed speech targeted at Italian children aged 3–6. Beginning from an overview of the available child-speech and child-directed speech corpora, the article underlines the need for an Italian Corpus focusing on children's passive vocabulary and how such a tool would be useful for future comparative studies on children's own production and as a tool for professionals in children's needs. The CIP aims at collecting 250, 000 linguistic tokens across a selection of different sources (Written, Spoken, Signed) gathered with the help of schools and families. This paper focuses specifically on the selection criteria for the written sources and the first steps of their linguistic processing, explaining through a set of three experiments how three different linguistic annotation tools performed on the tasks of tokenizing, lemmatizing and POS-tagging three different children's literature texts. The last part presents the results of the experiments with insight on the NLP tools’ performances, as well as the reasons for our choice of tool for the large-scale annotation process and the still-ongoing challenges for the finalization of our corpus},
KEYWORDS = {Child-directed speech, Children's literature, Corpus linguistics, Natural language processing, Preschool children language acquisition, Written Italian},
URL = {https://www.sciencedirect.com/science/article/pii/S2772766125000734},
VOLUME = {4 (3)},
DOI = {10.1016/j.rmal.2025.100252},
ISSN = {2772-7661},
JOURNAL = {RESEARCH METHODS IN APPLIED LINGUISTICS},
}
@ARTICLE{BONFIGLI_2025_ARTICLE_BBPMD_570501,
AUTHOR = {Bonfigli, A. and Bacco, L. and Pecchia, L. and Merone, M. and Dell'Orletta, F.},
TITLE = {Efficient multi-task learning with instance selection for biomedical NLP},
YEAR = {2025},
ABSTRACT = {Background: Biomedical natural language processing (NLP) increasingly relies on large language models and extensive datasets, presenting significant computational challenges. Methods: We propose Blue5, a multi-task model based on SciFive that incorporates instance selection (IS) to enable efficient, multi-task learning (MTL) on biomedical data. We adapt the E2SC-IS framework for the biomedical domain, integrating a calibrated SVM classifier to reduce computational costs. Results: Our approach achieves an average data reduction of 26. 6% across the several tasks of the BLUE (Biomedical Language Understanding Evaluation) Benchmark, while maintaining performance comparable with state-of-the-art models. The multi-task SVM configuration emerges as the most effective, demonstrating the power of combining IS with MTL for biomedical NLP. As a result of the unified framework, Blue5 effectively selects the most informative instances across tasks, ensuring model generalization while efficiently handling multiple NLP tasks. Conclusion: Our work offers a practical solution to address growing computational demands, enabling more scalable and accessible applications of advanced NLP techniques in biomedical research and healthcare},
KEYWORDS = {Biomedical NLP, BLUE benchmark, Computational efficiency, Instance selection, Multi-task learning},
URL = {https://iris.cnr.it/handle/20.500.14243/570501},
VOLUME = {190},
DOI = {10.1016/j.compbiomed.2025.110050},
ISSN = {0010-4825},
JOURNAL = {COMPUTERS IN BIOLOGY AND MEDICINE},
}
@ARTICLE{BURGASSI_2025_ARTICLE_B_572712,
AUTHOR = {Burgassi, C.},
TITLE = {‘Leggere’ nel Decameron},
YEAR = {2025},
ABSTRACT = {Il contributo è dedicato all'uso delle parole afferenti alla famiglia lessicale di leggere nel Decameron di Giovanni Boccaccio, nel quadro del progetto di lessicografia digitale VocaBo (Vocabolario di Giovanni Boccacico Online)},
KEYWORDS = {Giovanni Boccaccio, Decameron, lessicografia digitale, leggere},
PAGES = {113-118},
VOLUME = {SPECIALE GIOVANNI BOCCACCIO},
JOURNAL = {BIBLIOTECA DI VIA SENATO, MILANO},
}
@ARTICLE{CRISTOFARO_2025_ARTICLE_CDMSS_518038,
AUTHOR = {Cristofaro, S. and Del Grosso, A. M. and Mazzagufo, L. and Sichera, P. and Spampinato, D.},
TITLE = {Implementing Collaborative Digital Scholarly Editions: Insights from Bellini Digital Correspondence},
YEAR = {2025},
ABSTRACT = {Digital Correspondence project. Specifically, it outlines the activities aimed at improving the harmonization process, regarding the production of collaborative digital scholarly editions. The study proposes a preliminary semantic approach to the harmonization process, exploiting an ontology-based mapping perspective. The article also illustrates the functionalities and practicalities of the NormaTEI tool, designed to streamline harmonization processes within the Bellini Digital Correspondence project and applicable to similar initiatives},
KEYWORDS = {Cooperative Digital Scholarly Edition, Schemamatching, Harmonization, NormaTEI, Bellini Digital Correspondence},
PAGES = {42-53},
URL = {https://www.innove.org/ijist/index.php/ijist/article/view/297},
VOLUME = {9 (1)},
DOI = {10.57675/IMIST.PRSM/ijist-v9i1.297},
ISSN = {2550-5114},
JOURNAL = {INTERNATIONAL JOURNAL OF INFORMATION SCIENCE AND TECHNOLOGY},
}
@ARTICLE{DANKOVA_2025_ARTICLE_DFKM_579261,
AUTHOR = {Dankova, K. and Frontini, F. and Khan, A. F. and Monachini, M.},
TITLE = {La représentation et la diffusion des données terminologiques plurilingues: la collection REALITER – OTPL (CLARIN-IT)},
YEAR = {2025},
ABSTRACT = {In today’s increasingly interconnected world, plurilingual and pluricultural competences are essential for participation in economic, scientific, and cultural exchanges. In this context, the creation and dissemination of plurilingual terminological resources play an important role in ensuring clear and effective communication in scientific and professional fields. The Pan-Latin Terminology Network REALITER recognizes the benefits of plurilingual communication in specialized domains and therefore carries out activities aimed at promoting linguistic diversity in the area of Romance languages. Since its creation (1993), several plurilingual lexicons covering a wide range of sectors, such as the environment, digital technologies, education, and fashion, have been produced. Thanks to the collaboration between CLARIN-IT (the Italian national node of CLARIN ERIC, the European infrastructure for language resources and technologies) and OTPL (Osservatorio di Terminologie e Politiche Linguistiche, Università Cattolica del Sacro Cuore, Milan), these terminological data are indexed in the REALITER – OTPL collection and published on the ILC4CLARIN-SKOSMOS Service platform. After presenting the REALITER projects, with particular attention to terminological variation and cultural aspects, the paper aims to describe the methodological choices made for the representation and dissemination of these plurilingual lexicons in compliance with FAIR principles. This will highlight the crucial role of infrastructures such as CLARIN ERIC in supporting the representation, sharing, and preservation of this rich linguistic and cultural heritage},
KEYWORDS = {plurilingualism, lexicon, terminological variation, FAIR principles, infrastructure, plurilinguisme, lexique, variation terminologique, principes FAIR, infrastructure},
PAGES = {209-236},
URL = {https://id.erudit.org/iderudit/1124416ar},
VOLUME = {XXXVIII (2)},
DOI = {10.7202/1124416ar},
JOURNAL = {TTR},
}
@ARTICLE{DELGRATTA_2025_ARTICLE_DZDB_560703,
AUTHOR = {Del Gratta, R. and Zenzaro, S. and Del Grosso, A. M. and Boschetti, F.},
TITLE = {Category theory, Document Analysis, and Philological Operations. A formal approach: limitations, and challenges},
YEAR = {2025},
ABSTRACT = {Starting with a formal definition of the process of scholarly editing, we further formalize it by exploiting Category Theory. We then apply this formal model to automated Natural Language Processing tools, highlighting the parallelism between composition and associativity and linguistic tool pipelines. We then discuss the notion of interoperability between tools},
KEYWORDS = {Interoperability, NLP, Linguistic and philological operations, Category Theory, Formal Models},
PAGES = {11-20},
URL = {https://www.innove.org/ijist/index.php/ijist/article/view/288/217},
VOLUME = {9 (1)},
ISSN = {2550-5114},
JOURNAL = {INTERNATIONAL JOURNAL OF INFORMATION SCIENCE AND TECHNOLOGY},
}
@ARTICLE{DELGROSSO_2025_ARTICLE_DS_571201,
AUTHOR = {Del Grosso, A. M. and Siciliano, A.},
TITLE = {“Voce dei Margini”: le postille di Giorgio Bassani in un’edizione scientifica digitale},
YEAR = {2025},
ABSTRACT = {L’articolo presenta il lavoro di edizione scientifica digitale che è in corso di svolgimento sulle postille di Giorgio Bassani ai libri della sua biblioteca personale. Dopo aver esposto le ragioni per cui l’edizione digitale rappresenta la soluzione più adatta a rappresentare la complessa e strutturata testualità della postilla, si illustrano i criteri adottati nella codifica XML-TEI delle postille di Bassani al volume La scuola dell’uomo di Guido Calogero, centrale nella sua formazione umana e culturale. Infine, si descrivono le funzionalità di fruizione implementate dall’applicazione web tramite l’utilizzo del framework HTML templating della piattaforma eXist-db},
KEYWORDS = {XML-TEI, marginalia, Giorgio Bassani, eXist-db, digital archives, XML-TEI, postille, Giorgio Bassani, eXist-db, archivi digitali},
PAGES = {125-152},
URL = {https://edizioni.libreriauniversitaria.it/libro/limina-intorno-al-testo-2025-i/},
VOLUME = {2 (1)},
JOURNAL = {LIMINA},
}
@ARTICLE{DELGROSSO_2025_ARTICLE_DZBR_571221,
AUTHOR = {Del Grosso, A. M. and Zenzaro, S. and Boschetti, F. and Ranocchia, G.},
TITLE = {Co-designing Digital Papyrology},
YEAR = {2025},
ABSTRACT = {Traditional papyrology has established effective methods for producing diplomatic editions of papyri and publishing critical editions of their textual content. Digital papyrology strives to bridge the gap with the digital age. Achieving the balance between familiarity for traditional scholars and the potential for computational analysis remains a challenge. This paper proposes an innovative co-design approach for developing digital papyrology tools, leveraging both Domain-Driven Design (DDD) and Domain-Specific Languages (DSLs). DDD emphasizes a collaborative understanding of the problem domain, while DSLs are formal languages tailored to specific domains like papyrology. The co-design process involves close collaboration with a team of papyrologists, philologists, linguists, and other humanities scholars. This ensures that the resulting tools are user-friendly and cater to the needs of traditional scholars. DSLs encode domain-specific knowledge, facilitating the creation of machine-actionable Digital Scholarly Editions (DSEs) that remain user-friendly. CophiEditor, a modular web environment designed within a micro-services architecture, implements the complete workflow for creating DSL-based DSEs. The co-design approach, the DSL definition, and the DDD paradigm guarantee that CophiEditor is familiar and produces interoperable and extensible data. The development of CophiEditor, within the ERC GreekSchools project, showcases the potential of this approach. It offers greater accessibility of digital tools for traditional philologists and opens doors for new possibilities in computational analysis of ancient texts},
KEYWORDS = {Computational Philology, Digital Humanities,Digital Papyrology, Digital Scholarly Editing, TEI/EpiDoc},
PAGES = {31-41},
URL = {https://www.innove.org/ijist/index.php/ijist/article/view/294},
VOLUME = {9 (1)},
JOURNAL = {INTERNATIONAL JOURNAL OF INFORMATION SCIENCE AND TECHNOLOGY},
}
@ARTICLE{DIDONATO_2025_ARTICLE_DP_545335,
AUTHOR = {Di Donato, F. and Provost, L.},
TITLE = {Why isn’t FAIR enough? Bringing together methods and values for Open Science uptake},
YEAR = {2025},
ABSTRACT = {The FAIR principles have emerged as a global standard for Research Data Management but their application has not had the expected impact, especially considering the considerable amount of funding which has been put into FAIR policies. In fact, open research methods have not become the norm, FAIR is still perceived as just another mechanical task for researchers, and quality is still not ensured by the application of the principles. The CARE principles were proposed to complement the FAIR framework, arguing that people and purpose, rather than data and technology, should be at the centre of RDM frameworks. In practice, they have been applied in certain contexts, which we will examine, but their impact has been rather limited. In this article, we will therefore analyse the definition of the Open Science values and principles provided in the UNESCO Recommendation. By doing so, we aim to see if they overlap with the CARE values and principles, and to understand if the latter are useful, and for what. Finally, we note that the UNESCO definition of Open Science already encompasses the values and principles of CARE, while also being broader and more comprehensive. The implementation and practical translation of the FAIR principles into research practices must address an underlying cultural challenge, and this is where the CARE principles can provide meaningful insight, emphasising the importance of starting with context, communities, and their genuine needs. However, these principles are not indispensable, as these considerations are already embedded within the UNESCO Recommendation and, by extension, within the definition of Open Science itself—an ecosystem of practices in which Research Data Management is a foundational pillar},
KEYWORDS = {FAIR principles, Care Principles, Open Science, Research Data Management, Research on Research},
PAGES = {17-46},
URL = {https://umanisticadigitale.unibo.it/article/view/20976},
VOLUME = {19},
ISSN = {2532-8816},
JOURNAL = {UMANISTICA DIGITALE},
}
@ARTICLE{DIGIOVANNANTONIO_2025_ARTICLE_DP_572163,
AUTHOR = {Di Giovannantonio, S. and Papini, M.},
TITLE = {Il VocaBO-Vocabolario di Boccaccio online. Questioni di metodo tra lessicografia e annotazione digitale},
YEAR = {2025},
ABSTRACT = {The Vocabolario di Boccaccio Online (VocaBO) is the first native digital repertory entirely dedicated to the lexicon of the Certaldese. In line with the latest philological findings, this contribution first presents the text adopted for lexical indexing. Secondly, within the scope of domestic architecture and furnishings, it discusses several lemmatization issues related to linguistic traits characteristic of Decameron prose. The second part of the contribution is dedicated to demonstrating the impact of the two tools that constitute the digital core of the project: Maia, a platform that supports the drafting of entries and text annotation, and the tool through which users can access the vocabulary as it is compiled, as well as the annotated corpus itself},
KEYWORDS = {Boccaccio, Decameron, digital lexicography, text annotation, lexical linking, Boccaccio, Decameron, Lessicografia Digitali, annotazione testuale, lexical linking},
PAGES = {63-73},
URL = {https://www.ellisseonline.net/xx-2-2025/},
DOI = {10.48255/2240-9688.LELLIS.20.II.2025.04},
ISSN = {1826-0187},
JOURNAL = {L’ ELLISSE},
}
@ARTICLE{DINI_2025_ARTICLE_DMBD_570447,
AUTHOR = {Dini, L. and Moroni, L. and Brunato, D. and Dell'Orletta, F.},
TITLE = {In the eyes of a language model: A comprehensive examination through eye-tracking data},
YEAR = {2025},
ABSTRACT = {Cognitive signals, particularly eye-tracking data, offer a unique lens for understanding human sentence processing. Leveraging eye-gaze data from the English and Italian section of the Multilingual Eye-Movement Corpus (MECO), we designed a series of experiments aiming at exploring whether pre-trained neural language models (NLMs) encode patterns representative of human reading behavior and if directly incorporating this information through a fine-tuning process influences the cognitive plausibility of the model. Additionally, we sought to determine if such an impact persists through a downstream task. Our findings reveal that transformers encode eye-gaze-related information during pretraining and that explicitly integrating eye-tracking features increases model alignment with human attention. When investigating the effect of intermediate fine-tuning on eye-tracking data on the model's performance on a downstream task, we observe that this intermediate step does not result in catastrophic forgetting, despite the very different nature of the considered downstream task. In addition, the attention mechanism of models undergoing intermediate fine-tuning remains closely aligned with human attention. In conclusion, our comprehensive evaluation of NLMs informed by human attention patterns offers great potential for advancing the growing field of eXplainable Artificial Intelligence (XAI). Grounding language models in real-world cognitive processes enables the creation of systems that not only replicate human language output but also align with the cognitive mechanisms behind reading and comprehension. This alignment with human behavior enhances model adaptability, interpretability, and effectiveness, fostering more human-centric, transparent, and reliable AI applications across various domains. 1},
KEYWORDS = {Cognitive plausibility, Eye-tracking, Interpretability, Neural attention, Neural Language Models},
URL = {https://iris.cnr.it/handle/20.500.14243/570447},
VOLUME = {650},
DOI = {10.1016/j.neucom.2025.130617},
ISSN = {0925-2312},
JOURNAL = {NEUROCOMPUTING},
}
@ARTICLE{DOLCIOTTI_2025_ARTICLE_DRGTMMD_544166,
AUTHOR = {Dolciotti, C. and Righi, M. and Grecu, E. and Trucas, M. and Maxia, C. and Murtas, D. and Diana, A.},
TITLE = {The translational power of Alzheimer's-based organoid models in personalized medicine: an integrated biological and digital approach embodying patient clinical history},
YEAR = {2025},
ABSTRACT = {Alzheimer’s disease (AD) is a complex neurodegenerative condition characterized by a multifaceted interplay of genetic, environmental, and pathological factors. Traditional diagnostic and research methods, including neuropsychological assessments, imaging, and cerebrospinal fluid (CSF) biomarkers, have advanced our understanding but remain limited by late-stage detection and challenges in modeling disease progression. The emergence of three-dimensional (3D) brain organoids (BOs) offers a transformative platform for bridging these gaps. BOs derived from patient-specific induced pluripotent stem cells (iPSCs) mimic the structural and functional complexities of the human brain. This advancement offers an alternative or complementary approach for studying AD pathology, including β-amyloid and tau protein aggregation, neuroinflammation, and aging processes. By integrating biological complexity with cutting-edge technological tools such as organ-on-a-chip systems, microelectrode arrays, and artificial intelligence-driven digital twins (DTs), it is hoped that BOs will facilitate real-time modeling of AD progression and response to interventions. These models capture central nervous system biomarkers and establish correlations with peripheral markers, fostering a holistic understanding of disease mechanisms. Furthermore, BOs provide a scalable and ethically sound alternative to animal models, advancing drug discovery and personalized therapeutic strategies. The convergence of BOs and DTs potentially represents a significant shift in AD research, enhancing predictive and preventive capacities through precise in vitro simulations of individual disease trajectories. This approach underscores the potential for personalized medicine, reducing the reliance on invasive diagnostics while promoting early intervention. As research progresses, integrating sporadic and familial AD models within this framework promises to refine our understanding of disease heterogeneity and drive innovations in treatment and care},
KEYWORDS = {Alzheimer’s disease, neurodegeneration, personalized medicine, brain organoids, early diagnosis biomarker, neuroinflammation, digital twins},
URL = {https://www.frontiersin.org/journals/cellular-neuroscience/articles/10.3389/fncel.2025.1553642/abstract},
VOLUME = {19},
DOI = {10.3389/fncel.2025.1553642},
ISSN = {1662-5102},
JOURNAL = {FRONTIERS IN CELLULAR NEUROSCIENCE},
}
@ARTICLE{DOOWY_2025_ARTICLE_DS_571028,
AUTHOR = {Dołowy, N. and Soria, C.},
TITLE = {Contested Languages and Perception of Multilingualism: A Sociolinguistic Study of Poland and Italy},
YEAR = {2025},
ABSTRACT = {Most European states, including Poland and Italy, have diverse linguistic composition, yet only a fraction of their language varieties receive official recognition and support. While the EU promotes linguistic diversity, unrecognised forms – such as immigrant languages, some minority languages, and dialects – often lack protection and public awareness. This study, framed within folk linguistics, examines perceptions of multilingualism in Poland and Italy through an online questionnaire. By analysing how respondents classify and name language varieties such as ‘dialects’ and ‘minority languages’, we assess the impact of official recognition on social perception. Our findings reveal that ‘contested languages’ contribute to the perceived multilingualism of Poland and Italy and explore how lack of recognition may lead to marginalisation, reducing chances for legal protection and support. Understanding these perceptions helps sociolinguists and policymakers grasp dominant language ideologies and their implications for language planning},
KEYWORDS = {multilingualism, folk linguistics, dialects, minority languages, contested languages, Poland, Italy},
VOLUME = {(25)},
DOI = {10.11649/cs},
JOURNAL = {COGNITIVE STUDIES},
}
@ARTICLE{KHLIF_2025_ARTICLE_KMN_563230,
AUTHOR = {Khlif, N. and Mazroui, A. and Nahli, O.},
TITLE = {ENHANCING ARABIC DIALECT ANALYSIS: INTRODUCING DIMORPH FOR DARIJA},
YEAR = {2025},
ABSTRACT = {While Modern Standard Arabic (MSA) is well-studied, dialectal Arabic texts, such as Moroccan dialect (Darija), pose unique challenges due to their informal structure and lack of a standardized grammar. In this paper, we provide an in-depth study of Darija detailing its morphological and syntactic features, and we introduce DiMorph (Dialectal Morphological Analyzer), a specialized morphological engine, which is designed to address these complexities automatically. In detail, we focus on DiMorph’s multi-phase approach, involving both pre-and post-processing phases. Such approach effectively manages dialectal variability and achieves high accuracy in token recognition and analysis, particularly in social media contexts. Finally, we underscore the importance of developing tools that respect the linguistic diversity of Arabic dialects, laying a strong foundation for advanced computational research in Arabic dialectology. © 2025 Societa Editrice Il Mulino. All rights reserved},
KEYWORDS = {DiMorph, Moroccan dialect, morphological analyzer},
PAGES = {363-390},
URL = {https://iris.cnr.it/handle/20.500.14243/563230},
VOLUME = {24 (2)},
DOI = {10.1418/116951},
ISSN = {1720-9331},
JOURNAL = {LINGUE E LINGUAGGIO},
}
@ARTICLE{LAMELI_2025_ARTICLE_LMN_571148,
AUTHOR = {Lameli, A. and Montemagni, S. and Nerbonne, J.},
TITLE = {Dialectal Dynamics—An Introduction},
YEAR = {2025},
ABSTRACT = {The study of dialects leads very naturally to the study of their geographic distribution and the nature of the distribution, e. g., by examining whether the distribution is based simply on geographic distance or on relatively distinct dialect regions. Dialectal dynamics poses the further question of why the distribution takes the form it does. Does variation arise through migration, i. e., due to the relative lack of communication among people who live far from one another? Sociolinguists have shown convincingly that variation is often employed to indicate identification with others, leading to the adoption of speech habits and changes in the distribution of variation. Purely linguistic processes may push some varieties toward change while others are more resistant, and contact with other languages and dialects, including particularly standard languages, almost inevitably results in changes. This volume examines studies in the area of dialectal dynamics, including studies focused on methods that promise to illuminate this complex field},
KEYWORDS = {dialectology, dialectometry, language change, language contact, historical linguistics},
PAGES = {15},
URL = {https://www.mdpi.com/2226-471X/10/10/265},
VOLUME = {10 (10)},
DOI = {10.3390/languages10100265},
ISSN = {2226-471X},
JOURNAL = {LANGUAGES},
}
@ARTICLE{LOMI_2025_ARTICLE_LGDDDB_568861,
AUTHOR = {Lomi, M. and Geraci, F. and Del Seppia, C. and Dolciotti, C. and Del Carratore, M. R. and Bongioanni, P.},
TITLE = {Biomarkers profile in peripheral blood cells related to Alzheimer's disease},
YEAR = {2025},
ABSTRACT = {In a healthy brain, neuroinflammation, controlled by the main intermediary for the immune response microglia and astrocytes, contributes to maintain physiological functions such as secretion of neurotrophic factors, removal of cell tau and amyloid-β (Aβ) debris and local homeostasis. When the immune response becomes chronic, it can become pathological and fuel neuroinflammation, causing glial cells to malfunction and not perform their function of clearing debris, resulting in further damage to neurons. Multiple studies highlight that an intense crosstalk is activated between peripheral blood white cells (PBWC) and central nervous system (CNS). Nevertheless, how PBWC can be carriers of biomarkers of the CNS neuropathological states it is still far to be completely known. In this work we aimed to observe how PBWC content could be related to moderate-severity of DAT in order to have early signals from of pathological neurodegeneration brain initiate. Protein analysis have been performed in PBWC of Mild Cognitive Impairment (MCI) and DAT patients respect to those of healthy controls and differently expressed proteins have been investigated. Our data showed a deregulation of pathways involved in neurodegeneration since from MCI level and deregulated proteins that can be considered markers for DAT onset and progression},
KEYWORDS = {PBWC, biomarkers, proteomic, Alzheimer’s disease},
PAGES = {8949-8964},
URL = {https://iris.cnr.it/handle/20.500.14243/568861},
VOLUME = {62},
DOI = {10.1007/s12035-025-04767-y.},
ISSN = {1559-1182},
JOURNAL = {MOLECULAR NEUROBIOLOGY},
}
@ARTICLE{LUZIETTI_2025_ARTICLE_LSGMCDCMQMD_550741,
AUTHOR = {Luzietti, R. B. and Spadi, A. and Giampietro, N. and Mancuso, G. and Caravale, A. and D'Eredità, A. and Caradonna, M. and Moscati, P. and Quochi, V. and Monachini, M. and Degl'Innocenti, E.},
TITLE = {Digital Humanities and Heritage Science: moving from landscaping to a dynamic research observatory in an Open Science Cloud},
YEAR = {2025},
ABSTRACT = {This contribution presents the work conducted within the second work package of the Humanities and Heritage Italian Science Cloud (H2IOSC) infrastructural project, dedicated to "Landscaping and Building Communities", with the aim of defining a methodology for mapping the current status and availability of resources and technologies and enhancing their utilization in the Humanities and Cultural Heritage sectors. The mapping activity involved a comprehensive investigation encompassing language technologies, digital humanities, and heritage science disciplines in Italy. The aim of the landscaping activity is to collect information on the latest and most prevalent resources, tools, communities, best practices, standards, and projects developed within the Heritage, Social Sciences, and Digital Humanities communities. In this project, the four partnering infrastructures-CLARIN, DARIAH, E-RIHS, and OPERAS-collaborate closely to develop the best strategies for engaging and meeting the needs of their target research communities as well as to identify the set of priority items (resources, tools, and services) to FAIRify and onboard them into the national MarketPlace},
KEYWORDS = {digital humanities, heritage science, infrastructural survey, infrastrutture di ricerca},
PAGES = {419-439},
URL = {https://iris.cnr.it/handle/20.500.14243/550741},
VOLUME = {2025 (20)},
DOI = {10.6092/issn.2532-8816/21226},
ISSN = {2532-8816},
JOURNAL = {UMANISTICA DIGITALE},
}
@ARTICLE{MARESCA_2025_ARTICLE_MLRASWRRCKRFTJCITE_562294,
AUTHOR = {Maresca, D. C. and La Civita, E. and Romano, B. and Ambrosio, M. R. and Somma, F. and Wyss, T. and Rocco, B. and Rubino, V. and Cari, L. and Krebs, P. and Rodriguez Calero, A. and Ferro, M. and Trabanelli, S. and Jandus, C. and Crocetto, F. and Ianaro, A. and Terracciano, D. and Ercolano, G.},
TITLE = {Circulating innate lymphoid cells are dysregulated in patients with prostate cancer},
YEAR = {2025},
ABSTRACT = {BackgroundProstate cancer (PCa) is the second most common cancer affecting men globally, especially those aged 50 years and above. Despite substantial progress in terms of both prognosis and therapy, PCa remains a significant health concern, necessitating the identification of novel therapeutic targets. Innate lymphoid cells (ILCs) have emerged as critical modulators of tumor immunity, exhibiting both pro-and antitumoral effects. However, little is known yet about their contribution in PCa. This study investigated the phenotypic and functional profiles of ILC subsets in the peripheral blood mononuclear cells (PBMCs) of patients with PCa stratified by Gleason score. MethodsPBMCs were isolated by Lymphoprep. ILC frequency and activity were evaluated by flow cytometry. The levels of ILC-activating cytokines were analyzed by multiplex assay in the serum of healthy donors (HDs) and patients with PCa. To evaluate the crosstalk between ILC2s and cancer cells, PC3 and DU145 human PCa cell lines were used. ResultsWe found a stage-dependent increase in the protumoral ILC2 frequency and a concurrent decrease in antitumoral ILC1s in patients with PCa compared with healthy controls. Interestingly, the frequency of ILC2s was higher in patients with elevated prostate-specific antigen (PSA) values, suggesting their potential as molecular predictor for defining the risk category of patients with PCa at diagnosis. Importantly, patients with PCa exhibited hyperactivated ILC2s, characterized by elevated interleukin (IL)-13 and IL-5 production, while ILC1s displayed reduced tumor necrosis factor (TNF)-alpha and interferon (IFN)-gamma secretion. Furthermore, serum levels of ILC2-activating cytokines IL-33, IL-18, and prostaglandin D2 (PGD2) were elevated in patients with PCa. In vitro co-culture experiments demonstrated that PCa cell lines, capable of secreting these cytokines, could directly enhance ILC2 activity. Likewise, ILC2-derived IL-13 promoted PCa cell migration and invasion. ConclusionsCollectively, our findings highlight a dysregulated ILC profile in PCa, characterized by ILC2 dominance and heightened activity at the expense of ILC1s, suggesting both ILC1s and ILC2s as potential therapeutic targets for PCa treatment},
KEYWORDS = {IL-13, IL-18, IL-33, ILC1s, ILC2s, Innate lymphoid cells, Prostate cancer},
URL = {https://iris.cnr.it/handle/20.500.14243/562294},
VOLUME = {30 (1)},
DOI = {10.1186/s11658-025-00725-7},
ISSN = {1689-1392},
JOURNAL = {CELLULAR AND MOLECULAR BIOLOGY LETTERS},
}
@ARTICLE{MARZI_2025_ARTICLE_MNLSTPF_549321,
AUTHOR = {Marzi, C. and Nadalini, A. and Lento, A. and Srivastava, M. and Todesco, A. and Pirrelli, V. and Ferro, M.},
TITLE = {Oral text reading as a multi-sensory task},
YEAR = {2025},
ABSTRACT = {Reading aloud involves the complex interplay of visual, motor and lexical processes. While eye movements have been extensively investigated in the reading literature, less is known about the coordination of voice, eye and finger movements in oral and finger-point reading. Here we propose a multimodal perspective on these dynamics, emphasising the contribution of integrating eye-tracking, finger-tracking, and voice recording to a more comprehensive understanding of reading proficiency. Our results show that finger and eye movements are strongly coupled in early readers. Conversely, skilled readers show a more flexible coordination of sensorimotor signals and a more adaptive sensitivity to prosodic structures, with voice articulation slowing at key structural points, such as chunk heads and sentence-final boundaries. These findings provide novel insights into how multimodal coordination evolves with reading expertise, contributing to a more fine-grained understanding of reading fluency},
KEYWORDS = {reading development, multimodal integration, eye-voice span, finger-voice span, adaptive reading.},
PAGES = {141-156},
URL = {https://www.rivisteweb.it/doi/10.1418/117447},
VOLUME = {XXIV (1)},
DOI = {10.1418/117447},
ISSN = {1720-9331},
JOURNAL = {LINGUE E LINGUAGGIO},
}
@ARTICLE{MERCATANTI_2025_ARTICLE_MDR_571241,
AUTHOR = {Mercatanti, E. and Del Grosso, A. M. and Riccucci, M.},
TITLE = {Voci dall’Inferno: Dante per esprimere l’indicibile},
YEAR = {2025},
ABSTRACT = {This paper presents the ongoing developments of the project Voci dall’Inferno, which is structured around two integrated objectives: (a) the digitization and encoding of the first digital corpus of non-literary testimonies by Lager survivors; (b) the identification, quantification, and analysis of Dante’s lexicon and imagery within those testimonies. On the one hand, the creation of the digital corpus aims to collect, preserve, and enhance of non-literary testimonies; on the other, the project documents the use of computational tools and methods for analyzing the digitized materials. Among the project’s most significant outcomes is the web application Voci dall’Inferno, designed to catalogue, browse, and analyze the archived testimonies, as well as to systematically detect and study the presence of Dante’s vocabulary in the corpus. The contribution is structured in three sections. The first investigates, from a historical-literary and humanistic perspective, the reasons why Dante became a privileged reference for many survivors to express the experience of the Lager. The second and third sections address the project’s technical components: the second focuses on the XML/TEI encoding of the testimonies, while the third outlines the current state of development of the Voci dall’Inferno web platform. The contribution also incorporates results from Elvira Mercatanti’s master’s thesis in Digital Humanities [13]},
KEYWORDS = {Dante’s allusions, Dante’s lexicon, Digital Archives, eXist-db, Holocaust Testimonies, Web Application, XML-TEI, XQuery},
PAGES = {527-562},
VOLUME = {2025 (20)},
DOI = {10.6092/issn},
ISSN = {2532-8816},
JOURNAL = {UMANISTICA DIGITALE},
}
@ARTICLE{MONTEMAGNI_2025_ARTICLE_M_571146,
AUTHOR = {Montemagni, S.},
TITLE = {Bridging Linguistics and Computational Linguistics: Insights into Synergies and Challenges from a Case Study},
YEAR = {2025},
ABSTRACT = {This paper outlines the evolving interplay between Linguistics and Computational Linguistics, aiming to map the current state of their interactions and to identify areas where deeper integration could drive significant advancements in both areas. Since the early days of Computational Linguistics as an autonomous discipline, the synergy has developed in parallel with progress in both computational methods and linguistic theory. Computational modeling of language offers a powerful framework to investigate core questions of linguistics, from how language works and is acquired, to how it changes across time, space, communicative situations, and domains. Despite this potential, the capabilities of state-of-the-art computational methods remain only partially exploited within linguistic research, leaving a gap between advances in Natural Language Processing and the needs of linguistics. This paper seeks to examine the current landscape of this synergy, its scientific and practical implications, and the challenges that must be addressed to fully harness its potential. A pilot study is presented to illustrate how linguistic resources and computational modeling can provide answers to long-standing research questions and, at the same time, open up new avenues for investigating open issues in language typology},
KEYWORDS = {Linguistics, computational linguistics, linguistic typology, computational modelling of language},
PAGES = {9-33},
URL = {https://www.aaccademia.it/customized/downloadfile.php?tipo=estratto\&formato=pdf\&id=3108},
VOLUME = {11 (2)},
DOI = {10.17454/IJCOL112},
JOURNAL = {IJCOL},
}
@ARTICLE{MOTGER_2025_ARTICLE_MMDFM_570522,
AUTHOR = {Motger, Q. and Miaschi, A. and Dell'Orletta, F. and Franch, X. and Marco, J.},
TITLE = {Leveraging encoder-only large language models for mobile app review feature extraction},
YEAR = {2025},
ABSTRACT = {Mobile app review analysis presents unique challenges due to the low quality, subjective bias, and noisy content of user-generated documents. Extracting features from these reviews is essential for tasks such as feature prioritization and sentiment analysis, but it remains a challenging task. Meanwhile, encoder-only models based on the Transformer architecture have shown promising results for classification and information extraction tasks for multiple software engineering processes. This study explores the hypothesis that encoder-only large language models can enhance feature extraction from mobile app reviews. By leveraging crowdsourced annotations from an industrial context, we redefine feature extraction as a supervised token classification task. Our approach includes extending the pre-training of these models with a large corpus of user reviews to improve contextual understanding and employing instance selection techniques to optimize model fine-tuning. Empirical evaluations demonstrate that these methods improve the precision and recall of extracted features and enhance performance efficiency. Key contributions include a novel approach to feature extraction, annotated datasets, extended pre-trained models, and an instance selection mechanism for cost-effective fine-tuning. This research provides practical methods and empirical evidence in applying large language models to natural language processing tasks within mobile app reviews, offering improved performance in feature extraction},
KEYWORDS = {Extended pre-training, Feature extraction, Instance selection, Large language models, Mobile app reviews, Named-entity recognition},
URL = {https://iris.cnr.it/handle/20.500.14243/570522},
VOLUME = {30 (3)},
DOI = {10.1007/s10664-025-10660-y},
ISSN = {1382-3256},
JOURNAL = {EMPIRICAL SOFTWARE ENGINEERING},
}
@ARTICLE{NADALINI_2025_ARTICLE_NMFCCC_548023,
AUTHOR = {Nadalini, A. and Marzi, C. and Ferro, M. and Cinini, A. and Cutugno, P. and Chiarella, D.},
TITLE = {Inferential Reading Skills in High School: A Study on Comprehension Profiles},
YEAR = {2025},
ABSTRACT = {Reading comprehension of connected texts is a key skill in high school education, yet students exhibit varying proficiency levels, particularly in inferential reasoning. This study investigates reading behavior by means of finger-tracking technique and question answering among Italian 10th, 11th, and 12th year high school students, analyzing their performance on different types of questions: synonymy and reference vs. inference-based questions. Despite similar reading times and lexical effects across grades, students’ accuracy in answering inferential questions reveals significant variability. Subsequently, we identify three comprehension profiles—poor, medium, and good comprehenders—with the first two groups showing markedly lower performance on inference-based questions. These findings suggest that schooling alone may not be sufficient for all students to develop strong inferential skills, and some may benefit from targeted instructional support},
KEYWORDS = {reading strategies, comprehension profiles, inferential processing, finger-tracking, cognitive reading processes},
URL = {https://www.mdpi.com/2227-7102/15/6/654},
VOLUME = {15 (6)},
DOI = {10.3390/educsci15060654},
ISSN = {2227-7102},
JOURNAL = {EDUCATION SCIENCES},
}
@ARTICLE{OKOYE_2025_ARTICLE_OCPFNCCCDFFGPRRSSZMBFNAAABBBBBBCCCCCCCCCCDDDDFGGGGILLLLLMMMMMMNOPPPPQRRSSSSSSTTTTVVZ_564586,
AUTHOR = {Okoye, C. and Cuffaro, L. and Pozzi, F. E. and Ferrara, M. C. and Noale, M. and Calciolari, S. and Chicco, D. and Cincotti, F. and Daini, R. and Finazzi, A. and Francioso, L. and Gasparini, F. and Pagan, E. and Ribino, P. and Romeo, Z. and Sala, G. and Solfrizzi, V. and Zambon, A. and Maggi, S. and Bellelli, G. and Ferrarese, C. and Null, N. and Airoldi, C. and Aloisi, A. and Appollonio, I. and Bazzini, C. and Bochicchio, M. A. and Bologna, M. and Brattico, E. and Bruno, G. and Bulgari, M. and Canevelli, M. and Capone, S. and Ceolin, C. and Chiaradonna, F. and Colamarino, E. and Conti, E. and Corsonello, A. and Cortelessa, G. and Crudele, L. and Custodero, C. and De Luca, A. and Delussi, M. and Di Napoli, C. and Dibello, V. and Franchi, M. and Ganora, D. and Gesualdo, L. and Goldin, E. and Grossi, A. and Isella, V. and Lenti, R. and Leone, A. and Locati, S. and Logrieco, A. and Logroscino, G. and Macchia, E. and Mantuano, P. and Massimi, A. and Matteini, P. and Messina, G. and Moretti, L. and Natalello, A. and Orlandi, I. and Paragliola, G. and Paparella, G. and Pegoraro, S. and Pirrelli, V. and Quaranta, N. A. A. and Riccardi, G. and Romano, D. and Saibene, A. and Sala, A. and Sciurti, E. and Serino, L. and Siciliano, P. and Silanos, F. and Tamburrano, A. and Tosi, G. and Tratsevich, A. and Tremolizzo, L. and Villari, P. and Vezzoso, A. and Zoia, C. P.},
TITLE = {Multicomponent interventions and technologies to reduce the burden of frailty, functional, and cognitive decline: insights from the Age-It Research Program},
YEAR = {2025},
ABSTRACT = {Objectives Preventing age-related complications is a critical priority for health systems. Within the Age-It program, Spoke 8 aims to evaluate scalable, multicomponent, technology-assisted interventions to prevent frailty and mitigate functional and cognitive decline in older adults across different care settings. Methods Spoke 8 includes three clinical studies conducted in community, hospital, and long-term care settings, supported by cross-cutting work packages on digital infrastructure, technology development, and economic evaluation. The intervention model integrates physical, cognitive, nutritional, and psychosocial components, supported by digital tools, biomarkers of aging, and a centralized data platform. Results The project is expected to generate evidence on the effectiveness, feasibility, and cost-effectiveness of multidomain interventions implemented across diverse real-world settings, including community, hospital, and long-term care. Technology-assisted strategies-such as wearable sensors and digital cognitive tools-may enhance adherence and enable remote monitoring, while also supporting more personalized care delivery. The integration of artificial intelligence will facilitate the interpretation of complex clinical and biological data, improving risk stratification and the early identification of individuals most likely to benefit from targeted interventions. Together, these approaches may help reduce hospitalizations, delay functional decline, and promote aging in place. Discussion This initiative supports the transition toward more integrated and equitable care models for older adults. Through the implementation of scalable, person-centered interventions within routine services, the project offers policy-relevant strategies to address frailty and functional decline-contributing to the redesign of aging care in Italy and providing insights applicable across diverse health systems facing the challenges of population aging countries},
KEYWORDS = {Dementia, Frailty, Multidomain intervention, Prevention, Technology},
URL = {https://iris.cnr.it/handle/20.500.14243/564586},
VOLUME = {80 (Supplement_2)},
DOI = {10.1093/geronb/gbaf186},
ISSN = {1079-5014},
JOURNAL = {JOURNALS OF GERONTOLOGY SERIES B-PSYCHOLOGICAL SCIENCES AND SOCIAL SCIENCES},
}
@ARTICLE{PAPINI_2025_ARTICLE_PG_557903,
AUTHOR = {Papini, M. and Giovannetti, E.},
TITLE = {The Challenge of the Talmud in Italian: Tools and Computational Linguistics in the Service of Translation},
YEAR = {2025},
ABSTRACT = {The translation of the Babylonian Talmud into Italian constitutes a true challenge. To address the numerous issues posed by translating such a vast and complex text, the Traduco system was developed to support translators through collaborative features, a translation memory, distributional semantics, glossary management, and annotation tools. Additionally, recent experiments have explored the integration of large language models to assist in the translation and the construction of a Talmud Knowledge Base designed to provide a formal representation of the terminological and conceptual data identified in the Talmud},
KEYWORDS = {Computer-Assisted Translation, Translation Memory, Babylonian Talmud, Traduco, Large Language Models},
PAGES = {135-154},
URL = {http://doi.org/10.30687/TranScript/5876-7987},
VOLUME = {4},
DOI = {10.30687/TranScript},
ISSN = {2785-5708},
JOURNAL = {TRANSCRIPT},
}
@ARTICLE{PEDONESE_2025_ARTICLE_PFOBSFSRCSB_552963,
AUTHOR = {Pedonese, G. and Frontini, F. and Ottaviani, R. and Boschetti, F. and Spadi, A. and Francalanci, L. and Scognamiglio, A. and Restaneo, P. and Chaban, A. and Striova, J. and Benassi, L.},
TITLE = {Materiali didattici come oggetti digitali FAIR: una metodologia condivisa per la formazione in H2IOSC},
YEAR = {2025},
ABSTRACT = {Il presente lavoro dettaglia la strategia per lo sviluppo di iniziative di formazione nell’ambito del progetto PNRR sviluppato dal CNR Humanities and cultural Heritage ItalianOpen Science Cloud(H2IOSC) e mira ad aprire alla comunità italiana di riferimento il processo di applicazione delle linee guida di design e di fruizione di moduli didattici che integrino l’uso delle Infrastrutture di Ricerca. In particolare, il contributo si sofferma suglistandard condivisi per la descrizione dei materiali didattici come oggetti digitali FAIR al fine di massimizzarne il riutilizzo in un’ottica train the trainers e sulla descrizione dei requisiti per l’implementazione dell’infrastruttura di training. Dopo aver descritto la strategia didattica (Sezione 2) e l’applicazione della metodologia FAIR-by-Design di Skills4EOSC ai materiali didattici preesistenti (Sezione 3), il lavoro descrive il processo di ideazione di due piattaforme con funzionalità coerenti ai requisiti degli oggetti didattici prendendo ad esempio il corso CLARIN Introduction to Language Data: Standards and Repositoriestradotto e adattato in H2IOSC (Sezione 4)},
KEYWORDS = {formazione, gestione dei dati, infrastrutture di ricerca, H2IOSC, principi FAIR},
PAGES = {361-380},
URL = {https://iris.cnr.it/handle/20.500.14243/552963},
VOLUME = {2025 (20)},
DOI = {10.6092/issn.2532-8816/21190},
ISSN = {2532-8816},
JOURNAL = {UMANISTICA DIGITALE},
}
@ARTICLE{PIPERNO_2025_ARTICLE_PBDMP_570481,
AUTHOR = {Piperno, R. and Bacco, L. and Dell'Orletta, F. and Merone, M. and Pecchia, L.},
TITLE = {Cross-lingual distillation for domain knowledge transfer with sentence transformers},
YEAR = {2025},
ABSTRACT = {Recent advancements in Natural Language Processing (NLP) have substantially enhanced language understanding. However, non-English languages, especially in specialized and low-resource domains like biomedicine, remain largely underrepresented. Bridging this gap is essential for promoting inclusivity and expanding the global applicability of NLP technologies. This study presents a cross-lingual knowledge distillation framework that utilizes sentence transformers to improve domain-specific NLP capabilities in non-English languages. Specifically, the framework focuses on biomedical text classification tasks. By aligning sentence embeddings between a teacher model trained on English biomedical corpora and a multilingual student model, the proposed method effectively transfers both domain-specific and task-specific knowledge. This alignment allows the student model to efficiently process and adapt to biomedical texts in Spanish, French, and German, particularly in low-resource settings with limited tuning data. Extensive experiments with domain-adapted models like BioBERT and multilingual BERT with machine-translated text pairs demonstrate substantial performance improvements in downstream biomedical NLP tasks. The proposed framework proves highly effective in scenarios characterized by limited training data availability. The results highlight the scalability and effectiveness of this approach, facilitating the development of robust multilingual models tailored to the biomedical domain, thus advancing global accessibility and impact in biomedical NLP applications},
KEYWORDS = {Biomedical domain, Cross-lingual learning, Domain adaptation, Knowledge distillation, Sentence transformers},
URL = {https://iris.cnr.it/handle/20.500.14243/570481},
VOLUME = {311},
DOI = {10.1016/j.knosys.2025.113079},
ISSN = {0950-7051},
JOURNAL = {KNOWLEDGE-BASED SYSTEMS},
}
@ARTICLE{PROIETTI_2025_ARTICLE_PCDLLY_582203,
AUTHOR = {Proietti, C. and Chesñevar, C. I. and Dix, J. and Liao, B. and Luo, J. and Yuste Ginel, A.},
TITLE = {Formal Argumentation and Modal Logic},
YEAR = {2025},
ABSTRACT = {The interrelationship between defeasible argumentation and modal logic is rooted in their shared goal of capturing and modelling reasoning under uncertainty and changing conditions. In the last years, researchers have explored different ways to combine these two formalizations to create more robust systems for handling complex reasoning tasks, in which modal operators can be incorporated into argumentation systems. In this article we analyse three different lines of work to combine modal logic and argumentation: a) a logic-based framework that combines dynamic logic and argumentation for value-based planning; b) alternating-time temporal logic extended with coalitional argumentation; c) different combined approaches for integrating epistemic logics and argumentation. These three alternatives will help the reader to understand different interplays that can take place when combining argumentation and modal logic. On the one hand, we show that argumentation systems can be combined with very different readings of modal operators (i. e., dynamic, temporal and epistemic). On the other hand, modal logic and argumentation can be used in different relative positions. When representing and reasoning about plans, modal logic is applied for the reasoning on the object level and a structured argumentation framework is built on the meta-level over modal logic. When epistemically reasoning about opponents’ argumentative information, modal logic can be built over argumentation. For checking the strategic properties of coalitions of agents, argumentation is put inside modal logic so that the coalition can enlarge according to the theory of coalitional argumentation},
KEYWORDS = {Formal Argumentation, Modal Logic, Abstract Argumentation},
PAGES = {825-892},
VOLUME = {12 (3)},
JOURNAL = {JOURNAL OF APPLIED LOGICS},
}
@ARTICLE{ROMANO_2025_ARTICLE_RV_560370,
AUTHOR = {Romano, F. and Venturi, G.},
TITLE = {Metodi e strumenti per la modernizzazione della lingua delle istituzioni},
YEAR = {2025},
ABSTRACT = {Abstract The paper provides a methodology for the guided drafting of administrative documents that meet criteria of clarity and simplicity in both content and language},
KEYWORDS = {plain language, legal design, natural language processing, inclusione sociale, linguaggio giuridico, semplificazione linguaggio giuridico},
PAGES = {105-121},
URL = {https://calumet-review.com/index.php/it/category/numeri/22-s-sem-2025-it/},
VOLUME = {MIGRANTI LEGGI CONTRATTI VERSO LA CHIAREZZA (EDITOR ANNARITA MIGLIETTA) (22)},
ISSN = {2465-0145},
JOURNAL = {CALUMET},
}
@ARTICLE{SOLASALES_2025_ARTICLE_SAMD_570482,
AUTHOR = {Sola Sales, S. and Alzetta, C. and Moret Tatay, C. and Dell'Orletta, F.},
TITLE = {When Time Matters: Exploring the Impact of Recall Techniques and Educational Levels on Witness Testimony Quality},
YEAR = {2025},
ABSTRACT = {Mental reconstruction (MRC) and Free Recall (FR) have been recognized for enhancing the quality of witness statements. However, the mechanisms underlying this association remain insufficiently understood. This study explores how the time allocated to MRC and FR and variations in educational level influence the quality of eyewitness testimonies. Testimony quality is evaluated based on manually annotated content information provided by experts in testimony assessment, which measures adherence to the events. This is further complemented by fine-grained linguistic features, automatically extracted using linguistic analysis tools, to capture stylistic aspects. As a proof of concept, the analysis is performed on a corpus of 96 testimonies in Spanish describing two robbery cases. The results suggest that both mental reconstruction and narration times positively impact the accuracy of testimonies, as inaccuracies predominantly involve peripheral details. Furthermore, while the study confirms that educational level affects testimony quality, no significant differences were observed in the frequency of erroneous reports. This study contributes to the understanding of the relationship between cognitive strategies and the accuracy of witness statements, proposing an analysis approach applicable to forensic psychology for witness assessment},
KEYWORDS = {automatic linguistic analysis, content analysis, eyewitness testimonies, free recall, mental reinstatement of context},
URL = {https://iris.cnr.it/handle/20.500.14243/570482},
VOLUME = {16 (2)},
DOI = {10.3390/info16020122},
ISSN = {2078-2489},
JOURNAL = {INFORMATION},
}
@ARTICLE{SORIA_2025_ARTICLE_SNC_571034,
AUTHOR = {Soria, C. and Nodari, R. and Calamai, S.},
TITLE = {Assessing Smartphone Speech Recognition Across Diverse English Accents: A Preliminary Study},
YEAR = {2025},
ABSTRACT = {This study examines the performance of a smartphone-based automatic speech recognition(ASR) system when processing diverse English accents. With the increasing reliance on voiceactivatedartificial intelligence in daily tasks, ensuring equitable ASR performance across linguisticvarieties is critical. Using audio data from the CIRCE project corpus, we assess recognitionaccuracy for eleven English accents selected according to Kachru’s three-circle model (Inner, Outer, and Expanding Circle varieties). Findings highlight disparities in recognition performanceand suggest that ASR models exhibit a bias favoring American English (AmE). Thestudy underscores the need for enhanced ASR inclusivity and diversification of training data},
KEYWORDS = {Automatic Speech Recognition, Smartphone, English Accents, Sociophonetics},
VOLUME = {33 (3)},
DOI = {10.69117/ALL},
JOURNAL = {L'ANALISI LINGUISTICA E LETTERARIA},
}
@ARTICLE{VINCI_2025_ARTICLE_VPVV_570782,
AUTHOR = {Vinci, A. and Pirrotta, L. and Venturi, G. and Vainieri, M.},
TITLE = {From clicks to care: Exploring the digital strategies of Italian health authorities in communicating ‘General Practitioner Selection’ service},
YEAR = {2025},
ABSTRACT = {The prioritization of digitalization is crucial to the agendas of nations worldwide. While substantial funds have been allocated to foster it, there remains a scarcity of tools dedicated to systematically monitoring the performance of the digital transformation. This work describes the level of digitalization and information of a fundamental primary care service: the “General Practitioner (GP) selection”. The analysis was conducted by consulting websites of Italian Local Health Authorities (LHAs). First, we explored the digitalization levels of 105 websites through the Primary Care Digital Information (PCDI) composite index. It comprises four dimensions: informativeness, accessibility, inclusiveness, and adaptability, scoring on a five-point scale (low-high digitalization). Second, we conducted a readability analysis, employing three validated measures. We found an average level of digitalization and information, although dimensions perform differently. The best-performing dimension was adaptability, while the worst was inclusiveness. Half of the LHAs provided several digital alternatives to GP selection, while the remaining provided limited or no options. Regarding readability, just 29% of the LHA's websites were found easy to read. Overall, our findings depict that Italian LHAs have different approaches. This study highlights that, despite best practices, several areas require monitoring and intervention. Moreover, some barriers characterize Italian health communication strategies, notably the variability of information across and within regions and on average low website readability},
KEYWORDS = {Online information, Readability, Evaluation, Digital transformation, Public services},
PAGES = {9},
URL = {https://www.sciencedirect.com/science/article/pii/S0168851025001034},
VOLUME = {157},
DOI = {10.1016/j},
JOURNAL = {HEALTH POLICY},
}
@ARTICLE{ZENZARO_2025_ARTICLE_ZDBR_548541,
AUTHOR = {Zenzaro, S. and Del Grosso, A. M. and Boschetti, F. and Ranocchia, G.},
TITLE = {CoPhiEditor: The DSL-Based DSE Methodology within the ERC Advanced Grant 885222-GreekSchools},
YEAR = {2025},
ABSTRACT = {This paper explores the integration of traditional philological methods with computational approaches, aiming to establish a more effective and rigorous framework for textual studies. To this end, we propose a preliminary set of evaluation criteria—familiarity, transparency, completeness, compactness, consistency, and actionability—for analyzing text editing tools. Using this framework, we suggest the use of Domain-Specific Languages (DSLs) for the digital papyrological editions of the ERC-885222 GreekSchools project that is our case study. We introduce CoPhiEditor, a software platform designed to support the creation of Digital Scholarly Editions through the use of DSLs. This approach enables scholars to retain familiar workflows while benefiting from machine-actionable data representations and computational functionalities. Key features of CoPhiEditor include its recursive data model, automatic error-checking and suggestions, automatic TEI-conformant serialization, and advanced collaboration capabilities that streamline teamwork on shared projects. Furthermore, its extensible and domain-agnostic architecture broadens its applicability across various scholarly editing contexts. The aim of CoPhiEditor allows philologists to incorporate digital tools without sacrificing their established editorial practices},
KEYWORDS = {Domain-Specific Languages, Computational Philology, Digital Philology, DSE tools, AIUCD2023, AIUCD2024},
PAGES = {31-56},
URL = {https://umanisticadigitale.unibo.it/article/view/21231},
VOLUME = {20},
DOI = {10.6092/issn.2532-8816/21231},
ISSN = {2532-8816},
JOURNAL = {UMANISTICA DIGITALE},
}
@BOOK{FERRETTI_2025_BOOK_FLPTL_563268,
AUTHOR = {Ferretti, R. and Licciulli, F. and Provost, L. and Tarallo, A. and Lazzeri, E.},
TITLE = {Documento di visione dei Data Steward del CNR},
YEAR = {2025},
ABSTRACT = {Documento di visione dei Data Steward del CNR: Verso una rete strutturata per la gestione dei dati e dei risultati della ricerca},
KEYWORDS = {Data Steward, gestione dati e prodotti},
PAGES = {5},
URL = {http://eprints.bice.rm.cnr.it/id/eprint/23964},
DOI = {10.57665/BICE_Data2025},
PUBLISHER = {CNR},
}
@INCOLLECTION{BOSCHETTI_2025_INCOLLECTION_B_547481,
AUTHOR = {Boschetti, F.},
TITLE = {Forme e sostanze dell’ipallage},
YEAR = {2025},
ABSTRACT = {L’articolo discute la struttura dell’ipallage, la storia del termine, le realizzazioni letterarie e non letterarie},
KEYWORDS = {figure retoriche, cinque sensi, strutture sintattiche},
PAGES = {809-828},
URL = {https://www.ledizioni.it/download/77360/},
PUBLISHER = {Ledizioni (Milano, ITA)},
ISBN = {9791256004300},
CONFERENCE_PLACE = {Milano},
BOOKTITLE = {Figure retoriche: Tradizioni, discipline, contesti},
}
@INCOLLECTION{BURGASSI_2025_INCOLLECTION_B_572706,
AUTHOR = {Burgassi, C.},
TITLE = {Da Bezzecca a Bianciardi: le memorie garibaldine di Eugenio Checchi},
YEAR = {2025},
ABSTRACT = {Il contributo è dedicato alle Memorie di un garibaldino di Eugenio Checchi (I ed. 1866). Si tratteggia il profilo dell'autore, si ricostruisce il contesto storico-cultulare e politico entro cui il libro è nato, se ne legge il contenuto alla luce in particolare del riuso fattone da Luciano Bianciardi},
KEYWORDS = {Memorialistica garibladina, Eugenio Checchi, Luciano Bianciardi},
PAGES = {41-56},
VOLUME = {«QUI SI CONVIENE USARE UN POCO D’ARTE». STUDI E TESTIMONIANZE DEGLI AMICI PER DOMENICO DE MARTINO},
PUBLISHER = {Ronzani (Dueville (VI), ITA)},
ISBN = {9791259971548},
CONFERENCE_PLACE = {Dueville (VI)},
BOOKTITLE = {«Qui si conviene usare un poco d’arte». Studi e testimonianze degli amici per Domenico De Martino},
}
@INCOLLECTION{BURGASSI_2025_INCOLLECTION_BG_559670,
AUTHOR = {Burgassi, C. and Guadagnini, E.},
TITLE = {Il vocabolario del "Decameron": le componenti principali},
YEAR = {2025},
ABSTRACT = {Il contributo analizza alcune tipologie di parole, ritenute rilevanti per la caratterizzazione lessicale del "Decameron": latinismi, dantismi, regionalismi, forestierismi},
KEYWORDS = {Lessicologia storica, Boccaccio},
PAGES = {45-65},
URL = {https://iris.cnr.it/handle/20.500.14243/559670},
VOLUME = {IL VOCABOLARIO DEL DECAMERON: LE COMPONENTI PRINCIPALI},
PUBLISHER = {Carocci (Roma, ITA)},
ISBN = {9788829033225},
CONFERENCE_PLACE = {Roma},
BOOKTITLE = {Il lessico del Decameron. Un universo di parole},
}
@INCOLLECTION{BURGASSI_2025_INCOLLECTION_BG_559669,
AUTHOR = {Burgassi, C. and Guadagnini, E.},
TITLE = {Il vocabolario del "Decameron": uno sguardo d’insieme},
YEAR = {2025},
ABSTRACT = {Il contributo propone una valutazione complessiva del lessico del "Decameron", analizzato contrastivamente rispetto al vocabolario italiano antico},
KEYWORDS = {Lessicologia storica, Boccaccio},
PAGES = {21-44},
URL = {https://iris.cnr.it/handle/20.500.14243/559669},
VOLUME = {IL VOCABOLARIO DEL "DECAMERON": UNO SGUARDO D’INSIEME},
PUBLISHER = {Carocci (Roma, ITA)},
ISBN = {9788829033225},
CONFERENCE_PLACE = {Roma},
BOOKTITLE = {Il lessico del Decameron. Un universo di parole},
}
@INCOLLECTION{BURGASSI_2025_INCOLLECTION_BR_572711,
AUTHOR = {Burgassi, C. and Ricotta, V.},
TITLE = {Un nuovo progetto per il lessico di Boccaccio: il VocaBO – Vocabolario di Boccaccio Online. Primi appunti},
YEAR = {2025},
ABSTRACT = {«Una descrizione realistica della rete che è il lessico dovrebb’essere a sua volta anzitutto reticolare. Un dizionario reticolare permette una navigazione in tutte le direzioni. Insomma, una volta sistemata la questione dei formati (tanto quelli delle entrate quanto quelli semantici), il dizionario del futuro – quale lo permette sin d’ora l’informatica – fonde le tre anime che ho illustrato all’inizio: quella del “vocabolario”, quella del dizionario dei sinonimi, quella dell’analogico, e li unisce in una rete di reti. Ci sarà qualcuno, ricercatore o editore, che avrà il coraggio di mettersi in un’impresa di questo genere?». Così Raffaele Simone (2016: 31-32) chiude il suo saggio di interesse lessicografico dal titolo quanto mai significativo, Il dizionario del futuro. Ci pare che il tema posto da questa citazione, e l’auspicio interrogativo che la conclude, possano ben introdurre l’impianto e i contenuti del nuovo progetto di lessicografia digitale in corso di svolgimento che riguarda il vocabolario delle opere di Giovanni Boccaccio (PANI 2023). Si tratta del VocaBO – Vocabolario di Boccaccio online, diretto da Giovanna Frosini, promosso dall’Università per Stranieri di Siena e dall’Ente Nazionale Giovanni Boccaccio, con la collaborazione del Cnr-Istituto di Linguistica Computazionale “Antonio Zampolli” di Pisa (CNR-ILC) e dall’Accademia della Crusca. Il progetto VocaBO intende descrivere il lessico delle opere di Boccaccio a partire dal Decameron: esso mira, quindi, a mettere in piena luce il sistema delle parole – delle unità monoparola o monorematiche e delle unità multiparola o polirematiche – impiegate dal padre della prosa italiana. A questo scopo è stato criticamente pensato e predisposto un modello di voce lessicografica che raccoglie informazioni lessicali su più piani: relativamente agli scritti di Boccaccio: le forme attestate di un lemma (ossia, in genere, dell’entrata), le sue occorrenze nel Decameron e nelle altre opere volgari, la struttura sintagmatica nel caso delle polirematiche e le eventuali relazioni sintagmatiche (collocazioni), la strutturazione gerarchica del significato in accezioni (ed eventuali sottoaccezioni); relativamente alla storia linguistica e agli strumenti a disposizione per studiarla: l’etimo del lemma, la sua prima attestazione in Boccaccio confrontata con la prima attestazione conosciuta, la “fortuna” della parola nella tradizione letteraria (indagata principalmente attraverso il Vocabolario degli Accademici della Crusca nelle varie impressioni). Alle esigenze specifiche del VocaBO, per inquadrare e supportare la ricerca linguistico-lessicale di questo tipo, è appositamente adattato lo strumento informatico sviluppato dall’ILC-CNR nel campo della lessicografica digitale (per una sua presentazione e una rassegna dei progetti lessicografici che lo adottano, cfr. BELLANDI 2022). Si tratta di uno strumento Web collaborativo che opera in pieno accordo con le tecnologie del Web Semantico, col paradigma dei Linked Data e con i principi FAIR (Findable, Accessible, Interoperable, Reusable) della “Scienza Aperta”. Tale strumento permette di costruire una «rete di reti» per lo studio del lessico (come quella invocata da Raffaele Simone), in quanto rende possibile l’interconnessione tra i diversi livelli dell’analisi (delle corpus, delle voci, dell’ontologia), ciascuno dei quali è raggiungibile a partire dagli altri. Il livello delle voci del vocabolario è infatti integrato con quello del corpus testuale annotato ed è congiunto tanto con il piano delle relazioni di significato (reti onomasiologiche) quanto con il piano dei campi concettuali extralinguistici denotati (ontologia). La strutturazione dei tre livelli interrelati ha notevoli ricadute sulla modalità di accesso ai dati: si possono – per esempio – effettuare ricerche a partire dal livello ontologico che reperiscono i dati associati agli altri due livelli (cercando “arti e mestieri” nell’ontologia, si reperiranno, così, tutte le voci relative sul piano del vocabolario e tutte le attestazioni corrispondenti sul piano del corpus testuale)},
KEYWORDS = {Lessicografia digitale, Giovanni Boccaccio, Decameron},
PAGES = {265-293},
VOLUME = {LA TRADIZIONE DELLE OPERE DI BOCCACCIO. CANTIERI APERTI E PROSPETTIVE DI RICERCA},
PUBLISHER = {Olschki (Firenze)},
ISBN = {978},
CONFERENCE_PLACE = {Firenze},
BOOKTITLE = {La tradizione delle opere di Boccaccio Cantieri aperti e prospettive di ricerca},
}
@INCOLLECTION{BUSCEMI_2025_INCOLLECTION_BF_549328,
AUTHOR = {Buscemi, F. and Frontini, F.},
TITLE = {Scienza aperta, dati e infrastrutture},
YEAR = {2025},
ABSTRACT = {Scienza Aperta, Dati e Infrastrutture. Impatto, impegno e prospettive degli Istituti del DSU rispetto a questi grandi temi, nel contesto nazionale ed europeo},
KEYWORDS = {Scienza aperta, infrastrutture di ricerca, open publishing},
PAGES = {34-44},
URL = {https://iris.cnr.it/handle/20.500.14243/549328},
PUBLISHER = {CNR Edizioni (Roma, ITA)},
ISBN = {9788880807322},
CONFERENCE_PLACE = {Roma},
BOOKTITLE = {LE SCIENZE UMANE E SOCIALI NEL XXI SECOLO: COMPRENDERE E TRASFORMARE LA SOCIETÀ},
EDITOR = {Filippetti, A. and Sfameni, C. and Antonini, G.},
}
@INCOLLECTION{DELGROSSO_2025_INCOLLECTION_DZBR_523028,
AUTHOR = {Del Grosso, A. M. and Zenzaro, S. and Boschetti, F. and Ranocchia, G.},
TITLE = {Bridging Traditional and Digital Papyrology with Domain-Specific Languages},
YEAR = {2025},
ABSTRACT = {In this chapter, we propose a method to bridge the divide between traditional and digital papyrology by harnessing the capabilities of Domain Specific Languages (DSLs). Our approach, namely DSL-based Digital Scholarly Editing (DSL-based DSE), seeks to pave the way for harmonious integration. We believe that it is possible to bridge the gap between traditional and digital papyrology leveraging Domain Specific Languages by following the DSL-based DSE methodology. Throughout this chapter, we describe the GreekSchools project that is our testing ground for our methodology. Additionally, we offer a succinct theoretical foundation for our novel approach, elucidating the underlying principles guiding its design. Then we define DSL-based DSE and illustrate its practical implications through concrete examples, showcasing the dynamic interplay between our methodology and EpiDoc. Finally, we introduce CoPhi Editor, a collaborative and cooperative Web-based platform that implements the DSL-based DSE methodology for the GreekSchools project, but it aims to position itself among the useful tools for collaborative editing of digital scholarly editions, like SoSOL, Perseids, TextualCommunities, and others},
KEYWORDS = {Digital Papyrology, Digital Humanities, Digital Scholarly Editing, TEI/EpiDoc, Computational Philology},
PAGES = {125-152},
URL = {https://www.degruyter.com/document/doi/10.1515/9783111070162/html},
VOLUME = {3},
DOI = {10.1515/9783111070162-009},
PUBLISHER = {De Gruyter (Berlin/Boston, DEU)},
ISBN = {9783111070162},
CONFERENCE_PLACE = {Berlin/Boston},
BOOKTITLE = {Digital Papyrology},
EDITOR = {Reggiani, N.},
}
@INCOLLECTION{DIDONATO_2025_INCOLLECTION_D_560015,
AUTHOR = {Di Donato, F.},
TITLE = {Open Science and the Role of Social Sciences Research Infrastructures and Data},
YEAR = {2025},
ABSTRACT = {The first chapter delves into Open Science, exploring the origins of foundational approaches, concepts, and principles that advocate for inclusion, quality, transparency and collaboration in research. The chapter emphasises key principles such as collaboration and sharing, which are crucial for advancing Open Science. In the OS landscape, Research Infrastructures are a crucial axis. The role of research infrastructures is here highlighted, considering their enabling and facilitating function for the adoption of Open Science practices. RIs are fundamental for defining the European Open Science Cloud, the large overarching framework within which the European Commission has been building the European Research Area for the past 10 years. In particular, Social Sciences data and open panel data can play a crucial role in conducting the multidisciplinary, multilingual and inclusive research needed to respond to today’s challenges},
KEYWORDS = {open science, research infrastructures, SSH},
PAGES = {3-17},
URL = {https://link.springer.com/chapter/10.1007/978-3-032-07005-0_1},
DOI = {10.1007/978-3-032-07005-0},
PUBLISHER = {Springer},
ISBN = {978-3-032-07004-3},
BOOKTITLE = {Longitudinal Data Infrastructures in Europe. Tools for Open Science in Social Science Research},
}
@INCOLLECTION{GUADAGNINI_2025_INCOLLECTION_GM_543921,
AUTHOR = {Guadagnini, E. and Mabboux, C.},
TITLE = {Una nuova edizione della "Rettorica" di Brunetto Latini},
YEAR = {2025},
ABSTRACT = {Presentazione della nuova edizione critica della "Rettorica" di Brunetto Latini},
KEYWORDS = {Brunetto Latini, retorica,},
PAGES = {51-67},
URL = {https://www.isime.it/product/brunetto-latini-intellettuale-medievale/},
PUBLISHER = {Istituto Storico Italiano per il Medioevo (Roma, ITA)},
ISBN = {9788831445443},
CONFERENCE_PLACE = {Roma},
BOOKTITLE = {Brunetto Latini. Intellettuale medievale},
}
@INCOLLECTION{ZENZARO_2025_INCOLLECTION_ZBD_543101,
AUTHOR = {Zenzaro, S. and Boschetti, F. and Del Grosso, A. M.},
TITLE = {Making digital scholarly editions based on Domain Specific Languages},
YEAR = {2025},
ABSTRACT = {Define a methodology for using domain-specific languages to create digital scholarly editions},
KEYWORDS = {Digital Scholarly Editions, Domain Specific Languages},
PAGES = {141-164},
URL = {https://books.sup.ac.uk/sup/catalog/book/4},
DOI = {10.62637/sup.GHST9020},
PUBLISHER = {Scottish University Press (Edinburgh, GBR)},
ISBN = {9781917341073},
CONFERENCE_PLACE = {Edinburgh},
BOOKTITLE = {Digital editing and publishing in the twenty-first century},
EDITOR = {O'Sullivan, J. and Pidd, M. and Wessels, B. and Murphy, O. and Kurzmeier, M. and Whittle, S.},
}
@INPROCEEDINGS{ALZETTA_2025_INPROCEEDINGS_AM_571223,
AUTHOR = {Alzetta, C. and Montemagni, S.},
TITLE = {Low-vs High-level Lemmatization for Historical Languages. A Case study on Italian},
YEAR = {2025},
ABSTRACT = {Lemmatization remains a foundational yet challenging task in the processing of historical Italian texts, due to the complex interplay of orthographic, morphological, and diatopic variation. A crucial, yet often overlooked, aspect is the degree of normalization applied during lemmatization. A conservative approach preserves attested historical forms, ensuring greater linguistic fidelity but increasing data sparsity. Conversely, an abstract normalization strategy aligns historical variants with standardized contemporary lemmas, improving generalization but potentially introducing inaccurate mappings. In this paper, we present a comparative evaluation of conservative and normalized lemmatization strategies for historical Italian. To our knowledge, this is the first study to explicitly assess the impact of lemmatization strategies in the context of historical languages, particularly those that are morphologically rich. Our results indicate that high-level normalization offers a promising trade-off between precision and generalization},
KEYWORDS = {Data-driven Lemmatization, Historical Italian, Universal Dependencies, Normalization},
PAGES = {10},
URL = {https://aclanthology.org/2025.clicit-1.4.pdf},
PUBLISHER = {CEUR Workshop Proceeding},
ISBN = {979-12-243-0587-3},
CONFERENCE_NAME = {Eleventh Italian Conference on Computational Linguistics (CLiC-it 2025)},
BOOKTITLE = {Proceedings of the Eleventh Italian Conference on Computational Linguistics (CLiC-it 2025)},
}
@INPROCEEDINGS{BARDI_2025_INPROCEEDINGS_BBDDDFGMRRT_557642,
AUTHOR = {Bardi, A. and Buzzoni, M. and Daquino, M. and Del Gratta, R. and Del Grosso, A. M. and Fischer, F. and Giacomini, S. and Martignano, C. and Rosselli Del Turco, R. and Rubin, G. and Tomasi, F.},
TITLE = {FAIR Digital Humanities scholarly metadata. The ATLAS project},
YEAR = {2025},
ABSTRACT = {This paper was presented at the Workshop on Open Citations and Open Scholarly Metadata (WOOC 2025), held in Bologna on 28–29 May 2025. It is included in the official workshop proceedings and contributes to ongoing discussions around open infrastructures, citation data, and scholarly metadata interoperability},
KEYWORDS = {Digital Humanities, FAIR principles},
PAGES = {4},
URL = {https://zenodo.org/records/16366693},
DOI = {10.5281/zenodo.16366692},
PUBLISHER = {Zenodo},
CONFERENCE_NAME = {WOOC 2025-Workshop on Open Citations and Open Scholarly Metadata},
BOOKTITLE = {WOOC 2025 proceedings},
}
@INPROCEEDINGS{BARONI_2025_INPROCEEDINGS_BBFFFFGPPRSTV_582243,
AUTHOR = {Baroni, P. and Bistarelli, S. and Fazzinga, B. and Fellin, G. and Flesca, S. and Furfaro, F. and Giacomin, M. and Parisi, F. and Proietti, C. and Russo, I. and Santini, F. and Taticchi, C. and Vernillo, P.},
TITLE = {Empowering Public Interest Communication with Argumentation-Project Report},
YEAR = {2025},
ABSTRACT = {The EPICA (Empowering Public Interest Communication with Argumentation) project aims to improve Public Interest Communication (PIC) through the use of advanced Computational Argumentation (CA) techniques. This paper provides a summary of the technical results of the project and discusses future research direction},
KEYWORDS = {Automated Reasoning, Computational Argumentation, Public Interest Communication},
PAGES = {37-42},
URL = {https://iris.cnr.it/handle/20.500.14243/582243},
VOLUME = {4025},
PUBLISHER = {CEUR WS},
CONFERENCE_NAME = {9th Workshop on Advances in Argumentation in Artificial Intelligence, AI^3 2025},
BOOKTITLE = {AI^3 2025, Advances in Argumentation in Artificial Intelligence},
}
@INPROCEEDINGS{BARONI_2025_INPROCEEDINGS_BFGP_582225,
AUTHOR = {Baroni, P. and Fellin, G. and Giacomin, M. and Proietti, C.},
TITLE = {A NetLogo Tool for Exploring Value-Based Argumentation in Public Interest Communication},
YEAR = {2025},
ABSTRACT = {We present a NetLogo-based tool for simulating how public interest arguments influence diverse audiences over time. Extending a previous theoretical model, agents are assigned profiles represented by value vectors that evolve through interaction with neighbours, capturing social influence dynamics. The tool computes the variation over time of the persuasive impact of arguments on the population on the basis of these evolving profiles. While the model simplifies argument exposure as continuous and uniform, it offers a foundation for more realistic simulations incorporating multiple arguments and competing campaigns in future work},
KEYWORDS = {Computational Argumentation, NetLogo, Public Interest Communication, Value-Based Argumentation, Vector-Based Model, Voting Models},
PAGES = {84-89},
VOLUME = {4025},
PUBLISHER = {CEUR WS},
CONFERENCE_NAME = {9th Workshop on Advances in Argumentation in Artificial Intelligence, AI^3 2025},
BOOKTITLE = {AI^3 2025, Advances in Argumentation in Artificial Intelligence},
}
@INPROCEEDINGS{BARONI_2025_INPROCEEDINGS_BFGP_582221,
AUTHOR = {Baroni, P. and Fellin, G. and Giacomin, M. and Proietti, C.},
TITLE = {On Monotonic and Nonmonotonic Effects of Arguments in Public Interest Communication},
YEAR = {2025},
ABSTRACT = {In a previous work we introduced a vector-based extension of value-based argumentation for public interest communication aimed to provide an articulated model of the impact of a communication campaign on a set of target audiences. The proposed model was monotonic, intuitively meaning that adding arguments to a campaign and enlarging the set of the values they cover cannot decrease the effectiveness of the campaign itself. As this property does not always hold in practice, in this paper we extend the model in order to encompass nonmonotonic effects both at the level of quantitative measures of campaign impact and of the acceptability of the campaign arguments with respect to a standard argumentation semantics. In both cases, we identify some sufficient conditions for monotonicity and provide a preliminary discussion about their relevance and applicability in practice},
KEYWORDS = {Computational argumentation, Public interest communication, Value-based argumentation},
PAGES = {71-83},
VOLUME = {4025},
CONFERENCE_NAME = {9th Workshop on Advances in Argumentation in Artificial Intelligence, AI^3 2025},
BOOKTITLE = {AI^3 2025, Advances in Argumentation in Artificial Intelligence},
}
@INPROCEEDINGS{BELBACHIR_2025_INPROCEEDINGS_BKCEMN_563028,
AUTHOR = {Belbachir, S. and Khlif, N. and Chahhou, M. and El Mohajir, M. and Mazroui, A. and Nahli, O.},
TITLE = {A Proposed Approach for Extracting Semantic and Lexical Relations for Low-Resource Languages: A Case Study of Darija},
YEAR = {2025},
ABSTRACT = {Extracting semantic relations between words is crucial for the development and enrichment of lexical resources, especially for under-resourced languages like Moroccan Darija. This paper presents an automated methodology for identifying synonyms, antonyms, hypernyms, and hyponyms by leveraging bilingual Darija-English resources, Princeton WordNet (PWN), the Suggested Upper Merged Ontology (SUMO), and the NLTK toolkit. Experimental evaluation was conducted on a dataset of 361 Darija nouns, selected as a preliminary testbed to validate the methodology before scaling it to the full lexicon. The results show that 83. 10% were successfully aligned with PWN synsets, resulting in the extraction of 14, 201 semantic relations, of which 5, 475 (38. 55%) were validated through back-translation. These findings confirm the potential of transferring semantic knowledge from English into Darija, despite cultural and lexical mismatches. The proposed pipeline substantially enriches Darija's lexical coverage and offers a scalable and replicable approach for developing semantic resources in other low-resource dialects. © 2025 IEEE},
KEYWORDS = {Darija, NLP, NLTK, Ontology, semantic relation, sumo, Wordnet},
PAGES = {153-160},
URL = {https://iris.cnr.it/handle/20.500.14243/563028},
DOI = {10.1109/CiSt65886.2025.11224229},
BOOKTITLE = {A Proposed Approach for Extracting Semantic and Lexical Relations for Low-Resource Languages: A Case Study of Darija},
}
@INPROCEEDINGS{BELBACHIR_2025_INPROCEEDINGS_BNEC_566029,
AUTHOR = {Belbachir, S. and Nahli, O. and El Mohajir, M. and Chahhou, M.},
TITLE = {Building a Machine Learning Classifier for Synonyms Validation in Moroccan Darija},
YEAR = {2025},
ABSTRACT = {Building lexical resources for low-resource languages, such as Arabic dialects, remains a challenging yet essential endeavor. One major difficulty lies in the reliable identification of appropriate synonyms, which requires both rich lexical data and robust machine learning techniques. This study presents a synset classification framework for Darija (Moroccan Arabic), leveraging contextual embeddings derived from multiple Transformer-based language models to capture the semantic richness of the dialect. In addition to contextual similarity, we automatically extract lexical and ontological similarity features. These features are combined and used as input to supervised classification algorithms. Several classifiers were evaluated, including Logistic Regression, Random Forest, Decision Tree, and Gradient Boosting. The models were trained to predict the most appropriate WordNet synset for each Darija word, with performance assessed through k-fold cross-validation. Experimental results confirm the effectiveness of the proposed approach, with the best-performing model achieving an accuracy of 73. 28% and an F1-score of 84. 81%, underscoring the potential of Transformer-based embeddings in advancing lexical resource development for under-resourced languages},
KEYWORDS = {Princeton WordNet (PWN), Darija,Natural Language Processing (NLP), Logistic Regression (LR), SUMO, Semantic Similarity, Cosine Similarity, Machine Learning.},
PAGES = {80-87},
URL = {https://iris.cnr.it/handle/20.500.14243/566029},
DOI = {10.1109/CiSt65886.2025.11224302},
BOOKTITLE = {8th IEEE Congress on Information Science and Technology},
}
@INPROCEEDINGS{BONFIGLI_2025_INPROCEEDINGS_BPBDBCPRVPMP_570763,
AUTHOR = {Bonfigli, A. and Piperno, R. and Bacco, L. and Dell'Orletta, F. and Brunato, D. and Crispino, F. and Papalia, G. F. and Russo, F. and Vadalà, G. and Papalia, R. and Merone, M. and Pecchia, L.},
TITLE = {A Novel Real-World Dataset of Italian Clinical Notes for NLP-based Decision Support in Low Back Pain Treatment},
YEAR = {2025},
ABSTRACT = {Low back pain represents a leading source of disability worldwide and poses a significant challenge for evidence-based clinical decision support. In contexts where Italian-language resources for diversified therapeutic pathways are lacking, we have assembled a novel, annotated dataset comprising up to three pre-treatment documents per patient (MRI report, X-ray report, and patient visit notes), alongside demographic information (age and sex). The cohort consists of 176 patient records, stratified into three therapeutic groups: 50 conservative, 92 regenerative, and 34 surgical. The primary aim is to investigate whether the collected dataset can be harnessed to predict which of the three treatment modalities is most appropriate. To this end, six document-combination scenarios were defined, evaluating each single-report modality as well as all possible pairings. For each scenario, two modeling strategies were contrasted: a traditional Support Vector Machine classifier leveraging TF–IDF features based on unigrams, bigrams, and trigrams, and a fine-tuned Italian BERT model adapted to our corpus. Experimental results indicate that classic n-gram–based approaches achieve the highest performance (macro–𝐹1 up to 71. 3%). The BERT model, while outperforming the baseline, encounters limitations in this low-resource scenario. These findings suggest that the present dataset has the potential to catalyze the development of Italian-language clinical decision support systems that account for the distinct signatures of treatment pathways},
KEYWORDS = {NLP in healthcare, Large Language Models (LLMs), Italian Medical Corpus},
URL = {https://iris.cnr.it/handle/20.500.14243/570763},
BOOKTITLE = {Proceedings of the Eleventh Italian Conference on Computational Linguistics (CLiC-it 2025)},
}
@INPROCEEDINGS{BRUNATO_2025_INPROCEEDINGS_B_532162,
AUTHOR = {Brunato, D.},
TITLE = {Learning from Impairment: Leveraging Insights from Clinical Linguistics in Language Modelling Research},
YEAR = {2025},
ABSTRACT = {This position paper investigates the potential of integrating insights from language impairment research and its clinical treatment to develop human-inspired learning strategies and evaluation frameworks for language models (LMs). We inspect the theoretical underpinnings underlying some influential linguistically motivated training approaches derived from neurolinguistics and, particularly, aphasiology, aimed at enhancing the recovery and generalization of linguistic skills in aphasia treatment, with a primary focus on those targeting the syntactic domain. We highlight how these insights can inform the design of rigorous assessments for LMs, specifically in their handling of complex syntactic phenomena, as well as their implications for developing human-like learning strategies, aligning with efforts to create more sustainable and cognitively plausible natural language processing (NLP) models},
KEYWORDS = {language modelling, clinical linguistics, syntactic complexity},
PAGES = {4167-4174},
URL = {https://aclanthology.org/2025.coling-main.281/},
ISBN = {979-8-89176-196-4},
CONFERENCE_NAME = {31st International Conference on Computational Linguistics},
BOOKTITLE = {Proceedings of the 31st International Conference on Computational Linguistics},
}
@INPROCEEDINGS{CALDERARO_2025_INPROCEEDINGS_CMD_570746,
AUTHOR = {Calderaro, S. and Miaschi, A. and Dell'Orletta, F.},
TITLE = {The OuLiBench Benchmark: Formal Constraints as a Lens into LLM Linguistic Competence},
YEAR = {2025},
ABSTRACT = {Recent progress in Large Language Models (LLMs) has led to impressive capabilities in Natural Language Generation (NLG). However, standard evaluation benchmarks often focus on surface-level performance and are predominantly English-centric, limiting insights into models’ deeper linguistic competences, especially in other languages. In this paper, we introduce OuLiBench, a novel benchmark inspired by the literary movement OuLiPo, designed to evaluate LLMs’ ability to generate Italian text under explicit linguistic constraints, ranging from morpho-syntactic requirements to creative and structural challenges. Our goal is to assess the extent to which LLMs can understand and manipulate language when guided by specific, sometimes artificial constraints. We evaluate a range of state-of-the-art models in both zero-and few-shot settings, comparing performance across constraint types and difficulty levels. Our results highlight significant variability across models and tasks, shedding light on the limits of controllable text generation and offering a new lens for probing LLMs’ generative and linguistic competence beyond traditional benchmarks},
KEYWORDS = {Large Language Models, Benchmark, Evaluation, Controllable Text Generation},
URL = {https://iris.cnr.it/handle/20.500.14243/570746},
BOOKTITLE = {Proceedings of the Eleventh Italian Conference on Computational Linguistics (CLiC-it 2025)},
}
@INPROCEEDINGS{CARDILLO_2025_INPROCEEDINGS_CDFACC_562981,
AUTHOR = {Cardillo, F. A. and Debole, F. and Frontini, F. and Aelami, M. and Chahinian, N. and Conrad, S.},
TITLE = {Novel benchmark for NER in the wastewater and stormwater domain},
YEAR = {2025},
ABSTRACT = {Efficient wastewater and stormwater management is mandatory for sustainable cities. Extracting structured knowledge from reports and regulations is challenging due to domain-specific terminology and multilingual contexts. This work focuses on domain-specific Named Entity Recognition (NER) as a first step towards effective relation and information extraction to support decision making. A multilingual benchmark is crucial for evaluating these methods. This study develops a French-Italian domain-specific text corpus for wastewater management. It evaluates state-of-the-art NER methods, including LLM-based approaches, to provide a reliable baseline for future strategies and explores automated annotation projection in view of an extension of the corpus to new languages},
KEYWORDS = {Annotation projection, Domain-specific corpus, LLMs for NER, Multilingual NLP, Named Entity Recognition},
PAGES = {226-231},
URL = {https://ieeexplore.ieee.org/document/11224095},
DOI = {10.1109/cist65886.2025.11224095},
PUBLISHER = {Institute of Electrical and Electronics Engineers (USA)},
ISBN = {979-8-3315-4384-6},
CONFERENCE_NAME = {Cist 2025-8th IEEE International Congress on Information Science and Technology},
CONFERENCE_PLACE = {USA},
BOOKTITLE = {Cist 2025 proceedings},
}
@INPROCEEDINGS{CHABAN_2025_INPROCEEDINGS_CBPFOBSFSRS_571121,
AUTHOR = {Chaban, A. and Benassi, L. and Pedonese, G. and Frontini, F. and Ottaviani, R. and Boschetti, F. and Spadi, A. and Francalanci, L. and Sconamiglio, A. and Restaneo, P. and Striova, J.},
TITLE = {Bridging Disciplines for Heritage Professionals: The H2IOSC Digital Training Platform (by CLARIN, DARIAH, E-RIHS and OPERAS)},
YEAR = {2025},
ABSTRACT = {The complexity of the contemporary heritage field requires professionals to develop interdisciplinary skills and to collaborate across diverse disciplines, from social sciences and digital humanities to preservation of cultural heritage, archaeology and beyond. As digital and interactive tools become increasingly integrated into heritage studies, the training in the field is undergoing a significant transformation. The H2IOSC (Heritage and Humanities Italian Open Science Cloud) project has developed an innovative digital training infrastructure aimed at providing access to FAIR (Findable, Accessible, Interoperable and Reusable) courses and training materials. In this abstract we focus on the H2IOSC training platform, aimed to address the evolving training needs of our disciplinary communities. Created by H2IOSC WP8 (Work Package 8: Training, Engagement and Capacity Building) in collaboration with the E. T. T. S. p. A., it is maintained and hosted by CNR-ILC (Institute of Computational Linguistics “A. Zampolli”), host institution of CLARIN-IT, with the participation of the national nodes of DARIAH, E-RIHS, and OPERAS. The platform provides a flexible, customizable learning environment designed to support interdisciplinary education and continuous professional development in the Social Sciences, Digital Humanities and Cultural Heritage sectors. The platform features a comprehensive course catalogue containing training courses and modules developed or adapted by the four infrastructures within the H2IOSC project as FAIR training materials, designed for various target knowledge levels, from beginners to advanced learners in heritage and humanities fields. An intuitive dashboard allows users to access materials, track progress and use collaborative tools, including forums, chats, and virtual working groups for networking and communication. The platform incorporates quizzes, simulations, hands-on exercises, and gamification tools, making learning more interactive. Designed for accessibility and inclusivity, it is fully compatible with both desktop and mobile devices, enabling individual learning without geographical or temporal constraints. This paper outlines the development process of the platform, addressing the challenges encountered, the key achievements, and its potential to transform training within the Social Sciences, Digital Humanities and Heritage Sector. We highlight how the design of specialized digital heritage training materials has influenced the development of the Digital Asset Management (DAM) system, particularly its ability to support effective cataloguing, metadata management, and archival of multimedia data. Ultimately, we emphasize the importance of adopting best practices for interdisciplinary learning and explore how digital tools can foster greater collaboration and knowledge exchange across heritage and humanities disciplines},
KEYWORDS = {heritage, digital humanities, training, FAIR},
URL = {https://iris.cnr.it/handle/20.500.14243/571121},
DOI = {10.2312/dh.20253036},
BOOKTITLE = {Digital Heritage 2025},
}
@INPROCEEDINGS{CIACCIO_2025_INPROCEEDINGS_CMD_570462,
AUTHOR = {Ciaccio, C. and Miaschi, A. and Dell'Orletta, F.},
TITLE = {Evaluating Lexical Proficiency in Neural Language Models},
YEAR = {2025},
ABSTRACT = {We present a novel evaluation framework designed to assess the lexical proficiency and linguistic creativity of Transformer-based Language Models (LMs). We validate the framework by analyzing the performance of a set of LMs of different sizes, in both mono-and multilingual configuration, across tasks involving the generation, definition, and contextual usage of lexicalized words, neologisms, and nonce words. To support these evaluations, we developed a novel dataset of lexical entries for the Italian language, including curated definitions and usage examples sourced from various online platforms. The results highlight the robustness and effectiveness of our framework in evaluating multiple dimensions of LMs' linguistic understanding and offer an insight, through the assessment of their linguistic creativity, on the lexical generalization abilities of LMs},
KEYWORDS = {Large Language Models (LLMs), Interpretability},
PAGES = {1267-1286},
URL = {https://iris.cnr.it/handle/20.500.14243/570462},
VOLUME = {1},
DOI = {10.18653/v1/2025.acl-long.64},
PUBLISHER = {Association for Computational Linguistics (ACL)},
CONFERENCE_NAME = {63rd Annual Meeting of the Association for Computational Linguistics, ACL 2025},
BOOKTITLE = {Proceedings of the Annual Meeting of the Association for Computational Linguistics},
}
@INPROCEEDINGS{CIACCIO_2025_INPROCEEDINGS_CSMD_570745,
AUTHOR = {Ciaccio, C. and Sarti, G. and Miaschi, A. and Dell'Orletta, F.},
TITLE = {Crossword Space: Latent Manifold Learning for Italian Crosswords and Beyond},
YEAR = {2025},
ABSTRACT = {Answering crossword puzzle clues presents a challenging retrieval task that requires matching linguistically rich and often ambiguous clues with appropriate solutions. While traditional retrieval-based strategies can commonly be used to address this issue, wordplays and other lateral thinking strategies limit the effectiveness of conventional lexical and semantic approaches. In this work, we address the clue answering task as an information retrieval problem exploiting the potential of encoder-based Transformer models to learn a shared latent space between clues and solutions. In particular, we propose for the first time a collection of siamese and asymmetric dual encoder architectures trained to capture the complex properties and relation characterizing crossword clues and their solutions for the Italian language. After comparing various architectures for this task, we show that the strong retrieval capabilities of these systems extend to neologisms and dictionary terms, suggesting their potential use in linguistic analyses beyond the scope of language games},
KEYWORDS = {Language Games, Crosswords, Semantic Similarity, Embeddings, Natural Language Processing, Information Retrieval},
URL = {https://iris.cnr.it/handle/20.500.14243/570745},
BOOKTITLE = {Proceedings of the Eleventh Italian Conference on Computational Linguistics (CLiC-it 2025)},
}
@INPROCEEDINGS{CIACCIO_2025_INPROCEEDINGS_CSMD_570461,
AUTHOR = {Ciaccio, C. and Sartor, M. and Miaschi, A. and Dell'Orletta, F.},
TITLE = {Beyond the Spelling Miracle: Investigating Substring Awareness in Character-Blind Language Models},
YEAR = {2025},
ABSTRACT = {Correctly identifying characters and substrings of words should be a basic but essential ability of any Language Model that aims to proficiently understand and produce language. Despite so, the majority of Pre-trained Language Models (PLMs) are "character-blind" and struggle in spelling tasks, although they still seem to acquire some character knowledge during pre-training, a phenomenon dubbed Spelling Miracle. To shed light on this phenomenon, we systematically evaluate a range of PLMs with different parameter sizes using a controlled binary substring identification task. Through a series of experiments, we propose the first comprehensive investigation on where, when, and how PLMs develop awareness of characters and substrings, with a particular linguistic focus on morphemic units such as prefixes, suffixes, and roots},
KEYWORDS = {Large Language Models (LLMs), Interpretability},
PAGES = {11361-11372},
URL = {https://iris.cnr.it/handle/20.500.14243/570461},
DOI = {10.18653/v1/2025.findings-acl.593},
PUBLISHER = {Association for Computational Linguistics (ACL)},
CONFERENCE_NAME = {63rd Annual Meeting of the Association for Computational Linguistics, ACL 2025},
BOOKTITLE = {Proceedings of the Annual Meeting of the Association for Computational Linguistics},
}
@INPROCEEDINGS{CIMA_2025_INPROCEEDINGS_CMTADC_570444,
AUTHOR = {Cima, L. and Miaschi, A. and Trujillo, A. and Avvenuti, M. and Dell'Orletta, F. and Cresci, S.},
TITLE = {Contextualized Counterspeech: Strategies for Adaptation, Personalization, and Evaluation},
YEAR = {2025},
ABSTRACT = {AI-generated counterspeech offers a promising and scalable strategy to curb online toxicity through direct replies that promote civil discourse. However, current counterspeech is one-size-fits-all, lacking adaptation to the moderation context and the users involved. We propose and evaluate multiple strategies for generating tailored counterspeech that is adapted to the moderation context and personalized for the moderated user. We instruct a LLaMA2-13B model to generate counterspeech, experimenting with various configurations based on different contextual information and fine-tuning strategies. We identify the configurations that generate persuasive counterspeech through a combination of quantitative indicators and human evaluations collected via a pre-registered mixed-design crowdsourcing experiment. Results show that contextualized counterspeech can significantly outperform state-of-the-art generic counterspeech in adequacy and persuasiveness, without compromising other characteristics. Our findings also reveal a poor correlation between quantitative indicators and human evaluations, suggesting that these methods assess different aspects and highlighting the need for nuanced evaluation methodologies. The effectiveness of contextualized AI-generated counterspeech and the divergence between human and algorithmic evaluations underscore the importance of increased human-AI collaboration in content moderation},
KEYWORDS = {content moderation, Counterspeech, generative AI, online toxicity, personalization},
PAGES = {5022-5033},
URL = {https://iris.cnr.it/handle/20.500.14243/570444},
DOI = {10.1145/3696410.3714507},
PUBLISHER = {Association for Computing Machinery, Inc (1601 Broadway, 10th Floor, NEW YORK, NY, UNITED STATES)},
CONFERENCE_NAME = {34th ACM Web Conference, WWW 2025},
CONFERENCE_PLACE = {1601 Broadway, 10th Floor, NEW YORK, NY, UNITED STATES},
BOOKTITLE = {WWW 2025-Proceedings of the ACM Web Conference},
}
@INPROCEEDINGS{CININI_2025_INPROCEEDINGS_CMSM_579507,
AUTHOR = {Cinini, A. and Marongiu, P. and Sassolini, E. and Monachini, M.},
TITLE = {Preserving Preserving and enhancing cultural heritage: the Digest project},
YEAR = {2025},
ABSTRACT = {Valorizzare e custodire il patrimonio culturale: alla scoperta del progetto Digesto. Il contributo vuole discutere delle attivita connesse alla salvaguardia e alla valorizzazione di corpora testuali di valore storicoculturale prodotti in un lungo arco temporale. Analizzeremo le problematiche legate al progresso delle tecnologie utilizzate per la creazione/elaborazione dei dati che sono mutate nel tempo, nonche l'arduo passaggio dai formati proprietari a quelli standard per una migliore condivisione e interoperabilita dei dati. Infine, descriveremo la non facile transizione verso paradigmi di dati aperti e i passaggi necessari per migrare i dati verso infrastrutture di ricerca internazionali. In particolare, descriveremo le fasi del progetto di traduzione del Digesto di Giustiniano che hanno richiesto il supporto tecnologico del nostro gruppo di ricerca, e come questo contributo e cambiato di pari passo con il progresso tecnologico. Vogliamo offrire alla comunita DH un punto di vista reale sull'evoluzione della digitalizzazione/informatizzazione di grandi risorse testuali. Nel caso specifico, discuteremo del supporto alla traduzione specializzata dal latino all'italiano con strumenti di analisi testuale, e della trasformazione dei testi originali e tradotti in un corpus bilingue parallelo; di come questo e stato convertito in formato XML TEI; infine, delle operazioni necessarie al deposito dei dati all'interno dell'infrastruttura di ricerca CLARIN},
KEYWORDS = {texts corpora, standard TEI format, digital preservation, corpora testuali, standard TEI, preservazione digitale},
PAGES = {600-607},
URL = {https://amsacta.unibo.it/id/eprint/8380/},
DOI = {10.6092/unibo},
PUBLISHER = {AIUCD (ITA)},
ISBN = {978-88-942535-9-7},
CONFERENCE_NAME = {Diversità, Equità e Inclusione: Sfide e Opportunità per l’Informatica Umanistica nell’Era dell’Intelligenza Artificiale},
CONFERENCE_PLACE = {ITA},
BOOKTITLE = {Diversità, Equità e Inclusione: Sfide e Opportunità per l’Informatica Umanistica nell’Era dell’Intelligenza Artificiale, Proceedings del XIV Convegno Annuale AIUCD, Verona 11-13 giugno 2025, Università di Verona},
EDITOR = {Rebora, S. and Rospocher, M. and Bazzaco, S.},
}
@INPROCEEDINGS{CONGIU_2025_INPROCEEDINGS_CDR_571301,
AUTHOR = {Congiu, C. and Del Grosso, A. M. and Riccucci, M.},
TITLE = {Verso l’implementazione di un sistema di riconoscimento di allusioni al lessico dantesco nelle testimonianze del Lager: il caso d’uso in Voci dall’Inferno},
YEAR = {2025},
ABSTRACT = {Voci dall’Inferno è un progetto di ricerca dell’Università di Pisa, sviluppato con il supporto dell’Istituto di Linguistica Computazionale “A. Zampolli”. L’iniziativa ha due principali obiettivi scientifici: a) digitalizzare il primo corpus di testimonianze non letterarie di deportati sopravvissuti ai campi di concentramento e b) identificare al suo interno la presenza di citazioni e/o allusioni al lessico di Dante (Del Grosso et al., 2024). Al fine di raggiungere questo secondo obiettivo è stato sviluppato un prototipo di applicazione web denominata Voci dall’Inferno Verse Similarity Search. Il sistema è progettato per individuare citazioni e allusioni al lessico dantesco mediante approcci computazionali alla ricerca di frasi presenti nelle testimonianze e il confronto di essi con i versi presenti nella Divina Commedia di Dante Alighieri. L’applicazione, realizzata in Python, utilizza tecnologie avanzate come Weaviate, una piattaforma opensource per la ricerca vettoriale, e Streamlit, un framework per lo sviluppo di applicazioni web. Basandosi su metriche di Sentence Similarity, l’applicazione sfrutta modelli di machine learning per trasformare i testi in rappresentazioni di embeddings e in seguito misurarne la similarità. Attualmente l’applicazione non è ancora disponibile per l’uso da parte del pubblico, ciononostante l’infrastruttura di ricerca CLARIN-IT (H2IOSC) è stata contattata per ospitare l’applicazione garantendone accesso e sostenibilità. Una demo sarà predisposta per la conferenza qualora il contributo venisse accettato},
KEYWORDS = {Voci dall’Inferno, Sentence Similarity, Sentence Transformers, vector database, embeddings, Sentence Similarity, Sentence Transformers, vector database, embeddings, Voci dall’Inferno},
PAGES = {270-275},
URL = {https://amsacta.unibo.it/id/eprint/8380/},
DOI = {10.6092/unibo},
PUBLISHER = {AIUCD},
ISBN = {978-88-942535-9-7},
CONFERENCE_NAME = {Diversity, Equity, and Inclusion: Challenges and Opportunities for Digital Humanities in the Age of Artificial Intelligence},
BOOKTITLE = {Diversity, Equity, and Inclusion: Challenges and Opportunities for Digital Humanities in the Age of Artificial Intelligence, Proceedings del XIV Convegno Annuale AIUCD, Verona 11-13 giugno 2025, Università di Verona},
EDITOR = {Rebora, S. and Rospocher, M. and Bazzaco, S.},
}
@INPROCEEDINGS{COSTA_2025_INPROCEEDINGS_CZ_571261,
AUTHOR = {Costa, G. and Zenzaro, S.},
TITLE = {Un modello integrato per il Roman d’Alexandre del codice Correr 1493: annotazione linguistica e edizione critica digitale},
YEAR = {2025},
ABSTRACT = {L’obiettivo di questa proposta è di presentare alcune riflessioni, a livello sia pratico sia teorico, su di un nuovo modello di edizione critica digitale in cui i metadati derivati dall’annotazione linguistica di un testo possano essere assimilati e consultati. Lo scopo è di superare la divisione che spesso intercorre tra il piano ecdotico-filologico e quello dei corpora linguistici, proponendo, pertanto, lo sviluppo di un sistema integrato in cui il metadato linguistico possa essere interrogato in tutte le sue parti direttamente dall’interfaccia dedicata all’edizione critica digitale del testo oggetto di annotazione. L’oggetto di indagine di questo progetto sono testi che presentano particolarità linguistiche, in particolar modo legati a fenomeni di ibridismo tra diverse varietà e code-mixing. La proof of concept è in fase di sviluppo su di un testo medioevale appartenente al corpus del cosiddetto francese d’Italia, ovvero l’insieme di testi composti o trascritti in francese da autori della Penisola, tra il XIII e il XV secolo, nei quali i volgari medioevali italiani hanno trovato punti di contatto e di fusione con le varietà del francese antico},
KEYWORDS = {edizioni critiche digitali, annotazione linguistica automatica, corpora linguistici, Francese d’Italia (XIII-XV secolo)},
PAGES = {228-231},
URL = {https://aiucd2025.dlls.univr.it/proceedings/},
DOI = {10.6092/unibo},
ISBN = {978-88-942535-9-7},
CONFERENCE_NAME = {AIUCD2025-Diversità, Equità e Inclusione: Sfide e Opportunità per l’Informatica Umanistica nell’Era dell’Intelligenza Artificiale},
BOOKTITLE = {Proceedings del XIV Convegno Annuale AIUCD2025},
}
@INPROCEEDINGS{CUCURULLO_2025_INPROCEEDINGS_CMSS_571181,
AUTHOR = {Cucurullo, S. and Montemagni, S. and Saccoccio, R. and Sassolini, E.},
TITLE = {The Challenge of Obsolescence of Digital Archives in Cultural Heritage. A Case Study},
YEAR = {2025},
ABSTRACT = {This paper addresses the challenges of format, font, and software obsolescence, with a particular emphasis on cultural heritage archives. While technological impermanence is intrinsic to the digital domain, it poses serious risks to the accessibility and long-term preservation of humanities data. Focusing on intangible cultural heritage—specifically, dialect data—we explore both the problems and opportunities associated with the FAIRification of legacy resources. A case study of the Atlante Lessicale Toscano (ALT), a dialectal lexical atlas of Tuscany originally published as a digital archive in 2000, illustrates how painstakingly collected linguistic data can be transformed into sustainable, interoperable formats that ensure long-term usability and scholarly value},
KEYWORDS = {Humanities, Technological innovation, Relational databases, Linguistics, Cultural differences, Usability, Interoperability, Representation Standards, dialectal resources, digital obsolescence, FAIR data, heritage preservation},
PAGES = {506-512},
URL = {https://xplorestaging.ieee.org/document/11224142},
DOI = {10.1109/CiSt65886},
PUBLISHER = {IEEE (MAR)},
ISBN = {979-8-3315-4384-6},
CONFERENCE_NAME = {2025 IEEE 8th Congress on Information Science and Technology (CiSt)},
CONFERENCE_PLACE = {MAR},
BOOKTITLE = {Proceedings of the IEEE 8th Congress on Information Science and Technology (CiSt) 2025},
}
@INPROCEEDINGS{DELGRATTA_2025_INPROCEEDINGS_D_560724,
AUTHOR = {Del Gratta, R.},
TITLE = {Extending the Abrams-Strogatz Model with a Varying population},
YEAR = {2025},
ABSTRACT = {This paper extends the Abrams-Strogatz model of language competition by considering population variation over time and the probability of an individual being born as a speaker of one of the two languages. The model is used to analyze Mexican census data, considering the proportion of Bilingual (Spanish and Indigenous) speakers within the Indigenous community. The binomial probability distribution is chosen to measure the likelihood that out of n new Indigenous speakers, k, are born into Bilingual families. This addition complicates the fixed-point analysis of the Abrams-Strogatz model but better reflects the country’s social characteristics},
KEYWORDS = {Language Dynamics, Binomial Probability, Fixed Points Trajectories, Phase Space},
PAGES = {439-444},
URL = {https://ieeexplore.ieee.org/stamp/stamp.jsp?tp=\&arnumber=11224184},
DOI = {10.1109/cist65886.2025.11224184},
BOOKTITLE = {8th IEEE Congress on Information Science and Technology (CiSt)},
}
@INPROCEEDINGS{DELGRATTA_2025_INPROCEEDINGS_DD_560722,
AUTHOR = {Del Gratta, R. and Del Grosso, A. M.},
TITLE = {Using Functors as Format Converters},
YEAR = {2025},
ABSTRACT = {Format differences present a significant challenge to the interoperability of Text Analysis tools. It is essential to consider format conversions within a robust theoretical framework that can effectively manage these conversions while ensuring that they adhere to specific properties. This paper presents an approach based on “functors” to address format conversion for electronic textual documents. This method ensures that the properties of text and tools are preserved during the process. Functors are key concepts in Category Theory as they enable us to reformulate problems from a category where they are complicated to solve to another category where solutions are more easily attainable. The main concept of this paper is to model a specific scenario. Within the category of documents that conform to a particular format f, there arises a need to parse a document D using a Text Analysis (TA) tool t that cannot interpret the format f. The challenge can be solved with the help of format conversion from f to f′, where f′ fits with t. However, we propose and discuss a method that uses functors to “transform” D and t so that the transformed t can read D with f′},
KEYWORDS = {Format Conversion, Interoperability, Functors, Category Theory},
PAGES = {488-493},
URL = {https://ieeexplore.ieee.org/stamp/stamp.jsp?tp=\&arnumber=11224237},
VOLUME = {6},
DOI = {10.1109/cist65886.2025.11224237},
ISBN = {979-8-3315-4384-6},
BOOKTITLE = {8th IEEE Congress on Information Science and Technology (CiSt)},
}
@INPROCEEDINGS{DELGRATTA_2025_INPROCEEDINGS_DD_571361,
AUTHOR = {Del Gratta, R. and Del Grosso, A. M.},
TITLE = {Functors and format conversion},
YEAR = {2025},
ABSTRACT = {This contribution highlights the potential of functorial format conversion in applications such as digital philology and structured text analysis, where the heterogeneity of document formats often interferes with interoperability among text analysis tools},
KEYWORDS = {Interoperability, Category Theory, Text Analysis, Computational Linguistics, Linked Open Data},
PAGES = {106-108},
DOI = {10.5281/zenodo},
ISBN = {978-83-977695-0-2},
CONFERENCE_NAME = {"New Territories". Text Encoding Initiative Conference and Members' Meeting 2025},
BOOKTITLE = {"New Territories". Text Encoding Initiative Conference and Members' Meeting 2025},
}
@INPROCEEDINGS{DINI_2025_INPROCEEDINGS_DBDC_570521,
AUTHOR = {Dini, L. and Brunato, D. and Dell'Orletta, F. and Caselli, T.},
TITLE = {TEXT-CAKE: Challenging Language Models on Local Text Coherence},
YEAR = {2025},
ABSTRACT = {We present a deep investigation of encoder-based Language Models (LMs) on their abilities to detect text coherence across four languages and four text genres using a new evaluation benchmark, TEXT-CAKE. We analyze both multilingual and monolingual LMs with varying architectures and parameters in different finetuning settings. Our findings demonstrate that identifying subtle perturbations that disrupt local coherence is still a challenging task. Furthermore, our results underline the importance of using diverse text genres during pre-training and of an optimal pre-traning objective and large vocabulary size. When controlling for other parameters, deep LMs (i. e., higher number of layers) have an advantage over shallow ones, even when the total number of parameters is smaller},
KEYWORDS = {Large Language Models (LLMs), Text Coherence},
PAGES = {4384-4398},
URL = {https://iris.cnr.it/handle/20.500.14243/570521},
PUBLISHER = {Association for Computational Linguistics (ACL)},
CONFERENCE_NAME = {31st International Conference on Computational Linguistics, COLING 2025},
BOOKTITLE = {Proceedings-International Conference on Computational Linguistics, COLING},
}
@INPROCEEDINGS{DINI_2025_INPROCEEDINGS_DDBD_570446,
AUTHOR = {Dini, L. and Domenichelli, L. and Brunato, D. and Dell'Orletta, F.},
TITLE = {From Human Reading to NLM Understanding: Evaluating the Role of Eye-Tracking Data in Encoder-Based Models},
YEAR = {2025},
ABSTRACT = {Cognitive signals, particularly eye-tracking data, offer valuable insights into human language processing. Leveraging eye-gaze data from the Ghent Eye-Tracking Corpus, we conducted a series of experiments to examine how integrating knowledge of human reading behavior impacts Neural Language Models (NLMs) across multiple dimensions: task performance, attention mechanisms, and the geometry of their embedding space. We explored several fine-tuning methodologies to inject eyetracking features into the models. Our results reveal that incorporating these features does not degrade downstream task performance, enhances alignment between model attention and human attention patterns, and compresses the geometry of the embedding space},
KEYWORDS = {Large Language Models (LLMs), Eye-tracking, Interpretability},
PAGES = {17796-17813},
URL = {https://iris.cnr.it/handle/20.500.14243/570446},
VOLUME = {1},
DOI = {10.18653/v1/2025.acl-long.870},
PUBLISHER = {Association for Computational Linguistics (ACL)},
CONFERENCE_NAME = {63rd Annual Meeting of the Association for Computational Linguistics, ACL 2025},
BOOKTITLE = {Proceedings of the Annual Meeting of the Association for Computational Linguistics},
}
@INPROCEEDINGS{DOMENICHELLI_2025_INPROCEEDINGS_DDBD_570463,
AUTHOR = {Domenichelli, L. and Dini, L. and Brunato, D. and Dell'Orletta, F.},
TITLE = {The Role of Eye-Tracking Data in Encoder-Based Models: an In-depth Linguistic Analysis},
YEAR = {2025},
ABSTRACT = {This paper falls within ongoing research aimed at enhancing the human interpretability of neural language models by incorporating physiological data. Specifically, we leverage eye-tracking data collected during reading to explore how such information can guide model behavior. We train a multilingual encoder model to predict eye-tracking features from the Multilingual Eye-tracking Corpus (MECO) and analyze the resulting shifts in model attention patterns, focusing on how attention redistributes across linguistically informed categories such as part of speech, word position, word length, and distance from the syntactic head after fine-tuning. Moreover, we test how this attention shift impacts the representation of the interested words in the embedding space. The study covers both Italian and English, enabling a cross-linguistic perspective on attention and representation shifts in multilingual encoders grounded in human reading behavior},
KEYWORDS = {Eye-tracking, Neural Attention, Multilingual models, Embedding space, Interpretability},
URL = {https://iris.cnr.it/handle/20.500.14243/570463},
BOOKTITLE = {Proceedings of the Eleventh Italian Conference on Computational Linguistics (CLiC-it 2025), 24-26 September 2025, Cagliari, Italy},
}
@INPROCEEDINGS{FRANCALANCI_2025_INPROCEEDINGS_FSFRP_552964,
AUTHOR = {Francalanci, L. and Scognamiglio, A. and Falini, I. and Restaneo, P. and Pedonese, G.},
TITLE = {Il Glossario delle Infrastrutture di Ricerca (GIR)},
YEAR = {2025},
ABSTRACT = {Il Glossario delle Infrastrutture di Ricerca (GIR) è un’iniziativa che si inserisce nell’ambito del progetto PNRR “H2IOSC-Humanities and Cultural Heritage Italian Open Science Cloud” del CNR, che mira a creare una federazione di Infrastrutture di Ricerca (IR) coinvolgendo i nodi italiani di quattro infrastrutture che fanno parte della roadmap dell’European Strategy Forum on Research Infrastructure nel settore dell’innovazione sociale e culturale: CLARIN-IT, DARIAH-IT, E-RIHS. it, OPERAS. it. Il GIR nasce dall’esigenza di avere una terminologia di riferimento all’interno del progetto H2IOSC. Nella redazione dei documenti legati al progetto è emersa la difficoltà legata alla mancanza di una terminologia univoca, condivisa e non ambigua, anche nell’ottica di una piena interoperabilità dei risultati della ricerca. Da qui la necessità di definire i termini che appartengono all’ambito della progettazione e implementazione delle IR, sciogliere i numerosi acronimi presenti, e documentare questo particolare linguaggio tecnico e specialistico. A partire da una rassegna critica sui più recenti studi teorici e applicati nel campo della terminologia della lingua italiana, del lessico delle IR, del PNRR e della progettazione europea, è stata individuata una metodologia per la costruzione del Glossario che prevede l’identificazione di un corpus di riferimento poi usato per la redazione delle voci. La struttura delle voci è stata progettata prendendo come riferimento alcuni vocabolari nati direttamente in rete e prevede, per ciascun lemma, l’indicazione della categoria grammaticale, la marca d’uso, le accezioni che il termine assume nel contesto delle IR, un campo “note” per eventuali integrazioni e le voci correlate, se presenti. Il GIR rappresenta un’iniziativa preziosa per promuovere la condivisione della conoscenza e la collaborazione tra le Infrastrutture di Ricerca in Italia},
KEYWORDS = {glossario, Infrastrutture di Ricerca, terminologia, lessico specialistico},
PAGES = {24-28},
URL = {https://iris.cnr.it/handle/20.500.14243/552964},
DOI = {10.6092/unibo/amsacta/8380},
ISBN = {978-88-942535-9-7},
CONFERENCE_NAME = {XIV Convegno Annuale AIUCD 2025},
BOOKTITLE = {Diversità, Equità e Inclusione: Sfide e Opportunità per l’Informatica Umanistica nell’Era dell’Intelligenza Artificiale, Proceedings del XIV Convegno Annuale AIUCD2025},
}
@INPROCEEDINGS{GALIERO_2025_INPROCEEDINGS_GBDGM_560725,
AUTHOR = {Galiero, L. and Boschetti, F. and Del Gratta, R. and Grosso, A. M. D. and Monachini, M.},
TITLE = {Enhancing Lexical Resources: Synset Expansion and Cross-Linking Between ItalWordNet and MariTerm},
YEAR = {2025},
ABSTRACT = {This paper outlines the first operation towards a full update of MariTerm, a WordNet-like resource on maritime terminology developed and maintained by CNR-ILC, in preparation for future compliance with FAIR principles (Wilkinson et al., 2016). The project focused on expanding and linking synsets between ItalWordNet (IWN), a general lexical database for Italian, and MariTerm to enrich IWN with maritime concepts. A semi-automatic pipeline was developed to facilitate this process, prioritizing critical semantic relations and automatic evaluation. Key outcomes include an enriched ItalWordNet with links to MariTerm concepts and a revised MariTerm with connections to IWN synsets. While further refinement is needed, this work marks a significant step toward integrating maritime terminology into ItalWordNet},
KEYWORDS = {Ital Wordnet, MariTerm},
PAGES = {105-111},
URL = {https://iris.cnr.it/handle/20.500.14243/560725},
DOI = {10.18653/v1/2025.gwc-1.13},
BOOKTITLE = {Proceedings of the 13th Global Wordnet Conference},
}
@INPROCEEDINGS{GIACOMINI_2025_INPROCEEDINGS_GBBDDDFMRRT_540480,
AUTHOR = {Giacomini, S. and Bardi, A. and Buzzoni, M. and Daquino, M. and Del Gratta, R. and Del Grosso, A. M. and Fischer, F. and Martignano, C. and Rosselli Del Turco, R. and Rubin, G. and Tomasi, F.},
TITLE = {ATLAS: Towards a knowledge graph of international scholarly research on the Italian digital cultural heritage},
YEAR = {2025},
ABSTRACT = {In recent years, the abundance of available scholarly information has requested constant development and revision of standardized models and shared guidelines. Based on these frameworks, the Digital Humanities (DH) landscape features a variety of aggregators expected to enhance research data findability while promoting use and reuse. However, current semantic models fail to capture the specificity of DH research products, hindering data discovery and hampering the valorisation of Cultural Heritage. The ATLAS project addresses these key challenges by developing a unified framework for describing and aggregating scholarly outputs, particularly in the Italian Digital Cultural Heritage domain. This paper presents the initial versions of the ATLAS Ontology and Knowledge Graph, designed to model DH outcomes such as Digital Scholarly Editions, text collections, Linked Open Data, ontologies, and software. In so doing, ATLAS aims to enhance resource findability and reuse, paving the way for improved interoperability and future advancements in the field},
KEYWORDS = {Digital Humanities, Knowledge Graph, Semantic Web, Research Infrastructures, Italian Cultural Heritage},
PAGES = {13},
URL = {https://ceur-ws.org/Vol-3937/paper4.pdf},
VOLUME = {3937},
PUBLISHER = {CEUR-WP},
CONFERENCE_NAME = {IRCDL 2025: 21st Conference on Information and Research Science Connecting to Digital and Library Science},
BOOKTITLE = {IRCDL 2025 proceedings},
}
@INPROCEEDINGS{GUADAGNINI_2025_INPROCEEDINGS_G_550502,
AUTHOR = {Guadagnini, E.},
TITLE = {Una parola “marginale” dell’epopea francese (d’Italia): travache},
YEAR = {2025},
ABSTRACT = {This study focuses on the word travache (or trevache), a French adaptation of the Italian word trabacca, found within the Franco-Italian epic discursive tradition. Additionally, it considers the possibility of associating this lexical type with the reading travacles in the Ystoire de li Normant},
KEYWORDS = {Italianism, French of Italy, Travache, Trabacca},
PAGES = {263-277},
URL = {https://phaidra.cab.unipd.it/o:546755},
DOI = {10.25430/2724-0975/5},
PUBLISHER = {Dipartimento di Studi Linguistici e Letterari dell'Università degli Studi di Padova (Padova, ITA)},
ISSN = {2724-0975},
ISBN = {9788886326056},
CONFERENCE_PLACE = {Padova},
BOOKTITLE = {Entre France et Italie: marginalità nelle chansons de geste, Atti del I convegno della sezione italiana della Società Rencesvals (Genova, 19-20 ottobre 2024)},
}
@INPROCEEDINGS{HOHENEGGER_2025_INPROCEEDINGS_HMCDBDM_571341,
AUTHOR = {Hohenegger, H. and Mancinelli, T. and Ciotti, F. and De Longis, E. and Boschetti, F. and Del Grosso, A. M. and Meschini, F.},
TITLE = {Developing a Platform for Aligned Translations in Digital Scholarly Editions},
YEAR = {2025},
ABSTRACT = {The DiScEPT platform offers an innovative solution for creating digital scholarly editions with aligned translations. By integrating open-source, modular tools, it facilitates the alignment of multilingual texts, supporting comparative studies and in-depth analysis of translation processes. Adhering to FAIR principles and leveraging advanced NLP technologies for automatic text alignment},
KEYWORDS = {Discept, Alignment, Translation, DSE},
CONFERENCE_NAME = {Building Access and Accessibility, Open Science to all Citizens},
BOOKTITLE = {Building Access and Accessibility, Open Science to all Citizens},
}
@INPROCEEDINGS{HOMOLA_2025_INPROCEEDINGS_HABKMVBCDSKGDGBTA_570881,
AUTHOR = {Homola, M. and Anthony, P. and Bečková, I. and Kľuka, J. and Mojžiš, J. and Švec, P. and Balogh, S. and Cardillo, F. A. and Debole, F. and Straccia, U. and Kenyeres, M. and Giannini, F. and Diligenti, M. and Gori, M. and Bisták, T. and Trizna, D. and Adams, Z.},
TITLE = {A note on methods for explainable malware analysis},
YEAR = {2025},
ABSTRACT = {The inevitable rise of machine learning in malware analysis puts forward the need for human-understandable explanations of the learned results. We point out how the ontological representation of malware data provides a suitable language for the construction of such explanations. We then focus on possible methods that enable producing such explanations and we reflect on our experience with them in the context of the EMBER dataset},
KEYWORDS = {Malware analysis, explainable AI, ontology, EMBER dataset},
PAGES = {14},
URL = {https://ceur-ws.org/Vol-4176/shields-3.pdf},
VOLUME = {4176},
PUBLISHER = {CEUR-WP},
CONFERENCE_NAME = {JOWO 2025-Joint Ontology Workshops},
BOOKTITLE = {Episode XI: The Sicilian Summer under the Etna},
}
@INPROCEEDINGS{KHAN_2025_INPROCEEDINGS_KMQPFS_570784,
AUTHOR = {Khan, A. F. and Mallia, M. and Quochi, V. and Pedonese, G. and Frontini, F. and Squadrito, E.},
TITLE = {A Pilot Project for Promoting Linguistic Linked Open Data},
YEAR = {2025},
ABSTRACT = {This paper presents a pilot initiative, part of the H2IOSC infrastructure, that strives to support and promote the creation, publication, and sharing of Linguistic Linked Open Data (LLOD) in Italy and beyond. We describe the different parts of the pilot project: those related to vocabulary hosting, RDF data publication, training development, and use case promotion. Key contributions include the publication and hosting of the REALITER series of lexicons, the PLLOD triple store platform, and LLOD-focused training initiatives. We also describe a series of use-cases taking place within the pilot},
KEYWORDS = {Training,Linguistic Linked Open data, H2IOSC, CLARIN},
PAGES = {1-6},
URL = {https://iris.cnr.it/handle/20.500.14243/570784},
DOI = {10.1109/ieee-ch65308.2025.11279386},
CONFERENCE_NAME = {2025 IEEE International Conference on Cyber Humanities (IEEE-CH)},
BOOKTITLE = {2025 IEEE International Conference on Cyber Humanities (IEEE-CH)},
}
@INPROCEEDINGS{KZADRI_2025_INPROCEEDINGS_KCCDHR_570922,
AUTHOR = {Kzadri, M. and Cardillo, F. A. and Chahinian, N. and Delenne, C. and Hostache, R. and Riffi, J.},
TITLE = {U-NetMN and SegNetMN: Modified U-Net and SegNet models for bimodal SAR image segmentation},
YEAR = {2025},
ABSTRACT = {Segmenting Synthetic Aperture Radar (SAR) images is crucial for many remote sensing applications, particularly water body detection. However, deep learning-based segmenta-tion models often face challenges related to convergence speed and stability, mainly due to the complex statistical distribution of this type of data. In this study, we evaluate the impact of mode normalization on two widely used semantic segmentation models, U-Net and SegNet. Specifically, we integrate mode normalization, to reduce convergence time while maintaining the performance of the baseline models. Experimental results demonstrate that mode normalization significantly accelerates convergence. Furthermore, cross-validation results indicate that normalized models exhibit increased stability in different zones. These findings highlight the effectiveness of normalization in improving computational efficiency and generalization in SAR image segmentation},
KEYWORDS = {SAR image segmentation, deep learning, mode normalization, U-Net, SegNet.},
PAGES = {6},
URL = {https://ieeexplore.ieee.org/document/11135135},
DOI = {10.1109/ICCSC66714},
ISBN = {979-8-3315-6529-9},
CONFERENCE_NAME = {2025 International Conference on Circuit, Systems and Communication (ICCSC)},
BOOKTITLE = {Proceedings of the 2025 International Conference on Circuit, Systems and Communication (ICCSC)},
}
@INPROCEEDINGS{LITTA_2025_INPROCEEDINGS_LPMBMBBDDGMBS_555245,
AUTHOR = {Litta, E. and Passarotti, M. and Moretti, G. and Brasolin, P. and Mambrini, F. and Basile, V. and Bosco, C. and Di Fabio, A. and Di Palma, E. and Giovannetti, E. and Marchi, S. and Bellandi, A. and Sciolette, F.},
TITLE = {Linking CompL-it to the LiITA Knowledge Base},
YEAR = {2025},
ABSTRACT = {This paper presents the integration of CompL-it, a Linked Open Data (LOD) computational lexicon for contemporary Italian, into LiITA (Linking Italian), a Knowledge Base (KB) designed for linguistic interoperability. CompL-it contains over 101k lexical entries enriched with detailed morphological and semantic information, derived from multiple authoritative sources and modelled using the OntoLex-Lemon vocabulary. The linking process involved aligning lexical entries with lemmas in the LiITA’s Lemma Bank (LB), addressing both exact and ambiguous matches through systematic and semantically informed strategies. Moreover, 12, 739 new lemmas were added to the LiITA LB. This integration enhances the expressiveness and interoperability of LiITA, enabling complex SPARQL queries that exploit the semantic network encoded in CompL-it. Examples are provided to demonstrate the advantages of querying interlinked resources},
KEYWORDS = {Linked Open Data, Italian, language resources},
URL = {https://aclanthology.org/2025.clicit-1.57.pdf},
PUBLISHER = {CEUR Workshop Proceedings},
CONFERENCE_NAME = {CLiC-it 2025 Italian Conference on Computational Linguistics},
BOOKTITLE = {Proceedings of the Eleventh Italian Conference on Computational Linguistics (CLiC-it 2025)},
}
@INPROCEEDINGS{MANCINELLI_2025_INPROCEEDINGS_MHBDDM_571321,
AUTHOR = {Mancinelli, T. and Hohenegger, H. and Boschetti, F. and Del Grosso, A. M. and De Longis, E. and Mugelli, G.},
TITLE = {Modellazione, interoperabilità e riuso in DiScEPT},
YEAR = {2025},
ABSTRACT = {Il progetto DiScEPT (Digital Scholarly Editions and Parallel Translations Platform) ha l'obiettivo di creare un ambiente per la produzione e la pubblicazione di edizioni digitali. Il multilinguismo è il punctum saliens di questo progetto per una scelta scientifica, ma anche perché si propone di favorire l’accessibilità, l’inclusione e il dialogo interculturale almeno nell’ambito della comunità inerente alla filologia digitale nonché della traduttologia. Le traduzioni non sono solo il superamento delle barriere linguistiche, ma strumenti di arricchimento critico, opportunità per lo studio semantico, storico e culturale dei testi. Integrando strumenti avanzati, come il riconoscimento automatico dei caratteri (HTR e OCR) e l’allineamento linguistico basato su BERT-Align, DiScEPT propone flussi di lavoro dinamici per la creazione di edizioni digitali con traduzioni allineate. La metodologia si fonda su modelli multipli che considerano la materialità dei documenti, la critica testuale e soprattutto l’analisi dei corpora paralleli. Superando l’idea di una piattaforma monoblocco, il progetto adotta un ambiente distribuito, basato sull’integrazione di piattaforme esistenti tramite API},
KEYWORDS = {digital scholarly editing, linked open data, corpora alignment, TEI-XML, edizione scientifica digitale, TEI-XML, Allineamento di corpora, Linked Open Data},
PAGES = {314-318},
URL = {https://amsacta.unibo.it/id/eprint/8380/},
DOI = {10.6092/unibo},
PUBLISHER = {AIUCD},
ISBN = {978-88-942535-9-7},
CONFERENCE_NAME = {Diversity, Equity, and Inclusion: Challenges and Opportunities for Digital Humanities in the Age of Artificial Intelligence},
BOOKTITLE = {Diversity, Equity, and Inclusion: Challenges and Opportunities for Digital Humanities in the Age of Artificial Intelligence, Proceedings del XIV Convegno Annuale AIUCD, Verona 11-13 giugno 2025, Università di Verona},
EDITOR = {Rebora, S. and Rospocher, M. and Bazzaco, S.},
}
@INPROCEEDINGS{MARTIGNANO_2025_INPROCEEDINGS_MRGBBDDDFRT_557641,
AUTHOR = {Martignano, C. and Rubin, G. and Giacomini, S. and Bardi, A. and Buzzoni, M. and Daquino, M. and Del Gratta, R. and Del Grosso, A. M. and Fischer, F. and Rosselli Del Turco, R. and Tomasi, F.},
TITLE = {ATLAS: a data model for describing FAIR Digital Humanities research outcomes},
YEAR = {2025},
ABSTRACT = {This paper addresses the challenges of cataloguing and representing Digital Humanities (DH) research outputs within the framework of FAIR principles. Despite advancements in Semantic Web technologies and data aggregators, the scholarly community still lacks unified frameworks and domain-specific models to describe heterogeneous outputs such as digital editions, textual collections, and other scholarly resources published as Linked Open Data. The ATLAS project proposes an ontology and a knowledge graph to bridge these gaps. The methodology includes metadata modeling based on existing frameworks and novel extensions, supported by pilot studies on the Italian cultural heritage. The project, currently in its initial version, aims to enhance metadata interoperability and data accessibility, contributing to the optimization of cataloguing practices and the development of guidelines for the discovery and reuse of DH resources while providing a model applicable beyond the Italian context},
KEYWORDS = {Metadata modeling, Research infrastructure, Scholarly outcome, Linked open data, FAIR principles},
PAGES = {440-447},
URL = {https://amsacta.unibo.it/id/eprint/8380/},
DOI = {10.6092/unibo/amsacta/8380},
PUBLISHER = {AlmaDL, University of Bologna Digital Library (Bologna, ITA)},
ISBN = {978-88-942535-9-7},
CONFERENCE_NAME = {AIUCD 2025-XIV Convegno Annuale},
CONFERENCE_PLACE = {Bologna},
BOOKTITLE = {Diversità, Equità e Inclusione: Sfide e Opportunità per l’Informatica Umanistica nell’Era dell’Intelligenza Artificiale},
}
@INPROCEEDINGS{MAZZAGUFO_2025_INPROCEEDINGS_MSBCDS_559506,
AUTHOR = {Mazzagufo, L. and Sichera, P. and Bruno, D. and Cristofaro, S. and Del Grosso, A. M. and Spampinato, D.},
TITLE = {An Infrastructural Solution for Digital Publication starting from Automatic Layout and Text Recognition: Insights from Italian Literary Journals},
YEAR = {2025},
ABSTRACT = {The creation, preservation, processing, publication, and querying of complex textual resources require adopting a methodological framework that is both universally applicable and tailored to specific domains. Its broad design promotes a widespread (re)usability, while domain-specific features ensure effective imple-mentation. This work describes (the refinement of) an integrated environment for automatic text and layout recognition that relies on the use of the tools ZoneRW, Kraken and eScriptorium. Previous experiments have been undertaken within the framework of the COVerLeSS, a historical-philological and linguistic investigation project of the literary magazines of the late 19th century of Italian Verismo. The publication of the text transcriptions in TEI Publisher together with the collections of related digital images makes the digitization process reusable and interoperable},
KEYWORDS = {ATR, eScriptorium, ZoneRW, Kraken, TEI Publisher, Digital Humanities},
PAGES = {494-499},
URL = {https://iris.cnr.it/handle/20.500.14243/559506},
DOI = {10.1109/cist65886.2025.11224217},
PUBLISHER = {IEEE (Piscataway, USA)},
ISBN = {979-8-3315-4384-6},
CONFERENCE_NAME = {CiSt2025},
CONFERENCE_PLACE = {Piscataway},
BOOKTITLE = {The 8th IEEE Congress on Information Science and Technology (CiSt2025) Proceedings},
}
@INPROCEEDINGS{MELACCIO_2025_INPROCEEDINGS_MBM_555308,
AUTHOR = {Melaccio, D. and Boschetti, F. and Monachini, M.},
TITLE = {Interfacing CLARIN with H2IOSC: Metadata Interoperability through Ontology-based Mediation},
YEAR = {2025},
ABSTRACT = {We present an ontology-based approach for integrating CLARIN language resources into the H2IOSC semantic framework, promoting interoperability across the Social Sciences and Humanities. Building on CMDI and the CLARIN Concept Registry, our work extends CMD2RDF beyond syntactic conversion to formal semantic integration. CMDI metadata is mapped to CIDOC CRM and SSHOCro, with extensions for CLARIN-specific needs. This ontology-first strategy keeps CMDI fully operational while ensuring theoretical consistency and long-term sustainability. The resulting semantic layer enhances discoverability, enables cross-disciplinary integration, and contributes to a scalable knowledge graph aligned with FAIR principles and the EOSC vision},
KEYWORDS = {Metadata interoperability, Ontology-based mediation, Semantic integration, Cross-infrastructure interoperability, FAIR principles},
PAGES = {35-39},
URL = {https://www.clarin.eu/sites/default/files/CLARIN2025_ConferenceProceedings.pdf},
CONFERENCE_NAME = {CLARIN Annual Conference 2025},
BOOKTITLE = {CLARIN Annual Conference Proceedings, 2025},
}
@INPROCEEDINGS{MERCATANTI_2025_INPROCEEDINGS_MRD_571362,
AUTHOR = {Mercatanti, E. and Riccucci, M. and Del Grosso, A. M.},
TITLE = {Voci dall’Inferno a TEI-Based Digital Archive for finding Dante in Concentration Camp Testimonies},
YEAR = {2025},
ABSTRACT = {Voci dall’Inferno is a digital humanities project that brings together a multidisciplinary team of scholars and Digital Humanities students. The project pursues two interconnected objectives: (a) the creation of the first digital corpus of non-literary testimonies of concentration camp survivors – mostly unpublished – encoded in XML-TEI, including both written and oral sources (Burnard, 2014); (b) the systematic identification and analysis, within the testimonies, of lexical items and allusions to Dante’s Divine Comedy, particularly the Inferno},
KEYWORDS = {XML-TEI, digital archives, eXist-db, XQuery, web application},
PAGES = {201-204},
DOI = {10.5281/zenodo},
ISBN = {978-83-977695-0-2},
CONFERENCE_NAME = {"New Territories". Text Encoding Initiative Conference and Members' Meeting 2025},
BOOKTITLE = {"New Territories". Text Encoding Initiative Conference and Members' Meeting 2025},
}
@INPROCEEDINGS{MIRABELLA_2025_INPROCEEDINGS_MB_570561,
AUTHOR = {Mirabella, A. and Brunato, D. P.},
TITLE = {Exploring LLM-Based Assessment of Italian Middle School Writing: A Pilot Study},
YEAR = {2025},
ABSTRACT = {This study investigates the use of ChatGPT for Automated Essay Scoring (AES) in assessing Italian middle school students’ written texts. Using rubrics targeting grammar, coherence and argumentation, we compare AI-generated feedback with that of a human teacher on a newly collected corpus of students’ essays. Despite some differences, ChatGPT provided detailed and timely feedback that complements the teacher’s role. These findings underscore the potential of generative AI to improve the assessment of writing, providing useful insights for educators and supporting students in developing their writing skills},
KEYWORDS = {automated essay scoring, LLM, Italian learners, argumentative essays},
PAGES = {708-715},
URL = {https://aclanthology.org/2025.bea-1.51/},
DOI = {10.18653/v1/2025.bea-1.51},
PUBLISHER = {Association for Computational Linguistics},
BOOKTITLE = {Proceedings of the 20th Workshop on Innovative Use of NLP for Building Educational Applications (BEA 2025)},
}
@INPROCEEDINGS{MORONI_2025_INPROCEEDINGS_MPHBBMDEN_552066,
AUTHOR = {Moroni, L. and Puccetti, G. and Huguet Cabot, P. L. and Bejgu, A. S. and Barba, E. and Miaschi, A. and Dell'Orletta, F. and Esuli, A. and Navigli, R.},
TITLE = {Optimizing LLMs for Italian: reducing token fertility and enhancing efficiency through vocabulary adaptation},
YEAR = {2025},
ABSTRACT = {The number of pretrained Large Language Models (LLMs) is increasing steadily, though the majority are designed predominantly for the English language. While state-of-the-art LLMs can handle other languages, due to language contamination or some degree of multilingual pretraining data, they are not optimized for non-English languages, leading to inefficient encoding (high token ``fertility'') and slower inference speed. In this work, we thoroughly compare a variety of vocabulary adaptation techniques for optimizing English LLMs for the Italian language, and put forward Semantic Alignment Vocabulary Adaptation (SAVA), a novel method that leverages neural mapping for vocabulary substitution. SAVA achieves competitive performance across multiple downstream tasks, enhancing grounded alignment strategies. We adapt two LLMs: Mistral-7B-v0. 1, reducing token fertility by 25(\%), and Llama-3. 1-8B, optimizing the vocabulary and reducing the number of parameters by 1 billion. We show that, following the adaptation of the vocabulary, these models can recover their performance with a relatively limited stage of continual training on the target language. Finally, we test the capabilities of the adapted models on various multi-choice and generative tasks},
KEYWORDS = {Large Languiage Models, Italia LLM, Vocabulary Adaptation},
PAGES = {6646-6660},
URL = {https://aclanthology.org/2025.findings-naacl.371/},
DOI = {10.18653/v1/2025.findings-naacl.371},
PUBLISHER = {Association for Computational Linguistics},
ISBN = {979-8-89176-195-7},
CONFERENCE_NAME = {NAACL 2025-Annual Conference of the Nations of the Americas Chapter. Findings of the Association for Computational Linguistics},
BOOKTITLE = {NAACL 2025 Findings proceedings},
}
@INPROCEEDINGS{MUGELLI_2025_INPROCEEDINGS_MMHDDB_571262,
AUTHOR = {Mugelli, G. and Mancinelli, T. and Hohenegger, H. and De Longis, E. and Del Grosso, A. M. and Boschetti, F.},
TITLE = {DiScEPT: a distributed environment for digital scholarly editions},
YEAR = {2025},
ABSTRACT = {The DiScEPT project aims to create an environment for the production and publication of digital editions. Its method-ology is grounded in multiple models that take into account document materiality, textual criticism, and, in particular, the analysis of parallel corpora. The project adopts a distributed environment that relies on a range of open-source software components, integrated through APIs. Each step of the digital edition process can thus be performed using highly specialized platforms that offer optimal solutions for specific tasks, minimizing the need for customization and ensuring interoperability. This paper presents the approach adopted for the implementation of the distributed environment, highlighting the role of CLARIN’s tools and services in supporting the development of the DiScEPT project and ensuring the long-term preservation of its data within a sustainable framework},
KEYWORDS = {Humanities, Analytical models, Distributed databases, Production, Sustainable development, Open source software, Interoperability, digital editions, htr, data sustainability, digital philology},
PAGES = {443-448},
URL = {https://ieeexplore.ieee.org/document/11279340},
DOI = {10.1109/IEEE},
PUBLISHER = {IEEE},
ISBN = {979-8-3315-1435-8},
CONFERENCE_NAME = {2025 IEEE International Conference on Cyber Humanities (IEEE-CH)},
BOOKTITLE = {2025 IEEE International Conference on Cyber Humanities (IEEE-CH)},
EDITOR = {Bellini, E. and Degl'Innocenti, U. O. R. T. E. and Delle Ricerche, C. N.},
}
@INPROCEEDINGS{ORSINI_2025_INPROCEEDINGS_OB_570603,
AUTHOR = {Orsini, M. and Brunato, D.},
TITLE = {Direct and indirect interpretations of speech acts: evidence from human judgments and large language models},
YEAR = {2025},
ABSTRACT = {This paper introduces INDIR-IT (Indirectness for the Italian language), a linguistically informed, manually curated benchmark for evaluating large language models’ (LLMs) understanding of indirect speech acts (ISAs) in Italian. By systematically contrasting conventionalized and non-conventionalized ISAs with literal interpretations, the corpus enables fine-grained assessment of pragmatic competence, an area still relatively underexplored compared to lexical and syntactic understanding. Preliminary results show that LLMs handle conventionalized ISAs relatively well, while performance on non-conventionalized ISAs remains more sensitive to model size and capacity. INDIR-IT offers a foundation for advancing research on pragmatic inference in both humans and LLMs},
KEYWORDS = {Indirectness, Speech acts, Italian benchmark, Large Language Models, Human evaluation},
PAGES = {837-848},
URL = {https://aclanthology.org/2025.clicit-1.79},
PUBLISHER = {CEUR Workshop Proceedings},
ISBN = {979-12-243-0587-3},
CONFERENCE_NAME = {Eleventh Italian Conference on Computational Linguistics (CLiC-it 2025), Cagliari, Italy, September 2025},
BOOKTITLE = {Proceedings of the Eleventh Italian Conference on Computational Linguistics (CLiC-it 2025)},
}
@INPROCEEDINGS{PAPINI_2025_INPROCEEDINGS_P_544744,
AUTHOR = {Papini, M.},
TITLE = {MAIA. Uno strumento per la lessicografia digitale al servizio del Vocabolario di Boccaccio Online (VocaBO)},
YEAR = {2025},
ABSTRACT = {Il progetto di ricerca Vocabolario di Boccaccio Online-VocaBO mira a realizzare il primo vocabolario in formato digitale e liberamente accessibile in rete delle opere in volgare di Giovanni Boccaccio, a partire dal Decameron. Il progetto si fonda sulla stretta sinergia di due domini del sapere: da una parte quello linguistico, che presiede alla redazione delle voci lessicografiche; dall’altra quello computazionale, che rende disponibili risorse tecnologiche e standard a supporto dell’attività di redazione. In occasione del Seminario, abbiamo illustrato il contributo computazionale del CNR-ILC nell’ambito del VocaBO, descrivendo sinteticamente Maia, un nuovo strumento web per la lessicografia digitale che permette, oltre alla creazione di voci lessicografiche, l’annotazione multilivello di testi e la possibilità di collegare direttamente testo e voci. Questo strumento, realizzato dal gruppo di ricerca KLAB (Knowledge, Lexica \& Applications Bridging), ha l’obiettivo di offrire un ambiente di lavoro integrato, incorporando molteplici funzionalità che tradizionalmente sono affidate a software diversi e separati. Maia (già adottato anche in altri progetti di ricerca) per le esigenze specifiche del VocaBO è stato arricchito con un insieme di funzionalità espressamente mirate alla fruizione delle opere di Boccaccio e alla redazione delle voci lessicografiche. Per il VocaBO è stato creato, per esempio, un apposito pannello di ricerca sul testo, con visualizzazione in formato KWIC delle occorrenze (token) in contesti di ampiezza modulabile e con la possibilità di accedere, da qui, al testo completo dell’opera in oggetto. Quest’ultimo, leggibile con scorrimento continuo (dunque senza alcuna interruzione), può essere annotato in modo completamente personalizzabile in termini di livelli e granularità, consentendo anche il collegamento tra i token di una voce e i relativi significati. Per quanto riguarda poi la gestione del lessico, alcuni pannelli permettono la registrazione delle forme e delle accezioni dei lessemi, nonché la formalizzazione delle loro relazioni semantiche; altri pannelli supportano invece la creazione e la descrizione delle voci (piene o di rinvio) secondo il set di informazioni ritenute sensibili per lo studio del vocabolario di Boccaccio. Così, è possibile registrare in quale delle opere boccacciane compaia una voce per la prima volta, il numero delle sue occorrenze nel Decameron e nelle altre opere, la sua etimologia e altri dati notevoli},
KEYWORDS = {Text Annotation, E-Lexicography, Lexical Linking, Computational Lexicons, Linguistic Resources, Linguistic Linked Open Data, OntoLex-Lemon, Maia, VocaBO, Annotazione del testo, lessicografia digitale, lexical linking, lessici computazionali, risorse linguistiche, Linguistic Linked Open Data, OntoLex-Lemon, Maia, VocaBO},
URL = {https://iris.cnr.it/handle/20.500.14243/544744},
PUBLISHER = {Pacini Editore (Ospedaletto (Pisa), ITA)},
ISBN = {979-12-5486-582-8},
CONFERENCE_NAME = {Seminario internazionale, XI edizione "Intorno a Boccaccio / Boccaccio e dintorni 2024"},
CONFERENCE_PLACE = {Ospedaletto (Pisa)},
BOOKTITLE = {Intorno a Boccaccio / Boccaccio e dintorni 2024. Atti del Seminario internazionale di studi (Certaldo Alta, Casa di Giovanni Boccaccio, 18-19 ottobre 2024)},
}
@INPROCEEDINGS{PAPINI_2025_INPROCEEDINGS_PADGM_544703,
AUTHOR = {Papini, M. and Albanesi, D. and Dattilo, D. and Giovannetti, E. and Marchi, S.},
TITLE = {Experiments on the Use of LLMs for the Translation of the Babylonian Talmud},
YEAR = {2025},
ABSTRACT = {In this paper, we present an experiment on the use of Large Language Models (LLMs) in the translation of the Babylonian Talmud into Italian. The experiment focuses on translation and demonstrates how the combined use of LLMs and Translation Memory can improve the quality of suggested translations in a Computer-Assisted Translation context. The initial results highlight both the positive contribution of this hybrid technique and the limitations posed by the nature of complex texts like the Babylonian Talmud, whose translation can only be interpretative},
KEYWORDS = {Babylonian Talmud, Computer Assisted Translation, Large Language Models, Artificial Intelligence, Talmud Babilonese, Traduzione Assistita dal Computer, Modelli di Linguaggio di Grandi Dimensioni, Intelligenza Artificiale},
PAGES = {363-367},
URL = {https://aiucd2025.dlls.univr.it/assets/pdf/papers/58.pdf},
VOLUME = {DIVERSITÀ, EQUITÀ E INCLUSIONE: SFIDE E OPPORTUNITÀ PER L’INFORMATICA UMANISTICA NELL’ERA DELL’INTELLIGENZA ARTIFICIALE, PROCEEDINGS DEL XIV CONVEGNO ANNUALE AIUCD2025},
DOI = {10.6092/unibo/amsacta/8380},
ISBN = {978-88-942535-9-7},
CONFERENCE_NAME = {Diversità, Equità e Inclusione: Sfide e Opportunità per l’Informatica Umanistica nell’Era dell’Intelligenza Artificiale. XIV Convegno Annuale AIUCD2025},
BOOKTITLE = {Diversità, Equità e Inclusione: Sfide e Opportunità per l’Informatica Umanistica nell’Era dell’Intelligenza Artificiale, Proceedings del XIV Convegno Annuale AIUCD2025},
}
@INPROCEEDINGS{PAPUCCI_2025_INPROCEEDINGS_PVD_570801,
AUTHOR = {Papucci, M. and Venturi, G. and Dell'Orletta, F.},
TITLE = {Generating and Evaluating Multi-Level Text Simplification: A Case Study on Italian},
YEAR = {2025},
ABSTRACT = {Recent advances in Generative AI and Large Language Models (LLMs) have enabled the creation of highly realistic synthetic content, yet controlling model outputs remains a challenge. In this study, we explore the use of LLMs to generate high-quality synthetic data for Automatic Text Simplification (ATS), evaluating the ability of models fine-tuned on Italian to produce multiple simplified versions of the same original sentence that vary in readability and in their lexical and (morpho-)syntactic characteristics. The approach is tested across two domains, Wikipedia and Public Administration, allowing us to explore domain sensitivity. Additionally, we compare the linguistic phenomena observed in the generated data with those found in ATS resources previously created through manual or semi-automatic methods. Our results suggest that the best-performing LLM can generate linguistically diverse simplifications that align with known simplification patterns, offering a promising direction for building reliable ATS resources, including simplifications suited to varying levels of reader proficiency},
KEYWORDS = {Automatic Text Simplification, Large Language Models, Synthetic Data, Linguistic Complexity, Sentence Readability},
PAGES = {870-885},
URL = {https://aclanthology.org/2025.clicit-1.82/},
PUBLISHER = {CEUR Workshop Proceedings},
ISBN = {979-12-243-0587-3},
CONFERENCE_NAME = {Eleventh Italian Conference on Computational Linguistics (CLiC-it 2025)},
BOOKTITLE = {Proceedings of the Eleventh Italian Conference on Computational Linguistics (CLiC-it 2025)},
}
@INPROCEEDINGS{PEDONESE_2025_INPROCEEDINGS_PFDF_564161,
AUTHOR = {Pedonese, G. and Frontini, F. and Del Fante, D. and Federici, E.},
TITLE = {Adapting UPSKILLS Learning Modules to the University Curricula. Best Practices and Lessons Learnt from the H2IOSC Training Experience at the University of Ferrara},
YEAR = {2025},
ABSTRACT = {This paper details the steps taken to adapt and integrate the training materials developed by CLARIN ERIC in two bachelor’s degree courses and one master’s degree course at the University of Ferrara. The workflow applies the shared methodology developed within the Humanities and Heritage Italian Open Science Cloud project. It modifies the training materials of the UPSKILLS course “Introduction to Language Data: Standards and Repositories” according to the needs of three target courses focusing on English to Italian translation: English Language Course for Tourism, English Language for Translation and English Language and Linguistics for Humanities, Arts and Archaeology. The result of this pilot is a documented example of how CLARIN services can be integrated into university teaching, including initial teacher training, and providing an opportunity to discuss the topic and a use case for trainers who intend to include CLARIN in their courses},
KEYWORDS = {Training, Learning Resources, Language Data, FAIR principles, Research Infrastructures},
PAGES = {37-47},
URL = {https://ecp.ep.liu.se/index.php/clarin/article/view/1236},
DOI = {10.3384/ecp216.04},
PUBLISHER = {Linköping University Electronic press' conference series (SWE)},
ISBN = {978-91-8118-188-3},
CONFERENCE_PLACE = {SWE},
BOOKTITLE = {Selected papers from the CLARIN Annual Conference 2024},
EDITOR = {Vandeghinste, V. and Kontino, T.},
}
@INPROCEEDINGS{PEDONESE_2025_INPROCEEDINGS_PFOBSFSRCSB_552965,
AUTHOR = {Pedonese, G. and Frontini, F. and Ottaviani, R. and Boschetti, F. and Spadi, A. and Francalanci, L. and Scognamiglio, A. and Restaneo, P. and Chaban, A. and Striova, J. and Benassi, L.},
TITLE = {Dai Materiali Didattici alle Piattaforme FAIR: Costruire un’Infrastruttura di Training in H2IOSC},
YEAR = {2025},
ABSTRACT = {Questo contributo si propone di illustrare la progettazione e lo sviluppo di un’infrastruttura di formazione innovativa per le Scienze Umane e Sociali, basata sui principi FAIR e sulla promozione della Scienza Aperta, nell’ambito del progetto Humanities and cultural Heritage Italian Open Science Cloud (H2IOSC). L’obiettivo principale è la creazione di un ecosistema integrato che renda i materiali didattici facilmente reperibili, accessibili, interoperabili e riutilizzabili. A tal fine, sono state implementate due piattaforme: H2IOSC Virtual Environment, dedicata all’erogazione di corsi e risorse per studenti, e H2IOSC Training Library, un deposito per la conservazione e la condivisione di materiali didattici modulari. Entrambe le piattaforme si basano sulla metodologia "FAIR-by-Design" raccomandata dal progetto Skills4EOSC, che struttura il processo educativo in sei fasi, garantendo standard elevati di metadatazione e l’uso di formati aperti. Con l’implementazione di queste piattaforme, i cui servizi saranno resi disponibili a un livello di aggregazione più alto nel Marketplace di H2IOSC, il progetto intende favorire un approccio scalabile e sostenibile alla formazione, promuovendo al contempo la collaborazione tra docenti e studenti},
KEYWORDS = {formazione, gestione dei dati, infrastrutture di ricerca, principi FAIR, Scienza Aperta.},
PAGES = {473-477},
URL = {https://iris.cnr.it/handle/20.500.14243/552965},
DOI = {10.6092/unibo/amsacta/8380},
ISBN = {978-88-942535-9-7},
CONFERENCE_NAME = {XIV Convegno Annuale AIUCD 2025},
BOOKTITLE = {Diversità, Equità e Inclusione: Sfide e Opportunità per l’Informatica Umanistica nell’Era dell’Intelligenza Artificiale, Proceedings del XIV Convegno Annuale AIUCD2025},
}
@INPROCEEDINGS{PEDROTTI_2025_INPROCEEDINGS_PPCMPDE_554367,
AUTHOR = {Pedrotti, A. and Papucci, M. and Ciaccio, C. and Miaschi, A. and Puccetti, G. and Dell'Orletta, F. and Esuli, A.},
TITLE = {Stress-testing machine generated text detection: shifting language models writing style to fool detectors},
YEAR = {2025},
ABSTRACT = {Recent advancements in Generative AI and Large Language Models (LLMs) have enabled the creation of highly realistic synthetic content, raising concerns about the potential for malicious use, such as misinformation and manipulation. Moreover, detecting Machine-Generated Text (MGT) remains challenging due to the lack of robust benchmarks that assess generalization to real-world scenarios. In this work, we evaluate the resilience of state-of-the-art MGT detectors (e. g., Mage, Radar, LLM-DetectAIve) to linguistically informed adversarial attacks. We develop a pipeline that fine-tunes language models using Direct Preference Optimization (DPO) to shift the MGT style toward human-written text (HWT), obtaining generations more challenging to detect by current models. Additionally, we analyze the linguistic shifts induced by the alignment and how detectors rely on “linguistic shortcuts” to detect texts. Our results show that detectors can be easily fooled with relatively few examples, resulting in a significant drop in detecting performances. This highlights the importance of improving detection methods and making them robust to unseen in-domain texts. We release code, models, and data to support future research on more robust MGT detection benchmarks},
KEYWORDS = {machine-generated text detection, synthetic content detection},
PAGES = {3010-3031},
URL = {https://aclanthology.org/2025.findings-acl.156/},
DOI = {10.18653/v1/2025.findings-acl.156},
PUBLISHER = {Association for Computational Linguistics},
ISBN = {979-8-89176-256-5},
CONFERENCE_NAME = {NAACL 2025-Annual Conference of the Nations of the Americas Chapter of the Association for Computational Linguistics. Findings},
BOOKTITLE = {NAACL 2025 Findings proceedings},
}
@INPROCEEDINGS{PICCINI_2025_INPROCEEDINGS_PBCD_570921,
AUTHOR = {Piccini, S. and Bellandi, A. and Calvi, S. and Dankova, K.},
TITLE = {Représentation computationnelle des données terminologiques en diachronie: le cas des fibres artificielles},
YEAR = {2025},
ABSTRACT = {L’article porte sur la création d’une base de données diachronique des fibres textiles (FR-IT-EN) selon les principes du web sémantique – un projet né de la collaboration entre l’Istituto di Linguistica Computazionale « Antonio Zampolli » (ILC-CNR) et l’Osservatorio di Terminologie e Politiche Linguistiche (OTPL – Università Cattolica del Sacro Cuore). L’accent est mis sur la représentation formelle des données du sous-domaine des fibres artificielles. Après avoir introduit les caractéristiques spécifiques de ce type de fibres textiles, notamment leur impact sur l’environnement, la nature des données formalisées jusqu’à présent est illustrée. Dans l’étape suivante, les principes du modèle DIATERM, adopté dans ce projet, sont expliqués, suivis d’une description détaillée de la modélisation de la ressource des fibres textiles, qui repose sur deux niveaux d’analyse: linguistique et conceptuel. Enfin, sa capacité à donner des réponses précises à des requêtes formelles est démontrée au moyen d’une série d’interrogations diachroniques},
KEYWORDS = {terminologie diachronique, web sémantique, DIATERM, fibres textiles},
BOOKTITLE = {Proceedings of the TOTh 2024 Conference},
}
@INPROCEEDINGS{PICCINI_2025_INPROCEEDINGS_PJBM_570845,
AUTHOR = {Piccini, S. and Jama, J. M. and Bellandi, A. and Marchi, S.},
TITLE = {A Journey into Somali Culture: The Terminology of the Ugo Ferrandi’s Notebooks},
YEAR = {2025},
ABSTRACT = {The purpose of this contribution is to present the early stages of the construction of a Somali-Italian termino-ontological resource dating back to the time of Italy’s colonialist expansion into Africa. Specifically, terminological data were taken from the notebooks written by the Italian explorer Ugo Ferrandi (1852-1928) and published by the Società Geografica in 1903 under the title “Lugh. Emporio Commerciale sul Giuba”. To build the Ferrandi’s onto-terminological resource the Semantic Web technologies (RDF, OWL, SPARQL) and the Linked Open Data paradigm were adopted to ensure the FAIRness of data and to allow our terminological resource to be published and shared in an open interconnected Web of Data, thus contributing to filling the absence of Somali in the Linguistic Linked Data cloud},
KEYWORDS = {Somali language, computational terminology, Semantic Web},
PAGES = {267-284},
PUBLISHER = {Universitaires Savoie Mont Blanc},
BOOKTITLE = {Proceedings of the TOTh 2023 Conference},
}
@INPROCEEDINGS{PIPERNO_2025_INPROCEEDINGS_PBDPMB_570762,
AUTHOR = {Piperno, R. and Bonfigli, A. and Dell'Orletta, F. and Pecchia, L. and Merone, M. and Bacco, L.},
TITLE = {Doctor, Is That You? Evaluating Large Language Models on Italy’s Medical School Entrance Exams},
YEAR = {2025},
ABSTRACT = {In recent years, Large Language Models (LLMs) have demonstrated remarkable capabilities across a variety of linguistic and cognitive tasks. This study investigates whether such models can succeed in one of Europe’s most selective academic assessments: the Italian medical school entrance exam. We evaluate a wide selection of open-weights LLMs, ranging from natively Italian-pretrained models to multilingual and Italian-specialised variants, on a benchmark dataset comprising over 3, 300 real-world exam questions across five knowledge domains. Our experiments systematically explore the impact of language-specific pretraining, model size, prompt formulation and instruction tuning on exam performance. Results show that large multilingual models, particularly the Gemma-2-9B family, consistently outperform all other systems, surpassing the official admission threshold under all prompting settings. In contrast, models trained exclusively on Italian data fail to reach this threshold, even with larger architectures or instruction tuning. Additional analyses reveal that high-performing models display lower positional bias and greater inter-model consistency. These findings suggest that cross-domain reasoning and multilingual pretraining are key to handling multi-disciplinary educational tasks},
KEYWORDS = {Large Language Models (LLMs), Italian Medical Admission Test, NLP in healthcare},
URL = {https://iris.cnr.it/handle/20.500.14243/570762},
BOOKTITLE = {Proceedings of the Eleventh Italian Conference on Computational Linguistics (CLiC-it 2025)},
}
@INPROCEEDINGS{SICHERA_2025_INPROCEEDINGS_SDMS_556607,
AUTHOR = {Sichera, P. and Del Grosso, A. M. and Mazzagufo, L. and Spampinato, D.},
TITLE = {ZoneRW: verso un’integrazione con Kraken ed eScriptorium per il riconoscimento e la gestione avanzata delle regioni di interesse},
YEAR = {2025},
ABSTRACT = {The detection of regions of interest (ROI) in facsimile documents is essential for a proper digitization process and for the study of both manuscript and printed texts. This contribution presents a feature extension of the ZoneRW software (created in the context of the Bellini Digital Correspondence digital scholarly edition), to integrate the Kraken tool, dedicated to automatic zone detection and automatic text recognition, and the eScriptorium digital environment for advanced management of the digitization process from image repositories of textual documents. The proposed workflow uses the XML-PAGE format to ensure interoperability and scalability, while simultaneously allowing regions of interest to be defined, edited, and exported to eScriptorium. In addition, the new ZoneRW capabilities allow image description documents to be linked via IIIF protocol (manifest IIIF). The paper highlights and discusses the differences between XML-PAGE and XML-ALTO formats as well as prospects for future developments of the ZoneRW tool in the Digital Humanities context},
KEYWORDS = {ZoneRW, Kraken, eScriptorium, regions of interest, digitization, regioni di interesse, digitalizzazione},
PAGES = {297-302},
URL = {https://amsacta.unibo.it/id/eprint/8380},
DOI = {10.6092/unibo/amsacta/8380},
ISBN = {978-88-942535-9-7},
CONFERENCE_NAME = {XIV Convegno Annuale AIUCD 2025, Diversità, Equità e Inclusione: Sfide e Opportunità per l’Informatica Umanistica nell’Era dell’Intelligenza Artificiale},
BOOKTITLE = {Diversità, Equità e Inclusione: Sfide e Opportunità per l’Informatica Umanistica nell’Era dell’Intelligenza Artificiale, Proceedings del XIV Convegno Annuale AIUCD2025},
}
@INPROCEEDINGS{SICHERA_2025_INPROCEEDINGS_SMQGFOL_562001,
AUTHOR = {Sichera, P. and Monachini, M. and Quochi, V. and Giampietro, N. and Fabiani, V. and Ottaviani, R. and Luzietti, R. B.},
TITLE = {Synergies between CLARIN-IT and OPERAS-IT within H2IOSC: monitoring communities and orchestrating digital services},
YEAR = {2025},
ABSTRACT = {This paper introduces the Humanities and Cultural Heritage Open Science Cloud (H2IOSC) Marketplace, a digital environment designed for the discovery, access, and integration of di-verse digital resources, tools, and services in the fields of Language, Digital Humanities, and Cultural Heritage. The Marketplace is closely integrated with the H2IOSC Observatory-an an-alytical framework for monitoring the evolving landscape of digital resources-which provides insights into research infrastructure usage, allowing to align service offerings with user needs and expectations. Together, the Marketplace and Observatory promote interoperability and enhance collaboration between the CLARIN-IT and OPERAS-IT infrastructures},
KEYWORDS = {Marketplace, Workflow, Orchestration, Observatory, Osservatorio, Orchestrazione},
PAGES = {26-30},
URL = {https://www.clarin.eu/sites/default/files/CLARIN2025_ConferenceProceedings.pdf#page=35},
DOI = {10.5281/zenodo.17357825},
PUBLISHER = {Cristina Grisot, Thalassia Kontino (eds.) (Vienna, AUT)},
CONFERENCE_NAME = {CLARIN Annual Conference 2025},
CONFERENCE_PLACE = {Vienna},
BOOKTITLE = {CLARIN Annual Conference Proceedings 2025},
}
@INPROCEEDINGS{SORIA_2025_INPROCEEDINGS_S_571509,
AUTHOR = {Soria, C.},
TITLE = {Understanding the Unheard: Italian Students’ Recognition and Comprehensibility Ratings of English Accents},
YEAR = {2025},
ABSTRACT = {This study examines how Italian secondary school learners perceive and process different English accents, focusing on recognition accuracy and perceived comprehensibility. Students listened to recordings of nine English accents from Kachru’s Inner, Outer, and Expanding Circles and were asked to identify their geographical origin and rate their comprehensibility on a 5-point scale. The study investigates how accurately learners recognize different accents and whether perceived intelligibility correlates with correct identification. Preliminary expectations suggest that more familiar accents, such as British and American English, will be recognized more accurately and rated as more comprehensible, while less familiar varieties may be misidentified and perceived as less intelligible. The findings aim to shed light on sociolinguistic biases, language attitudes, and the impact of limited exposure to diverse Englishes in foreign language learning},
KEYWORDS = {World Englishes, language attitudes, sociolinguistics, accent recognition, accent attribution, perceptual sociophonetics},
DOI = {10.18778/8331},
ISBN = {978-83-8331-971-1},
CONFERENCE_NAME = {Accents 2025-18th International Conference on Nativa and Non-native Accents of English},
BOOKTITLE = {Accents 2025-18th International Conference on Nativa and Non-native Accents of English-Book of Abstracts},
}
@INPROCEEDINGS{SORIA_2025_INPROCEEDINGS_S_571506,
AUTHOR = {Soria, C.},
TITLE = {What Is the ‘Standard’ Accent? Italian Learners’ Views on English Norms and Varieties},
YEAR = {2025},
ABSTRACT = {This study examines how Italian secondary school learners conceptualize a “standard” English accent and the sociolinguistic biases shaping their evaluations. Using survey data, it investigates how students define “standard English, ” whether perceptions vary by learner characteristics, and how these perceptions relate to judgments about speech traits (e. g., intelligibility, correctness) and speaker qualities (e. g., competence, friendliness). The study also explores potential preference for familiar “inner-circle” varieties such as British or American English and possible bias against less familiar varieties. The findings aim to reveal underlying language ideologies and contribute to discussions on language attitudes, World Englishes, and more inclusive approaches to English language teaching},
KEYWORDS = {standard English, world english, accents, language attitudes, accent perception, sociolinguistics, sociophonetics, perceptual sociophonetics},
DOI = {10.18778/8331},
ISBN = {978-83-8331-971-1},
CONFERENCE_NAME = {Accents 2025-18th International Conference on Nativa and Non-native Accents of English},
BOOKTITLE = {Accents 2025-18th International Conference on Nativa and Non-native Accents of English-Book of Abstracts},
}
@INPROCEEDINGS{TESTA_2025_INPROCEEDINGS_TBBBLMPM_570743,
AUTHOR = {Testa, D. and Bonetta, G. and Bernardi, R. and Bondielli, A. and Lenci, A. and Miaschi, A. and Passaro, L. and Magnini, B.},
TITLE = {All-in-one: Understanding and Generation in Multimodal Reasoning with the MAIA Benchmark},
YEAR = {2025},
ABSTRACT = {We introduce MAIA (Multimodal AI Assessment), a native-Italian benchmark designed for fine-grained investigation of the reasoning abilities of visual language models on videos. MAIA differs from other available video benchmarks for its design, its reasoning categories, the metric it uses, and the language and culture of the videos. MAIA evaluates Vision Language Models (VLMs) on two aligned tasks: a visual statement verification task, and an openended visual question-answering task, both on the same set of video-related questions. It considers twelve reasoning categories that aim to disentangle language and vision relations by highlighting the role of the visual input. Thanks to its carefully taught design, it evaluates VLMs’ consistency and visually grounded natural language comprehension and generation simultaneously through an aggregated metric revealing low results that highlight models’ fragility. Last but not least, the video collection has been carefully selected to reflect the Italian culture, and the language data are produced by native-speakers. 1},
KEYWORDS = {multimodal, vllm, multimodal reasoning},
PAGES = {20030-20050},
URL = {https://iris.cnr.it/handle/20.500.14243/570743},
DOI = {10.18653/v1/2025.findings-emnlp.1091},
BOOKTITLE = {Findings of the Association for Computational Linguistics: EMNLP 2025},
}
@INPROCEEDINGS{TESTA_2025_INPROCEEDINGS_TBBBLMPM_570744,
AUTHOR = {Testa, D. and Bonetta, G. and Bernardi, R. and Bondielli, A. and Lenci, A. and Miaschi, A. and Passaro, L. and Magnini, B.},
TITLE = {MAIA: a Benchmark for Multimodal AI Assessment},
YEAR = {2025},
ABSTRACT = {We introduce MAIA (Multimodal AI Assessment), a multimodal dataset developed as a core component of a competenceoriented benchmark designed for fine-grained investigation of the reasoning abilities of Visual Language Models (VLMs) on videos. The MAIA benchmark is characterized by several distinctive features. To the best of our knowledge, MAIA is the first Italian-native benchmark addressing video understanding: videos were carefully selected to reflect Italian culture, and the language data (ie, questions and reference answers) were produced by native-Italian speakers. Second, MAIA explicitly includes twelve reasoning categories that are specifically designed to assess the reasoning abilities of VLMs on videos. Third, we structured the dataset to support two aligned tasks (ie, a statement verification and an open-ended visual question answering) built on the same datapoints, this way allowing to assess VLM coherence across task formats. Finally MAIA integrates, by design, state-of-the-art LLMs in the development process of the benchmark, taking advantage of their linguistic and reasoning capabilities both for data augmentation and for assessing and improving the overall quality of the data. In the paper we focus on the design principles and the data collection methodology, highlighting how MAIA provides a significant advancement with respect to other available dataset for VLM benchmarking. Data available at GitHub},
KEYWORDS = {multimodal, vllm, evaluation},
URL = {https://iris.cnr.it/handle/20.500.14243/570744},
BOOKTITLE = {Proceedings of the Eleventh Italian Conference on Computational Linguistics (CLiC-it 2025)},
}
@INPROCEEDINGS{VANDENHEUVEL_2025_INPROCEEDINGS_VDPFV_571001,
AUTHOR = {Van Den Heuvel, H. and Draxler, C. and Pedonese, G. and Frontini, F. and Van Der Lek, I.},
TITLE = {From Collection to Transcription: A Workflow for Managing Speech Data by the CLARIN Trainers’ Network},
YEAR = {2025},
ABSTRACT = {This proposal shares the experience of members of the CLARIN Trainers’ Network in reusing, adapting and localizing existing learning content related to speech and oral data management to meet the learning needs of the CLARIN-IT research community in the context of the Humanities and Cultural Heritage Italian Open Science Cloud (H2IOSC) project},
KEYWORDS = {training, FAIR data, Speech data, transcription chain},
PAGES = {437-442},
URL = {https://ieeexplore.ieee.org/servlet/opac?punumber=11278902},
DOI = {10.1109/IEEE},
PUBLISHER = {IEEE},
ISBN = {979-8-3315-1435-8},
CONFERENCE_NAME = {IEEE International Conference on Cyber Humanities (IEEE-CH)},
BOOKTITLE = {Proceedings of the 2025 IEEE International Conference on Cyber Humanities (IEEE-CH) 8-10 September, Florence, Italy},
}
@INPROCEEDINGS{ZENZARO_2025_INPROCEEDINGS_ZDBR_571322,
AUTHOR = {Zenzaro, S. and Del Grosso, A. M. and Boschetti, F. and Ranocchia, G.},
TITLE = {Integrity in Digital Scholarly Editing: The GreekSchools Case},
YEAR = {2025},
ABSTRACT = {Textual scholarship aims to reconstruct and publish texts through critical apparatuses. The DSL-based Digital Scholarly Editions (DSE) method merges traditional editing with computational techniques, enhancing workflows and adhering to open science principles. The GreekSchools project exemplifies this approach, and the CoPhiEditor implements it as a software solution},
KEYWORDS = {DSL-based DSE, GreekSchools, Digital Papyrology},
CONFERENCE_NAME = {Building Access and Accessibility, Open Science to all Citizens},
BOOKTITLE = {Building Access and Accessibility, Open Science to all Citizens},
}
@INPROCEEDINGS{ZENZARO_2025_INPROCEEDINGS_ZGLNPTDNL_563623,
AUTHOR = {Zenzaro, S. and Giostrella, C. and Lorenzetti, G. and Nodari, L. and Palleschi, V. and Tomasin, P. and Del Grosso, A. M. and Nahli, O. and Legnaioli, S.},
TITLE = {A multidisciplinary approach to valorising ancient manuscripts},
YEAR = {2025},
ABSTRACT = {This work responds to the objective of recovering, preserving and valorising ancient documents, with particular reference to those in Arabic, both manuscripts and small objects with Arabic inscriptions of significant historical-cultural interest, preserved in libraries and historical archives. The proposed approach aims to scientifically analyse both the form and content of the selected material in order to provide input for its conservation, digitisation, archiving, annotation and large-scale exploitation. To this end, the most advanced diagnostic and digital technologies will be adopted, integrated and tested with the aim of valorising and translating the uniqueness of the material objects into a format suitable for management and manipulation in innovative digital environments, while preserving all their complexity as objects of scientific analysis in the field of historical-cultural studies. The study presented here concerns the preliminary analysis of a copy of sacred texts in Arabic, Ms 566, dating from around the 15th century and currently held at the Biblioteca Nazionale of Pisa. The manuscript was chosen because it is representative of the material typology, state of preservation and content of the ancient manuscript, epigraphic and book heritage of the Arab world},
KEYWORDS = {ancient manuscript, Arabic, spectroscopy, multispectral imaging, computational philology, digital scholarly editions, DSL-based DSE, CoPhiEditor},
URL = {https://ieeexplore.ieee.org/document/11224170},
DOI = {10.1109/CiSt65886.2025.11224170},
ISBN = {979-8-3315-4384-6},
BOOKTITLE = {2025 IEEE 8th Congress on Information Science and Technology (CiSt)},
}
@INPROCEEDINGS{DIDONATO_2025_INPROCEEDINGS_D_554330,
AUTHOR = {Di Donato, F.},
TITLE = {What about research quality? A discussion on qualitative judgement and quantitative criteria in research assessment},
YEAR = {2025},
ABSTRACT = {The reform of research assessment since the San Francisco Declaration on Research Assessment (2012) and the Agreement on Reforming Research Assessment (ARRA) (2022) has focused on the contrast between quantity and quality. The Coalition for Advancing Research Assessment (CoARA) was set up to promote the principles and commitments contained therein. The actions of ARRA signatories are set out in the four core commitments that constitute the heart of the reform and its guiding framework. In particular, the second commitment states to "base research assessment primarily on qualitative evaluation for which peer review is central, supported by the responsible use of quantitative indicators" when meaningful and relevant. The ARRA identifies peer review as "the most robust known method for assessing research quality” and has the advantage of being in the hands of the research community. CoARA and the ARRA thus place qualitative judgement-as opposed to quantitative indicators-at the centre, implying the existence of an opposition between 'quality' and 'quantity'. This calls for a cultural change based on the principle that it is necessary to publish less (abandoning the 'publish or perish' logic) and publish better (making results, data and processes transparent, accessible and reproducible, and paying more attention to the integrity of research). The aim of this change is to produce research that is more robust, more rigorous, more responsible. In short, of higher quality. This approach has been criticised. One criticism, in the many debates following presentations on the reform that I attended, is that quantitative indicators are objective and qualitative judgement is subjective and arbitrary. This paper aims to refute both objections starting from the second. To do this, it draws on the definition of quality-and qualitative-by R. M. Pirsig, who devoted his entire life to defining a Metaphysics of Quality},
KEYWORDS = {Qualitative assessment, Research Evaluation},
PAGES = {4},
URL = {https://vastuullinentiede.fi/sites/default/files/2025-05/RESSH2025_Conference_Book_of_Abstracts.pdf},
DOI = {10.5281/zenodo.15403245},
CONFERENCE_NAME = {RESSH2025-Reforming Research Assessment},
BOOKTITLE = {RESSH2025 Book of Abstracts},
}
@INPROCEEDINGS{MAZZAGUFO_2025_INPROCEEDINGS_MCDDSSS_571342,
AUTHOR = {Mazzagufo, L. and Cristofaro, S. and D'Agata, C. and Del Grosso, A. M. and Sichera, P. and Sichera, A. and Spampinato, D.},
TITLE = {Moving towards a semantic archival edition: the PAVES-e project},
YEAR = {2025},
ABSTRACT = {This paper presents the open-access semantic edition-archive of Cesare Pavese’s literary and documentary heritage, developed within the PAVES-e project. It employs the CHROMA model, incorporating XML-TEI encoding, ontology-driven semantic organization, and interactive visualization tools to facilitate enhanced accessibility and semantic and lexicographic analysis of Pavese’s works},
KEYWORDS = {Pavese, DSU, XML-TEI},
URL = {https://iris.cnr.it/handle/20.500.14243/571342},
CONFERENCE_NAME = {Building Access and Accessibility, Open Science to all Citizens},
BOOKTITLE = {Building Access and Accessibility, Open Science to all Citizens},
}
@INPROCEEDINGS{MERCATANTI_2025_INPROCEEDINGS_MCDR_564801,
AUTHOR = {Mercatanti, E. and Congiu, C. and Del Grosso, A. M. and Riccucci, M.},
TITLE = {Voci dall'Inferno: a Web application to study and analyze the Lager testimonies},
YEAR = {2025},
ABSTRACT = {This contribution presents the ongoing development of the\ Voci dall'Inferno\ project. This research initiative aims to create a digital corpus of non-literary testimonies from Lager survivors and analyze it to identify expressions from Dante's\ Commedia that witnesses use to describe their harrowing experiences},
KEYWORDS = {dante alighieri, XML-TEI, digital archive, Lager, web application},
URL = {https://iris.cnr.it/handle/20.500.14243/564801},
DOI = {10.5281/ZENODO.15947430},
CONFERENCE_NAME = {DH2025-Building Access and Accessibility, Open Science to all Citizens},
CONFERENCE_PLACE = {ITA},
BOOKTITLE = {DH2025-Building Access and Accessibility, Open Science to all Citizens},
}
@INPROCEEDINGS{SICHERA_2025_INPROCEEDINGS_SCDDGMS_559735,
AUTHOR = {Sichera, P. and Cristofaro, S. and D'Agata, C. and Del Grosso, A. M. and Grasso, M. and Mazzagufo, L. and Spampinato, D.},
TITLE = {Streamlining TEI Workflows: Collaborative Editing with NormaTEI},
YEAR = {2025},
ABSTRACT = {In digital philology, the production of scholarly editions is increasingly recognized as a collaborative endeavour, involving multidisciplinary teams and both synchronous and asynchronous workflows. This shift affects not only the publication of individual critical texts but also the construction of large-scale digital archives. While adopting formal protocols like those of the TEI is essential, it alone cannot guarantee consistency and coherence of the outcomes. A robust system is needed to support the entire editorial process, facilitating both the harmonization and quantitative analysis of texts},
KEYWORDS = {Cooperative Digital Scholarly Edition, Harmonization, Encoding, Interoperability, NormaTEI, Digital Humanities},
PAGES = {177-182},
URL = {https://iris.cnr.it/handle/20.500.14243/559735},
DOI = {10.5281/zenodo.17312233},
ISBN = {978-83-977695-0-2},
CONFERENCE_NAME = {"New Territories" TEI 2025},
BOOKTITLE = {"New Territories". Text Encoding Initiative Conference and Members' Meeting 2025. Book of Abstracts},
}
@TECHREPORT{ALBANESI_2025_TECHREPORT_AGMPS_544743,
AUTHOR = {Albanesi, D. and Giovannetti, E. and Marchi, S. and Papini, M. and Sciolette, F.},
TITLE = {Traduco: l'Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-Rapporto tecnico 27},
YEAR = {2025},
ABSTRACT = {La presente relazione tecnico-scientifica descrive l’attività svolta da CNR-ILC nel contesto del Progetto Traduzione Talmud Babilonese nel periodo gennaio 2025-maggio 2025. Le principali attività tecniche svolte sul sistema Traduco attualmente in produzione hanno riguardato l’aggiornamento di alcune funzionalità. Sul fronte della ricerca è proseguito il lavoro sulla terminologia talmudica finalizzato all’integrazione delle voci terminologiche con il lessico della lingua italiana. Infine, sono proseguite le attività sperimentali di Intelligenza Artificiale con l’uso dei Large Language Models, in particolare sul fronte del supporto alla traduzione},
KEYWORDS = {Lessici elettronici, rappresentazione della conoscenza, Linguistica Computazionale, traduzione di testi religiosi, traduzione assistita dal calcolatore, Large Language Models, Intelligenza Artificiale},
URL = {https://iris.cnr.it/handle/20.500.14243/544743},
}
@TECHREPORT{BARDI_2025_TECHREPORT_BBDDDFGRMRT_564761,
AUTHOR = {Bardi, A. and Buzzoni, M. and Daquino, M. and Del Gratta, R. and Del Grosso, A. M. and Fischer, F. and Giacomini, S. and Rosselli Del Turco, R. and Martignano, C. and Rubin, G. and Tomasi, F.},
TITLE = {DH ATLAS: White book v1. 2},
YEAR = {2025},
ABSTRACT = {The DH ATLAS whitebook presents the ATLAS catalogue and its underlying data model and provides guidelines and best practices for producing "FAIR" (Findable, Accessible, Interoperable, and Reusable) scholarly outputs in Digital Humanities and enhancing Italian digital cultural heritage},
KEYWORDS = {Digital Humanities Data FAIRness},
PAGES = {113},
URL = {https://zenodo.org/records/14925266},
DOI = {10.5281/zenodo.1492526},
}
@TECHREPORT{BENASSI_2025_TECHREPORT_BBCCDDFMOPRSSS_573982,
AUTHOR = {Benassi, L. and Boschetti, F. and Canova, L. and Chaban, A. and Degl'Innocenti, E. and Di Meo, C. and Frontini, F. and Monachini, M. and Ottaviani, R. and Pedonese, G. and Restaneo, P. and Scognamiglio, A. and Spadi, A. and Striova, J.},
TITLE = {H2IOSC-D8. 1 Training Strategy},
YEAR = {2025},
ABSTRACT = {In this document we describe the state of the art of the four participating infrastructures in terms of training and define the training strategy of the project H2IOSC in terms of overall vision, and along the following 3 lines:-Building the H2IOSC the training infrastructure with a training portal and a depositing service for training materials (technical and functional requirements are described for both)-Creating an offer of common H2IOSC training materials, aimed at facilitating the use of the H2IOSC marketplace and pilots-Strengthening the disciplinary offer for the four participating infrastructures This is a living document, evolving during the life of the project with the natural upgrade of the awareness of the needs expressed by the various groups interested (users already in the community and identified potential users)},
KEYWORDS = {Training, Capacity building},
PAGES = {49},
URL = {https://zenodo.org/records/14680109},
DOI = {10.5281/zenodo.14680108},
}
@TECHREPORT{CARDILLO_2025_TECHREPORT_CKS_571029,
AUTHOR = {Cardillo, F. A. and Khyari, H. and Straccia, U.},
TITLE = {MILP-SAT-GNN: yet another neural SAT solver},
YEAR = {2025},
ABSTRACT = {We proposes a novel method that enables Graph Neural Networks (GNNs) to solve SAT problems by leveraging a technique developed for applying GNNs to Mixed Integer Linear Programming (MILP). Specifically, k-CNF formulae are mapped into MILP problems, which are then encoded as weighted bipartite graphs and subsequently fed into a GNN for training and testing. From a theoretical perspective: (i) we establish permutation and equivalence invariance results, demonstrating that the method produces outputs that are stable under reordering of clauses and variables; (ii) we identify a theoretical limitation, showing that for a class of formulae called foldable formulae, standard GNNs cannot always distinguish satisfiable from unsatisfiable instances; (iii) we prove a universal approximation theorem, establishing that with Random Node Initialization (RNI), the method can approximate SAT solving to arbitrary precision on finite datasets, that is, the GNN becomes approximately sound and complete on such datasets. Furthermore, we show that for unfoldable formulae, the same approximation guarantee can be achieved without the need for RNI. Finally, we conduct an experimental evaluation of our approach, which show that, despite the simplicity of the neural architecture, the method achieves promising results},
KEYWORDS = {Computer Science - Learning, Computer Science - Artificial Intelligence},
PAGES = {19},
URL = {http://arxiv.org/abs/2507.01825v1},
DOI = {10.48550/arXiv.2507.01825},
}
@TECHREPORT{GIOVANNETTI_2025_TECHREPORT_GABMP_567709,
AUTHOR = {Giovannetti, E. and Albanesi, D. and Bellandi, A. and Marchi, S. and Papini, M.},
TITLE = {Traduco: l'Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-Rapporto tecnico 28},
YEAR = {2025},
ABSTRACT = {La presente relazione tecnico-scientifica descrive l’attività svolta da CNR-ILC nel contesto del Progetto Traduzione Talmud Babilonese nel periodo giugno 2025-ottobre 2025. Le principali attività tecniche svolte sul sistema Traduco attualmente in produzione hanno riguardato l’aggiornamento di alcune funzionalità. Inoltre, è stato sviluppato un sistema per la conversione del contenuto del database di Traduco in un formato conforme al backend “TextO”, sviluppato presso il CNR-ILC. Sul fronte della ricerca si è lavorato all’estensione del lessico computazionale CompL-it della lingua italiana al fine di collegarvi semanticamente la risorsa terminologica del Talmud e consentire così di effettuare ricerche linguistico-semantiche sulla traduzione in italiano},
KEYWORDS = {Lessici elettronici, rappresentazione della conoscenza, Linguistica Computazionale, traduzione di testi religiosi, traduzione assistita dal calcolatore, Large Language Models, Intelligenza Artificiale},
URL = {https://iris.cnr.it/handle/20.500.14243/567709},
}
@TECHREPORT{MALLIA_2025_TECHREPORT_M_543561,
AUTHOR = {Mallia, M.},
TITLE = {Installing and configuring a Proxy with SimpleSAMLphp on ILC4CLARIN Infrastructure for SSO with CLARIN SPF},
YEAR = {2025},
ABSTRACT = {This technical report provides a detailed guide for the installation, configuration, and integration of a Service Provider (SP) to enable federated authentication within the ILC4CLARIN infrastructure. Aimed at technical personnel, the document outlines all necessary steps to connect the SP to the DFN-AAI federation, ensuring secure and reliable access to services through a federated identity model. At the core of the solution is SimpleSAMLphp, an open-source software that supports SAML-based identity federation, operating as both an Identity Provider (IdP) and Service Provider (SP). Its modular architecture allows for seamless integration with research and academic federations such as CLARIN, DFN-AAI, and eduGAIN. The configuration is metadata-driven, facilitating compatibility with a broad range of identity systems. The report also introduces key concepts of federated authentication, where trust relationships between IdPs and SPs allow users to access multiple services using a single set of credentials. Authentication is routed through a discovery service that enables users to select their home institution, improving user experience and security. The work is motivated by the need to integrate CLARIN's Single Sign-On (SSO) system into INCEpTION, a web-based platform for linguistic and semantic annotation developed at Technische Universität Darmstadt. Due to the complexity of direct integration with CLARIN’s discovery interface, a proxy-based authentication architecture was adopted. This approach, supported by Keycloak, consolidates multiple IdPs into a single authentication endpoint, streamlining the user login process while ensuring compatibility with the CLARIN federation. This report focuses on configuring the Service Provider component. A companion document will provide further details on the complete proxy architecture. The activity is part of the H2IOSC – Humanities and Heritage Italian Open Science Cloud project, funded under Italy’s National Recovery and Resilience Plan (PNRR). The initiative promotes open science in the humanities by providing federated access to distributed infrastructures and services. Within this framework, CLARIN-IT, the Italian node of the CLARIN ERIC infrastructure, plays a key role in enabling secure, interoperable access to digital linguistic resources for researchers},
KEYWORDS = {single sign on, clarin service provider federation, simplesamlphp, authentication},
URL = {https://zenodo.org/records/15544532},
DOI = {10.5281/zenodo.15544532},
}
@TECHREPORT{MALLIA_2025_TECHREPORT_MGGPE_546041,
AUTHOR = {Mallia, M. and Galanis, D. and Gkoumas, D. and Piperidis, S. and Eckart De Castilho, R.},
TITLE = {Integrating CLARIN SSO Authentication into INCEpTION: A Technical Report},
YEAR = {2025},
ABSTRACT = {This technical report documents the integration of a Single Sign-On (SSO) authentication system within the INCEpTION platform, designed to interoperate with the CLARIN Service Provider Federation. INCEpTION is a semantic annotation and knowledge management tool developed by the Technical University of Darmstadt and hosted within the CLARIN-EL research infrastructure. The report offers a detailed overview of the implementation process, presenting configuration steps, architectural decisions, and protocol-level considerations necessary for enabling secure, federated user access},
KEYWORDS = {Single Sign On, Authentication, Infrastructures},
URL = {https://iris.cnr.it/handle/20.500.14243/546041},
DOI = {10.5281/zenodo.15607127},
}
@TECHREPORT{MONACHINI_2025_TECHREPORT_MQLMCCDSCGM_557398,
AUTHOR = {Monachini, M. and Quochi, V. and Luzietti, R. B. and Moscati, P. and Caravale, A. and Chirivi, A. and Degl'Innocenti, E. and Spadi, A. and Caradonna, M. and Giampietro, N. and Mancuso, G.},
TITLE = {D2. 1 Landscaping and building communities},
YEAR = {2025},
ABSTRACT = {The Humanities and Heritage Italian Open Science Cloud (H2IOSC) project involves four Italian nodes of research infrastructures (RIs)-CLARIN, DARIAH, E-RIHS, and OPERAS. Within this project, the second work package focuses on establishing, mapping, and monitoring strategies for assessing the national and international operation contexts for the four RIs, the characteristics of their user communities, and the specific data resources, services, and tools that are most needed, used and newly created. The main objective of this work package is to conduct a comprehensive survey of the landscape of language technologies, humanities, and heritage science in Italy. This survey takes into account existing projects, resources, tools, communities, best practices, and standards that need to be integrated into the national Marketplace as well as the repositories of the four RIs. Collaboration within the work package was directed at structuring shared procedures for developing, managing, and adapting the survey's main objectives. Priority was on identifying and engaging key stakeholders within various communities. The surveying activity was organized around a set of shared activities, in parallel with others conducted by each infrastructure. The initial coordination activity focused on defining dimensions and criteria to guide the survey. It resulted in the creation of a structured questionnaire, which was designed to gather information about user needs, engage with stakeholders, identify communities of reference, evaluate relevant projects, and assess the FAIRness of data. The questionnaire was employed to gather insights on a wide range of topics, including data resources, software, tools, projects, training needs, prior knowledge of RIs, publications, and feedback. Such a questionnaire has been distributed among the relevant disciplinary communities and sub-communities of the four RIs. Respondents included students, researchers, professors, and subject matter experts in social science, digital humanities, and cultural heritage research fields. Preliminary results from the control group gave insights into the challenges and opportunities of the survey. Respondents have shared valuable information about data resources, technologies, software, and their training needs. The results highlight the need for clearer communication, dissemination activities, and better engagement strategies to encourage participation from the wider community. Addressing the lack of},
KEYWORDS = {Italian research infrastructures, Digital Humanities, Heritage science, Open Science},
URL = {https://iris.cnr.it/handle/20.500.14243/557398},
DOI = {10.5281/zenodo.14680021},
}
@TECHREPORT{MONACHINI_2025_TECHREPORT_MQLSMDCGCM_572705,
AUTHOR = {Monachini, M. and Quochi, V. and Luzietti, R. B. and Spadi, A. and Mancuso, G. and D'Eredità, A. and Caravale, A. and Giampietro, N. and Caradonna, M. and Melaccio, D.},
TITLE = {D2. 2 Updated Report on the H2IOSC Landscapes},
YEAR = {2025},
ABSTRACT = {This deliverable presents the updated results of the Landscaping and Building Communities activities carried out within WP2 of the H2IOSC project. Through a mixed-methods approach—combining questionnaires, interviews, focus groups, and internal and external scouting—the report provides a systematic overview of the research landscape in the Humanities, Linguistics, and Heritage Science domains in Italy. It maps existing digital resources, tools, services, community practices, FAIRness levels, training needs, and infrastructural gaps across the communities served by the four participating Research Infrastructures (CLARIN, DARIAH, E-RIHS, OPERAS). The findings feed directly into key components of the project, including the DHeLO landscaping platform and the H2IOSC Observatory, supporting resource integration, FAIRification, service development, capacity-building, and pilot innovation activities. Overall, the deliverable offers the strategic evidence base necessary for guiding the technical and community-oriented work of subsequent WPs},
KEYWORDS = {H2IOSC, Research Infrastructures},
URL = {https://iris.cnr.it/handle/20.500.14243/572705},
DOI = {10.5281/ZENODO.17737100},
}
@TECHREPORT{OTTAVIANI_2025_TECHREPORT_O_563841,
AUTHOR = {Ottaviani, R.},
TITLE = {Progettazione di un “piano strategico di consolidamento e sviluppo” per l’infrastruttura di ricerca di tipo Data Center realizzata dall’Istituto di Linguistica computazionale “A. Zampolli” di Pisa per il progetto “Humanities and cultural Heritage Italian Open Science Cloud – H2IOSC”},
YEAR = {2025},
ABSTRACT = {Report che ripercorre la strada per l'elaborazione di un “piano strategico di consolidamento e sviluppo” per l’infrastruttura di ricerca creata all'interno del progetto PNRR H2IOSC},
KEYWORDS = {H2IOSC, IR, Piano di sviluppo, Potenziamento Data center},
PAGES = {20},
URL = {https://iris.cnr.it/handle/20.500.14243/563841},
DOI = {10.32079/ISTI-TR-2025/018},
}
@TECHREPORT{PROVOST_2025_TECHREPORT_PDMXR_560076,
AUTHOR = {Provost, L. and Di Donato, F. and Malaguarnera, G. and Xenou, Z. and Reyes Elizondo, A.},
TITLE = {GraspOS Deliverable 6. 2: Dissemination, Exploitation, Communication Plan},
YEAR = {2025},
ABSTRACT = {Deliverable 6. 2 of the GraspOS project: Dissemination, Exploitation, Communication Plan This Dissemination, Exploitation, and Communication Plan provides a framework that guides the daily activities within the GraspOS project. It outlines how these activities contribute to the visibility and uptake of project results, and ensures engagement with external stakeholders and ongoing initiatives in Open Science and Responsible Research Assessment. The Plan has guided the daily operations of the project, and is monitored continuously, to support both the current activities of the project and post-project sustainability. The document reports on activities carried out since the start of the project, including the use of digital platforms, events, publications, and community engagement, and assesses their effectiveness through key performance indicators. It also describes updates made to the original plan to optimise outreach and alignment with related initiatives. In addition, the DECP sets out the final exploitation strategy, including the identification of key exploitable results, value propositions, sustainability pathways, and alignment with European Open Science and Responsible Research Assessment initiatives},
KEYWORDS = {GraspOS, Dissemination, Exploitation, Communication Plan},
URL = {https://iris.cnr.it/handle/20.500.14243/560076},
DOI = {10.5281/zenodo.16981002},
}
@TECHREPORT{PROVOST_2025_TECHREPORT_PDRXM_560075,
AUTHOR = {Provost, L. and Di Donato, F. and Reyes Elizondo, A. and Xenou, Z. and Malaguarnera, G.},
TITLE = {GraspOS Deliverable 6. 5: Report on C/D/E, community engagement, and training activities},
YEAR = {2025},
ABSTRACT = {Deliverable 6. 5 of the GraspOS project: Report on C/D/E, community engagement, and training activities This report outlines the communication, dissemination, exploitation, community engagement, and training activities undertaken by the GraspOS project up to September 2025 (M33). The document provides an analysis of the project's digital presence, and its stakeholder engagement strategy. It also reports on exploitation of project outputs, and details the work of the GraspOS Community of Practice (CoP) and the content of its training program, which includes both training sessions and webinars. The primary objective of these activities was to support the project's mission of advancing an Open Science-aware Responsible Research Assessment (RRA) system},
KEYWORDS = {Graspos, Dissemination, communication, coomunity engagement},
URL = {https://iris.cnr.it/handle/20.500.14243/560075},
}
@MISC{CALDONI_2025_MISC_CCFGKMMOPPPPSSST_556501,
AUTHOR = {Caldoni, G. and Coppini, S. and Ferretti, R. and Gualandi, B. and Kis, N. I. and Maltese, V. and Marchegiani, F. and Osmenaj, E. and Paschetta, M. and Pasquale, V. and Pavone, G. and Pedonese, G. and Sacchi, S. and Solieri, A. and Spadi, A. and Tarallo, A.},
TITLE = {Manifesto della Comunità Italiana Data Steward (CIDS)},
YEAR = {2025},
ABSTRACT = {Manifesto della comunità italiana data steward},
KEYWORDS = {CIDS - Comunità Italiana Data Stewards},
PAGES = {3},
URL = {https://zenodo.org/records/15129936},
DOI = {10.5281/zenodo.15129936},
}
@MISC{LAMELI_2025_MISC_LMN_571224,
AUTHOR = {Lameli, A. and Montemagni, S. and Nerbonne, J.},
TITLE = {Dialectal Dynamics},
YEAR = {2025},
ABSTRACT = {The quantitative work in dialectology in the last quarter century enables us to document, analyze and map the distribution of dialectal language variation in unprecedented detail. However, usually we do not know why distributions of variation have taken the form they have. We suspect that progress in this aspect of dialectology is likely to arise in reflection about social and geographical factors together and indeed there is work that points in this direction. The Languages special issue we propose to edit would like to extend and build on this work in two ways. First, we wish to stimulate dialectological theory based on the progress attained in quantitative work. A special focus will therefore be on work that deals with the combination of linguistic and, for example, social, cultural or economic influences in examining the distribution of linguistic variation. Second, we are also excited about the methodologically solid work being done on lesser studied languages and varieties, often in conjunction with language documentation. By encouraging and including research on a broader range of languages and varieties, we hope to avoid the myopia lurking when research is focused too narrowly on well-studied languages and areas},
KEYWORDS = {dialectology, social dialectology, dialectological theory, language documentation},
URL = {https://www.mdpi.com/journal/languages/special_issues/GZUP691XE0#Special_Issue_Information},
VOLUME = {10},
PUBLISHER = {MDPI},
}
@MISC{LAURIA_2025_MISC_LG_546862,
AUTHOR = {Lauria, F. M. and Gebrehiwot, A.},
TITLE = {Assessment Citrix NetScaler ADC sull'infrastruttura dell'Area della Ricerca di Pisa},
YEAR = {2025},
ABSTRACT = {La documentazione riporta l'esito e le procedure relavite ad un assessment internamente condotto al fine di identificare la potenziale esposizione verso Internet del software Citrix NetScaler ADC (Application Delivery Controller) dalle infrastrutture di rete degli istituti CNR ubicati presso l'Area della Ricerca di Pisa},
KEYWORDS = {cybersecurity, network security, network assessment},
URL = {https://iris.cnr.it/handle/20.500.14243/546862},
}
@MISC{MAGRINI_2025_MISC_MCDDIMMB_559511,
AUTHOR = {Magrini, M. and Curzio, O. and Dolciotti, C. and Donzelli, G. and Imiotti, M. C. and Minichilli, F. and Moroni, D. and Bongioanni, P.},
TITLE = {Virtual, augmented and mixed reality for motor neurorehabilitation: scoping review focused on the role of body representation},
YEAR = {2025},
ABSTRACT = {Background: In neurorehabilitation, virtual reality (VR) applications cover a wide range of areas, including the rehabilitation of patients with various types of brain and spinal cord injuries. VR provides the subject multisensory feedback, enhancing neuronal plasticity within the sensorimotor cortex. Objective: The systematic review critically analyses the existing literature on VR applications related to motor problems and somatic representation to propose new tools and experiments. Methods: The Protocol was registered in the international database for systematic reviews PROSPERO (ID: 481092-22 November 2023). The review followed the Preferred Reporting Items for Systematic Reviews and Meta-Analyses (PRISMA) Guidelines. To implement the search string, a broad overview of previous literature reviews in the field was developed. The databases PubMed, Embase, Scopus, and Web of Science (7 December 2023) were explored, and data regarding study design, methodology, participant characteristics, specific devices and instruments used and tested, body representation, and virtual somatic embodiment were collected. The Newcastle-Ottawa Scale was used to assess the methodological quality of the studies; for case report studies, a dedicated scale was used. Results: The review included 26 studies, mainly clinical trials on neurological patients. Internationally, VR technologies in the period 2008-2023 have evolved significantly; the emergence of inexpensive devices such as Oculus Rift and HTC Vive has stimulated research in this area. The best results have been achieved for patients with sensorimotor deficits. In VR systems, users experience a first-or third-person view (where their avatar is present) of the synthetic world around them. All included studies used the first-person perspective, which was found to be most effective. Five studies incorporated EEG for recording brain responses during experiments, while two studies used transcranial stimulators to enhance the effect of the VR intervention. A couple of studies employed other kinds of devices, such as eye trackers. Regarding the 3D engine used, Unity 3D remains the preferred choice for the development of VR applications in research due to its ease of learning and seamless integration with devices. Conclusions: The review of the selected studies shows that the use of VR devices enhances reinforcement learning, thereby improving motor and cognitive recovery. The emerging operational proposition supports the use of tailor-made techniques in the rehabilitation setting-aimed at improving and evaluating the outcomes of therapeutic interventions in the treatment of neurological patients. Clinical Trial: International database for systematic reviews PROSPERO, ID: 481092-22 November 2023},
KEYWORDS = {Body Representation, Embodiment Cognition, Virtual Reality, Augmented Reality, Neurorehabilitation},
PAGES = {19},
URL = {https://doi.org/10.2196/63487},
VOLUME = {2},
DOI = {10.2196/63487},
ISSN = {2818-3045},
}
@MISC{MANNOCCI_2025_MISC_MDPP_560074,
AUTHOR = {Mannocci, A. and Di Donato, F. and Pecoraro, F. and Provost, L.},
TITLE = {Implementing the Agreement on Reforming Research Assessment in RPOs: Lessons from the CNR Pilot},
YEAR = {2025},
ABSTRACT = {Poster presented at the final conference of the GraspOS project},
KEYWORDS = {Coara, Research assessment, open science},
URL = {https://iris.cnr.it/handle/20.500.14243/560074},
}
@MISC{PAPINI_2025_MISC_PMG_562386,
AUTHOR = {Papini, M. and Marchi, S. and Giovannetti, E.},
TITLE = {LLM and Talmud: an evaluation of early results of assisted translation and question answering},
YEAR = {2025},
ABSTRACT = {In this presentation, we will discuss two experiments applying Large Language Models (LLMs) within the framework of the Translation Project of the Babylonian Talmud into Italian. Two distinct tasks have been identified where large language models can contribute: translation support through suggestions and question answering (QA). For the first task, we applied a methodology inspired by Retrieval-Augmented Generation (RAG) techniques and few-shot prompting, which, by leveraging the translation memory of the “Traduco” CAT system, enabled the LLMs to generate translation suggestions that are linguistically correct and stylistically consistent with what translators have produced so far. For the second task, on the other hand, two prototypes also based on the RAG technique were developed in which the contexts provided to the model came from either the already published text alone or a combination of the published text and its accompanying glossaries. In both prototypes, prompts included instructions for the system to cite the sources used in its responses. Early results are promising. In the first task, our methodology produced a better translation in 79% of cases compared to the text translated directly by the generative model. The remaining 21% highlighted the LLM's inability to produce essential explanatory expansions crucial for understanding the Talmud and characteristic of the edition. The QA task also provided promising feedback, particularly in the indication of sources to support its answers, although it did not show substantial improvements in quality compared to direct queries to the models. These results underscore the need for further investigations to overcome the limitations of LLMs in processing highly complex texts},
KEYWORDS = {LLM, Talmud, question answering, assisted translation, RAG, LLM, Talmud, question answering, traduzione assistita, RAG},
URL = {https://iris.cnr.it/handle/20.500.14243/562386},
CONFERENCE_NAME = {AI and Digital Humanities – Methodological Approaches, Theories and Methods},
}
@MISC{PEDONESE_2025_MISC_P_561729,
AUTHOR = {Pedonese, G.},
TITLE = {From Collection to Transcription: a Workflow for Managing Speech Data by the CLARIN Trainers' Network},
YEAR = {2025},
ABSTRACT = {This presentation shares the experience of members of the CLARIN Trainers’ Network in reusing, adapting and localising existing learning content related to speech and oral data management to meet the learning needs of the CLARIN-IT research community in the context of the Humanities and Cultural Heritage Italian Open Science Cloud (H2IOSC) project. Following a brief introduction to the H2IOSC project and its training strategy, the article describes the transcription workshop and an accompanying workflow for managing speech and oral data, including data collection, privacy considerations, and the transcription chain. Furthermore, the authors show how they used the Skills4EOSC FAIR-by-Design methodology to convert the workshop into reusable training material, which other trainers can take and adapt to meet the needs of researchers in other communities working with oral history data.-Progetto H2IOSC-Humanities and cultural Heritage Italian Open Science Cloud finanziato dall’Unione Europea NextGenerationEU – PNRR M4C2 – Codice progetto IR0000029 – CUP B63C22000730005},
KEYWORDS = {transcription chain, Linguistics},
URL = {https://iris.cnr.it/handle/20.500.14243/561729},
DOI = {10.5281/zenodo.17191109},
CONFERENCE_NAME = {IEEE International Conference on Cyber Humanities (IEEE-CH), Florence, 8-10 September 2025},
}
@MISC{VANDENHEUVEL_2025_MISC_VDFPV_561742,
AUTHOR = {Van Den Heuvel, H. and Draxler, C. and Frontini, F. and Pedonese, G. and Van Der Lek, I.},
TITLE = {Introduzione alla Gestione dei Dati Orali},
YEAR = {2025},
ABSTRACT = {Il corso affronta le tematiche legate alla gestione dei dati linguistici orali. Dopo un'introduzione generale alle possibilità offerte dall'infrastruttura CLARIN ERIC in fase di scoperta, raccolta e deposito di dati orali, si approfondiranno le questioni etico-legali connesse alla raccolta, gestione e conservazione dei dati e il procedimento di trascrizione automatica, con ulteriori possibilità di annotazione attraverso strumenti ti trattamento automatico del linguaggio. Il corso è stato sviluppato con la collaborazione dei docenti della CLARIN Traners' Network nell'ambito della partecipazione di CLARIN-IT al Progetto H2IOSC-Humanities and cultural Heritage Italian Open Science Cloud finanziato dall’Unione Europea NextGenerationEU – PNRR M4C2 – Codice progetto IR0000029 – CUP B63C22000730005. Il materiale si compone di tre unità: Unità 1-I Dati Linguistici Orali in CLARIN Questa unità fornisce una panoramica delle risorse e dei servizi offerti dall'Infrastruttura di Ricerca CLARIN ERIC a supporto della scoperta, dell'annotazione e del deposito dei dati linguistici orali in accordo con i principi FAIR e le buone pratiche della Scienza Aperta. Unità 2-Raccolta e Gestione dei Dati Orali L'unità propone un'introduzione alle problematiche legate alla gestione dei dati orali dal punto di vista etico e legale. Gli aspetti legati al GDPR e alla normativa italiana di riferimento sono approfonditi in un gioco di ruolo interattivo. Unità 3-Laboratorio di Trascrizione Automatica In questa unità interattiva, saranno affrontate le questioni relative ad alcuni strumenti e i software utili per la trascrizione dei dati. Si ringraziano le ricercatrici e i ricercatori impegnate/i nel progetto PRIN Corpus SIM (Senecta Ipsa Morbus)-Spontaneous speech in healthy ageing per aver attivamente partecipato alle sessioni di didattica del 16 e 17 settembre 2024 presso l'Università di Firenze, da cui è stato tratto il materiale del corso},
KEYWORDS = {Dati orali, Archivi orali, Trascrizione automatica},
URL = {https://iris.cnr.it/handle/20.500.14243/561742},
DOI = {10.5281/zenodo.17183051},
}
@ARTICLE{ALZETTA_2024_ARTICLE_A_493660,
AUTHOR = {Alzetta, C.},
TITLE = {Investigating the Interplay between Text Difficulty and Prerequisite Relation Identification in Educational Texts},
YEAR = {2024},
ABSTRACT = {Prerequisite relations (PR) are fundamental in knowledge acquisition and the applications of Artificial Intelligence to distance learning, particularly with regard to personalized learning plans. The role of these relations is to specify the sequence of information acquisition necessary for understanding a target concept. Despite their significance, identifying PRs in educational texts is challenging, mainly due to the lack of systematic procedures for their identification on educational texts. This paper contributes to the ongoing research on PR identification by exploring the relationship between text difficulty, assessed across various linguistic properties and target audiences, and prerequisite relations. We conducted a crowd-based study on the novel task of prerequisite concept ordering. The study yielded preliminary yet valuable insights into the impact of text difficulty on the task. Such evidence sheds light on the need to account for the linguistic properties of texts when identifying PRs, thus advancing the field’s comprehension of PRs within the educational landscape. Ultimately, we hope that this work could foster novel linguistically-aware research on PR. Top of page},
KEYWORDS = {Prerequisite relations, Text difficulty, Educational texts},
PAGES = {39-64},
URL = {https://journals.openedition.org/ijcol/1362},
VOLUME = {10 (1)},
DOI = {10.4000/125nn},
ISSN = {2499-4553},
JOURNAL = {IJCOL},
}
@ARTICLE{ALZETTA_2024_ARTICLE_AMSV_484441,
AUTHOR = {Alzetta, C. and Montemagni, S. and Sartor, M. and Venturi, G.},
TITLE = {Parlamint-it: an 18-karat UD treebank of Italian parliamentary speeches},
YEAR = {2024},
ABSTRACT = {The paper presents ParlaMint-It, a new treebank of Italian parliamentary debates, linguistically annotated based on the Universal Dependencies (UD) framework. The resource comprises 20, 460 tokens and represents a hybrid language variety that is underrepresented in the UD initiative. ParlaMint-It results from a manual revision process that relies on a semi-automatic methodology able to identify sentences that are most likely to contain inconsistencies and recurrent error patterns generated by the automatic annotation. Such a method made the revision process faster and more efficient than revising the entire treebank. In addition, it allowed the identification and correction of annotation errors resulting from linguistic constructions inconsis-tently represented in UD treebanks and from characteristics specific to parliamentary speeches. Hence, the treebank is deemed as an 18-karat resource, since, although not fully manually revised, it is a valuable resource for researchers working on Italian language processing tasks},
KEYWORDS = {Universal dependencies treebanks, Annotation revision, Italian parliamentary debates, Linguistic annotation},
PAGES = {25},
URL = {https://link.springer.com/content/pdf/10.1007/s10579-024-09748-6.pdf},
DOI = {10.1007/s10579-024-09748-6},
ISSN = {1574-020X},
JOURNAL = {LANGUAGE RESOURCES AND EVALUATION},
}
@ARTICLE{BELLANDI_2024_ARTICLE_BDPV_505724,
AUTHOR = {Bellandi, A. and Di Nunzio Giorgio, M. and Piccini, S. and Vezzani, F.},
TITLE = {LemonizeTBX: Design and Implementation of a New Converter from TBX to OntoLex-Lemon},
YEAR = {2024},
ABSTRACT = {In this paper, we introduce LemonizeTBX, a converter that enhances interoperability between terminological and lexicographical frameworks, acknowledging their divergent data modelling approaches. First, we present the theoretical implications of a conversion from the TermBase eXchange (TBX) concept-oriented framework to the OntoLex-Lemon sense-centred standpoint within Semantic Web technologies. Then, we illustrate the prototype version of the converter, designed as an interactive tool engaging terminologists in the conversion process},
KEYWORDS = {data serialisation, lexicography, OntoLex-Lemon, TermBase eXchange, terminography},
PAGES = {1-18},
URL = {https://iris.cnr.it/handle/20.500.14243/505724},
VOLUME = {18 (2)},
ISSN = {1938-4122},
JOURNAL = {DIGITAL HUMANITIES QUARTERLY},
}
@ARTICLE{BIFFI_2024_ARTICLE_BGMS_550304,
AUTHOR = {Biffi, M. and Guadagnini, E. and Montemagni, S. and Sassolini, E.},
TITLE = {La stampa periodica citata nel GDLI: il rapporto tra voci e indice bibliografico e le prospettive per il dizionario strutturato},
YEAR = {2024},
ABSTRACT = {L’elemento caratterizzante del Grande dizionario della lingua italiana (GDLI) è il ricchissimo apparato degli esempi, allegati per documentare gli impieghi di ogni voce nel corso dei secoli: ne fanno parte anche passi estratti dalla stampa periodica, in una quantità che tende ad aumentare sensibilmente nella seconda metà del vocabolario. Questo contributo si articola in due parti: da un lato, saranno discussi metodi, risultati e prospettive per il collegamento – nella versione informatizzata del GDLI – tra gli esempi citati nelle voci e l’Indice degli autori citati e per il trattamento dei citati non indicizzati; d’altro canto, saranno presentati i primi risultati dell’analisi delle stringhe bibliografiche che occorrono nella sezione degli esempi (che sono state estratte automaticamente dalla prima versione digitale strutturata del dizionario), con riferimento alla stampa periodica},
KEYWORDS = {Lessicografia, Digital Humanities},
PAGES = {267-294},
URL = {https://iris.cnr.it/handle/20.500.14243/550304},
VOLUME = {41},
ISSN = {0392-5218},
JOURNAL = {STUDI DI LESSICOGRAFIA ITALIANA},
}
@ARTICLE{BONFIGLI_2024_ARTICLE_BBMD_518430,
AUTHOR = {Bonfigli, A. and Bacco, L. and Merone, M. and Dell'Orletta, F.},
TITLE = {From pre-training to fine-tuning: An in-depth analysis of Large Language Models in the biomedical domain},
YEAR = {2024},
ABSTRACT = {In this study, we delve into the adaptation and effectiveness of Transformer-based, pre-trained Large Language Models (LLMs) within the biomedical domain, a field that poses unique challenges due to its complexity and the specialized nature of its data. Building on the foundation laid by the transformative architecture of Transformers, we investigate the nuanced dynamics of LLMs through a multifaceted lens, focusing on two domain-specific tasks, i. e., Natural Language Inference (NLI) and Named Entity Recognition (NER). Our objective is to bridge the knowledge gap regarding how these models’ downstream performances correlate with their capacity to encapsulate task-relevant information. To achieve this goal, we probed and analyzed the inner encoding and attention mechanisms in LLMs, both encoder-and decoder-based, tailored for either general or biomedical-specific applications. This examination occurs before and after the models are fine-tuned across various data volumes. Our findings reveal that the models’ downstream effectiveness is intricately linked to specific patterns within their internal mechanisms, shedding light on the nuanced ways in which LLMs process and apply knowledge in the biomedical context. The source code for this paper is available at https: //github. com/agnesebonfigli99/LLMs-in-the-Biomedical-Domain},
KEYWORDS = {Biomedical domain, Domain adaptation, Large Language Models},
URL = {https://iris.cnr.it/handle/20.500.14243/518430},
VOLUME = {157},
DOI = {10.1016/j.artmed.2024.103003},
ISSN = {0933-3657},
JOURNAL = {ARTIFICIAL INTELLIGENCE IN MEDICINE},
}
@ARTICLE{CARDILLO_2024_ARTICLE_CDS_476401,
AUTHOR = {Cardillo, F. A. and Debole, F. and Straccia, U.},
TITLE = {PN-OWL: a two-stage algorithm to learn fuzzy concept inclusions from OWL 2 ontologies},
YEAR = {2024},
ABSTRACT = {Given a target class T of an OWL 2 ontology, positive (and possibly negative) examples of T, we address the problem of learning, viz. inducing, from the examples, fuzzy class inclusion rules that aim to describe conditions for being an individual classified as an instance of the class T. To do so, we present PN-OWL which is a two-stage learning algorithm consisting of a P-stage and an N-stage. In the P-stage, the algorithm learns fuzzy class inclusion rules (the P-rules). These rules aim to cover as many positive examples as possible, increasing recall, without compromising too much precision. In the N-stage, the algorithm learns fuzzy class inclusion rules (the N-rules), that try to rule out as many false positives, covered by the rules learnt at the P-stage, as possible. Roughly, the P-rules tell why an individual should be classified as an instance of T, while the N-rules tell why it should not. PN-OWL then aggregates the P-rules and the N-rules by combining them via an aggregation function to allow for a final decision on whether an individual is an instance of T or not. We also illustrate the effectiveness of PN-OWL through extensive experimentation},
KEYWORDS = {OWL 2 ontologies, Machine learning, Fuzzy logic, Concept/class inclusion rules},
PAGES = {19},
URL = {https://www.sciencedirect.com/science/article/pii/S0165011424001945},
VOLUME = {490 (109048)},
DOI = {10.1016/j.fss.2024.109048},
ISSN = {0165-0114},
JOURNAL = {FUZZY SETS AND SYSTEMS},
}
@ARTICLE{DIDONATO_2024_ARTICLE_D_465464,
AUTHOR = {Di Donato, F.},
TITLE = {What we talk about when we talk about research quality. A discussion on responsible research assessment and Open Science},
YEAR = {2024},
ABSTRACT = {The crisis of the current research assessment system has been at the centre of academic debate for many years but it is only recently that the issue has been brought to the forefront of the agendas of public institutions financing research. In fact, the existing evaluation criteria are believed to place excessive emphasis on quantity and on productivity, leaving aside research quality, collaborative open research methods, and the wider impact of research on society. The article starts from this consideration (section 1) and focuses on the ongoing reform coordinated by the Coalition for Advancing Research Assessment (CoARA), analysing in particular the Agreement on Reforming Research Assessment (ARRA) (section 2), which proposes a vision that relies on qualitative judgement based on peer reviewing, and places research quality at the centre of the reform. The definition of quality which emerges in the ARRA is closely linked to that of Open Science, and in particular that given by the UNESCO recommendation of 2021, to which section 3 is dedicated. Sections 4, 5 and 6 aim to provide the philosophical foundations of the definitions of quality and of Open Science which emerge in the previous sections. In particular, section 4 focuses on the definition of quality starting from the reflection of Robert Maynard Pirsig who, like in the Agreement, identifies quality with a procedural definition, namely the integrity of the scientific method. This connection leads us to the nexus between science and truth, which is addressed in Immanuel Kant's reflection on the purpose of science and on the conditions that make research possible in The Conflict of the Faculties (section 5). The analysis of Kant's considerations leads to defining what the philosopher means by the term Streit (conflict), i. e. a scientific debate between peers, a category that Kant understands in a broad sense. The space for such debate is based on collaboration, which is an essential character of the scientific method itself, as shown in section 6. In the conclusions, the definition of quality and qualitative judgement proposed by the ARRA is analysed again, and an enriched interpretation is proposed},
KEYWORDS = {Coara, Research assessment, open science, Qualitative judgement, Research quality},
PAGES = {35},
URL = {https://commentbfp.sp.unipi.it/quality-fdd/},
DOI = {10.5281/zenodo.10650139},
ISSN = {1591-4305},
JOURNAL = {BOLLETTINO TELEMATICO DI FILOSOFIA POLITICA},
}
@ARTICLE{DIDONATO_2024_ARTICLE_D_516012,
AUTHOR = {Di Donato, F.},
TITLE = {Verso una valutazione qualitativa della ricerca. Principi e modelli},
YEAR = {2024},
ABSTRACT = {Nel quadro della riforma della valutazione promossa dalla Coalition for Advancing research Assessment (CoARA), il contributo si propone di analizzare alcune iniziative che hanno anticipato e che, allo stesso tempo, rappresentano esempi pratici di traduzione dei principi e degli impegni alla base dell’Agreement on Reforming Research Assessment (ARRA) e di CoARA. In particolare, si prendono in considerazione le esperienze olandese e norvegese, che hanno definito modelli che aspirano a realizzare esercizi di valutazione che conciliano una valutazione qualitativa e responsabile con l’utilizzo di indicatori quantitativi. L’articolo inoltre presenta modelli di curriculum vitae narrativo, un formato che negli ultimi anni è impiegato da un numero crescente di enti valutatori per la valutazione individuale. Nelle conclusioni si discutono brevemente alcune criticità e i possibili sviluppi di tali strumenti},
KEYWORDS = {Coara, riforma della valutazione della ricerca, giudizio qualitativo, curriculum narrativo},
PAGES = {99-124},
URL = {https://iris.cnr.it/handle/20.500.14243/516012},
VOLUME = {2/2024 (95)},
ISSN = {2421-5848},
JOURNAL = {QUADERNI DI SOCIOLOGIA},
}
@ARTICLE{ERJAVEC_2024_ARTICLE_EKLKROOLKMSRAABBBPDDGHIKKLMMNSTTVVWYF_483041,
AUTHOR = {Erjavec, T. and Kopp, M. and Ljubešić, N. and Kuzman, T. and Rayson, P. and Osenova, P. and Ogrodniczuk, M. and Çöltekin, Ç. and Koržinek, D. and Meden, K. and Skubic, J. and Rupnik, P. and Agnoloni, T. and Aires, J. and Barkarson, S. and Bartolini, R. and Bel, N. and Pérez, M. C. and Darģis, R. and Diwersy, S. and Gavriilidou, M. and Heusden, R. V. and Iruskieta, M. and Kahusk, N. and Kryvenko, A. and Ligeti Nagy, N. and Magariños, C. and Mölder, M. and Navarretta, C. and Simov, K. and Tungland, L. M. and Tuominen, J. and Vidler, J. and Vladu, A. I. and Wissik, T. and Yrjänäinen, V. and Fišer, D.},
TITLE = {ParlaMint II: Advancing Comparable Parliamentary Corpora Across Europe},
YEAR = {2024},
ABSTRACT = {The paper presents the results of the ParlaMint II project, which comprise comparable corpora of parliamentary debates of 29 European countries and autonomous regions, covering at least the period from 2015 to 2022, and containing over 1 billion words. The corpora are uniformly encoded, contain rich metadata about their 24 thousand speakers, and are linguistically annotated up to the level of Universal Dependencies syntax and named entities. The paper focuses on the enhancement made since the ParlaMint I project and presents the compilation of the corpora, including the encoding infrastructure, use of GitHub, the production of individual corpora, the common pipeline for producing their distribution, and use of CLARIN services for dissemination. It then gives a quantitative overview of the produced corpora, followed by the qualitative additions made within the ParlaMint II project, namely metadata localisation, the addition of new metadata, such as the political orientation of political parties, the machine translation of the corpora to English and its tagging with semantic classes, and the production of pilot speech corpora. Finally, outreach activities and further work are discussed},
KEYWORDS = {Parliamentary proceedings, TEI, Comparable corpora},
URL = {https://iris.cnr.it/handle/20.500.14243/483041},
DOI = {10.21203/rs.3.rs-4176128/v1},
ISSN = {1574-020X},
JOURNAL = {LANGUAGE RESOURCES AND EVALUATION},
}
@ARTICLE{GAMBINO_2024_ARTICLE_GBBCCFFFGGPR_520173,
AUTHOR = {Gambino, F. and Beretta, A. and Barillari, S. and Ceresato, F. and Costa, G. and Fassanelli, R. and Favaro, M. and Fois, J. and Guadagnini, E. and Guariglia, F. and Parodi, M. and Rettore, C.},
TITLE = {Il “francese d’Italia” e il progetto FrIngE. Panoramica generale e casi di studio},
YEAR = {2024},
ABSTRACT = {The contribution presents the first results of the project "FrIngE-The French in/of Italy: Code-MixiNG in Medieval Europe" (2023-2025, PRIN 2022XRFSXR), which aims to create an annotated corpus of French texts written in Italy},
KEYWORDS = {KEYWORDS: French of Italy, franco-italian, Linguistic Annotation, Pyrrha, Digital Humanities, Francese d’Italia, franco-italiano, annotazione linguistica, Pyrrha, Digital Humanities},
PAGES = {285-340},
URL = {https://www.francigena-unipd.com/index.php/francigena/article/view/100/107},
VOLUME = {10},
ISSN = {2420-9767},
JOURNAL = {FRANCIGENA},
}
@ARTICLE{GIOVANNETTI_2024_ARTICLE_GABMPS_506221,
AUTHOR = {Giovannetti, E. and Albanesi, D. and Bellandi, A. and Marchi, S. and Papini, M. and Sciolette, F.},
TITLE = {Maia: an Open Collaborative Platform for Text Annotation, E-Lexicography, and Lexical Linking},
YEAR = {2024},
ABSTRACT = {Although open tools for manual text annotation and the creation of lexical resources have been available for some years, there is currently no integrated tool that allows, within the same environment, annotating a text corpus, building a computational lexicon, and linking linguistic annotations to lexical elements. For this reason, we have developed Maia, an open and collaborative web tool based on semantic web and linked open data technologies for text annotation, e-lexicography, and lexical linking, primarily designed and developed for use by digital humanists. This article presents the first version of Maia, describing its functionality, and outlining its software architecture and development prospects},
KEYWORDS = {Text Annotation, E-Lexicography, Lexical Linking, Computational Lexicons, Linguistic Resources, Linguistic Linked Open Data, OntoLex-Lemon, Maia, Annotazione del testo, lessicografia digitale, lexical linking, lessici computazionali, risorse linguistiche, Linguistic Linked Open Data, OntoLex-Lemon, Maia},
PAGES = {27-52},
URL = {https://umanisticadigitale.unibo.it/article/view/19705},
VOLUME = {18},
ISSN = {2532-8816},
JOURNAL = {UMANISTICA DIGITALE},
}
@ARTICLE{HASENCKER_2024_ARTICLE_HNC_512795,
AUTHOR = {Hasenäcker, J. and Nadalini, A. and Crepaldi, D.},
TITLE = {Sub-word orthographic processing and semantic activation as revealed by ERPs},
YEAR = {2024},
ABSTRACT = {The present study investigated ERP signatures of processing sub-word orthography, that is, shorter words embedded within longer words, in a non-priming task that pushes for semantics. Participants performed a semantic categorisation task on pseudosuffixed and nonsuffixed words, like corner and peace, that contained embedded words (corn, pea) either congruent or not with the probe category (e. g. FOOD vs. ANIMAL). While the task required semantic activation of the whole-word, sub-word orthography and semantics were activated. Results indicate stronger negativity from as early as ∼230 ms after word onset when the embedded word did not fit the category, but only for pseudosuffixed words. The observed neural dynamics point to rapid extraction of sub-word orthography and prompt activation of meaning thereupon. We discuss the results with respect to literature on morphological processing, context-dependency of the mechanisms, and interpretations of the N250 and N400 components. 8},
KEYWORDS = {Visual word identification, erp, eeg},
PAGES = {1-13},
URL = {https://www.tandfonline.com/doi/abs/10.1080/23273798.2024.2430275},
DOI = {10.1080/23273798.2024.2430275},
ISSN = {2327-3798},
JOURNAL = {LANGUAGE, COGNITION AND NEUROSCIENCE},
}
@ARTICLE{IAVARONE_2024_ARTICLE_ISBGPVDG_501741,
AUTHOR = {Iavarone, B. and Sole Morelli, M. and Brunato, D. and Ghiasi, S. and Pasquale Scilingo, E. and Vanello, N. and Dell'Orletta, F. and Greco, A.},
TITLE = {The linguistic structure of an emotional text influences the sympathetic activity and the speech prosody of the reader},
YEAR = {2024},
ABSTRACT = {In this study, we present an analysis of the relationship between the linguistic profile of a text and the physiological and acoustic characteristics of the reader to improve the emotion recognition systems. To this aim, we recorded the speech and electrodermal activity (EDA) signals from 33 healthy volunteers reading neutral and affective texts aloud. We used the BioVoice toolbox and cvxEDA algorithm to estimate some of the main speech and EDA features, respectively. The selected texts were analyzed to quantify their lexical, morpho-syntactic, and syntactic properties. Correlation and Support Vector Regression analyses between linguistic and speech and EDA features have shown a significant bidirectional association between the morpho-syntactic structure of the text and both sympathetic markers and voice acoustic properties. Specifically, significant relationships were observed between linguistic properties and certain EDA and speech features commonly used to evaluate human emotional state (e. g., edaSymp, mean tonic, F0). These findings suggest that lexical, morpho-syntactic, and syntactic properties may have a significant impact on an individual’s emotional dynamics},
KEYWORDS = {Speech analysis, Linguistic profile, Electrodermal activity, Support Vector Regressor},
PAGES = {8},
URL = {https://iris.cnr.it/handle/20.500.14243/501741},
VOLUME = {89},
DOI = {10.1016/j.bspc.2023.105776},
ISSN = {1746-8108},
JOURNAL = {BIOMEDICAL SIGNAL PROCESSING AND CONTROL (ONLINE)},
}
@ARTICLE{KHAN_2024_ARTICLE_KF_475881,
AUTHOR = {Khan, A. F. and Frontini, F.},
TITLE = {Toward a Representation of Semantic Change in Linked Data},
YEAR = {2024},
ABSTRACT = {In this article, we introduce a new framework, the Intensional–Ontological Model (IOM), for representing meaning, and especially for representing semantic change, in linguistic linked data resources. This framework, which makes use of previous work in the literature on lexical semantics and ontologies, is intended to help clarify what we mean when we model semantic change and to assist in elaborating different ontology patterns for doing so. In this work, we assume a simple architecture, one which is at the basis of the well-known OntoLex-Lemon vocabulary and which consists of one or more lexicons linked to an ontology. Our model, which is based on this architecture and informed by previous work on word senses and ontologies, is intended to provide a clear interpretation for the modelling of both onomasiological and semiasological changes, in both static and dynamic versions. This article describes how the IOM framework represents word meaning as the relationship between a word and an ontological concepts in the ’static’ case, demonstrating that the IOM is compatible with OntoLex-Lemon (while at the same time providing a greater level of detail as to the meaning of the ’sense’ and ’reference’ relationships). It then goes on to detail how the IOM can help us understand how to model semantic shifts in linked data lexical resources with a focus on conceptual change and the addition of temporal information to semantic shift data},
KEYWORDS = {linked data, semantic shift, ontologies, lexical semantics},
URL = {https://iris.cnr.it/handle/20.500.14243/475881},
VOLUME = {9 (6)},
DOI = {10.3390/languages9060215},
ISSN = {2226-471X},
JOURNAL = {LANGUAGES},
}
@ARTICLE{MALLIA_2024_ARTICLE_MBQ_459320,
AUTHOR = {Mallia, M. and Bandini, M. and Quochi, V.},
TITLE = {An interface for linking ancient languages},
YEAR = {2024},
ABSTRACT = {The paper focuses on the linking potentials offered by the EpiLexO web-based front-end for the creation and editing of an ecosystem of digital resources for ancient languages, developed in the context of a project on the languages of fragmentary attestation of ancient Italy. The focus is particularly on mechanisms introduced for linking lexical information to other information bits either internally or externally, e. g. for creating attestations by linking lexical forms to their variants in relevant inscriptions, as well as for linking lexical data to external independent LOD datasets available on a remote endpoint. Finally, in the conclusions, we briefly introduce some future planned or desired enhancements as well as the final platform component, a parallel interface that constitutes the fruition application, which will be open to anyone on the web and willallow for browsing, searching, cross-querying and visualising the created set of interlinked resources},
KEYWORDS = {eLexicography, Ancient languages, Linguistic Linked Open Data, Digital historical linguistics},
PAGES = {175-190},
URL = {https://sciendo.com/it/article/10.2478/cait-2024-0042},
VOLUME = {2024 (4)},
DOI = {10.2478/cait-2024-0042},
ISSN = {1314-4081},
JOURNAL = {CYBERNETICS AND INFORMATION TECHNOLOGIES},
}
@ARTICLE{MANTOVANI_2024_ARTICLE_MPKGCSMCRABMB_514338,
AUTHOR = {Mantovani, S. and Pintus, A. and Kovtun, A. and Gondolini, A. and Casadio, S. and Sanson, A. and Marforio, T. D. and Calvaresi, M. and Rancan, M. and Armelao, L. and Bertuzzi, G. and Melucci, M. and Bandini, M.},
TITLE = {Graphene Oxide-Arginine Composites: Efficient Dual Function Materials for Integrated CO2 Capture and Conversion},
YEAR = {2024},
ABSTRACT = {The "on-demand" capture and utilization of CO2 is effectively realized with a readily accessible dual function organic composite. The covalent and controlled derivatization of graphene oxide (GO) surface with naturally occurring arginine led to a "smart" material capable of capturing (chemisorption) CO2 from high-purity flue-gas as well as low-concentration streams (i. e. direct air capture) and concomitant chemical activation toward the incorporation into cyclic carbonates. The overall integrated CO2 capture and conversion (ICCC) strategy has been fully elucidated mechanistically via dedicated computational, spectroscopic and thermal analyses},
KEYWORDS = {Carbon dioxide, Carbon-capture-conversion, Computational study, Graphene oxide, Spectroscopic investigation},
URL = {https://iris.cnr.it/handle/20.500.14243/514338},
VOLUME = {17 (5)},
DOI = {10.1002/cssc.202301673},
ISSN = {1864-564X},
JOURNAL = {CHEMSUSCHEM},
}
@ARTICLE{MARTELLI_2024_ARTICLE_MGPNSBEBTBPVDR_557121,
AUTHOR = {Martelli, G. and Gentilini, M. and Piperno, C. and Namdari, H. and Saponaro, D. and Bruck, E. and Elzir, I. and Bruni, L. and Trapanese, L. and Buscemi, R. and Picciano, G. and Vogelmann, S. and D'Esposito, F. and Rau, A.},
TITLE = {I fondamentalismi tra teologia e ideologismi},
YEAR = {2024},
ABSTRACT = {Articolo dedicato alla dimensione religiosa dei fondamentalismi all'interno del numero monografico dedicato al fenomeno dalla rivista Erre della Fondazione Rut},
KEYWORDS = {Fondamentalismi, Estremismo religioso},
PAGES = {8-14},
URL = {https://fondazionerut.org/wp-content/uploads/2024/05/ERRE-Numero1.pdf},
VOLUME = {1},
JOURNAL = {Erre},
}
@ARTICLE{MAZZAGUFO_2024_ARTICLE_MSSD_511742,
AUTHOR = {Mazzagufo, L. and Sichera, P. and Spampinato, D. and Del Grosso, A. M.},
TITLE = {Letters and Musical Sketches. Toward a Proper Integration of Bellini’s Writings},
YEAR = {2024},
ABSTRACT = {This article examines the use of XML-based technologies to encode verbal and musical texts in two publishing products featuring autograph material by Vincenzo Bellini (1801–1835), held at the Museo civico Belliniano in Catania, Italy. The first product is a digital scholarly edition (DSE) of Bellini’s autograph letters, encoded using the XML-TEI vocabulary. The second project involves the encoding of Bellini’s musical sketches, which often complement the letters by providing concrete examples of his compositional techniques. An experimental approach using the Music Encoding Initiative (MEI) vocabulary was adopted for these sketches: this encoding process required custom solutions to address the texts’ unique features, such as authorial interventions, the sketches’ embryonic nature, the copresence of musical notation and textual annotations, and the interrelations of different studies. This article therefore examines formal representational strategies and challenges encountered during the encoding process, particularly for musical texts, and presents an initial proposal aimed at properly integrating information from the TEI-encoded verbal texts and MEI-encoded musical texts, using an approach modeled after the Web Annotation Data Model (WADM) and its current implementation in TEI. We believe that the integration of these practices, technologies, and data is a means to unravel Bellini’s compositional process and his artistic sensibility, thereby enhancing both scholarly research and public engagement with his work},
KEYWORDS = {XML-MEI, encoding integration, Bellini Digital Correspondence, Digital scholarly edition, Vincenzo Bellini, musical sketches},
URL = {https://journals.openedition.org/jtei/5300},
VOLUME = {18},
DOI = {10.4000/12na6},
ISSN = {2162-5603},
JOURNAL = {JOURNAL OF THE TEXT ENCODING INITIATIVE},
}
@ARTICLE{PICCINI_2024_ARTICLE_PSV_532161,
AUTHOR = {Piccini, S. and Saponaro, D. and Vilela Ruiz, G. E.},
TITLE = {La connotation logique en terminologie. Le mariage dans l’Israël antique comme étude de cas},
YEAR = {2024},
ABSTRACT = {Cette étude vise à esquisser une réflexion sur la connotation logique en terminologie. En particulier, en utilisant un exemple issu de la langue hébraïque et portant sur la notion de mariage, elle met en avant l’importance de distinguer la connotation logique du concept et le sens du terme, tout en illustrant la pertinence de concevoir la connotation du concept comme une catégorisation fluide, structurée selon le principe wittgensteinien de l’air de famille},
KEYWORDS = {connotation logique, analyse sémique, concept polythétique, air de famille, mariage},
PAGES = {103-129},
URL = {https://iris.cnr.it/handle/20.500.14243/532161},
VOLUME = {125 (2)},
DOI = {10.48611/isbn.978-2-406-17959-7.p.0103},
ISSN = {0007-9871},
JOURNAL = {CAHIERS DE LEXICOLOGIE},
}
@ARTICLE{RUBEHN_2024_ARTICLE_RMJ_500421,
AUTHOR = {Rubehn, A. and Montemagni, S. and John Nerbonne, A.},
TITLE = {Extracting Tuscan phonetic correspondences from dialect pronunciations automatically},
YEAR = {2024},
ABSTRACT = {We present a novel approach to identifying individual pairs of phonetic correspondences in a dataset of dialect pronunciations. This continues work identifying shibboleths (i. e., characteristic features of a given dialect), a category that has interested dialectology and that dialectometrical research has examined mostly in the form of categorical data or entire phonetic transcriptions. This article reaches into segmental sequences (phonetic transcriptions) to identify individual phonetic correspondences. We follow earlier work in examining how distinctive and how representative a given phonetic correspondence is for a selected group of varieties. We proceed from string alignments, and innovate in characterizing the important notions via information theory. Despite minor problems, the method improves on the generality of competing approaches and can be shown to be useful in detecting characteristic phonetic correspondences in Tuscan varieties. We argue that this facilitates deeper investigation into the relation between aggregating approaches to dialectology and approaches proceeding from features},
KEYWORDS = {sound correspondence, dialectology, information theory, alignment, Tuscan dialects},
PAGES = {1-33},
URL = {https://brill.com/view/journals/ldc/14/1/article-p1_1.xml?ebody=abstract/excerpt},
VOLUME = {14 (1)},
DOI = {10.1163/22105832-bja10034},
ISSN = {2210-5824},
JOURNAL = {LANGUAGE DYNAMICS AND CHANGE (PRINT)},
}
@ARTICLE{SCIOLETTE_2024_ARTICLE_SBGM_519970,
AUTHOR = {Sciolette, F. and Bellandi, A. and Giovannetti, E. and Marchi, S.},
TITLE = {CompL-it: a Computational Lexicon of Italian Language},
YEAR = {2024},
ABSTRACT = {This paper describes CompL-it, a new open computational lexicon for contemporary Italian. The resource was constructed from three sources: an already available Italian lexicon, a lemmatized list of inflected forms obtained from a morphological analyzer, and a set of treebanks. Integrating these resources required a standardisation process in accordance with the standards of the Linguistic Linked Open Data community, which was necessary for the subsequent conversion into the OntoLex-Lemon model. The resulting computational lexicon comprises approximately 100, 000 lexical entries, 790, 000 forms, 57, 000 senses, and 86, 000 semantic relations. The lexicon, thanks to its rich and articulated linguistic structure, can be used, as shown, to enhance information retrieval in the context of full-text search tasks},
KEYWORDS = {Computational Lexicon, Linguistic Resources, Linguistic Linked Open Data, OntoLex-Lemon, Information Retrieval},
PAGES = {119-148},
URL = {https://www.aidainformazioni.it/index.php/aidainformazioni/article/view/315},
VOLUME = {42 (3-4)},
ISSN = {1121-0095},
JOURNAL = {AIDA INFORMAZIONI},
}
@ARTICLE{SPAMPINATO_2024_ARTICLE_SCCDMS_558622,
AUTHOR = {Spampinato, D. and Capizzi, E. and Cristofaro, S. and Del Grosso, A. M. and Mazzagufo, L. and Sichera, P.},
TITLE = {Oltre la carta. Un modello di edizione digitale delle lettere di Vincenzo Bellini},
YEAR = {2024},
ABSTRACT = {The adoption of digital technologies in philology and the humanities has transformed editorial and textual analysis practices, fostering new methodological perspectives. In this context, Bellini Digital Correspondence (BDC) presents a model of digital scholarly edition applied to the autograph letters of Vincenzo Bellini, preserved at the Museo civico Belliniano in Catania. By integrating innovative computational tools – some developed specifically for this edition – BDC provides enhanced access to primary sources, facilitating their interdisciplinary study and analysis. The project is based on a collaborative and distributed approach, adhering to interoperability standards to ensure that the edition is fully open source and open access. This not only enables its reuse in similar contexts but also encourages further methodological reflections on digital scholarly editing},
KEYWORDS = {Digital Scholarly Editing, XML-TEI, ZoneRW, NormaTEI, lettere autografe, Museo civico Belliniano},
URL = {https://www.bollettinostudibelliniani.eu/oltre-la-carta-un-modello-di-edizione-digitale-delle-lettere-di-vincenzo-bellini/},
DOI = {10.17422/ISSN.2283-8716/1073},
ISSN = {2283-8716},
JOURNAL = {BOLLETTINO DI STUDI BELLINIANI},
}
@ARTICLE{ZENZARO_2024_ARTICLE_Z_475305,
AUTHOR = {Zenzaro, S.},
TITLE = {Models for Digital Humanities Tools: Coping with Technological Changes and Obsolescence},
YEAR = {2024},
ABSTRACT = {This article highlights the importance of defining models and using modular software for digital humanities tools. We emphasize the need for these tools to adapt to the rapidly changing technology landscape, which has led to many tools having short lifespans. We propose an approach to address software obsolescence by using modular models. This involves designing tools to be easily integrated, scalable, and adaptable to changing technology and user requirements. To illustrate the usefulness of models, we present their application to a real-world use case: the CoPhi Editor web platform},
KEYWORDS = {digital humanities, models, modularity, tools,obsolescence},
PAGES = {1-10},
URL = {https://iris.cnr.it/handle/20.500.14243/475305},
VOLUME = {8 (2)},
DOI = {10.57675/imist.prsm/ijist-v8i2.283},
ISSN = {2550-5114},
JOURNAL = {INTERNATIONAL JOURNAL OF INFORMATION SCIENCE AND TECHNOLOGY},
}
@BOOK{ALZETTA_2024_BOOK_A_493657,
AUTHOR = {Alzetta, C.},
TITLE = {Unlocking Knowledge in the Digital Age. A Guide to Modelling Propaedeutic Relations in Educational Texts},
YEAR = {2024},
ABSTRACT = {This volume, intended for educational researchers and practitioners, discusses the pivotal role of prerequisite relations between educational contents in shaping learning paths and offers tools for exploring and analyzing teaching materials. It demonstrates how uncovering the structured representation of educational text content fosters its dynamic and adaptive navigation, all while tackling the complexities of identifying prerequisite relations within such texts. Through a multidisciplinary methodology integrating corpus annotation, knowledge modelling, and deep textual analysis, the volume illustrates the interplay between form and content in textual materials, underscoring the importance of employing level-appropriate language for fostering effective learning. The efficacy of this approach is demonstrated through case studies on content modelling and textbook exploration that illustrate its potential to enhance teaching and learning across diverse domains},
KEYWORDS = {Prerequisite relations, Annotation, Modelling Framework, Educational application},
URL = {https://iris.cnr.it/handle/20.500.14243/493657},
PUBLISHER = {Edizioni ETS (Pisa, ITA)},
ISBN = {9788846769237},
CONFERENCE_PLACE = {Pisa},
}
@BOOK{BIORCI_2024_BOOK_BMR_512958,
AUTHOR = {Biorci, G. and Marconi, L. and Ratti, D.},
TITLE = {Dizionario dei sinonimi e dei contrari. Compatto Sinonimi},
YEAR = {2024},
ABSTRACT = {Nuova edizione del Dizionario dei sinonimi con l'aggiunta di circa trecento neologismi},
KEYWORDS = {dizionario, sinonimi, contrari},
PAGES = {1-624},
URL = {https://iris.cnr.it/handle/20.500.14243/512958},
PUBLISHER = {Zanichelli editore (Bologna, ITA)},
ISBN = {9788808420848},
CONFERENCE_PLACE = {Bologna},
}
@BOOK{DUVAL_2024_BOOK_DG_451672,
AUTHOR = {Duval, F. and Guadagnini, E.},
TITLE = {Le théâtre antique au Moyen Âge. Étude des mots et des concepts dans les textes en français et en italien},
YEAR = {2024},
ABSTRACT = {Longtemps s'est imposée l'idée d'une redécouverte tardive du théâtre antique après la longue parenthèse du Moyen Âge. Dans ce domaine, comme pour tant d'autres, l'« âge moyen » aurait représenté une coupure nette entre l'Antiquité, où le théâtre était une institution sociale répandue, et la Renaissance, qui aurait renoué avec les codes et pratiques antiques. Pour faire pièce à cette historiographie de la rupture, Frédéric Duval et Elisa Guadagnini ont recueilli et étudié les traces laissées par le théâtre antique dans l'encyclopédie et les langues vernaculaires du Moyen Âge. Le présent livre s'intéresse à l'histoire des langues et à l'histoire des idées, aux mots autant qu'aux concepts. Les auteurs partent toutefois de la représentation lexicale du théâtre antique. Sous cet angle, la documentation vernaculaire présente des avantages par rapport à la documentation latine. L'analyse porte à la fois sur la mise en place d'un lexique théâtral référant à l'Antiquité et sur le processus de conceptualisation du ?théâtre antique? en France et en Italie entre le XIIe et le XVe siècle},
KEYWORDS = {Teatro, Linguistica romanza, Eredità dei classici, Letteratura medievale},
PAGES = {1-670},
URL = {https://iris.cnr.it/handle/20.500.14243/451672},
VOLUME = {CCLXXIV},
PUBLISHER = {Droz (Genève, CHE)},
ISBN = {978-2-600-06468-2},
CONFERENCE_PLACE = {Genève},
}
@INCOLLECTION{BURGASSI_2024_INCOLLECTION_BV_474454,
AUTHOR = {Burgassi, C. and Vaccaro, G.},
TITLE = {ASPETTI LINGUISTICI INTORNO AL CASO MORO},
YEAR = {2024},
KEYWORDS = {.},
PAGES = {185-194},
URL = {https://www.francocesatieditore.com/catalogo/anni-settanta-la-grande-narrazione/},
PUBLISHER = {Franco Cesati (Firenze, ITA)},
ISBN = {979-12-5496-167-4},
CONFERENCE_PLACE = {Firenze},
BOOKTITLE = {Anni Settanta: la grande narrazione},
}
@INCOLLECTION{CHIARCOS_2024_INCOLLECTION_CIAGKKT_530981,
AUTHOR = {Chiarcos, C. and Ionov, M. and Apostol, E. S. and Gkirtzou, K. and Kabashi, B. and Khan, A. F. A. and Truică, C. O.},
TITLE = {Multiword expressions, collocations and the OntoLex vocabulary},
YEAR = {2024},
ABSTRACT = {We describe challenges in and approaches for modelling multiword expressions in machine-readable dictionaries. OntoLex is a widely used community standard for lexical resources on the web, and the predominant RDF vocabulary for the purpose. The current challenge is for OntoLex users to figure out the correct modelling strategy, as different use cases require the application of different OntoLex modules. This chapter serves as an orientation point for researchers and practitioners, and for a number of real-world use cases it will describe modelling strategies and compare their advantages and disadvantages},
KEYWORDS = {ontolex, linked data, multword expressions},
URL = {https://iris.cnr.it/handle/20.500.14243/530981},
DOI = {10.5281/zenodo.10949960},
ISBN = {978-3-98554-099-0},
BOOKTITLE = {Multiword expressions in lexical resources: Linguistic, lexicographic, and computational perspectives},
}
@INCOLLECTION{CLRICE_2024_INCOLLECTION_CPVCCLBBFGBMGOHKVK_506902,
AUTHOR = {Clérice, T. and Pinche, A. and Vlachou Efstathiou, M. and Chagué, A. and Camps, J. B. and Levenson, M. G. and Brisville Fertin, O. and Boschetti, F. and Fischer, F. and Gervers, M. and Boutreux, A. and Manton, A. and Gabay, S. and O'Connor, P. and Haverals, W. and Kestemont, M. and Vandyck, C. and Kiessling, B.},
TITLE = {CATMuS Medieval: A Multilingual Large-Scale Cross-Century Dataset in Latin Script for Handwritten Text Recognition and Beyond},
YEAR = {2024},
ABSTRACT = {The surge in digitisation initiatives by Cultural Heritage institutions has facilitated online accessibility to numerous historical manuscripts. However, a substantial portion of these documents exists solely as images, lacking machine-readable text. Handwritten Text Recognition (HTR) has emerged as a crucial tool for converting these images into machine-readable formats, enabling researchers and scholars to analyse vast collections efficiently. Despite significant technological progress, establishing consistent ground truth across projects for HTR tasks, particularly for complex and heterogeneous historical sources like medieval manuscripts in Latin scripts (8th-15th century CE), remains nonetheless challenging},
KEYWORDS = {historical source, medieval manuscript, Latin script, benchmarking dataset, multilingual, handwritten text recognition},
PAGES = {174-194},
URL = {https://link.springer.com/book/10.1007/978-3-031-70543-4},
VOLUME = {14806 LNCS},
DOI = {10.1007/978-3-031-70543-4_11},
PUBLISHER = {Springer},
ISBN = {9783031705427},
BOOKTITLE = {Document Analysis and Recognition – ICDAR 2024},
}
@INCOLLECTION{FRONTINI_2024_INCOLLECTION_FRS_475984,
AUTHOR = {Frontini, F. and Roth Boll, A. and Seguin, M. S.},
TITLE = {Cartographie d’une aventure Approche numérique du Journal d’un voyage fait aux Indes orientales de Robert Challe},
YEAR = {2024},
ABSTRACT = {L’article propose d’étudier le Journal d’un voyage de Robert Challe grâce aux outils des humanités numériques. Nous avons reconstitué la cartographie de l’aventure challienne et comparé les trajets ainsi restitués avec leur exploitation viatique. La rencontre des espaces réellement visités avec leur représentation textuelle fait ainsi émerger l’existence d’une forme de géographie mémorielle, affective et poétique, indispensable au travail littéraire de Robert Challe},
KEYWORDS = {Contextualisation, humanités numériques, identification, localisation, marquage, méthodologie, observation, référencement, spatialisation, technologie},
URL = {https://iris.cnr.it/handle/20.500.14243/475984},
DOI = {10.48611/isbn.978-2-406-16757-0.p.0247},
PUBLISHER = {Classiques Garnier},
ISBN = {978-2-406-16757-0},
BOOKTITLE = {Robert Challe et l’aventure},
}
@INCOLLECTION{PROIETTI_2024_INCOLLECTION_PT_582402,
AUTHOR = {Proietti, C. and Taticchi, C.},
TITLE = {PREFACE},
YEAR = {2024},
ABSTRACT = {This volume contains the papers presented at the 8th Workshop on Advances in Argumentation in Artificial Intelligence (AI3 2024), held in Bolzano, Italy, on November 28th 2024. AI3 2024 was the 8th edition of the Workshop on Advances in Argumentation in Artificial Intelligence series, a venue that provides opportunities for stakeholders from academia and industry to present their recent work in argumentation theory. The goal of the workshop is to stimulate discussions and promote scientific collaboration among researchers in computational argumentation and related fields, including nonmonotonic reasoning, logic programming, linguistics, natural language processing, philosophy and psychology, just to mention a few},
KEYWORDS = {abstract argumentation, formal argumentation, computational models of argument},
PAGES = {1-3},
URL = {https://ceur-ws.org/Vol-3871/},
VOLUME = {3871},
PUBLISHER = {CEUR-WS},
BOOKTITLE = {AI^3 2024 Advances in Argumentation in Artificial Intelligence 2024},
EDITOR = {Proietti, C. and Taticchi, C.},
}
@EDITORIAL{BOSCHETTI_2024_EDITORIAL_BLMN_506904,
AUTHOR = {Boschetti, F. and Lebani, G. E. and Magnini, B. and Novielli, N.},
TITLE = {Proceedings of the 9th Italian Conference on Computational Linguistics CLiC-it 2023 (Venezia, 30 novembre-2 dicembre 2023)},
YEAR = {2024},
ABSTRACT = {The ninth edition of the Italian Conference on Computational Linguistics (CLiC-it 2023) was held from 30th November to 2nd December 2023 at Ca’ Foscari University of Venice, in the beautiful venue of the Auditorium Santa Margherita-Emanuele Severino. After the edition of 2020, which was organized in fully virtual mode due to the health emergency related to Covid-19, and CLiC-it 2021, which was held in hybrid mode, with CLiC-it 2023 we are back to a fully in-presence conference. Overall, almost 210 participants registered to the conference, confirming that the community is eager to meet in person and to enjoy both the scientific and social events together with the colleagues},
KEYWORDS = {Computational Linguistics},
URL = {https://iris.cnr.it/handle/20.500.14243/506904},
PUBLISHER = {Lexis Compagnia Editoriale in Torino srl},
ISBN = {9791255000846},
}
@EDITORIAL{MELERO_2024_EDITORIAL_MSS_520373,
AUTHOR = {Melero, M. and Sakti, S. and Soria, C.},
TITLE = {Proceedings of the 3rd Annual Meeting of the Special Interest Group on Under-resourced Languages @ LREC-COLING 2024},
YEAR = {2024},
ABSTRACT = {The Proceedings of the 3rd Annual Meeting of the Special Interest Group on Under-resourced Languages (SIGUL2024) at LREC-COLING 2024 serve as a testament to the growing awareness and commitment within the research community to address the challenges faced by these languages. This workshop aims at providing a platform for researchers, practitioners, and stakeholders to come together, share insights, and collaborate on innovative solutions to empower technological uptake for all languages equally},
KEYWORDS = {under resourced languages, Linguistic diversity, Natural language processing},
URL = {https://aclanthology.org/2024.sigul-1.0},
PUBLISHER = {ELRA and ICCL (Paris, FRA)},
ISBN = {978-2-493814-29-6},
CONFERENCE_PLACE = {Paris},
}
@EDITORIAL{PROIETTI_2024_EDITORIAL_PT_530204,
AUTHOR = {Proietti, C. and Taticchi, C.},
TITLE = {Proceedings of the 8th Workshop on Advances in Argumentation in Artificial Intelligence 2024 co-located with the 23rd International Conference of the Italian Association for Artificial Intelligence (AIxIA 2024), Bozen, Italy, November 28, 2024},
YEAR = {2024},
ABSTRACT = {This volume contains the papers presented at the 8th Workshop on Advances in Argumentation in Artificial Intelligence (AI3 2024), held in Bolzano, Italy, on November 28th 2024. AI3 2024 was the 8th edition of the Workshop on Advances in Argumentation in Artificial Intelligence series, a venue that provides opportunities for stakeholders from academia and industry to present their recent work in argumentation theory. The goal of the workshop is to stimulate discussions and promote scientific collaboration among researchers in computational argumentation and related fields, including nonmonotonic reasoning, logic programming, linguistics, natural language processing, philosophy and psychology, just to mention a few. The workshop was co-located with the 23rd International Conference of the Italian Association for Artificial Intelligence, the yearly AI conference of researchers, students, and industry professionals dealing with various aspects of AI in Italy. AIxIA 2024 took place in Bolzano, from 25 to 29 November 2024. AI3 2024 was held in presence. We received 10 submissions out of which 5 papers were accepted as regular papers, and 4 as short papers and/or extended abstracts of project presentation. AI3 2024 offered an interesting and diverse program, which in addition to the technical papers, included an invited talk by Marco Guerini (FBK, Trento) on “NLP for CounterSpeech-Trends and Open Challenges”. Weare very grateful to the Program Committee for their invaluable efforts in providing helpful and informative reviews for all submissions in a timely fashion. Finally, special thanks go to Gianvincenzo Alfano (University of Calabria) and Stefano Ferilli (University of Bari) for their support during the organisation of the event, and to the General and Local Chairs of AIxIA 2024, for their engagement in the local organisation and constant support during the co-location},
KEYWORDS = {Argumentation, Artificial Intelligence},
URL = {https://iris.cnr.it/handle/20.500.14243/530204},
VOLUME = {3871},
}
@INPROCEEDINGS{BANDINI_2024_INPROCEEDINGS_BQ_526227,
AUTHOR = {Bandini, M. and Quochi, V.},
TITLE = {Representing texts as LOD: a Systematic Literature Review},
YEAR = {2024},
ABSTRACT = {Despite the growing interest in publishing linguistic data as Linked Open Data, the publishing of ancient language corpora for the Semantic Web is still challenging. This contribution describes a systematic literature review on the representation of corpus data as Linguistic Linked Open Data, focusing especially on models and (data) granularity. Our goal is to gain insights into the advantages and disadvantages of the different approaches. Here we present our systematic review methodology and some initial results},
KEYWORDS = {Linked Open Data, Text corpora, ancient languages, systematic literature review},
PAGES = {455-461},
URL = {https://amsacta.unibo.it/id/eprint/7927/},
ISBN = {978-88-942535-8-0},
CONFERENCE_NAME = {Me. Te. Digitali. Mediterraneo in rete tra testi e contesti. XIII Convegno Annuale AIUCD2024},
BOOKTITLE = {Me. Te. Digitali. Mediterraneo in rete tra testi e contesti, Proceedings del XIII Convegno Annuale AIUCD2024},
}
@INPROCEEDINGS{BARONI_2024_INPROCEEDINGS_BBFFFFGPPRSTV_530552,
AUTHOR = {Baroni, P. and Bistarelli, S. and Fazzinga, B. and Fellin, G. and Flesca, S. and Furfaro, F. and Giacomin, M. and Parisi, F. and Proietti, C. and Russo, I. and Santini, F. and Taticchi, C. and Vernillo, P.},
TITLE = {Empowering Public Interest Communication with Argumentation-Project Overview (Extended Abstract)},
YEAR = {2024},
ABSTRACT = {The EPICA (Empowering Public Interest Communication with Argumentation) project aims to improve Public Interest Communication (PIC) through the use of advanced Computational Argumentation (CA) techniques. The project’s activities include exploring the potential of CA to address specific PIC needs, developing formal models for effective communication, and applying them to real case studies for validation. It also focuses on developing reasoning algorithms and innovative tools to support PIC strategies, enable the dissemination and practical application of the results, and improve institutional communication practices to address critical societal challenges},
KEYWORDS = {Argumentation, Artificial Intelligence, public interest communication},
PAGES = {1-3},
URL = {https://ceur-ws.org/Vol-3871/paper9.pdf},
CONFERENCE_NAME = {23rd International Conference of the Italian Association for Artificial Intelligence (AIxIA 2024), Bozen, Italy, November 28, 2024},
BOOKTITLE = {Proceedings of the 8th Workshop on Advances in Argumentation in Artificial Intelligence 2024 co-located with the 23rd International Conference of the Italian Association for Artificial Intelligence (AIxIA 2024), Bozen, Italy, November 28, 2024},
}
@INPROCEEDINGS{BARONI_2024_INPROCEEDINGS_BFGP_530191,
AUTHOR = {Baroni, P. and Fellin, G. and Giacomin, M. and Proietti, C.},
TITLE = {A Vector-Based Extension of Value-Based Argumentation for Public Interest Communication},
YEAR = {2024},
ABSTRACT = {In this paper, we propose a mathematical model to quantify and analyse the impact of public interest communication on target audiences. Building on Bench-Capon’s value-based approach, our model introduces the concept of value vectors to represent a multi-dimensional spectrum of values influencing audience perception and response. By employing vectors, we aim to capture the nuanced interplay between diverse values and the effectiveness of communication strategies},
KEYWORDS = {Abstract Argumentation, Public Interest Communication, Value-based Argumentation},
PAGES = {1-13},
URL = {https://iris.cnr.it/handle/20.500.14243/530191},
VOLUME = {3871},
CONFERENCE_NAME = {23rd International Conference of the Italian Association for Artificial Intelligence (AIxIA 2024), Bozen, Italy, November 28, 2024},
BOOKTITLE = {Proceedings of the 8th Workshop on Advances in Argumentation in Artificial Intelligence 2024 co-located with the 23rd International Conference of the Italian Association for Artificial Intelligence (AIxIA 2024), Bozen, Italy, November 28, 2024},
}
@INPROCEEDINGS{BOSCHETTI_2024_INPROCEEDINGS_BCKP_506921,
AUTHOR = {Boschetti, F. and Chilla, L. and Konstantinidou, M. and Pavlopoulos, J.},
TITLE = {Annotating Homeric Emotions by a Domain-Specific Language},
YEAR = {2024},
ABSTRACT = {In this study, we introduce a novel approach to understanding the emotive content present in ancient literature, specifically focusing on the first Book of Homer’s Iliad. Recognizing the challenges inherent in interpreting emotions from ancient texts, we developed a Domain-Specific Language (DSL) tailored for this purpose. This DSL not only allows for the annotation of basic sentiments such as positive, negative, neutral, or mixed but also facilitates the identification and categorization of specific emotions. To ensure the relevance and applicability of our annotations, we mapped the extracted emotions to some authoritative domain ontologies. This mapping process aids in bridging the gap between ancient emotional expressions and contemporary understanding. Our preliminary results, which we discuss in detail, highlight the potential of our approach in offering deeper insights into the emotional landscape of ancient texts. We believe that our methodology can serve as a foundation for future studies aiming to decode emotions in historical literature},
KEYWORDS = {sentiment analysis, digital philology, collaborative annotation, domain-specific languages},
PAGES = {489-493},
URL = {https://www.aaccademia.it/ita/titolo?ref=1685},
PUBLISHER = {Lexis Compagnia Editoriale in Torino srl (Torino, ITA)},
ISBN = {9791255000846},
CONFERENCE_NAME = {9th Italian Conference on Computational Linguistics (CLiC-it2023)},
CONFERENCE_PLACE = {Torino},
BOOKTITLE = {Proceedings of the 9th Italian Conference on Computational Linguistics-Venice, Italy, November 30-December 2, 2023},
}
@INPROCEEDINGS{BOSCHETTI_2024_INPROCEEDINGS_BRQ_507141,
AUTHOR = {Boschetti, F. and Rigobianco, L. and Quochi, V.},
TITLE = {Domain-Specific Languages for Epigraphy: The Case of ItAnt},
YEAR = {2024},
ABSTRACT = {This contribution illustrates how the definition of a Domain-Specific Language can support the activity of epigraphists and historical linguists. It presents and discusses a method and technological solution, based on Domain Specific Languages, for facilitating scholars in digitally representing the available knowledge of archaic languages and cultures, by increasing the human readability of the encoded data without sacrificing the compliance to standard models and formats. Such a work is framed in the context of an Italian National collaborative research project devoted to the study of the languages and cultures of ancient Italy, witnessed by a digital collection of inscriptions. The platform developed within this project offers an interesting use case and motivation for experimenting with DSLs for the creation of the needed digital critical editions. After explaining the DSL grammar definition process, we finally, test the applicability of the DSL grammar to 5 example inscriptions in the Faliscan language},
KEYWORDS = {Domain Specific Languages, Ancient Languages, Digital Scholarly Editions, Digital Humanities, Text Representation, TEI EpiDoc},
PAGES = {191-202},
URL = {https://ecp.ep.liu.se/index.php/clarin/article/view/1023},
VOLUME = {210},
DOI = {10.3384/ecp210007},
ISBN = {978-91-8075-740-9},
CONFERENCE_NAME = {CLARIN Annual Conference 2023},
BOOKTITLE = {Selected papers from the CLARIN Annual Conference 2023},
}
@INPROCEEDINGS{CARDILLO_2024_INPROCEEDINGS_CD_505144,
AUTHOR = {Cardillo, F. A. and Debole, F.},
TITLE = {Italian word embeddings for the medical domain},
YEAR = {2024},
ABSTRACT = {Neural word embeddings have proven valuable in the development of medical applications. However, for the Italian language, there are no publicly available corpora, embeddings, or evaluation resources tailored to this domain. In this paper, we introduce an Italian corpus for the medical domain, that includes texts from Wikipedia, medical journals, drug leaflets, and specialized websites. Using this corpus, we generate neural word embeddings from scratch. These embeddings are then evaluated using standard evaluation resources, that we translated into Italian exploiting the concept graph in the UMLS Metathesaurus. Despite the relatively small size of the corpus, our experimental results indicate that the new embeddings correlate well with human judgments regarding the similarity and the relatedness of medical concepts. Moreover, these medical-specific embeddings outperform a baseline model trained on the full Wikipedia corpus, which includes the medical pages we used. We believe that our embeddings and the newly introduced textual resources will foster further advancements in the field of Italian medical Natural Language Processing},
KEYWORDS = {NLP, Distributed Representations},
PAGES = {9434-9440},
URL = {https://aclanthology.org/2024.lrec-main.824},
ISBN = {978-2-493814-10-4},
CONFERENCE_NAME = {LREC-COLING 2024-24th Joint International Conference on Computational Linguistics, Language Resources and Evaluation},
BOOKTITLE = {Proceedings of the LREC-COLING 2024},
}
@INPROCEEDINGS{DAGATA_2024_INPROCEEDINGS_DDNPSS_518968,
AUTHOR = {D'Agata, C. and Del Grosso, A. M. and Nay, L. and Palazzolo, G. and Sichera, A. and Spampinato, D.},
TITLE = {PAVES-e: Per una Hyperedizione dell’opera di Cesare Pavese},
YEAR = {2024},
ABSTRACT = {L’articolo presenta il progetto PAVES-e, finanziato con i fondi PRIN 2022, che intende creare un’edizione-archivio semantica open access, definita Hyperedizione, dell’opera di Cesare Pavese. Essa permetterà a un vasto pubblico di fruire dell’opera pavesiana attraverso un portale nel quale poter consultare le edizioni scientifiche digitali delle poesie e dei romanzi mettendole in relazione con collegamenti semantici all’epistolario e al diario (Mestiere di vivere), fruendo inoltre dei manoscritti, dei vocabolari d’autore e del commento multimediale. Il contributo, dopo aver presentato il progetto (distinguendo analiticamente tutte le sue fasi: DigitalPavese, OntoPavese, PaveseInImmagini, PaveseInTesto, PaveseInParole, AnnotaPavese, BiblioPavese), si sofferma in particolare su PaveseInTesto, discutendo alcune scelte di codifica e di modellizzazione delle edizioni, con alcune proposte sul workflow, sugli editor scelti e sulla interfaccia di visualizzazione},
KEYWORDS = {Edizioni scientifiche digitali semantiche, codifica XML TEI, archivi digitali d’autore, lessicografia, filologia computazionale},
PAGES = {6},
URL = {https://iris.cnr.it/handle/20.500.14243/518968},
ISBN = {9788894253580},
CONFERENCE_NAME = {AIUCD 2024 Me. Te. Digitali. Mediterraneo in rete tra testi e contesti},
BOOKTITLE = {AIUCD 2024 Me. Te. Digitali. Mediterraneo in rete tra testi e contesti, Proceedings},
}
@INPROCEEDINGS{DAQUINO_2024_INPROCEEDINGS_DBBDDFTR_532579,
AUTHOR = {Daquino, M. and Bardi, A. and Buzzoni, M. and Del Gratta, R. and Del Grosso, A. M. and Fischer, F. and Tomasi, F. and Rosselli Del Turco, R.},
TITLE = {The ATLAS: a knowledge graph of digital scholarly research on Italian Cultural Heritage},
YEAR = {2024},
ABSTRACT = {ATLAS is a research initiative that aims to improve the FAIRness and exploitation of Digital Humanities (DH) projects and scholarly data about Italian Cultural Heritage (CH). This contribution describes the main challenges and opportunities of DH projects related to discoverability, interoperability, and preservation. It also explains the methodology and objectives of ATLAS, which involves the integration and reengineering of metadata from selected sources and software solutions (referred to as pilots within the ATLAS context) into a knowledge graph using Semantic Web and Natural Language Processing technologies. The expected outcomes and impacts of ATLAS, are (i) the definition of guidelines and best practices for DH projects; (ii) the creation of a reference set of excellence initiatives; (iii) the reconciliation of data with authority records and open data sources; (iv) the publication and preservation of the knowledge graph; and (v) the development of a platform for exploration and discovery of DH projects and resources, in synergy with the European Research Infrastructures CLARIN and OpenAIRE},
KEYWORDS = {Knowledge graph, Ontologies, Italian Cultural Heritage},
PAGES = {588-592},
URL = {https://amsacta.unibo.it/id/eprint/7927/},
ISBN = {978-88-942535-8-0},
CONFERENCE_NAME = {AIUCD2024-Me. Te. Digitali. Mediterraneo in rete tra testi e contesti},
BOOKTITLE = {Me. Te. Digitali. Mediterraneo in rete tra testi e contesti. Atti del XIII Convegno Annuale AIUCD2024},
EDITOR = {Di Silvestro, A. and Spampinato, D.},
}
@INPROCEEDINGS{DELGROSSO_2024_INPROCEEDINGS_DRM_504941,
AUTHOR = {Del Grosso, A. M. and Riccucci, M. and Mercatanti, E.},
TITLE = {The Impact of Digital Editing on the Study of Holocaust Survivors’ Testimonies in the context of Voci dall’Inferno Project},
YEAR = {2024},
ABSTRACT = {In Nazi concentration camps, approximately 20 million people perished. This included young and old, men and women, Jews, dissidents, and homosexuals. Only 10% of those deported survived. This paper introduces “Voci dall’Inferno” project, which aims to achieve two key objectives: a) Create a comprehensive digital archive: by encoding a corpus of non-literary testimonies including both written and oral sources. b) Analyze the use of Dante’s language: by identifying the presence of Dante’s lexicon and allusions. Currently, the project holds 47 testimonies, with 29 transcribed in full text and 18 encoded using the XML-TEI format. This project is propelled by a multidisciplinary and educational context with experts in humanities and computer science. The project’s findings will be disseminated through a user-friendly web application built on an XML foundation. Though currently in its prototyping phase, the application boasts several features, including a search engine for testimonies, terms, or phrases within the corpus. Additionally, a browsing interface allows users to read and listen the original testimonies, while a visualization tool enables deeper exploration of the corpus’s content. Adhering to the Text Encoding Initiative (TEI) guidelines, the project ensures a structured digital archive, aligned with the FAIR principles for data accessibility and reusability},
KEYWORDS = {XML-TEI, Holocaust Testimonies, Digital Archives},
PAGES = {1-9},
URL = {https://aclanthology.org/2024.htres-1.1},
PUBLISHER = {ELRA and ICCL (Torino, ITA)},
ISBN = {978-2-493814-18-0},
CONFERENCE_NAME = {First Workshop on Holocaust Testimonies as Language Resources},
CONFERENCE_PLACE = {Torino},
BOOKTITLE = {Proceedings of the First Workshop on Holocaust Testimonies as Language Resources (HTRes) @ LREC-COLING 2024},
EDITOR = {Anuradha, I. and Wynne, M. and Frontini, F. and Plum, A.},
}
@INPROCEEDINGS{FERRO_2024_INPROCEEDINGS_FMNTLP_501843,
AUTHOR = {Ferro, M. and Marzi, C. and Nadalini, A. and Taxitari, L. and Lento, A. and Pirrelli, V.},
TITLE = {ReadLet: a Dataset for Oral, Visual and Tactile Text Reading Data of Early and Mature Readers},
YEAR = {2024},
ABSTRACT = {The paper presents the design and construction of a time-stamped multimodal dataset for reading research, including multiple time-aligned temporal signals elicited with four experimental trials of connected text reading by both child and adult readers. We present the experimental protocols, as well as the data acquisition process and the post-processing phase of data annotation/augmentation. To evaluate the potential and usefulness of a time-aligned multimodal dataset for reading research, we present a few statistical analyses showing the correlation and complementarity of multimodal time-series of reading data, as well as some results of modelling adults’ reading data by integrating different modalities. The total dataset size amounts to about 2. 5 GByte in compressed format and is available through the CLARIN infrastructure},
KEYWORDS = {text reading, eye movements, finger movements, eye-finger span, synchronisation, parallel processing, multimodality},
PAGES = {13595-13609},
URL = {https://aclanthology.org/volumes/2024.lrec-main/},
PUBLISHER = {ELRA Language Resources Association (ELRA) (Parigi, FRA)},
ISBN = {978-2-493814-10-4},
CONFERENCE_NAME = {2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024)},
CONFERENCE_PLACE = {Parigi},
BOOKTITLE = {Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024)},
}
@INPROCEEDINGS{GROMANN_2024_INPROCEEDINGS_GGPABBCCFGGGKKLLPORRSSSSSSSTVZZ_475921,
AUTHOR = {Gromann, D. and Goncalo Oliveira, H. and Pitarch, L. and Apostol, E. S. and Bernad, J. and Bytyçi, E. and Cantone, C. and Carvalho, S. and Frontini, F. and Garabik, R. and Gracia, J. and Granata, L. and Khan, F. and Knez, T. and Labropoulou, P. and Liebeskind, C. and Pia Di Buono, M. and Ostroški Anić, A. and Rackevičienė, S. and Rodrigues, R. and Sérasset, G. and Selmistraitis, L. and Sidibé, M. and Silvano, P. and Spahiu, B. and Sogutlu, E. and Stanković, R. and Truică, C. O. and Valunaite Oleskeviciene, G. and Zitnik, S. and Zdravkova, K.},
TITLE = {MultiLexBATS: Multilingual Dataset of Lexical Semantic Relations},
YEAR = {2024},
ABSTRACT = {Understanding the relation between the meanings of words is an important part of comprehending natural language. Prior work has either focused on analysing lexical semantic relations in word embeddings or probing pretrained language models (PLMs), with some exceptions. Given the rarity of highly multilingual benchmarks, it is unclear to what extent PLMs capture relational knowledge and are able to transfer it across languages. To start addressing this question, we propose MultiLexBATS, a multilingual parallel dataset of lexical semantic relations adapted from BATS in 15 languages including low-resource languages, such as Bambara, Lithuanian, and Albanian. As experiment on cross-lingual transfer of relational knowledge, we test the PLMs(') ability to (1) capture analogies across languages, and (2) predict translation targets. We find considerable differences across relation types and languages with a clear preference for hypernymy and antonymy as well as romance languages},
KEYWORDS = {Lexical Semantic Relations, Multilingual Benchmark, BATS},
PAGES = {11783-11793},
URL = {https://aclanthology.org/2024.lrec-main.1029},
PUBLISHER = {ELRA and ICCL},
BOOKTITLE = {Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024)},
}
@INPROCEEDINGS{KHAN_2024_INPROCEEDINGS_KSACLMORF_475941,
AUTHOR = {Khan, F. and Salgado, A. and Anuradha, I. and Costa, R. and Liyanage, C. and McCrae, J. P. and Ojha, A. K. and Rani, P. and Frontini, F.},
TITLE = {CHAMUÇA: Towards a Linked Data Language Resource of Portuguese Borrowings in Asian Languages},
YEAR = {2024},
ABSTRACT = {This paper presents the development of CHAMUÇA, a novel lexical resource designed to document the influence of the Portuguese language on various Asian languages, with an initial focus on the languages of South Asia. Through the utilization of linked open data and the OntoLex vocabulary, CHAMUÇA offers structured insights into the linguistic characteristics, and cultural ramifications of Portuguese borrowings across multiple languages. The article outlines CHAMUÇA’s potential contributions to the linguistic linked data community, emphasising its role in addressing the scarcity of resources for lesser-resourced languages and serving as a test case for organising etymological data in a queryable format. CHAMUÇA emerges as an initiative towards the comprehensive catalogization and analysis of Portuguese borrowings, offering valuable insights into language contact dynamics, historical evolution, and cultural exchange in Asia, one that is based on linked data technology},
KEYWORDS = {portuguese, ontolex, language contact, lexicon},
URL = {https://aclanthology.org/2024.ldl-1.6},
PUBLISHER = {ELRA and ICCL (Torino, Italia)},
CONFERENCE_PLACE = {Torino, Italia},
BOOKTITLE = {Proceedings of the 9th Workshop on Linked Data in Linguistics @ LREC-COLING 2024},
}
@INPROCEEDINGS{LENTO_2024_INPROCEEDINGS_LNFMPDKSTK_513008,
AUTHOR = {Lento, A. and Nadalini, A. and Ferro, M. and Marzi, C. and Pirrelli, V. and Dimitrova, T. and Kukova, H. and Stefanova, V. and Todorova, M. and Koeva, S.},
TITLE = {Assessing Reading Literacy of Bulgarian Pupils with Finger-tracking},
YEAR = {2024},
ABSTRACT = {The paper reports on the first steps in developing a time-stamped multimodal dataset of reading data by Bulgarian children. Data are being collected, structured and analysed by means of ReadLet, an innovative infrastructure for multimodal language data collection that uses a tablet as a reader’s front-end. The overall goal of the project is to quantitatively analyse the reading skills of a sample of early Bulgarian readers collected over a two-year period, and compare them with the reading data of early readers of Italian, collected using the same protocol. We illustrate design issues of the experimental protocol, as well as the data acquisition process and the post-processing phase of data annotation/augmentation. To evaluate the potential and usefulness of the Bulgarian dataset for reading research, we present some preliminary statistical analyses of our recently collected data. They show robust convergence trends between Bulgarian and Italian early reading development stages},
KEYWORDS = {Finger Tracking, Reading, Learning, Text Comprehension.},
PAGES = {140-149},
URL = {https://dcl.bas.bg/clib/proceedings/},
CONFERENCE_NAME = {Sixth International Conference on Computational Linguistics in Bulgaria (CLIB 2024)},
CONFERENCE_PLACE = {BGR},
BOOKTITLE = {Proceedings of the Sixth International Conference on Computational Linguistics in Bulgaria (CLIB 2024)},
}
@INPROCEEDINGS{LENTO_2024_INPROCEEDINGS_LNKPMF_519724,
AUTHOR = {Lento, A. and Nadalini, A. and Khlif, N. and Pirrelli, V. and Marzi, C. and Ferro, M.},
TITLE = {Comparative Evaluation of Computational Models Predicting Eye Fixation Patterns During Reading: Insights from Transformers and Simpler Architectures},
YEAR = {2024},
ABSTRACT = {Eye tracking records of natural text reading are known to provide significant insights into the cognitive processes underlying word processing and text comprehension, with gaze patterns, such as fixation duration and saccadic movements, being modulated by morphological, lexical, and higher-level structural properties of the text being read. Although some of these effects have been simulated with computational models, it is still not clear how accurately computational modelling can predict complex fixation patterns in connected text reading. State-of-the-art neural architectures have shown promising results, with pre-trained transformer-based classifiers having recently been claimed to outperform other competitors, achieving beyond 95% accuracy. However, transformer-based models have neither been compared with alternative architectures nor adequately evaluated for their sensitivity to the linguistic factors affecting human reading. Here we address these issues by evaluating the performance of a pool of neural networks in classifying eye-fixation English data as a function of both lexical and contextual factors. We show that i) accuracy of transformer-based models has largely been overestimated, ii) other simpler models make comparable or even better predictions, iii) most models are sensitive to some of the major lexical factors accounting for at least 50% of human fixation variance, iv) most models fail to capture some significant context-sensitive interactions, such as those accounting for spillover effects in reading. The work shows the benefits of combining accuracy-based evaluation metrics with non-linear regression modelling of fixed and random effects on both real and simulated eye-tracking data},
KEYWORDS = {eye-tracking, eye fixation time prediction, neural network, contextual word embeddings, lexical features},
PAGES = {10},
URL = {https://ceur-ws.org/Vol-3878/},
VOLUME = {VOL-3878},
PUBLISHER = {CEUR (Aachen, DEU)},
ISBN = {979-12-210-7060-6},
CONFERENCE_NAME = {Italian Conference on Computational Linguistics (CLiC-it)},
CONFERENCE_PLACE = {Aachen},
BOOKTITLE = {Proceedings of the Tenth Italian Conference on Computational Linguistics (CLiC-it 2024)},
}
@INPROCEEDINGS{LUZIETTI_2024_INPROCEEDINGS_LCCDGMMQSMD_523843,
AUTHOR = {Luzietti, R. B. and Caradonna, M. and Caravale, A. and D'Eredita, A. and Giampietro, N. and Mancuso, G. and Moscati, P. and Quochi, V. and Spadi, A. and Monachini, M. and Degl'Innocenti, E.},
TITLE = {Digital Humanities and Heritage Science: moving from landscaping to a dynamic research observatory in an Open Science Cloud},
YEAR = {2024},
ABSTRACT = {The paper describes work carried out in the context of an infrastructural project for the implementation of a comprehensive investigation on language technologies, digital humanities, and heritage science disciplines in Italy. The topic of this landscaping activity consists in an extended survey of all the existing projects, resources, tools, communities, best practices, and standards in use among the SSH communities. Within this project, the second work package focuses on establishing, mapping, and monitoring strategies for assessing the national and international contexts for the four RIs, the characteristics of their user communities, and the specific data resources, services, and tools that are most needed, used and newly created},
KEYWORDS = {Research infrastructures, Landscaping, Building Communities, Digital Humanities, Cultural Heritage Science},
PAGES = {5},
URL = {https://amsacta.unibo.it/id/eprint/7927/},
DOI = {10.6092/unibo/amsacta/7927},
ISBN = {978-88-942535-8-0},
CONFERENCE_NAME = {Me. Te. Digitali. Mediterraneo in rete tra testi e contesti. XIII Convegno Annuale AIUCD2024},
BOOKTITLE = {Me. Te. Digitali. Mediterraneo in rete tra testi e contesti, Proceedings del XIII Convegno Annuale AIUCD2024},
}
@INPROCEEDINGS{LUZIETTI_2024_INPROCEEDINGS_LQOCDM_572742,
AUTHOR = {Luzietti, R. B. and Quochi, V. and Ottaviani, R. and Carpita, D. and Del Gratta, R. and Monachini, M.},
TITLE = {CLARIN in the Italian Open Science Cloud: landscaping and community engagement},
YEAR = {2024},
ABSTRACT = {This contribution is part of the H2IOSC project, supported by the Italian PNRR European Fund, in which the Italian CLARIN node collaborates with DARIAH, E-RIHS, and OPERAS to build an Italian Open Science Cloud. The paper presents an overview of two key project activities aim-img at landscaping the Italian resource panorama and increasing the Italian research community’s involvement. On the one hand, CLARIN-IT has benefited from CLARIN ERIC central services such as Virtual Language Observatory and Resource Families to gather information on the type and status of resources available that might be of interest of the Italian research community. On the other hand, through the H2IOSC activities CLARIN-IT is working to increase and strengthen the influence and use of CLARIN services within the Italian linguistics community},
KEYWORDS = {Research Infrastructures},
PAGES = {153-157},
URL = {https://www.clarin.eu/sites/default/files/CLARIN2024_ConferenceProceedings_final.pdf},
CONFERENCE_NAME = {CLARIN Annual Conference 2024},
BOOKTITLE = {CLARIN Annual Conference Proceedings},
}
@INPROCEEDINGS{MALLIA_2024_INPROCEEDINGS_MBBMPRTZZQ_479261,
AUTHOR = {Mallia, M. and Bandini, M. and Bellandi, A. and Murano, F. and Piccini, S. and Rigobianco, L. and Tommasi, A. and Zavattari, C. and Zinzi, M. and Quochi, V.},
TITLE = {DigItAnt: a platform for creating, linking and exploiting LOD lexica with heterogeneous resources},
YEAR = {2024},
ABSTRACT = {Over the past few years, the deployment of Linked Open Data (LOD) technologies has witnessed significant advancements across a myriad of sectors, linguistics included. This progression is characterized by an exponential increase in the conversion of resources to adhere to contemporary encoding standards. Such transformations are driven by the objectives outlined in “ecological” methodologies, notably the FAIR data principles, which advocate for the reuse and interoperability of resources. This paper presents the DigItAnt architecture, developed in the context of a national project funded by the Italian Ministry of Research and in the service of a recently started Italian endeavor to realize a federation of infrastructures for the humanities. It details its services, utilities and data types, and shows how it manages to produce, exploit and interlink LLOD and non-LLOD datasets in ways that are meaningful to its intended target disciplinary context, i. e. historical linguistics over epigraphy data. The paper also introduces how DigItAnt services and functionalities will contribute to the empowerment of the H2IOSC Italian infrastructures cluster project, which is devoted to the construction of a nationwide research infrastructure federation for the humanities, and it will possibly contribute to its pilot project towards an authoritative LLOD platform},
KEYWORDS = {Linguisti Linked Open Data, Ancient Languages, Digital Historical Linguistics, Language Technology for Digital Humanities},
PAGES = {55-65},
URL = {https://aclanthology.org/2024.ldl-1.8/},
PUBLISHER = {ELRA (Paris)},
ISBN = {978-2-493814-38-8},
CONFERENCE_NAME = {9th Workshop on Linked Data in Linguistics},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the 9th Workshop on Linked Data in Linguistics},
}
@INPROCEEDINGS{MALLIA_2024_INPROCEEDINGS_MDQ_526230,
AUTHOR = {Mallia, M. and Del Gratta, R. and Quochi, V.},
TITLE = {Funzioni e sostenibilità di una piattaforma digitale per le lingue arcaiche},
YEAR = {2024},
ABSTRACT = {Questo contributo, basato sull'esperienza acquisita in un progetto di ricerca triennale dedicato allo sviluppo di tecnologie e risorse digitali nel campo degli studi linguistico-storici su lingue epigrafiche frammentarie, riflette sulla sostenibilità a lungo termine dei risultati digitali ottenuti da piccoli gruppi di ricerca nelle Digital Humanities (DH). In particolare, l'analisi si concentra sulla possibilità di integrare questi risultati nelle infrastrutture di ricerca virtuali, distribuite e federate, come CLARIN(-IT) e la recente iniziativa di federazione delle infrastrutture di ricerca italiane per le Scienze Umane e il Patrimonio Culturale, denominata 'Humanities and Heritage Italian Open Cloud' (H2IOSC)},
KEYWORDS = {Infrastrutture di ricerca, Sostenibilità tecnica, Epigrafia Digitale, Servizi web},
PAGES = {566-571},
URL = {https://amsacta.unibo.it/id/eprint/7927/},
ISBN = {978-88-942535-8-0},
CONFERENCE_NAME = {Me. Te. Digitali. Mediterraneo in rete tra testi e contesti. XIII Convegno Annuale AIUCD2024},
BOOKTITLE = {Me. Te. Digitali. Mediterraneo in rete tra testi e contesti, Proceedings del XIII Convegno Annuale AIUCD2024},
}
@INPROCEEDINGS{MIASCHI_2024_INPROCEEDINGS_MDV_487005,
AUTHOR = {Miaschi, A. and Dell'Orletta, F. and Venturi, G.},
TITLE = {Linguistic Knowledge Can Enhance Encoder-Decoder Models (If You Let It)},
YEAR = {2024},
ABSTRACT = {In this paper, we explore the impact of augmenting pre-trained Encoder-Decoder models, specifically T5, with linguistic knowledge for the prediction of a target task. In particular, we investigate whether fine-tuning a T5 model on an intermediate task that predicts structural linguistic properties of sentences modifies its performance in the target task of predicting sentence-level complexity. Our study encompasses diverse experiments conducted on Italian and English datasets, employing both monolingual and multilingual T5 models at various sizes. Results obtained for both languages and in cross-lingual configurations show that linguistically motivated intermediate fine-tuning has generally a positive impact on target task performance, especially when applied to smaller models and in scenarios with limited data availability},
KEYWORDS = {encoder-decoder, intermediate fine-tuning, linguistic features, sentence complexity},
PAGES = {10539-10554},
URL = {https://aclanthology.org/2024.lrec-main.922/},
PUBLISHER = {ELRA and ICCL},
ISBN = {978-2-493814-10-4},
CONFERENCE_NAME = {Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024)},
BOOKTITLE = {Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024)},
}
@INPROCEEDINGS{MIASCHI_2024_INPROCEEDINGS_MDV_518427,
AUTHOR = {Miaschi, A. and Dell'Orletta, F. and Venturi, G.},
TITLE = {Evaluating Large Language Models via Linguistic Profiling},
YEAR = {2024},
ABSTRACT = {Large Language Models (LLMs) undergo extensive evaluation against various benchmarks collected in established leaderboards to assess their performance across multiple tasks. However, to the best of our knowledge, there is a lack of comprehensive studies evaluating these models’ linguistic abilities independent of specific tasks. In this paper, we introduce a novel evaluation methodology designed to test LLMs’ sentence generation abilities under specific linguistic constraints. Drawing on the ‘linguistic profiling’ approach, we rigorously investigate the extent to which five LLMs of varying sizes, tested in both zero-and few-shot scenarios, effectively adhere to (morpho)syntactic constraints. Our findings shed light on the linguistic proficiency of LLMs, revealing both their capabilities and limitations in generating linguistically-constrained sentences},
KEYWORDS = {Large Language Models, Controllable Text Generation, Linguistic Profiling},
PAGES = {2835-2848},
URL = {https://aclanthology.org/2024.emnlp-main.166},
DOI = {10.18653/v1/2024.emnlp-main.166},
PUBLISHER = {Association for Computational Linguistics (USA)},
ISBN = {979-8-89176-164-3},
CONFERENCE_NAME = {Conference on Empirical Methods in Natural Language Processing (EMNLP)},
CONFERENCE_PLACE = {USA},
BOOKTITLE = {Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing},
}
@INPROCEEDINGS{MOTGER_2024_INPROCEEDINGS_MMDFM_519997,
AUTHOR = {Motger, Q. and Miaschi, A. and Dell'Orletta, F. and Franch, X. and Marco, J.},
TITLE = {T-FREX: A Transformer-based Feature Extraction Method from Mobile App Reviews},
YEAR = {2024},
ABSTRACT = {Mobile app reviews are a large-scale data source for software-related knowledge generation activities, including software maintenance, evolution and feedback analysis. Effective extraction of features (i. e., functionalities or characteristics) from these reviews is key to support analysis on the acceptance of these features, identification of relevant new feature requests and prioritization of feature development, among others. Traditional methods focus on syntactic pattern-based approaches, typically context-agnostic, evaluated on a closed set of apps, difficult to replicate and limited to a reduced set and domain of apps. Mean-while, the pervasiveness of Large Language Models (LLMs) based on the Transformer architecture in software engineering tasks lays the groundwork for empirical evaluation of the performance of these models to support feature extraction. In this study, we present T-FREX, a Transformer-based, fully automatic approach for mobile app review feature extraction. First, we collect a set of ground truth features from users in a real crowdsourced software recommendation platform and transfer them automatically into a dataset of app reviews. Then, we use this newly created dataset to fine-tune multiple LLMs on a named entity recognition task under different data configurations. We assess the performance of T-FREX with respect to this ground truth, and we complement our analysis by comparing T-FREX with a baseline method from the field. Finally, we assess the quality of new features predicted by T-FREX through an external human evaluation. Results show that T-FREX outperforms on average the traditional syntactic-based method, especially when discovering new features from a domain for which the model has been fine-tuned},
KEYWORDS = {feature extraction, large language models, mobile apps, named entity recognition, reviews, token classification},
PAGES = {227-238},
URL = {https://iris.cnr.it/handle/20.500.14243/519997},
DOI = {10.1109/SANER60148.2024.00030},
PUBLISHER = {Institute of Electrical and Electronics Engineers Inc},
CONFERENCE_NAME = {31st IEEE International Conference on Software Analysis, Evolution and Reengineering, SANER 2024},
BOOKTITLE = {Proceedings-2024 IEEE International Conference on Software Analysis, Evolution and Reengineering, SANER 2024},
}
@INPROCEEDINGS{OCCHIPINTI_2024_INPROCEEDINGS_OMMLDNG_519999,
AUTHOR = {Occhipinti, D. and Marchi, M. and Mondella, I. and Lai, H. and Dell'Orletta, F. and Nissim, M. and Guerini, M.},
TITLE = {Fine-tuning with HED-IT: The impact of human post-editing for dialogical language models},
YEAR = {2024},
ABSTRACT = {Automatic methods for generating and gathering linguistic data have proven effective for fine-tuning Language Models (LMs) in languages less resourced than English. Still, while there has been emphasis on data quantity, less attention has been given to its quality. In this work, we investigate the impact of human intervention on machine-generated data when fine-tuning dialogical models. In particular, we study (1) whether post-edited dialogues exhibit higher perceived quality compared to the originals that were automatically generated; (2) whether fine-tuning with post-edited dialogues results in noticeable differences in the generated outputs; and (3) whether post-edited dialogues influence the outcomes when considering the parameter size of the LMs. To this end we created HED-IT, a large-scale dataset where machine-generated dialogues are paired with the version post-edited by humans. Using both the edited and unedited portions of HED-IT, we fine-tuned three different sizes of an LM. Results from both human and automatic evaluation show that the different quality of training data is clearly perceived and it has an impact also on the models trained on such data. Additionally, our findings indicate that larger models are less sensitive to data quality, whereas this has a crucial impact on smaller models. These results enhance our comprehension of the impact of human intervention on training data in the development of high-quality LMs},
KEYWORDS = {Large Language Models (LLMs), Detecting Synthetic Texts},
PAGES = {11892-11907},
URL = {https://iris.cnr.it/handle/20.500.14243/519999},
PUBLISHER = {Association for Computational Linguistics (ACL)},
CONFERENCE_NAME = {Findings of the 62nd Annual Meeting of the Association for Computational Linguistics, ACL 2024},
BOOKTITLE = {Proceedings of the Annual Meeting of the Association for Computational Linguistics},
}
@INPROCEEDINGS{PAGLIARA_2024_INPROCEEDINGS_PBB_506802,
AUTHOR = {Pagliara, A. and Boschetti, F. and Baglioni, D.},
TITLE = {Testi allografici: contatti tra lingue e scritture del Mediterraneo},
YEAR = {2024},
ABSTRACT = {Questo contributo discute la creazione dell’edizione scientifica digitale e l’analisi linguistica di testi allografici italoromanzi, documenti unici scritti in volgari italiani ma con alfabeti non latini dell’area mediterranea quali il greco, l’ebraico, l’arabo e il siriaco. Nonostante sia un fenomeno noto, ha ricevuto scarsa attenzione nella ricerca storicolinguistica e filologica in Italia, principalmente a causa delle difficoltà interpretative. Il progetto MIA (Manuscripta Italica Allographica) e altre iniziative simili mirano a catalogare digitalmente questi testi, applicando i metodi della filologia digitale per trascriverli e interpretarli. L’analisi si concentra sulle peculiarità grafiche e fonologiche, evidenziando l’influenza dei sistemi grafici originali sulla lingua italiana scritta e offrendo nuove prospettive sulla competenza linguistica degli autori alloglotti. Questa ricerca apporta un contributo significativo alla comprensione della diversità grafica e linguistica dei testi allografici, proponendo metodologie innovative per il loro studio attraverso l’apporto delle Digital Humanities},
URL = {https://iris.cnr.it/handle/20.500.14243/506802},
ISBN = {978-88-942535-8-0},
}
@INPROCEEDINGS{PEDONESE_2024_INPROCEEDINGS_PFOBSFSRCSB_506821,
AUTHOR = {Pedonese, G. and Frontini, F. and Ottaviani, R. and Boschetti, F. and Spadi, A. and Francalanci, L. and Scognamiglio, A. and Restaneo, P. and Chaban, A. and Striova, J. and Benassi, L.},
TITLE = {Materiali didattici come oggetti digitali FAIR: una metodologia condivisa per la formazione in H2IOSC},
YEAR = {2024},
ABSTRACT = {Il presente lavoro dettaglia la strategia per lo sviluppo di iniziative di formazione nell’ambito del progetto H2IOSC e mira a coinvolgere la comunità italiana di riferimento sulle modalità di design e di fruizione di moduli didattici che integrino l’uso delle Infrastrutture di Ricerca. In particolare, il contributo si sofferma sulla descrizione dei requisiti per l’implementazione dell’infrastruttura di training e sugli standard condivisi per la descrizione dei materiali didattici come oggetti digitali FAIR al fine di massimizzarne il riutilizzo in un’ottica train the trainers},
KEYWORDS = {Formazione, training, infrastrutture di ricerca, H2IOSC, principi FAIR.},
PAGES = {577-581},
URL = {https://amsacta.unibo.it/id/eprint/7927/},
DOI = {10.6092/unibo/amsacta/7927},
ISBN = {978-88-942535-8-0},
CONFERENCE_NAME = {XIII Convegno Annuale AIUCD2024},
BOOKTITLE = {Me. Te. Digitali. Mediterraneo in rete tra testi e contesti, Proceedings del XIII Convegno Annuale AIUCD2024},
}
@INPROCEEDINGS{PICCINI_2024_INPROCEEDINGS_PRBC_533336,
AUTHOR = {Piccini, S. and Ruiz, G. E. V. and Bellandi, A. and Carniani, E.},
TITLE = {Tracing Linguistic Heritage: Constructing a Somali-Italian Terminological Resource Through Explorers’ Notebooks and Contemporary Corpus Analysis},
YEAR = {2024},
ABSTRACT = {The aim of this contribution is to introduce the initial phases of constructing a Somali-Italian terminological resource that dates back to Italy’s colonial expansion into Africa. Specifically, the terminological data was extracted from the notebooks authored by the Italian explorer Ugo Ferrandi (1852-1928) and published by the Società Geografica in 1903 under the title “Lugh. Emporio Commerciale sul Giuba”. In order to develop Ferrandi’s terminological resource, we have employed Semantic Web technologies (RDF, OWL, and SPARQL) and embraced the Linked Open Data paradigm. This ensures the FAIRness of the data and enables the publication and sharing of our terminological resource within an open interconnected Web of Data, thus contributing to addressing the absence of Somali in the Linguistic Linked Data cloud. Whenever feasible, Ferrandi’s lexicon entries have been linked and enriched with information derived from a Somali lexicon included in a contemporary Somali Corpus. This approach allows the synchronic corpus-related Somali lexicon to acquire historical depth, thereby illuminating the linguistic dynamics that have transpired over time and would otherwise have remained obscure},
KEYWORDS = {Somali language, computational terminology, Semantic Web},
URL = {https://iris.cnr.it/handle/20.500.14243/533336},
BOOKTITLE = {Proceedings of the 3rd Annual Meeting of the Special Interest Group on Under-resourced Languages @ LREC-COLING 2024},
}
@INPROCEEDINGS{PUCCETTI_2024_INPROCEEDINGS_PRADE_519993,
AUTHOR = {Puccetti, G. and Rogers, A. and Alzetta, C. and Dell'Orletta, F. and Esuli, A.},
TITLE = {AI 'News' Content Farms Are Easy to Make and Hard to Detect: A Case Study in Italian},
YEAR = {2024},
ABSTRACT = {Large Language Models (LLMs) are increasingly used as 'content farm' models (CFMs), to generate synthetic text that could pass for real news articles. This is already happening even for languages that do not have high-quality monolingual LLMs. We show that fine-tuning Llama (v1), mostly trained on English, on as little as 40K Italian news articles, is sufficient for producing news-like texts that native speakers of Italian struggle to identify as synthetic. We investigate three LLMs and three methods of detecting synthetic texts (log-likelihood, DetectGPT, and supervised classification), finding that they all perform better than human raters, but they are all impractical in the real world (requiring either access to token likelihood information or a large dataset of CFM texts). We also explore the possibility of creating a proxy CFM: an LLM fine-tuned on a similar dataset to one used by the real 'content farm'. We find that even a small amount of fine-tuning data suffices for creating a successful detector, but we need to know which base LLM is used, which is a major challenge. Our results suggest that there are currently no practical methods for detecting synthetic news-like texts 'in the wild', while generating them is too easy. We highlight the urgency of more NLP research on this problem},
KEYWORDS = {Large Language Models (LLMs), Detecting synthetic texts},
PAGES = {15312-15338},
URL = {https://aclanthology.org/2024.acl-long.817/},
VOLUME = {1},
DOI = {10.18653/v1/2024.acl-long.817},
PUBLISHER = {Association for Computational Linguistics (ACL)},
CONFERENCE_NAME = {ACL 2024-62nd Annual Meeting of the Association for Computational Linguistics},
BOOKTITLE = {Proceedings of the Annual Meeting of the Association for Computational Linguistics},
}
@INPROCEEDINGS{SICHERA_2024_INPROCEEDINGS_SMDS_546201,
AUTHOR = {Sichera, P. and Mazzagufo, L. and Del Grosso, A. M. and Spampinato, D.},
TITLE = {Metodi di armonizzazione per codifiche TEI cooperative: l’edizione Bellini Digital Correspondence},
YEAR = {2024},
ABSTRACT = {Il contributo illustra nel dettaglio tanto le attività quanto gli strumenti inerenti all’armonizzazione dei documenti XML-TEI codificati in maniera cooperativa da studenti di Informatica Umanistica al fine di realizzare l’edizione scientifica digitale delle lettere autografe di Vincenzo Bellini (Bellini Digital Correspondence). Si mostreranno le strategie adottate per automatizzare al massimo la fase di analisi del processo di codifica implementato in seno al progetto. Nel contesto delle attività di supporto all’armonizzazione dei dati è stato sviluppato NormaTEI, un tool per l’estrazione delle diverse scelte di codifica sia attraverso il controllo di coerenza strutturale di elementi e gerarchie XML, sia attraverso l’analisi della distribuzione delle frequenze riferite a specifici tag presenti in diverse decine di documenti XML-TEI},
KEYWORDS = {Cooperative digital scholarly edition, schema-matching, armonizzazione, mormaTEI, Bellini Digital Correspondence},
PAGES = {185-190},
URL = {https://amsacta.unibo.it/id/eprint/7721},
DOI = {10.6092/unibo/amsacta/7721},
ISSN = {2532-8816},
ISBN = {978-88-942535-7-3},
CONFERENCE_NAME = {AIUCD 2023},
BOOKTITLE = {UMANISTICA DIGITALE},
}
@INPROCEEDINGS{TOMMASI_2024_INPROCEEDINGS_TZMQ_507161,
AUTHOR = {Tommasi, A. and Zavattari, C. and Mallia, M. and Quochi, V.},
TITLE = {REST services for Corpus management Annotation and SearcH},
YEAR = {2024},
ABSTRACT = {This paper presents a back-end software that offers a set of micro web services for the general-purpose management and search of text documents and annotations. Initially developed for a digital epigraphy project, the system focuses on integrating texts and lexicons represented in different paradigms. Nonetheless, the solution is designed to be general and adaptable across various domains},
KEYWORDS = {Corpus and annotation management, Digital Epigraphy},
PAGES = {1-5},
URL = {https://iris.cnr.it/handle/20.500.14243/507161},
CONFERENCE_NAME = {CLARIN Annual Conference 2024},
BOOKTITLE = {Proceedings of the CLARIN Annual Conference 2024},
}
@INPROCEEDINGS{BARDI_2024_INPROCEEDINGS_BDDDR_557643,
AUTHOR = {Bardi, A. and Daquino, M. and Del Gratta, R. and Del Grosso, A. M. and Rosselli Del Turco, R.},
TITLE = {The ATLAS of Italian Digital Humanities: a knowledge graph of digital scholarly research on Italian Cultural Heritage},
YEAR = {2024},
ABSTRACT = {ATLAS is a project funded by the Next Generation EU program of the European Commission for 24 months (October 2023-October 2025) that aims to improve the FAIRness and exploitation of Digital Humanities (DH) projects and scholarly data about Italian cultural heritage (https: //dh-atlas. github. io). DH research outputs are often not easy to discover, and risk obsolescence if not well documented and based on shared guidelines and standards. Moreover, projects are often self-referential, meaning that they may not follow metadata standards and best practices. In addition, users’ experience is limited in exploration, since there is a lack of interlinking across projects with a clear content overlap and explanations of such overlaps-including contradictory statements or disagreement. The goal of ATLAS is to identify shared metadata standards, protocols, reusable workflows, good practices, guidelines and evaluation frameworks in the Digital Humanities. To tackle the aforementioned problems in real-world scenarios and ensure the representativeness of identified guidelines, a pool of selected sources will be integrated in a knowledge graph, and reengineered with state-of-the-art Semantic Web technologies and Natural Language Processing methods. Pilot projects will help us to define guidelines and create a golden set of reference projects in the Digital Humanities. The aim is to collect sources that are published according to shareable criteria, that can be easily mined to extract research topics, inter and intra-textual relations, as well as bibliographic, literary, and thematic data. This will allow us to define quality criteria for recommending best practices to future projects. Moreover, the data extracted will be reconciled with international authority records (e. g. VIAF) and open data sources (e. g. Wikidata) to facilitate their reuse and the development of mashup applications. Finally, such enhanced data will be preserved and leveraged in a dedicated platform to support exploration and discovery of the landscape of DH projects, and will provide suggestions on tools and resources to scholars that are planning new projects. In summary, the ATLAS project will contribute to the Italian DH research community with four main results:-A whitebook including results of the analysis of the state of the art and good practices for FAIR scholarly data-A knowledge graph on DH projects and scholarly data on Italian Cultural Heritage, accessible online via the ATLAS web application and preserved in CLARIN.-The pilots evaluation, highlighting differences and strategies to cope with mapping knowledge, data manipulation, access and persistence of different types of digital artefacts.-A search portal dedicated to scholarly literature and data relevant to the pilots and beyond, built on top of the OpenAIRE CONNECT Gateway on Digital Humanities and Cultural Heritage},
KEYWORDS = {Digital Humanities, Knowledge Graph},
PAGES = {1},
URL = {https://zenodo.org/records/11569280},
DOI = {10.5281/zenodo.11569280},
PUBLISHER = {Zenodo},
CONFERENCE_NAME = {DARIAH 2024-Annual Event},
BOOKTITLE = {Workflows: Digital Methods for Reproducible Research Practices in the Arts and Humanities},
}
@INPROCEEDINGS{BIGGIO_2024_INPROCEEDINGS_BMC_471749,
AUTHOR = {Biggio, M. and Merone, M. and Caligiore, D.},
TITLE = {Disentangling Blink Reflexes in Multiple Sclerosis through explainable artificial intelligence systems},
YEAR = {2024},
URL = {https://iris.cnr.it/handle/20.500.14243/471749},
CONFERENCE_NAME = {Congresso scientifico annuale AISM "Brain health: rethinking the diagnosis of multiple sclerosi and related disorders"},
BOOKTITLE = {Atti del Congresso scientifico annuale AISM e la sua Fondazione "Brain health: rethinking the diagnosis of multiple sclerosi and related disorders"},
}
@INPROCEEDINGS{DIDONATO_2024_INPROCEEDINGS_D_545365,
AUTHOR = {Di Donato, F.},
TITLE = {CoARA: a che punto siamo?},
YEAR = {2024},
ABSTRACT = {Presentazione delle attività di CoARA e del capitolo nazionale italiano},
KEYWORDS = {Coara},
PAGES = {47-50},
URL = {https://www.openaccessrepository.it/records/gkz1v-y6n13},
DOI = {10.15161/oar.it/gkz1v-y6n13},
CONFERENCE_NAME = {Un lungo cammino: le nuove sfide della scienza aperta},
CONFERENCE_PLACE = {ITA},
BOOKTITLE = {Un lungo cammino: le nuove sfide della scienza aperta. Secondo convegno nazionale del gruppo di lavoro Open Science della CoPER},
}
@INPROCEEDINGS{DOOWYRYBISKA_2024_INPROCEEDINGS_DS_476501,
AUTHOR = {Dołowy Rybińska, N. and Soria, C.},
TITLE = {Do the contested languages of Italy and Poland contribute to the perception of these countries as multilingual?},
YEAR = {2024},
ABSTRACT = {The paper discusses the results of an online questionnaire conducted in 2022 to assess speakers' "naive" perception of Italy and Poland as multilingual countries. Studies of people's perceptions of the linguistic varieties present in a given territory help sociolinguists and language planners to understand the dominant linguistic ideology at a given point in time. Most European states, including Poland and Italy, have large linguistic repertoires, including state, immigrant, regional and minority languages, as well as their dialects. Safeguarding linguistic diversity in Europe is one of the most frequently stated tasks of the EU, and member states comply to a certain extent by supporting recognised indigenous languages on their territory and adopting measures to promote multilingualism through internal state regulations. However, officially recognised languages represent only a small percentage of the total number of language varieties used in Italy and Poland. Unrecognised varieties, both those perceived as languages (e. g. those of foreigners, immigrants, some minority languages) and those treated as dialects of the state language (the contested languages), in most cases receive little support. Moreover, awareness of their existence and the need to protect them is rather limited. On the basis of the answers to the questionnaire, we will discuss whether and to what extent the contested languages of Italy and Poland contribute to the folk perception and representation of Italy and Poland as multilingual countries. We will also focus on whether the lack of recognition of some language varieties leads to their neglect and consequently reduces their further chances for legal protection, support and recognition},
KEYWORDS = {Multilingualism, linguistic diversity, folk perception, sociolinguistics, contested languages},
URL = {https://iris.cnr.it/handle/20.500.14243/476501},
CONFERENCE_NAME = {CLOW4-Contested Language in the Old World},
BOOKTITLE = {Abstracts Booklet 24th-25th 2024 Contested Languages in the Old World},
}
@INPROCEEDINGS{NODARI_2024_INPROCEEDINGS_NSCC_529563,
AUTHOR = {Nodari, R. and Soria, C. and Calamai, S. and Carella, G.},
TITLE = {Attitudes towards World Englishes and Accent Discrimination in the Italian School System},
YEAR = {2024},
ABSTRACT = {According to Kachru (1992) the global spread of English can be synthetised in a model with three concentric circles: the inner circle (e. g. UK, US), where English is the dominant mother tongue; the outer circle (e. g. India, Nigeria), where English is used as a second language in official contexts; and the expanding circle (e. g. China, Japan), where English is learned as a foreign language. This framework has influenced the teaching of English by emphasising the importance of exposing students to different varieties of World English, es rather than focusing solely on Standard English (Kachru 1992; Seargeant, Swann 2012; Matsuda 2003, 2013). The phenomenon of World Englishes and its implications have been addressed several times; however, the question of social acceptance of non-standard varieties by teachers and students remains open (Lippi-Green 2012). This study aims at exploring possible discrimination of World Englishes accents among Italian secondary school students. 80 questionnaires were collected in two different Italian cities in the framework of a verbal guise experimental design, where students were asked to judge and rate different voices of students and teachers of English reading the same passage from a schoolbook. The following accents of English were used in the verbal guise experiments: four accents from the Inner Circle (Standard American; Standard British; African American; Multicultural London English), two from the Outer Circle (Indian; Nigerian), three from the expanding Circle (Italian; Chinese; Ukrainian). Participants were presented 9 different audio stimuli of male and female voices reading an excerpt of a school manual, with different contextualisation (teachers/students). After listening to each stimulus, participants were requested to express their agreement on a 5-point Likert scale regarding a set of adjectives describing the person just heard. To assess attitudes towards different accents the Stereotype Content Model (SCM, Fiske et al. 2002) was adopted. According to SCM, the two dimensions of competence and warmth organize the perception of social groups and individual. The dimension of competence is related to the perceived status, whereas the warmth dimension is related to solidarity (Conte \& Plutchik 1981). Nine adjectives were used, six for each of the competence and warmth dimension, three for the speech traits dimensions. It was then requested to guess the provenance of the speaker. This experiment aims at testing three research questions. We hypothesise that i) British English will be favoured for competence and American English for solidarity, whereas outer-and expanding circle varieties will be downgraded in comparison and perceived negatively. We then hypothesise that ii) Italian English accent will be perceived negatively for competence, but positively for solidarity. Finally, we predict that iii) students will be more critical towards teachers on the competence dimensions and, conversely, they will be more critical towards peers on the solidarity dimension},
KEYWORDS = {accent discrimination, verbal guise test, standard English, Stereotype content model, computational sociolinguistics, computational sociophonetics},
PAGES = {42-43},
URL = {https://www.filolog.uni.lodz.pl/fileadmin/Wydzialy/Wydzial_Filologiczny/PLIKI_KONFERENCJE/ACCENTS/Accents2024/Accents-2024-BoA.pdf},
PUBLISHER = {Lodz University (Lodz, POL)},
CONFERENCE_NAME = {ACCENTS 2024 Accents in various contexts 17th International Conference on Native and Non-native Accents of English},
CONFERENCE_PLACE = {Lodz},
BOOKTITLE = {ACCENTS 2024-Accents in various contexts-17th International Conference on Native and Non-native Accents of English},
}
@INPROCEEDINGS{SORIA_2024_INPROCEEDINGS_SNC_529673,
AUTHOR = {Soria, C. and Nodari, R. and Calamai, S.},
TITLE = {Assessing Smartphone Speech Recognition across Diverse English Accents: A Preliminary Study},
YEAR = {2024},
ABSTRACT = {Voice-activated artificial intelligence in smartphones is making spoken human-device interactions increasingly common, with many users utilizing these systems for everyday tasks such as creating shopping lists, dictating messages, or querying information (Ammari et al., 2019). The success of these interactions relies heavily on the accuracy of speech recognition technology embedded in devices, which can be significantly affected by accents and dialects. Recent advancements have improved the recognition of various accents beyond standard British or American English, driven by the need to ensure equitable service and representation for diverse communities (Choe et al., 2022; Koenecke et al., 2020). Although some automatic speech recognition (ASR) systems embedded in smartphones offer recognition for certain second language (L2) English accents (Lai, 2021), research on their performance remains limited (Chan et al., 2022; Del Rio et al., 2023; Tadimeti et al., 2022). This work presents preliminary findings from a study assessing the performance of common smartphone speech recognition systems with respect to a range of L1 (native) and L2 (non-native) English accents. The study utilized 36 audio clips from the CIRCE corpus, which consisted of the same short text read aloud by male and female speakers of four L1 and nine L2 English accents. The L1 accents included Standard American, African American, Standard British, and Multicultural London English, while the L2 accents covered Indian, Nigerian, Bosnian, Italian, Turkish, Ukrainian, Chinese, German, and Russian. Each clip averaged 0. 32 seconds in length. To simulate typical user experiences, the research evaluated Apple’s Siri voice recognition for two everyday tasks: message/note dictation and voice search. The audio clips were played from a laptop with voice recognition activated on an iPhone using the Notes app. Siri’s different English locales2 (USA, UK, Australia, Canada, Japan, India, New Zealand, Singapore, and South Africa) were tested for each accent. Each clip was played three times, resulting in a total of 702 transcripts. The study measured transcript accuracy using the Word Error Rate (WER) to compare and evaluate the performance of ASR systems. This new and unique comparable speech corpus provided insights into which L1 and L2 English accents are best recognized by common smartphones, as well as a comparative analysis of different automatic recognition models of local Englishes. Additionally, these preliminary results were compared with existing literature on human intelligibility of L1 and L2 accents (Verbeke and Simon, 2023)},
KEYWORDS = {automatic speech recognition, WER, English accents, L1 accents, L2 accents},
PAGES = {63-65},
URL = {https://www.filolog.uni.lodz.pl/fileadmin/Wydzialy/Wydzial_Filologiczny/PLIKI_KONFERENCJE/ACCENTS/Accents2024/Accents-2024-BoA.pdf},
PUBLISHER = {University of Lodz (Lodz, POL)},
CONFERENCE_NAME = {ACCENTS 2024 Accents in various contexts 17th International Conference on Native and Non-native Accents of English},
CONFERENCE_PLACE = {Lodz},
BOOKTITLE = {ACCENTS 2024 Accents in various contexts 17th International Conference on Native and Non-native Accents of English, Book of Abstract},
}
@TECHREPORT{ALBANESI_2024_TECHREPORT_ABGMPS_544741,
AUTHOR = {Albanesi, D. and Bellandi, A. and Giovannetti, E. and Marchi, S. and Papini, M. and Sciolette, F.},
TITLE = {Traduco: l'Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-Rapporto tecnico 25},
YEAR = {2024},
ABSTRACT = {La presente relazione tecnico-scientifica descrive l’attività svolta da CNR-ILC nel contesto del Progetto Traduzione Talmud Babilonese nel periodo gennaio 2024-luglio 2024. Le principali attività tecniche svolte sul sistema Traduco attualmente in produzione hanno riguardato l’aggiornamento di alcune funzionalità. Parallelamente, in continuità alle attività descritte nel documento di SAL precedente, è proseguito il lavoro di ricerca e sviluppo sui fronti della realizzazione della nuova versione di Traduco e sull’ampliamento della risorsa lessicale per l’italiano contemporaneo a supporto della funzionalità di ricerca full-text sul testo del Talmud tradotto in italiano. Inoltre, sempre in relazione alle tecnologie per l’accesso semantico alla traduzione, è stata avviata una attività di sperimentazione dell’uso di Large Language Models},
KEYWORDS = {Lessici elettronici, rappresentazione della conoscenza, Linguistica Computazionale, traduzione di testi religiosi, traduzione assistita dal calcolatore, Large Language Models},
URL = {https://iris.cnr.it/handle/20.500.14243/544741},
}
@TECHREPORT{ALBANESI_2024_TECHREPORT_AGMPS_544742,
AUTHOR = {Albanesi, D. and Giovannetti, E. and Marchi, S. and Papini, M. and Sciolette, F.},
TITLE = {Traduco: l'Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-Rapporto tecnico 26},
YEAR = {2024},
ABSTRACT = {La presente relazione tecnico-scientifica descrive l’attività svolta da CNR-ILC nel contesto del Progetto Traduzione Talmud Babilonese nel periodo agosto 2024-dicembre 2024. Le principali attività tecniche svolte sul sistema Traduco attualmente in produzione hanno riguardato l’aggiornamento di alcune funzionalità. In continuità alle attività descritte nel documento di SAL precedente è stato concluso il lavoro di sviluppo che ha portato alla realizzazione della nuova versione di Traduco. Sul fronte della ricerca è proseguito il lavoro sulla terminologia talmudica finalizzato all’integrazione delle voci terminologiche con il lessico della lingua italiana. Infine, sono proseguite le attività sperimentali di Intelligenza Artificiale con l’uso dei Large Language Models, in particolare sul fronte dell’accesso intelligente al testo talmudico},
KEYWORDS = {Lessici elettronici, rappresentazione della conoscenza, Linguistica Computazionale, traduzione di testi religiosi, traduzione assistita dal calcolatore, Large Language Models, Intelligenza Artificiale, question answering},
URL = {https://iris.cnr.it/handle/20.500.14243/544742},
}
@TECHREPORT{CALIGIURI_2024_TECHREPORT_CCFIS_524907,
AUTHOR = {Caligiuri, S. and Carpita, D. and Falini, I. and Iachello, S. and Spinelli, F.},
TITLE = {H2IOSC Project Handbook},
YEAR = {2024},
ABSTRACT = {The 'H2IOSC Handbook' aims to provide an overview of the H2IOSC Project’s state of the art and to introduce people who make it possible, not only to the H2IOSC community but also to a wider audience. The 'H2IOSC Handbook' is an open and dynamic document, constantly evolving, and will be updated as required throughout the project. The 'H2IOSC Handbook-V1 February 2024' is the first edition, produced in conjunction with the H2IOSC General Meeting that took place on February 6th and 7th, 2024. done by the Editorial Board},
KEYWORDS = {Digital Transformation, Open Science, Cultural Heritage, Research Infrastructures, Social sciences, Digital humanities, Humanities},
URL = {https://zenodo.org/records/12918010},
DOI = {10.5281/zenodo.12918008},
}
@TECHREPORT{KALOV_2024_TECHREPORT_KFBLMH_475982,
AUTHOR = {Kalová, T. and Frontini, F. and Bracco, L. and Laetitia, D. and Meeus, J. and Hasani Mavriqi, I.},
TITLE = {Data Stewardship Career Paths: Recommendations of the EOSC Task Force Data Stewardship Curricula and Career Paths},
YEAR = {2024},
ABSTRACT = {This document provides an overview of the topic of Data Stewardship Career Paths. Our review and summary of relevant reports and papers, ongoing initiatives, projects and surveys highlight the importance of ensuring more sustainable career paths for Data Stewards. The report further argues the need for further in-depth study and documentation of this topic. In particular, the analysis identifies relevant aspects that should be considered, ranging from employment conditions and salary to scientific recognition and roles. The report provides a list of recommendations and identifies activities that can be taken by the EOSC in the areas of Partnership, Association and Projects, summarised as follows: The EOSC Association and related projects should ensure that the overview of the current situation is kept up-to-date as a reference point. A section on the EOSC Association public website should be dedicated to Data Stewardship initiatives including a dedicated bibliography. To ensure long-term sustainability, a governing body should own and maintain this "inventory" as a point of reference; future projects should be encouraged to use it as a reference and provide input. The EOSC Association should ensure collaboration with international initiatives, in particular, the RDA IG Professionalizing Data Stewardship – TF Career Tracks and ensure coordination among current activities and studies carried out within the various EOSC Horizon Europe projects, and promote and support the organisation of dedicated events. The current and future EOSC projects and initiatives in the field should build on the work of this task force, as well as on the results of the studies above, and extend them by Applying qualitative methods such as guided interviews or focus groups to investigate the aspects covered in section 6 (“Data Stewardship Careers-What Counts”) in more depthDeveloping Data Steward Personas based on the proposed methodology detailed in Annex 1The EOSC Partnership (EOSC Association, European Commission and Steering Board) should establish a permanent Data Stewardship expert group (including representatives from the various existing initiatives and this task force) with the following responsibilities: Develop and implement a monitoring framework that will allow the EOSC and other national and international institutions to support the career paths and development of personnel hired (at least in part) in Data Stewardship rolesAdvise the Association and the relevant (ongoing and future) projects and initiativesIssue recommendations on further activities of the Association regarding Data StewardshipIn consideration of the importance of the key role of Data Stewards in the development and implementation of the EOSC and to facilitate the exchange with and among Data Stewards, a further objective of the EOSC Association should be to assess the need for a professional network for Data Stewards, at least on the European level. \ The use of an innovative methodology, the Persona workshops, is recommended alongside further surveys and in-depth interviews to explore the relevant aspects of career paths and professional development of Data Stewards, including the roles and responsibilities of employers and Data Stewardship training programmes. \ Context This work was carried out within the Data Stewardship Curricula and Career Paths EOSC Task Force framework, particularly its Career Paths work stream},
KEYWORDS = {career paths, data stewards, EOSC},
URL = {https://zenodo.org/records/11077722},
DOI = {10.5281/zenodo.11077722},
}
@TECHREPORT{OTTAVIANI_2024_TECHREPORT_OC_513900,
AUTHOR = {Ottaviani, R. and Carpita, D.},
TITLE = {Avvio e gestione del progetto “Humanities and cultural Heritage Italian Open Science Cloud – H2IOSC”},
YEAR = {2024},
ABSTRACT = {Rapporto tecnico-gestionale relativo all'avvio e all'implementazione del progetto H2IOSC: programmazione del procurement e del reclutamento del personale},
KEYWORDS = {H2IOSC, e-procurement, ciclo di vita del contratto, programmazione e controllo},
URL = {https://iris.cnr.it/handle/20.500.14243/513900},
}
@TECHREPORT{OTTAVIANI_2024_TECHREPORT_OL_513916,
AUTHOR = {Ottaviani, R. and Luzietti, R. B.},
TITLE = {La protezione dei dati personali by design e by default nell’elaborazione, gestione e diffusione del questionario per il “CENSIMENTO SUGLI ARCHIVI LETTERARI DIGITALI NATIVI” nel progetto di ricerca ALDiNa – Archivi Letterari Digitali Nativi, e impostazione della privacy policy del progetto},
YEAR = {2024},
ABSTRACT = {La protezione dei dati personali by design e by default nell’elaborazione, gestione e diffusione del questionario per il “CENSIMENTO SUGLI ARCHIVI LETTERARI DIGITALI NATIVI” nel progetto di ricerca ALDiNa – Archivi Letterari Digitali Nativi e impostazione della privacy policy del progetto},
KEYWORDS = {H2IOSC, Survey, Questionario, Censimento, Protezione dati personali, Soggetto interessato, Intervista},
PAGES = {25},
URL = {https://iris.cnr.it/handle/20.500.14243/513916},
DOI = {10.32079/ISTI-TR-2024/009},
}
@TECHREPORT{QUOCHI_2024_TECHREPORT_Q_514764,
AUTHOR = {Quochi, V.},
TITLE = {Epilexo Search: un’interfaccia di fruizione di lessici antichi per il progetto ItAnt},
YEAR = {2024},
ABSTRACT = {Il medesimo documento descrive lo sviluppo di “EpiLexO Search”, una piattaforma web per la fruizione di dati relativi ai lessici elettronici collegati a materiali testuali e bibliografici, nonché a risorse lessicografiche esterne, creati attraverso la piattaforma di editing dei lessici “EpiLexO Editor”. L’obiettivo del progetto è quello di creare uno strumento che possa permettere agli utenti interessati a visualizzare tutte le informazioni peculiari relative ai dati delle iscrizioni codificate secondo gli standard dell’epigrafia digitale-in questo caso di Epidoc-e dei dati relativi al lessico computazionale e dei Linguistic Linked Open Data, tramite l’utilizzo del modello OntoLex-Lemon. Oltre alla consultazione dei lessici, EpiLexO Search include un particolare sistema per la renderizzazione dei testi epigrafici secondo le convenzioni di Leida con annessi dati LOD e dei sistemi per la reperibilità di dati da più fonti per consentire agli utenti di effettuare ricerche incrociate e avanzate. Questo documento esplora le varie fasi della progettazione della piattaforma, dettagliando le specifiche tecniche di ciascun componente e delineando il modello generale per l'organizzazione e la presentazione dei dati},
KEYWORDS = {Digital Lexicography, Linguistic Linked Open Data},
URL = {https://iris.cnr.it/handle/20.500.14243/514764},
}
@MISC{CARLINO_2024_MISC_C_501701,
AUTHOR = {Carlino, M.},
TITLE = {Sito web del progetto LuCET-LingUistic Complexity Evaluation in educaTion},
YEAR = {2024},
ABSTRACT = {Design of the structure and implementation (with the WordPress CMS) of the website of the project LuCET-LingUistic Complexity Evaluation in educaTion (PRIN 2022 SH4-2022KPNY3B): https: //www. ilc. cnr. it/lucet (English)},
KEYWORDS = {website, dissemination, Linguistics},
URL = {https://www.ilc.cnr.it/lucet},
}
@MISC{CASTELLI_2024_MISC_CCDGLLR_519247,
AUTHOR = {Castelli, D. and Cimino, R. and Di Donato, F. and Gatt, L. and Lavitrano, M. and Lazzeri, E. and Rossi, G.},
TITLE = {Processi per individuare le attività già in essere nel Paese riconducibili agli obiettivi del PNSA 2021-2027},
YEAR = {2024},
ABSTRACT = {Questo documento è stato prodotto dai membri del Tavolo di lavoro per l’implementazione del PNSA-Piano Nazionale per Scienza Aperta 2021-2027 (DM 268/2022) in risposta al secondo punto del mandato ricevuto dal MUR, consistente nel “proporre processi per individuare le attività già in essere nel Paese riconducibili agli obiettivi del PNSA 2021-2027”. Esso contiene, dunque, una proposta di processo per individuare le suddette attività già in essere, identificando l’informazione da raccogliere e suggerendo come raccoglierla e come pubblicarla. Il risultato di tale processo è una ricognizione attenta e ragionata dello stato dell’arte della Scienza Aperta in Italia, ricognizione che rappresenta un punto di partenza concreto per incidere sulla complessità e sostenibilità dell’implementazione del PNSA, permettendo di far leva sull’esistente e di identificare i gap che devono essere colmati. In questo quadro, la ricognizione costituisce anche un necessario contributo all’implementazione del nodo EOSC nazionale e dell’accordo internazionale CoARA},
KEYWORDS = {Scienza aperta, PNSA},
URL = {https://iris.cnr.it/handle/20.500.14243/519247},
}
@MISC{ERJAVEC_2024_MISC_EKOOAAAAAAAABBBBBBBCCLCDDDDDDDFFFGGGGGGGHIJJJKKKLLLMMMMMMMMMNNNNOPPPPPPPPPQRRRRRRSSSSTTTVVVVVVVVWYZF_483001,
AUTHOR = {Erjavec, T. and Kopp, M. and Ogrodniczuk, M. and Osenova, P. and Agerri, R. and Agirrezabal, M. and Agnoloni, T. and Aires, J. and Albini, M. and Alkorta, J. and Antiba Cartazo, I. and Arrieta, E. and Barcala, M. and Bardanca, D. and Barkarson, S. and Bartolini, R. and Battistoni, R. and Bel, N. and Bonet Ramos, M. D. M. and Calzada Pérez, M. and Cardoso, A. and Çöltekin, Ç. and Coole, M. and Darģis, R. and De Does, J. and De Libano, R. and Depoorter, G. and Depuydt, K. and Diwersy, S. and Dodé, R. and Fernandez, K. and Fernández Rei, E. and Frontini, F. and Garcia, M. and García Díaz, N. and García Louzao, P. and Gavriilidou, M. and Gkoumas, D. and Grigorov, I. and Grigorova, V. and Haltrup Hansen, D. and Iruskieta, M. and Jarlbrink, J. and Jelencsik Mátyus, K. and Jongejan, B. and Kahusk, N. and Kirnbauer, M. and Kryvenko, A. and Ligeti Nagy, N. and Ljubešić, N. and Luxardo, G. and Magariños, C. and Magnusson, M. and Marchetti, C. and Marx, M. and Meden, K. and Mendes, A. and Mochtak, M. and Mölder, M. and Montemagni, S. and Navarretta, C. and Nitoń, B. and Norén, F. M. and Nwadukwe, A. and Ojsteršek, M. and Pančur, A. and Papavassiliou, V. and Pereira, R. and Pérez Lago, M. and Piperidis, S. and Pirker, H. and Pisani, M. and Pol, H. V. D. and Prokopidis, P. and Quochi, V. and Rayson, P. and Regueira, X. L. and Rii, A. and Rudolf, M. and Ruisi, M. and Rupnik, P. and Schopper, D. and Simov, K. and Sinikallio, L. and Skubic, J. and Tamper, M. and Tungland, L. M. and Tuominen, J. and Van Heusden, R. and Varga, Z. and Vázquez Abuín, M. and Venturi, G. and Vidal Miguéns, A. and Vider, K. and Vivel Couso, A. and Vladu, A. I. and Wissik, T. and Yrjänäinen, V. and Zevallos, R. and Fišer, D.},
TITLE = {Linguistically annotated multilingual comparable corpora of parliamentary debates ParlaMint. ana 4. 1},
YEAR = {2024},
ABSTRACT = {ParlaMint 4. 1 is a set of comparable corpora containing transcriptions of parliamentary debates of 29 European countries and autonomous regions, mostly starting in 2015 and extending to mid-2022. The individual corpora comprise between 9 and 126 million words and the complete set contains over 1. 2 billion words. The transcriptions are divided by days with information on the term, session and meeting, and contain speeches marked by the speaker and their role (e. g. chair, regular speaker). The speeches also contain marked-up transcriber comments, such as gaps in the transcription, interruptions, applause, etc. The corpora have extensive metadata, most importantly on speakers (name, gender, MP and minister status, party affiliation), on their political parties and parliamentary groups (name, coalition/opposition status, Wikipedia-sourced left-to-right political orientation, and CHES variables, https: //www. chesdata. eu/). Note that some corpora have further metadata, e. g. the year of birth of the speakers, links to their Wikipedia articles, their membership in various committees, etc. The transcriptions are also marked with the subcorpora they belong to ("reference", until 2020-01-30, "covid", from 2020-01-31, and "war", from 2022-02-24). An overview of the statistics of the corpora is avaialable on GitHub in the folder Build/Metadata, in particular for the release 4. 1 at https: //github. com/clarin-eric/ParlaMint/tree/v4. 1/Build/Metadata. The corpora are encoded according to the ParlaMint encoding guidelines (https: //clarin-eric. github. io/ParlaMint/) and schemas (included in the distribution). The ParlaMint. ana linguistic annotation includes tokenization; sentence segmentation; lemmatisation; Universal Dependencies part-of-speech, morphological features, and syntactic dependencies; and the 4-class CoNLL-2003 named entities. Some corpora also have further linguistic annotations, in particular PoS tagging according a language-specific scheme, with their corpus TEI headers giving further details on the annotation vocabularies and tools used. This entry contains the ParlaMint. ana TEI-encoded linguistically annotated corpora; the derived CoNLL-U files along with TSV metadata of the speeches; and the derived vertical files (with their registry file), suitable for use with CQP-based concordancers, such as CWB, noSketch Engine or KonText. Also included is the 4. 1 release of the sample data and scripts available at the GitHub repository of the ParlaMint project at https: //github. com/clarin-eric/ParlaMint and the log files produced in the process of building the corpora for this release. The log files show e. g. known errors in the corpora, while more information about known problems is available in the open issues at the GitHub repository of the project. This entry contains the linguistically marked-up version of the corpus, while the text version, i. e. without the linguistic annotation is also available at http: //hdl. handle. net/11356/1912. Another related resource, namely the ParlaMint corpora machine translated to English ParlaMint-en. ana 4. 1 can be found at http: //hdl. handle. net/11356/1910. As opposed to the previous version 4. 0, this version fixes a number of bugs and restructures the ParlaMint GitHub repository. The DK corpus has been linguistically re-annotated to remove bugs, while its speeches are now also marked with topics. The PT corpus has been extended to 2024-03 and the UA corpus to 2023-11, which also has improved language marking (uk vs. ru) on segments},
KEYWORDS = {ParlaCLARIN, linguistic annotation, pos-tagging, Named Entity Recognition, linguistic dependency annotation, UD},
URL = {https://iris.cnr.it/handle/20.500.14243/483001},
}
@MISC{GROSSI_2024_MISC_GHMNBBBEGHHJJKKLLMMPRRSSSTTTV_530562,
AUTHOR = {Grossi, D. and Hahn, U. and Mäs, M. and Nitsche, A. and Behrens, J. and Boehmer, N. and Brill, M. and Endriss, U. and Grandi, U. and Haret, A. and Heitzig, J. and Janssens, N. and Jonker, C. M. and Keijzer, M. A. and Kistner, A. and Lackner, M. and Lieben, A. and Mikhaylovskaya, A. and Murukannaiah, P. K. and Proietti, C. and Revel, M. and Rouméas, É. and Shapiro, E. and Sreedurga, G. and Swierczek, B. and Talmon, N. and Turrini, P. and Terzopoulou, Z. and Van De Putte, F.},
TITLE = {Enabling the Digital Democratic Revival: A Research Program for Digital Democracy},
YEAR = {2024},
ABSTRACT = {This white paper outlines a long-term scientific vision for the development of digital-democracy technology. We contend that if digital democracy is tomeet the ambition of enabling a participatory renewal in our societies, then acomprehensive multi-methods research effort is required that could, over theyears, support its development in a democratically principled, empirically andcomputationally informed way. The paper is co-authored by an international andinterdisciplinary team of researchers and arose from the Lorentz CenterWorkshop on ``Algorithmic Technology for Democracy'' (Leiden, October 2022)},
KEYWORDS = {Computer Science - Computers and Society},
URL = {http://arxiv.org/abs/2401.16863v1},
}
@MISC{MALLIA_2024_MISC_MBBMPRTZZQ_479301,
AUTHOR = {Mallia, M. and Bandini, M. and Bellandi, A. and Murano, F. and Piccini, S. and Rigobianco, L. and Tommasi, A. and Zavattari, C. and Zinzi, M. and Quochi, V.},
TITLE = {DigItAnt. A platform for creating, linking and exploiting LOD lexica with heterogeneous resources},
YEAR = {2024},
ABSTRACT = {Poster presented at the LDL 2024 Workshop, Torino, 25/05/2024},
KEYWORDS = {Linguisti Linked Open Data, Ancient Languages, Digital Historical Linguistics, Language Technology for Digital Humanities},
URL = {https://doi.org/10.5281/zenodo.11384067},
DOI = {10.5281/zenodo.11384066},
}
@MISC{MALLIA_2024_MISC_MQ_532940,
AUTHOR = {Mallia, M. and Quochi, V.},
TITLE = {DigItAnt Search},
YEAR = {2024},
ABSTRACT = {DigItAnt-search is the GUI web application od the DigItAnt platform, designed to explore, visualise and navigate the different sources of information created or linked within the national ItAnt project (https: //www. prin-italia-antica. unifi. it/). DigItAnt is an innovative platform designed to support historical linguistic and epigraphic studies, and researchers in the creation, management and consultation of digital linguistic resources for the fragmentary ancient languages. DigItAnt-search allows to explore interactively various sources of information in a unified and easily accessible environment},
KEYWORDS = {Historical linguistics, Digital epigraphy, Linguistic Open Linked Data, Web GUI application, Search interface},
URL = {https://github.com/DigItAnt/DigItAnt_search},
}
@MISC{OTTAVIANI_2024_MISC_O_513527,
AUTHOR = {Ottaviani, R.},
TITLE = {The CLARIN experience in H2IOSC Project-Improving users’ involvement with the use of learning materials created within the CLARIN network},
YEAR = {2024},
ABSTRACT = {H2IOSC-Humanities and cultural Heritage Italian Open Science Cloud aims to provide a federated and inclusive cluster of 4 Research Infrastructures in the ESFRI domain of Social and Cultural Innovation, to enable researchers from various disciplines in the fields of humanities, language technologies and cultural heritage to collaborate in research by sharing tools, services and data. Among the main activities planned in WP1 and WP8 of H2IOSC project are those of engagement and training. These activities are also inspired by the CLARIN experience with the aim of enhancing broader community involvement and reaching new interest groups. The set of actions that result from it fall under the “Engagement and training plan for H2IOSC”. The keyword of the Engagement and Training Plan is Outreach. Within the framework of the H2IOSC project, outreach can be defined as the planning of a user involvement or training program that actively involves a broad community. This involvement may take place through the creation of events, initiatives, or the dissemination of materials that not only satisfy the relevant scientific community but also reach other possible stakeholders. The main objective of outreach is to maximize the impact of research and communicate knowledge and good practices, thus contributing to positive community involvement. More generally, outreach activities also include information and orientation initiatives dedicated to promoting the knowledge of products, services, and possibilities offered by Research Infrastructures to potential users. In order to achieve this objective, the following approach will be used: 1. CLARIN Research and dissemination initiatives analyses (e. g. Clarin in a nutshell, Clarin Café, playrole for specific training) 2. Adaptation of pre-existing educational and engagement modules to the needs of H2IOSC users 3. Arrangement of engagement and training plan for H2IOSC 4. Engagement and training plan implementation 5. Promotion of the train-the-trainer approach The results of the initial initiatives will allow us to review the processes activated with the aim of continuous improvement both during the project's lifespan and in the subsequent phases, to maintain, develop, and ensure the sustainability of these activities within the infrastructure},
KEYWORDS = {Clarin, IR, Digital Humanitie, H2IOSC},
URL = {https://iris.cnr.it/handle/20.500.14243/513527},
CONFERENCE_NAME = {CLARIN ANNUAL CONFERENCE 2024},
}
@MISC{PEDONESE_2024_MISC_PKMFQS_561741,
AUTHOR = {Pedonese, G. and Khan, A. F. and Mallia, M. and Frontini, F. and Quochi, V. and Squadrito, E.},
TITLE = {Linguistic Linked Open Data for Humanists},
YEAR = {2024},
ABSTRACT = {Having achieved popularity as a way of publishing and accessing data in different fields of the sciences and for sharing large encyclopaedic datasets such as DBpedia (derived from Wikipedia), linked data is becoming more and more popular in different areas of the humanities. In this course we will present a comprehensive introduction to the creation, publication, and use of linked open data for anyone who wants to work with linguistic datasets – such as lexicons and corpora – and especially for those who come from a linguistic or humanist background. We will look at the basics of linked data and the Semantic Web and introduce the various different standards technologies that make up the Semantic Web stack before focusing on the particular case of linked data language resources. During the course we will study the most important tools, vocabularies, and resources available in the Semantic Web and provide hands-on training for the creation and querying of linguistic linked data. We will look at how Semantic Web technologies can contribute to the creation of FAIR language resources as well as how to publish your resource on the linked open data cloud. We will also show how the Semantic Web query language SPARQL can be a powerful tool for data exploration},
KEYWORDS = {Linked Open Data, Linguistics},
URL = {https://iris.cnr.it/handle/20.500.14243/561741},
DOI = {10.5281/zenodo.13897931},
}
@MISC{PROVOST_2024_MISC_P_475242,
AUTHOR = {Provost, L.},
TITLE = {National Stakeholder Engagement in GraspOS Pilots},
YEAR = {2024},
ABSTRACT = {This presentation was held on 3 June 2024 in the Horizon Europe Communication and Engagement Working Group coordinated by the EOSC Association. It focuses on how the GraspOS Pilots engage with their respective communities at national level, showcasing both their geographical distribution and the outreach activities which have been carried out with national stakeholders, often in the local language},
KEYWORDS = {EOSC, Horizon Europe, Communication Engagement, GraspOS},
URL = {https://doi.org/10.5281/zenodo.11482696},
DOI = {10.5281/zenodo.11482693},
CONFERENCE_NAME = {EOSC Association Working Group Communication and Engagement for Horizon Europe Projects},
}
@MISC{SCIOLETTE_2024_MISC_SGMB_530422,
AUTHOR = {Sciolette, F. and Giovannetti, E. and Marchi, S. and Bellandi, A.},
TITLE = {CompL-it},
YEAR = {2024},
ABSTRACT = {CompL-it is a computational lexicon for Italian derived from LexicO (https: //dspace-clarin-it. ilc. cnr. it/repository/xmlui/handle/20. 500. 11752/ILC-977), with the integration of following resources:-M-GLF (https: //dspace-clarin-it. ilc. cnr. it/repository/xmlui/handle/20. 500. 11752/ILC-1002), a list of lemmatized forms generated by the morphological analyzer MAGIC (Battista and Pirrelli, 1999, Pirrelli and Battista 2000);-a set of treebanks for Italian (contained in https: //lindat. cz/repository/xmlui/handle/11234/1-4611):-ISDT;-VIT;-ParTUT;-ParlaMint-it. The resource contains a morphological layer (including lemmas, inflected forms, and morphological features) and a semantic layer (including senses and relations between them). Entries are encoded according to the OntoLex-Lemon model and made available as a semantic repository},
KEYWORDS = {morphology, semantics, computational lexicon, linked open data},
URL = {https://iris.cnr.it/handle/20.500.14243/530422},
}
@MISC{SICHERA_2024_MISC_SCSMD_522482,
AUTHOR = {Sichera, P. and Cristofaro, S. and Spampinato, D. and Mazzagufo, L. and Del Grosso, A. M.},
TITLE = {CHROMA model for H2IOSC},
YEAR = {2024},
ABSTRACT = {The development of computational models and tools for philologically curated digital editions poses dual challenges: defining functional specifications for the reference community and ensuring sustainability and adherence to open science principles. Requirements analysis benefits from user stories describing application scenarios, while issues in process management and technologies require solutions for resource accessibility and longevity. The CHROMA model (http: //chroma. cnr. it/) offers an integrated approach rooted in projects like "Bellini Digital Correspondence" and "Pirandello Nazionale". It treats text as a complex multidimensional object through an editorial process involving: Creating digital surrogates of primary sources via IIIF protocol; Segmentation and text recognition using HTR/OCR environments by using eScriptorium tool; Separating textual and paratextual planes; Representing structural and semantic phenomena through XML/TEI, RDF, and Domain-Specific Languages; Assisted encoding with software tools for realigning different versions of editions e. g., Bertalign and NormaTEI; Integrating linguistic and lexicographic analyses by using NLP tools; Extracting information and generating knowledge graphs by means of semantic Web technologies and Ontologies; Connecting to authority records via LOD. The edition's fruition involves interactive visualization tools like TEIPublisher or EVT. Long-term technological standards ensure academic sustainability and synergy with the H2IOSC project. This workflow is part of pilot projects of the H2IOSC infrastructure such as the "Text Transcription Environment" and will be included in the initiative's marketplace as possible tool in docker deployment flavor. The CLARIN bazaar has discussed the model's conceptual choices and explored the proposed process in depth},
KEYWORDS = {Workflow, eScriptorium, HTR, OCR, XML-TEI, NormaTEI, NLP, Digital humanities, onthology},
URL = {https://iris.cnr.it/handle/20.500.14243/522482},
DOI = {10.5281/zenodo.13913607},
CONFERENCE_NAME = {CLARIN Annual Conference 2024},
}
@MISC{SICHERA_2024_MISC_SSDMC_517192,
AUTHOR = {Sichera, P. and Spampinato, D. and Del Grosso, A. M. and Mazzagufo, L. and Cristofaro, S.},
TITLE = {NormaTEI},
YEAR = {2024},
ABSTRACT = {NormaTEI is software for analyzing the content of one or more XML files. NormaTEI is designed mainly for two uses: control of encoding uniformity: when an XML/TEI edition is made up of multiple files, NormaTEI allows you to control them in an organic way, allowing you to easily identify errors or different encoding choices; encoding analysis: personalized and complex searches on the selected corpus (one or more files). The name "Norma" recalls both the operation for which the software was developed ("normalization") and Vincenzo Bellini's most famous work: NormaTEI was in fact developed during the creation of Bellini Digital Correspondence},
KEYWORDS = {4D, XML-TEI, XML parser, XPath, TEI, harmonization, normalize, Digital edition, error detection, diffing},
URL = {https://github.com/pierpaolosichera/NormaTEI},
DOI = {10.5281/zenodo.12581646},
}
@MISC{SPINELLI_2024_MISC_SI_526811,
AUTHOR = {Spinelli, F. and Iachello, S.},
TITLE = {H2IOSC Visual Identity},
YEAR = {2024},
ABSTRACT = {The "Visual Identity GUIDELINE" provides guidelines for the use of the H2IOSC project's visual identity, including logos and branded materials. Developed by Silvia Iachello (CNR ISPC) and Federica Spinelli (CNR OVI), members of the H2IOSC Editorial Board, this guide offers guidance on the use of PNRR project logos, research infrastructure logos, and includes access to a communication kit with ready-to-use graphics and templates for presentations and letterhead},
KEYWORDS = {Digital humanities, Sustainability, Cultural Heritage, Digital Transformation, Open Science, Research Infrastructures, Social sciences},
URL = {https://doi.org/10.5281/zenodo.14646251},
DOI = {10.5281/zenodo.14646250},
}
@MISC{VANDERLEK_2024_MISC_VFFP_561743,
AUTHOR = {Van Der Lek, I. and Fišer, D. and Frontini, F. and Pedonese, G.},
TITLE = {Introduzione ai Dati Linguistici: Standard e Archivi Digitali},
YEAR = {2024},
ABSTRACT = {Il corso "Introduzione ai Dati Linguistici: Standard e Archivi Digitali" introduce gli insegnanti e gli studenti all'uso degli archivi digitali di dati della ricerca e al loro ruolo nel ciclo di vita dei dati linguistici nel contesto degli principi FAIR e delle buone pratiche della Scienza Aperta. I materiali del corso sono suddivisi in unità e sono intesi come contenuti didattici per i docenti che insegnano a livello di laurea triennale o laurea magistrale, che sono invitati a sfogliare i materiali, esportarli per l'uso nel Learning Management System della loro istituzione e adattarli ai propri scopi come ritengono opportuno. Questo corso traduce in italiano e aggiorna i materiali di: van der Lek, Iulianna; Fišer, Darja. (2023). Introduction to Language Data: Standards and Repositories. In UPSKILLS Learning Content. https: //upskillsproject. eu/project/standards_repositories/. CC BY 4. 0. https: //creativecommons. org/licenses/by/4. 0/ L'adattamento si è svolto nell'ambito del progetto Humanities and cultural Heritage Italian Open Science Cloud (https: //www. h2iosc. cnr. it/), Work Package 8 "Training, Capacity Building, Engagement", a cura del personale CNR-ILC dedicato all'Attività 8. 2 "Teach CLARIN, Teach with CLARIN". Progetto H2IOSC-Humanities and cultural Heritage Italian Open Science Cloud finanziato dall’Unione Europea NextGenerationEU – PNRR M4C2 – Codice progetto IR0000029 – CUP B63C22000730005},
KEYWORDS = {Dati Linguistici, Gestione dati},
URL = {https://iris.cnr.it/handle/20.500.14243/561743},
DOI = {10.5281/zenodo.13911935},
}
@ARTICLE{ALZETTA_2023_ARTICLE_ADMPV_439017,
AUTHOR = {Alzetta, C. and Dell'Orletta, F. and Miaschi, A. and Prat, E. and Venturi, G.},
TITLE = {Tell me how you write and I'll tell you what you read: a study on the writing style of book reviews},
YEAR = {2023},
ABSTRACT = {The paper aims at investigating variations in the writing style of book reviews published on different social reading platforms and referring to books of different genres, which enables acquiring insights into communication strategies adopted by readers to share their reading experiences. To this end, we introduce a corpus-based study focused on the analysis of A Good Review, a novel corpus of online book reviews written in Italian, posted on Amazon and Goodreads, and covering six literary fiction genres. We rely on stylometric analysis to explore the linguistic properties and lexicon of reviews and the authors conducted automatic classification experiments using multiple approaches and feature configurations to predict either the review's platform or the literary genre. The analysis of user-generated reviews demonstrates that language is a quite variable dimension across reading platforms, but not as much across book genres. The classification experiments revealed that features modelling the syntactic structure of the sentence are reliable proxies for discerning Amazon and Goodreads reviews, whereas lexical information showed a higher predictive role for automatically discriminating the genre},
KEYWORDS = {Stylometric analysis, Textual Genre detection, Book reviews},
PAGES = {23},
URL = {https://www.emerald.com/insight/content/doi/10.1108/JD-04-2023-0073/full/html},
VOLUME = {79},
DOI = {10.1108/JD-04-2023-0073},
ISSN = {0022-0418},
JOURNAL = {JOURNAL OF DOCUMENTATION},
}
@ARTICLE{ALZETTA_2023_ARTICLE_ATK_450158,
AUTHOR = {Alzetta, C. and Torre, I. and Koceva, F.},
TITLE = {Annotation Protocol for Textbook Enrichment with Prerequisite Knowledge Graph},
YEAR = {2023},
ABSTRACT = {Extracting and formally representing the knowledge embedded in textbooks, such as the concepts explained and the relations between them, can support the provision of advanced knowledge-based services for learning environments and digital libraries. In this paper, we consider a specific type of relation in textbooks referred to as prerequisite relations (PR). PRs represent precedence relations between concepts aimed to provide the reader with the knowledge needed to understand a further concept(s). Their annotation in educational texts produces datasets that can be represented as a graph of concepts connected by PRs. However, building good-quality and reliable datasets of PRs from a textbook is still an open issue, not just for automated annotation methods but even for manual annotation. In turn, the lack of good-quality datasets and well-defined criteria to identify PRs affect the development and validation of automated methods for prerequisite identification. As a contribution to this issue, in this paper, we propose PREAP, a protocol for the annotation of prerequisite relations in textbooks aimed at obtaining reliable annotated data that can be shared, compared, and reused in the research community. PREAP defines a novel textbook-driven annotation method aimed to capture the structure of prerequisites underlying the text. The protocol has been evaluated against baseline methods for manual and automatic annotation. The findings show that PREAP enables the creation of prerequisite knowledge graphs that have higher inter-annotator agreement, accuracy, and alignment with text than the baseline methods. This suggests that the protocol is able to accurately capture the PRs expressed in the text. Furthermore, the findings show that the time required to complete the annotation using PREAP are significantly shorter than with the other manual baseline methods. The paper includes also guidelines for using PREAP in three annotation scenarios, experimentally tested. We also provide example datasets and a user interface that we developed to support prerequisite annotation},
KEYWORDS = {Text annotation, annotation protocol, knowledge engeneering, educational textbook},
URL = {https://rdcu.be/dxjsm},
DOI = {10.1007/s10758-023-09682-6},
ISSN = {2211-1662},
JOURNAL = {TECHNOLOGY, KNOWLEDGE AND LEARNING},
}
@ARTICLE{BACCO_2023_ARTICLE_BDLMN_439016,
AUTHOR = {Bacco, L. and Dell'Orletta, F. and Lai, H. and Merone, M. and Nissim, M.},
TITLE = {A text style transfer system for reducing the physician-patient expertise gap: An analysis with automatic and human evaluations},
YEAR = {2023},
ABSTRACT = {Physicians and patients often come from different backgrounds and have varying levels of education, which can result in communication difficulties in the healthcare process. To address this expertise gap, we present a "Text Style Transfer" system. Our system uses Semantic Textual Similarity techniques based on Sentence Transformers models to create pseudo-parallel datasets from a large, non-parallel corpus of lay and expert texts. This approach allowed us to train a denoising autoencoder model (BART), overcoming the limitations of previous systems. Our extensive analysis, which includes both automatic metrics and human evaluations from both lay (patients) and expert (physicians) individuals, shows that our system outperforms state-of-the-art models and is comparable to human-provided gold references in some cases},
KEYWORDS = {Natural language processing, Text style transfer, Text simplification},
PAGES = {1-18},
URL = {https://www.sciencedirect.com/science/article/pii/S0957417423013763},
VOLUME = {233},
DOI = {10.1016/j.eswa.2023.120874},
ISSN = {0957-4174},
JOURNAL = {EXPERT SYSTEMS WITH APPLICATIONS},
}
@ARTICLE{BELLANDI_2023_ARTICLE_B_505728,
AUTHOR = {Bellandi, A.},
TITLE = {Building linked lexicography applications with LexO-server},
YEAR = {2023},
ABSTRACT = {The adoption of Semantic Web technologies in the lexicographic field, has been driven by the need to ensure the construction of lexical resources that are interoperable and can be shared and reused by the scientific communities. In this context, the OntoLex W3C working group proposed the OntoLex-Lemon model aimed at providing rich linguistic grounding for ontologies. It includes the representation of morphological and syntactic properties of lexical entries as well as their meaning with respect to an ontology or vocabulary. This article aims at presenting LexO-server, a set of REST services for the management of OntoLex-Lemon modeled lexical resources. LexO-server comes as a software backend providing data access and manipulation to frontend developers. The set of services are general enough to make possible the construction of applications oriented at different tasks, such as editing, linking, dictionary making, linguistic annotation, or NLP ones. As a demonstration of the versatility and the potential of LexOserver, we will present three web applications that rely on it},
KEYWORDS = {Semantic Web, Lexicography, Terminology, rest services},
PAGES = {937-952},
URL = {https://iris.cnr.it/handle/20.500.14243/505728},
VOLUME = {38 (3)},
ISSN = {2055-768X},
JOURNAL = {DIGITAL SCHOLARSHIP IN THE HUMANITIES},
}
@ARTICLE{BELLANDI_2023_ARTICLE_BP_505742,
AUTHOR = {Bellandi, A. and Piccini, S.},
TITLE = {Creating specialised dictionaries using LexO},
YEAR = {2023},
ABSTRACT = {Although the contribution of linguistics to terminology is widely recognized today, there remains a lack of tools allowing the construction of specialized dictionaries that deal with both the conceptual and the linguistic dimension of the terms. In this paper we present LexO, a collaborative web editor that was built with the aim of filling this gap. The guiding principles of LexO are the following: i) to allow terminologists to define the morphological, syntactic and semantic features of a term, w. r. t. the traditional onomasiological perspective; ii) to adhere to the open science philosophy and to the FAIR principles, so to create specialized dictionaries that can be shared and reused within the scientific community},
KEYWORDS = {Lexicography, Terminology, LexO, Linked Data, Semantic Web, OntoLex-Lemon},
PAGES = {225-250},
URL = {https://iris.cnr.it/handle/20.500.14243/505742},
VOLUME = {39 (1)},
ISSN = {1865-9403},
JOURNAL = {LEXICOGRAPHICA},
}
@ARTICLE{BERENIKEHERRMANN_2023_ARTICLE_BBFJPRRS_476001,
AUTHOR = {Berenike Herrmann, J. and Bories, A. S. and Frontini, F. and Jacquot, C. and Pielström, S. and Rebora, S. and Rockwell, G. and Sinclair, S.},
TITLE = {Tool criticism in practice. On methods, tools and aims of computational literary studies},
YEAR = {2023},
ABSTRACT = {This paper is a case-driven contribution to the discussion on the method-theory relationship in practices within the field of Computational Literary Studies (CLS). Progress in this field dedicated to the computational analysis of literary texts has long revolved around the new, digital tools: tools, as computational devices for analysis, have had here a comparatively strong status as research entities of their own, while their ontological status has remained unclear to the day. As a rule, they have widely been imported from the fields of data science and NLP, while less often being hand-tailored to specific tasks within interdisciplinary settings. Although studies within CLS are evolving to both a higher degree of specialization in method (going beyond the limitations of out-of-the-box tools) and a stronger theoretical modeling, the technological dimension remains a defining factor. An unreflective adoption of technology in the shape of tools can compromise the plausibility and the reproducibility of the results produced using these tools. Our paper presents a multi-faceted intervention to the discussion around tools, methods, and the research questions that are answered with them. It presents research perspectives first conceived at the ADHO SIG-DLS workshop Anatomy of tools: A closer look at textual DH methodologies that took place in Utrecht in July 2019. At that event, the authors discussed selected case studies to address tool criticism from several angles. Our goal was to leverage a tool-critical perspective, in order to “take stock, reflect upon and critically comment upon our own practices” within CLS. We identified Textométrie, Stylometry, and Semantic Text Mining as three central types of hands-on CLS. For each of these sub-fields, we asked: What are our tools and methods-in-use? What are the implications of using a tool-oriented perspective as opposed to a methodology-oriented one? How do either relate to research questions and theory? These questions were explored by case-studies on an exemplary basis. The unifying perspective of this paper is an applied tool criticism – a critical inquiry leveraged towards crucial dimensions of CLS practices. Here we re-compose the original oral papers and add entirely new sections to it, to create a useful overview of the issue through a combination of perspectives. While we elaborated the thematic connections between the individual case studies, we hope the interactive spirit of an exemplary exchange remains palpable: individual research perspectives shape the case studies reported for Textométrie, Stylometry and Semantic Text Mining, are complemented by further studies showcasing CLS-specific perspectives on replicability and domain-specific research, and a short section discussing a tool inventory as a practical, community-based incarnation of tool criticism. The article reflects thus a rich array of perspectives on tool criticism, including the complementary perspective of tool defense – arguing that we need tools and methods as a basic common ground on how to carry out fundamental operations of analysis and interpretation within a community},
KEYWORDS = {tool criticism, digital literary studies, digital humanities},
URL = {https://www.digitalhumanities.org/dhq/vol/17/2/000687/000687.html},
VOLUME = {017 (2)},
ISSN = {1938-4122},
JOURNAL = {DIGITAL HUMANITIES QUARTERLY},
}
@ARTICLE{BIFFI_2023_ARTICLE_BGMS_454366,
AUTHOR = {Biffi, M. and Guadagnini, E. and Montemagni, S. and Sassolini, E.},
TITLE = {Il lemmario del «GDLI»: dati quantitativi e prime osservazioni},
YEAR = {2023},
ABSTRACT = {Dopo la realizzazione della versione elettronica del solo testo del "Grande dizionario della lingua italiana" (GDLI), si è avviato un progetto di graduale informatizzazione della sua struttura. Questo articolo ne presenta il primo risultato, vale a dire l'estrazione automatica del lemmario che è così per la prima volta quantificabile e individuabile. Una prima parte del testo è dedicata all'illustrazione della strutturazione dei contenuti del dizionario e la loro rappresentazione secondo standard internazionalmente riconosciuti (XML-TEI); la seconda presenta una prima elaborazione dei dati del lemmario estratto; la terza propone una prima analisi comparativa con i lemmari di altri dizionari della lingua italiana},
KEYWORDS = {Lessicografia, Lessicografia digitale, Lessicografia storica},
PAGES = {331-351},
URL = {https://accademiadellacrusca.it/it/riviste/articoli/slei-xl-2023/8679},
VOLUME = {40},
ISSN = {0392-5218},
JOURNAL = {STUDI DI LESSICOGRAFIA ITALIANA},
}
@ARTICLE{BRANCO_2023_ARTICLE_BEFHHJKKLNPPPSSTWZ_475961,
AUTHOR = {Branco, A. and Eskevich, M. and Frontini, F. and Hajic, J. and Hinrichs, E. and Jong, F. and Kamocki, P. and Konig, A. and Linden, K. and Navarretta, C. and Piasecki, M. and Piperidis, S. and Pitkanen, O. and Simov, K. and Skadina, I. and Trippel, T. and Witt, A. and Zinn, C.},
TITLE = {The CLARIN infrastructure as an interoperable language technology platform for SSH and beyond},
YEAR = {2023},
ABSTRACT = {CLARIN is a European Research Infrastructure Consortium developing and providing a federated and interoperable platform to support scientists in the field of the Social Sciences and Humanities in carrying-out language-related research. This contribution provides an overview of the entire infrastructure with a particular focus on tool interoperability, ease of access to research data, tools and services, the importance of sharing knowledge within and across (national) communities, and community building. By taking into account FAIR principles from the very beginning, CLARIN succeeded in becoming a successful example of a research infrastructure that is actively used by its members. The benefits CLARIN members reap from their infrastructure secure a future for their common good that is both sustainable and attractive to partners beyond the original target groups},
KEYWORDS = {Interoperability, Language resources, Language technology, Research infrastructure, Social sciences and humanities},
URL = {https://iris.cnr.it/handle/20.500.14243/475961},
DOI = {10.1007/s10579-023-09658-z},
ISSN = {1574-020X},
JOURNAL = {LANGUAGE RESOURCES AND EVALUATION},
}
@ARTICLE{BURGASSI_2023_ARTICLE_B_474453,
AUTHOR = {Burgassi, C.},
TITLE = {Maschere e vestiario. Nel nome di Gianduia},
YEAR = {2023},
ABSTRACT = {The usage of the word gianduia as a common noun for clothing, originating from the proper noun of the Piedmontese mask, emerges from texts dating back to the second half of the 19th century, both within and outside of Piedmont. This particular use of gianduia, which is not recorded by the reference lexicographic tools (including general, etymological, and historical dictionaries for Italian and the Piedmontese dialect), proves to be driven by specific cultural and political factors, thus serving as an emblematic case study of their influence on language. In this essay, instances of gianduia related to clothing are gathered as well as analysed according to the historical and linguistic context in which they occur},
KEYWORDS = {Deonomastic, Clothing name, Piedmontese mask Gianduia},
PAGES = {287-302},
URL = {https://www.rivisteweb.it/doi/10.61001/113132},
VOLUME = {49 (2)},
DOI = {10.61001/113132},
ISSN = {0394-3569},
JOURNAL = {STUDI LINGUISTICI ITALIANI},
}
@ARTICLE{BURGASSI_2023_ARTICLE_BG_437188,
AUTHOR = {Burgassi, C. and Guadagnini, E.},
TITLE = {Per studiare il vocabolario del passato. La posizione delle parole in epoca storica},
YEAR = {2023},
ABSTRACT = {This paper aims to propose a new method for describing the lexicon of a language in a specific period of its history. The first paragraph outlines the two main ideas to be found in the studies concerning both synchronic and diachronic lexicology. In the second para-graph our method for lexical inquiry is presented along with its core concepts, such as textual Corpus Representativeness, Connotation, Connotation Rate (Quoziente Connota-tivo, QC) and word Position in the Center-Periphery Vocabulary Model. The third para-graph sketches two possible research lines, the first one regarding the lexicon of a given historical period (Old Italian), the second dealing with the comparison between two differ-ent linguistic historical phases (Old Italian vs. Contemporary Italian)},
KEYWORDS = {Historical Lexicology, Corpus Linguistics, Word Connotation, Word Position, Center-Periphery Vocabulary Model},
PAGES = {1-18},
URL = {https://revistas.uam.es/chimera/article/view/15698},
VOLUME = {10},
DOI = {10.15366/chimera2023.10.001},
ISSN = {2386-2629},
JOURNAL = {CHIMERA},
}
@ARTICLE{CERULLI_2023_ARTICLE_CBD_455146,
AUTHOR = {Cerulli, A. and Brunato, D. and Dell'Orletta, F.},
TITLE = {Linguistic Profile of a Text and Human Ratings of Writing Quality: a Case Study on Italian L1 Learner Essays},
YEAR = {2023},
ABSTRACT = {This paper presents a study based on the linguistic profiling methodology to explore the relationship between the linguistic structure of a text and how it is perceived in terms of writing quality byhumans. The approach is tested on a selection of Italian L1 learners essays, which were taken from a larger longitudinal corpus of essays written by Italian L1 students enrolled in the first and secondyear of lower secondary school. Human ratings of writing quality by Italian native speakers were collected through a crowdsourcing task, in which annotators were asked to read pairs of essays andrated which one they believed to be better written. By analyzing these ratings, the study identifies a variety of linguistic phenomena spanning across distinct levels of linguistic description thatdistinguish the essays considered as 'winners' and evaluates the impact of students' errors on the human perception of writing quality},
KEYWORDS = {text quality, human ratings, Natural Language Processing, learner corpus},
PAGES = {7-34},
URL = {https://www.ai-lc.it/wp-content/uploads/2023/09/IJCOL_9_1_1_cerulli_et_al.pdf},
VOLUME = {1 (9)},
DOI = {10.4000/ijcol.1104},
ISSN = {2499-4553},
JOURNAL = {IJCOL},
}
@ARTICLE{CHIARELLA_2023_ARTICLE_C_459849,
AUTHOR = {Chiarella, D.},
TITLE = {Towards Multi-AUV Collaboration and Coordination: A Gesture-Based Multi-AUV Hierarchical Language and a Language Framework Comparison System},
YEAR = {2023},
ABSTRACT = {The underwater environment is a harmful environment, yet one of the richest and least exploited. For these reasons the idea of a robotic companion with the task of supporting and monitoring divers during their activities and operations has been proposed. However, the idea of a platoon of robots at the diver's disposal has never been fully addressed in these proposals due to the high cost of implementation and the usability, weight and bulk of the robots. Nevertheless, recent advancements in swarm robotics, materials engineering, deep learning, and the decreasing cost of autonomous underwater vehicles (AUVs), have rendered this concept increasingly viable. Therefore, this paper introduces, in the first part, a novel framework that integrates a revised version of a gesture-based language for underwater human-robot interaction (Caddian) based on insights gained from extensive field trials. The newly introduced objective of this framework is to enable the cooperation and coordination of an AUV team by one or more human operators, while allowing a human operator to delegate a robot leader to instruct the other robotic team members. The work, in the second part, provides an evaluation of the new language proposed thanks to a fifty million sentence corpus and describes a comparison framework, which is used to estimate it with respect to other existing underwater human-robot interaction languages},
KEYWORDS = {gesture-based language, underwater human-robot interaction, multi-AUV collaboration, language corpora and resources},
PAGES = {28},
URL = {https://www.mdpi.com/2077-1312/11/6/1208},
VOLUME = {11 (6)},
DOI = {10.3390/jmse11061208},
ISSN = {2077-1312},
JOURNAL = {JOURNAL OF MARINE SCIENCE AND ENGINEERING},
}
@ARTICLE{ERJAVEC_2023_ARTICLE_EOOLSPRKBSCDDAVPDNLCRMKDRVMF_448001,
AUTHOR = {Erjavec, T. and Ogrodniczuk, M. and Osenova, P. and Ljubesic, N. and Simov, K. and Pancur, A. and Rudolf, M. and Kopp, M. and Barkarson, S. and Steingrimsson, S. and Coltekin, C. and De Does, J. and Depuydt, K. and Agnoloni, T. and Venturi, G. and Perez, M. C. and De Macedo, L. D. and Navarretta, C. and Luxardo, G. and Coole, M. and Rayson, P. and Morkevicius, V. and Krilavicius, T. and Dargis, R. and Ring, O. and Van Heusden, R. and Marx, M. and Fiser, D.},
TITLE = {The ParlaMint corpora of parliamentary proceedings},
YEAR = {2023},
ABSTRACT = {This paper presents the ParlaMint corpora containing transcriptions of the sessions of the 17 European national parliaments with half a billion words. The corpora are uniformly encoded, contain rich meta-data about 11 thousand speakers, and are linguistically annotated following the Universal Dependencies formalism and with named entities. Samples of the corpora and conversion scripts are available from the project's GitHub repository, and the complete corpora are openly available via the CLARIN. SI repository for download, as well as through the NoSketch Engine and KonText concordancers and the Parlameter interface for on-line exploration and analysis},
KEYWORDS = {Parlamentary proceedings, Linguistic annotation, Universal Dependencies},
PAGES = {1-34},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85124105199\&origin=inward},
DOI = {10.1007/s10579-021-09574-0},
ISSN = {1574-020X},
JOURNAL = {LANGUAGE RESOURCES AND EVALUATION},
}
@ARTICLE{FAVARO_2023_ARTICLE_FBM_526790,
AUTHOR = {Favaro, M. and Biffi, M. and Montemagni, S.},
TITLE = {POS tagging and lemmatization of historical varieties of languages. The challenge of old Italian},
YEAR = {2023},
ABSTRACT = {The paper discusses the challenges of POS tagging and lemmatization of historical varieties of Italian, and reports for both tasks the results of experiments carried out in a classical supervised domain adaptation scenario using the diachronic and typologically differentiated corpus built for the "Vocabolario Dinamico dell’Italiano Moderno" (VoDIM). For what concerns POS tagging, the effectiveness of retrained models is illustrated and substantiated with quantitative data, with a specific view to linguistic annotation results obtained with respect to specific language evolution stages, domains and textual genres. For lemmatization, different customized models have been developed, including lexicon-assisted ones and models retrained with historical annotated texts. In both cases, a detailed error analysis is provided},
KEYWORDS = {Historical Varieties of Italian, POS-Tagging, Lemmatization},
PAGES = {99-120},
URL = {https://journals.openedition.org/ijcol/1325},
VOLUME = {9 (2)},
DOI = {10.4000/ijcol.1325},
ISSN = {2499-4553},
JOURNAL = {IJCOL},
}
@ARTICLE{FOLESANI_2023_ARTICLE_FBPTMTZNCBRDCG_460174,
AUTHOR = {Folesani, F. and Belvederi, M. M. and Puggioni, C. and Tiberto, E. and Marella, M. and Toffanin, T. and Zerbinati, L. and Nanni, M. G. and Caruso, R. and Brunato, D. and Ravelli, A. A. and Dell'Orletta, F. and Chochinov, H. M. and Grassi, L.},
TITLE = {Linguistic markers of demoralization improvement in schizophrenia: A pilot study},
YEAR = {2023},
ABSTRACT = {Background and objectives: Individuals with schizophrenia display language impairments involving pragmatics, semantics and syntax. Language impairments may show diagnostic specificity and could relate to the ability of engaging in psychotherapy. This pilot study sought to: (1) identify linguistic features that might differentiate individuals with schizophrenia from distressed controls without psychotic symptoms; and (2) examine the association between linguistic abilities and clinical changes during psychotherapy. Methods: We recruited patients with schizophrenia and a comparison group of individuals with demoralization and distress due to cancer. Participants underwent Dignity Therapy (DT), an existentially-oriented brief psychotherapy focused on legacy and subjective dignity. Verbatim transcripts of the DT sessions were analysed using Natural Language Processing (NLP). In addition, we measured changes in levels of demoralization and dignity-related distress before and after DT, exploring the association with linguistic variables with network analysis. Results: Patients with schizophrenia could be differentiated from those with cancer-related distress using only three out of 141 linguistic variables: total number of words, number of prepositional chains and conversational elements. Across groups, better levels of discourse coherence and higher number of arguments controlled by a predicate (verb "arity") were associated with larger improvements in demoralization and, indirectly, dignity-related distress. Conclusions: Reproducible linguistic markers may be able to differentiate individuals with schizophrenia from those with less severe psychopathology, and to predict better uptake of psychotherapy independent from diagnosis. Future studies should explore whether linguistic features derived from NLP may be exploited as accessible diagnostic or prognostic markers to tailor psychotherapy and other interventions in schizophrenia},
KEYWORDS = {Schizophrenia, Dignity Therapy, Natural Language Processing, Linguistic Profiling, Psychotherapy},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85153800425\&origin=inward},
DOI = {10.1016/j.ejpsy.2023.03.001},
ISSN = {0213-6163},
JOURNAL = {EUROPEAN JOURNAL OF PSYCHIATRY},
}
@ARTICLE{GUADAGNINI_2023_ARTICLE_G_454365,
AUTHOR = {Guadagnini, E.},
TITLE = {Una breve storia del 'cadavere': caduti latini, corpi morti romanzi e una postilla dantesca},
YEAR = {2023},
ABSTRACT = {The designations of death, dying, and the dead have been extensively studied, especially since they are often subject to linguistic taboo and are therefore named through euphemisms and dysphemisms. This contribution will reconstruct the history of the lexical type cadaver, in parallel with corpus (mortuum), from ancient Latin to modern Romance languages: the 'X-phemic' model will be discussed, but the study will adopt a semasiological perspective},
KEYWORDS = {Lexicology, Romance Linguistics, Corpse, Dante Alighieri, Corpo morto},
PAGES = {129-152},
URL = {https://edizionicafoscari.unive.it/en/edizioni4/riviste/transcript/2023/2/una-breve-storia-del-cadavere-caduti-latini-corpi/},
VOLUME = {2 (2)},
DOI = {10.30687/TranScript/2785-5708/2023/04/001},
ISSN = {2785-5708},
JOURNAL = {TRANSCRIPT},
}
@ARTICLE{LENATTI_2023_ARTICLE_LPOFM_418837,
AUTHOR = {Lenatti, M. and Paglialonga, A. and Orani, V. and Ferretti, M. and Mongelli, M.},
TITLE = {Characterization of synthetic health data using rule-based artificial intelligence models},
YEAR = {2023},
ABSTRACT = {The aim of this study is to apply and characterize eXplainable AI (XAI) to assess the quality of synthetic health data generated using a data augmentation algorithm. In this exploratory study, several synthetic datasets are generated using various configurations of a conditional Generative Adversarial Network (GAN) from a set of 156 observations related to adult hearing screening. A rule-based native XAI algorithm, the Logic Learning Machine, is used in combination with conventional utility metrics. The classification performance in different conditions is assessed: models trained and tested on synthetic data, models trained on synthetic data and tested on real data, and models trained on real data and tested on synthetic data. The rules extracted from real and synthetic data are then compared using a rule similarity metric. The results indicate that XAI may be used to assess the quality of synthetic data by (i) the analysis of classification performance and (ii) the analysis of the rules extracted on real and synthetic data (number, covering, structure, cut-off values, and similarity). These results suggest that XAI can be used in an original way to assess synthetic health data and extract knowledge about the mechanisms underlying the generated data},
KEYWORDS = {Synthetic data, Auditory system, Data models, Biomedical measurement, eXplainable AI (XAI), hearing screening, rule similarity, Generative Adversarial Networks (GAN), data augmentation, rule-based models},
PAGES = {3760-3769},
URL = {https://ieeexplore.ieee.org/document/10016704},
VOLUME = {27 (8)},
DOI = {10.1109/JBHI.2023.3236722},
ISSN = {2168-2194},
JOURNAL = {IEEE JOURNAL OF BIOMEDICAL AND HEALTH INFORMATICS},
}
@ARTICLE{LUZIETTI_2023_ARTICLE_LM_532872,
AUTHOR = {Luzietti, R. B. and Meluzzi, C.},
TITLE = {A sociophonetic approach to stop consonant production in a Sardinian Italian community in Yorkshire},
YEAR = {2023},
ABSTRACT = {This research contributes to the study of phonetic attrition and the processes of construction and maintenance of speakers’ sociolinguistic identity in migratory settings. This preliminary work focuses on Sardinian immigrants in York (UK), by analysing the maintenance or loss of characteristic phonetic features of their Sardinian Italian, in particular stop consonants. Despite these limitations, the results of the acoustic analysis show that maintaining linguistic skills in Sardinian local varieties in migration settings is important for the resistance of Sardinian stop consonants to phonetic attrition. Furthermore, being members of Sardinian communities and speakers of Sardinian is critical for maintaining speakers’ identities, especially in multilingual and multicultural environments},
KEYWORDS = {consonants, linguistic variation, phonetic attrition, Sardinian Italian, sociophonetics},
PAGES = {271-288},
URL = {https://iris.cnr.it/handle/20.500.14243/532872},
VOLUME = {4 (3)},
DOI = {10.1558/jmbs.23094},
ISSN = {2631-8407},
JOURNAL = {JOURNAL OF MONOLINGUAL AND BILINGUAL SPEECH},
}
@ARTICLE{MAGNANI_2023_ARTICLE_MCDBCILMTMASAACSCPMETMBRCFGMMMPRS_460175,
AUTHOR = {Magnani, L. and Carmisciano, L. and Dell'Orletta, F. and Bettinardi, O. and Chiesa, S. and Imbesi, M. and Limonta, G. and Montagna, E. and Turone, I. and Martinasso, D. and Aguglia, A. and Serafini, G. and Amore, M. and Amerio, A. and Costanza, A. and Sibilla, F. and Calcagno, P. and Patti, S. and Molino, G. and Escelsior, A. and Trabucco, A. and Marzano, L. and Brunato, D. and Ravelli, A. A. and Cappucciati, M. and Fiocchi, R. and Guerzoni, G. and Maravita, D. and Macchetti, F. and Mori, E. and Paglia, C. A. and Roscigno, F. and Saginario, A.},
TITLE = {Linguistic profile automated characterisation in pluripotential clinical high-risk mental state (CHARMS) conditions: methodology of a multicentre observational study},
YEAR = {2023},
ABSTRACT = {Introduction Language is usually considered the social vehicle of thought in intersubjective communications. However, the relationship between language and high-order cognition seems to evade this canonical and unidirectional description (ie, the notion of language as a simple means of thought communication). In recent years, clinical high at-risk mental state (CHARMS) criteria (evolved from the Ultra-High-Risk paradigm) and the introduction of the Clinical Staging system have been proposed to address the dynamicity of early psychopathology. At the same time, natural language processing (NLP) techniques have greatly evolved and have been successfully applied to investigate different neuropsychiatric conditions. The combination of at-risk mental state paradigm, clinical staging system and automated NLP methods, the latter applied on spoken language transcripts, could represent a useful and convenient approach to the problem of early psychopathological distress within a transdiagnostic risk paradigm. Methods and analysis Help-seeking young people presenting psychological distress (CHARMS /-and Clinical Stage 1a or 1b; target sample size for both groups n=90) will be assessed through several psychometric tools and multiple speech analyses during an observational period of 1-year, in the context of an Italian multicentric study. Subjects will be enrolled in different contexts: Department of Neuroscience, Rehabilitation, Ophthalmology, Genetics, Maternal and Child Health (DINOGMI), Section of Psychiatry, University of Genoa-IRCCS Ospedale Policlinico San Martino, Genoa, Italy; Mental Health Department-territorial mental services (ASL 3-Genoa), Genoa, Italy; and Mental Health Department-territorial mental services (AUSL-Piacenza), Piacenza, Italy. The conversion rate to full-blown psychopathology (CS 2) will be evaluated over 2 years of clinical observation, to further confirm the predictive and discriminative value of CHARMS criteria and to verify the possibility of enriching them with several linguistic features, derived from a fine-grained automated linguistic analysis of speech. Ethics and dissemination The methodology described in this study adheres to ethical principles as formulated in the Declaration of Helsinki and is compatible with International Conference on Harmonization (ICH)-good clinical practice. The research protocol was reviewed and approved by two different ethics committees (CER Liguria approval code: 591/2020-id. 10993; Comitato Etico dell'Area Vasta Emilia Nord approval code: 2022/0071963). Participants will provide their written informed consent prior to study enrolment and parental consent will be needed in the case of participants aged less than 18 years old. Experimental results will be carefully shared through publication in peer-reviewed journals, to ensure proper data reproducibility},
KEYWORDS = {Clinical High At Risk Mental State, Natural Language Processing, Linguistic profiling, Depression},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85150775470\&origin=inward},
VOLUME = {13},
DOI = {10.1136/bmjopen-2022-066642},
ISSN = {2044-6055},
JOURNAL = {BMJ OPEN},
}
@ARTICLE{MARZI_2023_ARTICLE_MMV_452198,
AUTHOR = {Marzi, C. and Melloni, C. and Vender, M.},
TITLE = {Finger-tracking reading profiles in monolingual and bilingual early graders},
YEAR = {2023},
ABSTRACT = {In this paper we propose an analysis of the reading behaviour of a group of Italian monolingual (n= 24) and bilingual (n= 35) 2nd schoolgraders, engaged in the tasks of reading aloud lists of isolated words and nonwords (from the DDE-2 test battery), as well as narrative connected textsdisplayed on the touch-screen of a common tablet, to be read either aloud or silently. A finger-tracking technique is illustrated, which provides detailed information about the reading behaviour and attention focus of early graders. Our results reveal various differences between groups. In particular, a different tracking pattern emerged in reading long, morphologically-complex word forms, correlating with a higher decoding error rate and comprehension difficulties in bilingual children compared with their monolingual peers. We suggest that the unsteady, discontinuous reading pattern for long noun and verb forms may be due to a (proto)-morphological reading strategy, with monolingual children being more successful in benefiting from a morpheme-based reading route. We also discuss the potentials of the finger-tracking technique as a tool to offer a more profound and comprehensive analysis of the reading profiles of both monolingual and bilingual readers},
KEYWORDS = {developing readers, bilingualism, L2 literacy, connected text reading, morphological processing, finger-tracking},
PAGES = {327-361},
URL = {https://www.rivisteweb.it/doi/10.1418/109051},
VOLUME = {XXII (2)},
DOI = {10.1418/109051},
ISSN = {1720-9331},
JOURNAL = {LINGUE E LINGUAGGIO},
}
@ARTICLE{MARZI_2023_ARTICLE_MP_462114,
AUTHOR = {Marzi, C. and Pirrelli, V.},
TITLE = {A discriminative information-theoretical analysis of the regularity gradient in inflectional morphology},
YEAR = {2023},
ABSTRACT = {Over the last decades, several independent lines of research in morphology have questioned the hypothesis of a direct correspondence between sublexical units and their mental correlates. Word and paradigm models of morphology shifted the fundamental part-whole relation in an inflection system onto the relation between individual inflected word forms and inflectional paradigms. In turn, the use of artificial neural networks of densely interconnected parallel processing nodes for morphology learning marked a radical departure from a morpheme-based view of the mental lexicon. Lately, in computational models of Discriminative Learning, a network architecture has been combined with an uncertainty reducing mechanism that dispenses with the need for a one-to-one association between formal contrasts and meanings, leading to the dissolution of a discrete notion of the morpheme. The paper capitalises on these converging lines of development to offer a unifying information-theoretical, simulation-based analysis of the costs incurred in processing (ir)regularly inflected forms belonging to the verb systems of English, German, French, Spanish and Italian. Using Temporal Self-Organising Maps as a computational model of lexical storage and access, we show that a discriminative, recurrent neural network, based on Rescorla-Wagner's equations, can replicate speakers' exquisite sensitivity to widespread effects of word frequency, paradigm entropy and morphological (ir)regularity in lexical processing. The evidence suggests an explanatory hypothesis linking Word and paradigm morphology with principles of information theory and human perception of morphological structure. According to this hypothesis, the ways more or less regularly inflected words are structured in the mental lexicon are more related to a reduction in processing uncertainty and maximisation of predictive efficiency than to economy of storage},
KEYWORDS = {Morphological inflection, Morphological regularity, Prediction-driven processing, Discriminative learning, Lexical self-organisation, Gradient structure, Information theory, Non-linear modelling},
PAGES = {1-51},
URL = {https://doi.org/10.1007/s11525-023-09415-6},
DOI = {10.1007/s11525-023-09415-6},
ISSN = {1871-5621},
JOURNAL = {MORPHOLOGY (DORDRECHT)},
}
@ARTICLE{MAZZARINO_2023_ARTICLE_MM_460281,
AUTHOR = {Mazzarino, S. and Marzi, C.},
TITLE = {Morphological processing in Italian L2 developing readers: a pilot study},
YEAR = {2023},
ABSTRACT = {In this paper we focus on the morphological competence and awareness of 23 Italian second-language (L2) school children, by comparing the reading profiles of Italian L1 and L2 children attending primary school from 2nd to 5th grades. Reading data were collected through the experimental finger-tracking protocol developed within the ReadLet project, which supports collecting and structuring behavioural reading data of short narrative texts displayed on a tablet touch-screen. The analyses reproduced the main effects that are well-attested in the developmental literature, and pointed out some differences in the behavioural profile of L2 versus L1 children, with the former being more affected by word length and frequency effects, as well as by the aloud reading task than the latter. Interestingly, however, a functional morphological segmentation strategy emerges in L2 readers processing complex inflected forms during the aloud reading task. We interpret it as a possible strategy to alleviate the extra cognitive load associated with the overt articulation of morphologically complex words within the context of a connected text},
KEYWORDS = {reading, bilingualism, morphological awareness, developing readers, word processing},
PAGES = {143-166},
URL = {https://iris.cnr.it/handle/20.500.14243/460281},
VOLUME = {XXII (1)},
DOI = {10.1418/107679},
ISSN = {1720-9331},
JOURNAL = {LINGUE E LINGUAGGIO},
}
@ARTICLE{MELUZZI_2023_ARTICLE_MLN_532876,
AUTHOR = {Meluzzi, C. and Luzietti, R. B. and Nese, N.},
TITLE = {Considerazioni preliminari per una ricerca sociolinguistica sul sardo di migrazione nel Biellese},
YEAR = {2023},
ABSTRACT = {The paper deals with a preliminary sociolinguistic analysis of a corpus of first-generation Sardinian speakers who migrated to Biella, an Alpine Valley in the north-west of Italy. The data have been collected through ethnographic interviews with either single speakers or married couples who migrated from Sardinia. The analysis is conducted on the linguistic repertoires and linguistic uses emerging from the recorded interactions and on the phonetic variability of the vowel space in some selected speakers. The results show that Sardinian varieties are preserved within families but not transmitted to the youngest generations of migrants},
KEYWORDS = {Linguistic Identity, Sardinian, Sociolinguistics of migration, Sociophonetics},
PAGES = {103-124},
URL = {https://iris.cnr.it/handle/20.500.14243/532876},
VOLUME = {28},
DOI = {10.5565/rev/qdi.581},
ISSN = {2014-8828},
JOURNAL = {QUADERNS D'ITALIÀ},
}
@ARTICLE{MIASCHI_2023_ARTICLE_MABDV_439018,
AUTHOR = {Miaschi, A. and Alzetta, C. and Brunato, D. and Dell'Orletta, F. and Venturi, G.},
TITLE = {Testing the Effectiveness of the Diagnostic Probing Paradigm on Italian Treebanks},
YEAR = {2023},
ABSTRACT = {The outstanding performance recently reached by neural language models (NLMs) across many natural language processing (NLP) tasks has steered the debate towards understanding whether NLMs implicitly learn linguistic competence. Probes, i. e., supervised models trained using NLM representations to predict linguistic properties, are frequently adopted to investigate this issue. However, it is still questioned if probing classification tasks really enable such investigation or if they simply hint at surface patterns in the data. This work contributes to this debate by presenting an approach to assessing the effectiveness of a suite of probing tasks aimed at testing the linguistic knowledge implicitly encoded by one of the most prominent NLMs, BERT. To this aim, we compared the performance of probes when predicting gold and automatically altered values of a set of linguistic features. Our experiments were performed on Italian and were evaluated across BERT's layers and for sentences with different lengths. As a general result, we observed higher performance in the prediction of gold values, thus suggesting that the probing model is sensitive to the distortion of feature values. However, our experiments also showed that the length of a sentence is a highly influential factor that is able to confound the probing model's predictions},
KEYWORDS = {Neural language model, Probing tasks, Treebanks},
PAGES = {19},
URL = {https://www.mdpi.com/2078-2489/14/3/144},
VOLUME = {14 (3)},
DOI = {10.3390/info14030144},
ISSN = {2078-2489},
JOURNAL = {INFORMATION},
}
@ARTICLE{MURANO_2023_ARTICLE_MQDRZ_459322,
AUTHOR = {Murano, F. and Quochi, V. and Del Grosso, A. M. and Rigobianco, L. and Zinzi, M.},
TITLE = {Describing Inscriptions of Ancient Italy. The ItAnt Project and Its Information Encoding Process},
YEAR = {2023},
ABSTRACT = {This paper discusses the challenges addressed in the digital scholarly encoding of the fragmentary texts of the languages of Ancient Italy according to the TEI/EpiDoc Guidelines in XML format. This contribution describes the solutions and customisations that have been adopted for dealing with the peculiarities of our epigraphical documentation and with the formalisation of epigraphical information deemed interesting for data retrieval in a historical linguistic perspective. The making of a digital corpus consisting of new critical editions of selected inscriptions is a work carried out in the context of the project "Languages and Cultures of Ancient Italy. Historical Linguistics and Digital Models", which aims to investigate the languages of Ancient Italy by combining the traditional methods, proper to historical linguistics, with methods and technologies proper to the digital humanities and computational lexicography. More specifically, the purpose of the project is to create a collection of interrelated digital language resources which comprise: 1) the digital corpus of texts editions; 2) a computational lexicon compliant with the Web Semantic requirements; 3) a relevant bibliographic reference dataset encoded according to the FRBRoo/LRMoo specifications. Additionally, selected textual data and scientific interpretations will be encoded by using CIDOC CRM and its extensions, namely CRMtex and CRMinf. The present contribution tackles one of the main aspects of the project, and proposes significant innovations in the encoding of critical editions for epigraphic texts of fragmentary languages, which will hopefully foster future interoperability and integration with other external datasets, a paramount concern of the project},
KEYWORDS = {text encoding, ancient languages, digital epigraphy, TEI/EpiDoc},
PAGES = {15},
URL = {https://dl.acm.org/doi/pdf/10.1145/3606703},
VOLUME = {16},
DOI = {10.1145/3606703},
ISSN = {1556-4711},
JOURNAL = {JOURNAL ON COMPUTING AND CULTURAL HERITAGE},
}
@ARTICLE{NADALINI_2023_ARTICLE_NMFTLCP_501822,
AUTHOR = {Nadalini, A. and Marzi, C. and Ferro, M. and Taxitari, L. and Lento, A. and Crepaldi, D. and Pirrelli, V.},
TITLE = {Eye-voice and finger-voice spans in adults’ oral reading of connected texts},
YEAR = {2023},
ABSTRACT = {The present paper investigates the interaction between eye movements, voice articulation and the movements of the index finger dynamically pointing to a text line in oral finger-point reading of Italian. During finger-point reading, the finger appears to be ahead of the voice most of the times, by a margin that is significantly modulated by the distribution of phrasal and prosodic units in the reading text. Eye movements replicate the same effects on a different time scale. The eye is ahead of both voice and finger by a wide margin (confirming evidence observed for English and German sentence reading), while showing a tendency to re-synchronise with voice articulation at the right edge of strong prosodic units (sentence boundaries). Our evidence suggests a multicomponent view of the time span between the eye/finger and the voice. The span is shown to be the dynamic outcome of an optimally adaptive reading strategy, resulting from the interaction between individual decoding skills, the reader's phonological buffer capacity, and the structural complexity of a reading text. Proficient readers modulate their span to compensate for the different timing between word fixation and word articulation, read faster, and dynamically adjust their processing window to the meaningful, prosodic units of a text},
KEYWORDS = {finger-point reading, eye-tracking, finger-tracking, eye-voice span, finger-voice span, eye-finger coordination, parallel processing, working memory, phonological buffer, adaptive reading},
PAGES = {366-400},
URL = {https://benjamins.com/catalog/ml.00025.nad},
VOLUME = {18 (3)},
DOI = {10.1075/ml.00025.nad},
ISSN = {1871-1340},
JOURNAL = {THE MENTAL LEXICON},
}
@ARTICLE{PICCINI_2023_ARTICLE_PVB_519860,
AUTHOR = {Piccini, S. and Vezzani, F. and Bellandi, A.},
TITLE = {TBX and lemon: What Perspectives in Terminology?},
YEAR = {2023},
ABSTRACT = {Different solutions are offered today for modelling multilingual terminological data. In this article, we focus on the description of two approaches: on the one hand, the model proposed in the context of ISO TC 37/SC 3, based on the adoption of the Terminological Markup Framework/TermBase eXchange standards; on the other hand, the ‘Lemon’ model and, more generally, the Ontology Web Language adopted in the framework of the Semantic Web. The aim of this study is to propose a contrastive multilevel analysis between these two paradigms, with the ultimate goal of highlighting their divergences and convergences. The terminological case study chosen to test the two approaches is represented by the pathology known as ‘body dysmorphic disorder’, which poses challenges in terms of conceptual and linguistic representation. Starting from the phenomena of reconceptualization and denominative variation of this disorder, we will show that the two models are based on diverging but complementary theoretical and methodological perspectives},
KEYWORDS = {TBX, Lemon, Terminology},
PAGES = {61-72},
URL = {https://academic.oup.com/dsh/article/38/Supplement_1/i61/7203991},
VOLUME = {38 (1)},
DOI = {10.1093/llc/fqad025},
ISSN = {2055-768X},
JOURNAL = {DIGITAL SCHOLARSHIP IN THE HUMANITIES},
}
@ARTICLE{PROIETTI_2023_ARTICLE_PC_519990,
AUTHOR = {Proietti, C. and Chiarella, D.},
TITLE = {Corrigendum to ’the Role of Argument Strength and Informational Biases in Polarization and Bi-Polarization Effects’ (Journal of Artificial Societies and Social Simulation, (2023), 26, 2, 5, 10. 18564/jasss. 5164)},
YEAR = {2023},
ABSTRACT = {This corrigendum refers to’The Role of Argument Strength and Informational Biases in Polarization and Bi-Polarization Effects’, Journal of Artificial Societies and Social Simulation, 26 (2) 5, 2023},
KEYWORDS = {Argument Communication Theory, Argumentation, Bi-Polarization, Epistemic Vigilance, Opinion Dynamics, Polarization},
URL = {https://iris.cnr.it/handle/20.500.14243/519990},
VOLUME = {26 (3)},
DOI = {10.18564/jasss.5164},
ISSN = {1460-7425},
JOURNAL = {JASSS},
}
@ARTICLE{PROIETTI_2023_ARTICLE_PC_433900,
AUTHOR = {Proietti, C. and Chiarella, D.},
TITLE = {The Role of Argument Strength and Informational Biases in Polarization and Bi-Polarization Effects},
YEAR = {2023},
ABSTRACT = {This simulation research explores the informational causes of polarization and bi-polarization of opinions within groups. We define 'polarization' here as a uniform change of the opinion of the whole group in the same direction, whereas 'bi-polarization' indicates a split of two subgroups towards opposite directions. For our purposes, we have expanded the model of the Argument Communication Theory of Bi-polarization. This is an argument-based multi-agent model of opinion dynamics inspired by Persuasive Argument Theory. The original model accounts for polarization as an outcome of pure informational influence and reproduces bipolarization effects by postulating an additional mechanism of homophilous selection of communication partners. The expanded model adds two dimensions: i. e., argument strength and more sophisticated protocols of informational influence (argument communication and opinion update). Adding the first dimension, allows us to investigate whether and how the presence of stronger or weaker arguments in a discussion influences polarization and bi-polarization dynamics, as suggested by the original framework of Persuasive Arguments Theory. The second feature allows us to test whether other mechanisms related to confirmation bias and epistemic vigilance can act as a driving force of bi-polarization. For the first issue, our simulations showed that argument strength has a measurable effect. For the second, our results would indicate that, in absence of homophily, only very strong types of informational bias can lead to bi-polarization},
KEYWORDS = {Argumentation, Argument Communication Theory, Polarization, Bi-Polarization, Epistemic Vigilance, Opinion dynamics},
PAGES = {25},
URL = {https://www.jasss.org/26/2/5.html},
VOLUME = {26 (2)},
DOI = {10.18564/jasss.5062},
ISSN = {1460-7425},
JOURNAL = {JASSS},
}
@ARTICLE{PROVOST_2023_ARTICLE_PDTDBC_474443,
AUTHOR = {Provost, L. and Di Donato, F. and Tóth Czifra, E. and Dumouchel, S. and Blotière, E. and Chen, Y.},
TITLE = {Open Science Training in TRIPLE},
YEAR = {2023},
ABSTRACT = {This case study focuses on the online training activities on Open Science delivered within the H2020 project Transforming Research through Innovative Practices for Linked Interdisciplinary Exploration (TRIPLE, Grant Agreement 863420). The project is dedicated to building a discovery platform for the Social Sciences and Humanities (SSH) and is committed to promoting and supporting the uptake of Open Science within research practices. In order to address SSH research and training communities' needs for enhanced competencies on Open Science and for stronger support in the Findable, Accessible, Interoperable, Reusable (FAIR) management of digital training materials, two reusable outputs were produced. The work carried out is presented as a novel approach to tackle the issues related to FAIRifying research and training practices and to create training resources whose reusability and relevance reaches beyond the project lifetime and framework. The case study presents the methods by which the results were produced so as to encourage and enable their future adaptation and reuse. The TRIPLE Open Science training series (result 1) targets SSH researchers, research support personnel and infrastructure developers in need of practical tools and specific skills to integrate Open Science practices in their workflows. The training series provides 12 competence-oriented online training events in Open Access whose training materials are available as Open Educational Resources (OER). The TRIPLE Training Toolkit (result 2) targets training organisers and research performing organisations who wish to design and manage training events as OERs and increase the impact of their training following good practice. The Toolkit is an easily reproducible workflow designed to help trainers minimise the time they spend in managing training events following FAIR practice. The workflow follows a FAIR-by-design method to address the frequent findability and reusability issues related to the management of digital training resources},
KEYWORDS = {EOSC, FAIR data, Open Science, Project management, Scholarly practice, Training and education},
URL = {https://open-research-europe.ec.europa.eu/articles/3-39},
VOLUME = {3},
DOI = {10.12688/openreseurope.15430.2},
ISSN = {2732-5121},
JOURNAL = {OPEN RESEARCH EUROPE},
}
@ARTICLE{SCIOLETTE_2023_ARTICLE_SMG_462840,
AUTHOR = {Sciolette, F. and Marchi, S. and Giovannetti, E.},
TITLE = {LexicO: an Italian Computational Lexicon derived from Parole-Simple-Clips},
YEAR = {2023},
ABSTRACT = {Parole-Simple-Clips (PSC) is a computational lexicon of the Italian language, developed from1996 to 2003 by the Institute of Computational Linguistics of the Italian National ResearchCouncil (ILC-CNR) in the context of national and European projects. The PSC resource isstrongly structured, rich of data, and, for its features, may provide an edge if used in the supportof text retrieval related tasks, such as full-text search. However, the lexicon still appears incompleteand presents some redundant, erroneous and missing data. This paper documents the first stepsundertaken for the creation of LexicO, an Italian computational lexicon built upon PSC startingfrom an in depth analysis of its four linguistic layers (semantic, syntactic, morphological, andphonological) in which it is structured. As a result of this work, LexicO has been released andmade freely available},
KEYWORDS = {Computational Lexicon, Parole-Simple-Clips, Linguistic Resources, Full-text Search, LexicO},
PAGES = {24},
URL = {https://iris.cnr.it/handle/20.500.14243/462840},
VOLUME = {15},
DOI = {10.6092/issn.2532-8816/15176},
ISSN = {2532-8816},
JOURNAL = {UMANISTICA DIGITALE},
}
@ARTICLE{SOLSALES_2023_ARTICLE_SAMD_439019,
AUTHOR = {Solà Sales, S. and Alzetta, C. and Moret Tatay, C. and Dell'Orletta, F.},
TITLE = {Analysing Deception in Witness Memory Though Linguistic Styles in Spontaneous Language},
YEAR = {2023},
ABSTRACT = {The act of lying and its detection have raised interest in many fields, from the legal system to our daily lives. Considering that testimonies are commonly based on linguistic parameters, natural language processing, a research field concerned with programming computers to process and analyse natural language texts or speech, is a topic of interest on this front. This study aimed to examine the linguistic styles of simulated deception and true testimonies collected with the aim of studying witness memory. Study participants were asked to act as a witness of a crime by retelling the story they had just read. Cognitive interviewing techniques were used to collect testimony under two conditions: truth and simulated deception. A sample of 48 participants volunteered to participate in the study. Analyses of the linguistic indicators and content were carried out. Specifically, we performed a comparison of testimonies of the same participant by condition to analyse the variation between (i) lexical and (ii) linguistic features and (iii) content and speech characteristics (disfluencies) depending on the narrative condition. Concerning lexical properties, adjectives were the most-varying grammatical category between truthful and deceptive testimonies. Furthermore, in the linguistic analysis, we observed that truthful testimonies were generally longer than deceptive ones in terms of the number of words and sentences and also characterised by more articulated sentence structures, and these differences were also statistically significant. Regarding the analysis of the content, cognitive criteria (details) and admitting lack of memory were more present in truthful statements. By providing an objective measure, these results are of interest in developing NLP tools for assessing the credibility of testimonies in forensics},
KEYWORDS = {Natural language processing, Simulated deception, Stylometric analysis},
PAGES = {26},
URL = {https://www.mdpi.com/2076-3425/13/2/317},
VOLUME = {13 (2)},
DOI = {10.3390/brainsci13020317},
ISSN = {2076-3425},
JOURNAL = {BRAIN SCIENCES},
}
@ARTICLE{VENUTIMARTINA_2023_ARTICLE_VDBTPBCM_459802,
AUTHOR = {Venuti Martina, C. and Del Grosso, A. M. and Boschetti, F. and Tessarolo, L. and Prontera, A. and Bovet, D. and Cattaneo, G. and Melis, V.},
TITLE = {La 'Galassia MQDQ: ' un concetto di filologia tradizionale, digitale, sostenibile},
YEAR = {2023},
ABSTRACT = {The investigation of intertextuality within a corpus of Latin poetry is the main objective of the research functions of the so-called 'Musisque Deoque Galaxy': formular recurrences, and lexical and metric-verbal co-occurrences draw a dense network of relationships between texts, where poetic memory presents itself in various modalities. This contribution aims to analyse the latest developments in the "Musisque Deoque Galaxy" both from the point of view of the tools created to enable new textual acquisitions and new analyses, and from the technological point of view, with reference to the work carried out to ensure a long-term sustainability},
KEYWORDS = {Digital textual corpora, Domain Specific Languages (DSL), Sustainability, Latin poetry, Carmina Latina Epigraphica, MQDQ Galaxy},
PAGES = {71-120},
URL = {https://iris.cnr.it/handle/20.500.14243/459802},
VOLUME = {4 (1)},
DOI = {10.30687/mag/2724-3923/2023/07/003},
ISSN = {2724-3923},
JOURNAL = {MAGAZÈN},
}
@INCOLLECTION{BOSCHETTI_2023_INCOLLECTION_BBDMKBT_455960,
AUTHOR = {Boschetti, F. and Bambaci, L. and Del Grosso, A. M. and Mugelli, G. and Khan, A. F. A. and Bellandi, A. and Taddei, A.},
TITLE = {Collaborative and multidisciplinary annotations of ancient texts: The Euporia system},
YEAR = {2023},
ABSTRACT = {Euporia is an annotation system originally created to study the ritual dynamics in ancient Greek tragedies from an anthropological perspective. The system is designed to be flexible enough so that it can be easily extended in other directions of multidisciplinary research. The system combines the simplicity of a web interface pared down to its essential elements with the expressivity of a domain-specific language parsed with ANTLR, that avoids the verbosity of general-purpose markup languages (such as XML-TEI) during the annotation phase. In this way, the user is focused on domain-specific tasks by writing concise annotations. Upon exportation of our data, interoperability is ensured by two measures: references to the annotated text are translated from a system based on progressive word numbers to the Canonical Text Services (CTS) system, and the annotations are translated into XML-TEI. An annotation is constituted by a text reference, a condition related to variant readings and interpretations of the same text, as well as by a sequence of tags. Tags are created by following a bottom-up approach: they are progressively introduced and reused by the domain-expert during the annotation process. During revisions, tags are grouped and mapped onto an ontology, in order to enable and to exploit the identification of relations among the tags in querying the annotated corpus. Being designed for interoperability, our approach can be extended to other research fields (e. g. philology, archaeology) through the creation of new domain-specific languages and domain-specific tagsets, in order to improve the functionalities of the Euporia system},
KEYWORDS = {Digital Humanities, Euporia, Domain Specific Languages, CoPhiLab, Digital Philology},
PAGES = {172-223},
URL = {https://iris.cnr.it/handle/20.500.14243/455960},
VOLUME = {6},
DOI = {10.1163/9789004527119_008},
PUBLISHER = {Brill Academic Publishers (Leiden, NLD)},
ISBN = {9789004527119},
CONFERENCE_PLACE = {Leiden},
BOOKTITLE = {The ancient world goes digital: case studies on archaeology, texts, online publishing, digital archiving, and preservation},
EDITOR = {Juloux, V. B. and Di Ludovico, A.},
}
@INCOLLECTION{BOSCHETTI_2023_INCOLLECTION_BD_480246,
AUTHOR = {Boschetti, F. and Del Grosso, A. M.},
TITLE = {La Collaborazione del CoPhiLab (CNR-ILC) con l’Università di Pisa nell’ambito DH},
YEAR = {2023},
ABSTRACT = {Questo contributo ha lo scopo di presentare un metodo di lavoro collaborativo tra Università di Pisa e Istituto di Linguistica Computazionale “A. Zampolli” (CNR-ILC) che si è consolidato nel tempo grazie alla condivisione di competenze umanistiche, informatiche e ingegneristiche da parte di studiosi e studenti sia per scopi di ricerca che per scopi didattici, in ambienti non solo accademici ma anche aperti all’interazione con il pubblico, come archivi e musei. Dopo aver delineato il contesto nel quale i progetti di rappresentazione e annotazione di documenti storici e letterari sono stati sviluppati, descriviamo le forze in gioco che hanno determinato i vincoli e i requisiti emersi dalle iniziative realizzate. Infine, definiamo i concetti principali del metodo e discutiamo i risultati ottenuti},
KEYWORDS = {Digital Humanities, Informatica Umanistica},
URL = {https://iris.cnr.it/handle/20.500.14243/480246},
VOLUME = {3},
PUBLISHER = {Simonelli Editore (Milano, ITA)},
ISBN = {9788893203166},
CONFERENCE_PLACE = {Milano},
BOOKTITLE = {Pionieri fra due culture. Informatica umanistica a Pisa in onore di Maria Simi},
EDITOR = {Salvatori, E. and Pelagatti, S. and Mannari, C.},
}
@INCOLLECTION{BURGASSI_2023_INCOLLECTION_B_474449,
AUTHOR = {Burgassi, C.},
TITLE = {I VOLTI DEL CAOS. Per la storia linguistica di un’idea},
YEAR = {2023},
ABSTRACT = {This paper aims to outline the relationship between the different meanings of the word chaos in the history of the Italian language. Chaos is a word of Greek derivation which is largely used in the nowadays language to express the meaning ‘extreme confusion, disorder’. Other meanings of the term reflecting its Classical – Christian origins (such as ‘abyss, deep’, ‘indistinct mass of matter’ or ‘hell’) are as well attested in the linguistic history of Italian. Particular attention is paid to evaluate how chaos was used in the Middle Ages in comparison to its current usage},
KEYWORDS = {Chao, Old Italian, Historical Semantic, Lexicology},
PAGES = {23-54},
URL = {https://iris.cnr.it/handle/20.500.14243/474449},
DOI = {10.7410/1661},
PUBLISHER = {Consiglio Nazionale delle Ricerche, Istituto di Storia dell’Europa Mediterranea (Cagliari, ITA)},
ISBN = {978-88-97317-81-4},
CONFERENCE_PLACE = {Cagliari},
BOOKTITLE = {STORIE DI IDEE NELL’EUROPA MEDITERRANEA. Trasmissione di parole e saperi nel Medioevo e nella prima Età moderna},
}
@INCOLLECTION{BURGASSI_2023_INCOLLECTION_BG_452840,
AUTHOR = {Burgassi, C. and Guadagnini, E.},
TITLE = {La marcatezza lessicale nella ricostruzione del vocabolario di epoca storica},
YEAR = {2023},
ABSTRACT = {In questo contributo si descrive un possibile impiego del concetto di "marcatezza" nel campo della lessicologia storica. Come è noto, si tratta di un concetto molto ricorrente negli studi ma di difficile definizione e di vario utilizzo, del quale qui si propone un'applicazione specifica. Rispetto a una fase storica della lingua, in una serie di lessemi che risultano "omoionimici" per un significato, la marcatezza può stabilire un ordinamento che, di tali lessemi, rispecchi le relative posizioni nell'architettura del vocabolario. A parità di contenuto denotativo, la marcatezza così concepita valuta la variazione sul piano connotativo, là dove la connotazione non riguarda la competenza linguistica ma è estrapolata dalle caratteristiche di attestazione dei lessemi in un corpus rappresentativo di riferimento. Per sostanziare l'argomentazione portiamo due esempi, il primo relativo al significato 'essere umano nei primi anni di vita', il secondo relativo al significato 'atto di violazione di una norma', nel vocabolario italiano antico},
KEYWORDS = {Lessicologia italiana, Linguistica storica, Marcatezza},
PAGES = {77-94},
URL = {https://amsacta.unibo.it/id/eprint/7465},
DOI = {10.6092/unibo/amsacta/7465},
ISBN = {9788854971264},
BOOKTITLE = {«CLUB Working Papers in Linguistics» Volume 7},
EDITOR = {Cervini, C. and Gagliardi, G.},
}
@INCOLLECTION{CAITIRUSSO_2023_INCOLLECTION_CF_469901,
AUTHOR = {Caiti Russo, G. and Frontini, F.},
TITLE = {Migrazione di testi e di codici manoscritti: risorse digitali per la ricostruzione dell'Occitania medievale},
YEAR = {2023},
ABSTRACT = {This paper offers an overview of the current panorama of digital language resources and approaches to the study of Medieval Occitan. Starting from a scattered tradition of witnesses, Occitan manuscripts are now being digitised in various projects, but not enough has been done to adopt interoperable and shared practices. By drawing from other philological traditions, and in particular the Digital Classics, we trace an inventory of best practices, tools, standards and formats that Digital Occitan Studies needs to develop in order to offer scholars access to Virtual Research environments of linked and interconnected language resources},
KEYWORDS = {Occitan, Digital Philology, Digital Editions, Virtual Research Environments, Occitano, filologia digitale, edizioni digitali, ambienti virtuali di ricerca},
PAGES = {537-568},
URL = {https://iris.cnr.it/handle/20.500.14243/469901},
DOI = {10.7410/1678},
PUBLISHER = {Casalini-ISEM-Istituto di Storia dell'Europa Mediterranea (Cagliari)},
ISBN = {978-88-97317-81-4},
CONFERENCE_PLACE = {Cagliari},
BOOKTITLE = {Storie di idee nell'Europa mediterranea: trasmissione di parole e saperi nel Medioevo e nella prima età moderna},
}
@INCOLLECTION{DRENGUBIAK_2023_INCOLLECTION_DHDF_476003,
AUTHOR = {Drengubiak, J. and Hirsch, F. and Didirková, I. and Frontini, F.},
TITLE = {The perception of voice qualities in audiobooks in the context of teaching French as a second language},
YEAR = {2023},
ABSTRACT = {Audiobooks are a common part of everyday life and their possibilities are also used when learning a foreign language. The article comprehensively addresses the issue of audiobooks as a variation of the Listening comprehension activity on a sample of secondary and university students. In addition to their experience with audiobooks, their attitude to listening comprehension, it examines the preferences regarding specific characteristics of the voices of the narrators. The students first determined the perceived characteristic on a scale of 1-4 in the following categories: pitch (high-low), speed (slow-fast), melodicity (monotonous-melodious), articulation (comprehensible-incomprehensible). Later, subjective ratings were assigned to these categories on a scale from strong like to strong dislike. The preference research was conducted on an excerpt of Grand Meaulnes by A. Fournier, which was recorded by two professional and two amateur narrators},
URL = {https://www.pulib.sk/web/pdf/web/viewer.html?file=/web/kniznica/elpub/dokument/Drengubiak4/subor/9788055531786.pdf},
ISBN = {978-80-555-3178-6},
BOOKTITLE = {Literatúra vo výučbe – vyučovať literatúru; La littérature dans l'enseignement-Enseigner la littérature; Literature in teaching-Teaching literature},
}
@INCOLLECTION{FISCHER_2023_INCOLLECTION_FBDMMM_523538,
AUTHOR = {Fischer, F. and Boschetti, F. and Del Grosso, A. M. and Montefusco, A. and Mancinelli, T. and Macchiarelli, A.},
TITLE = {Sinergie fra VeDPH e CNR-ILC in termini di condivisione della conoscenza e sostenibilità dei progetti digitali},
YEAR = {2023},
ABSTRACT = {Nel 2019, all’apertura del VeDPH, il CNR-ILC ha istituito presso il centro veneziano una propria Unità di Ricerca presso Terzi (URT), animata prevalentemente da personale del CoPhiLab, per operare in sinergia con il Dipartimento di Studi Umanistici di Ca’ Foscari su temi inerenti alla progettazione, alla creazione e alla fruizione di edizioni scientifiche digitali},
KEYWORDS = {CoPhiLab, VeDPH, Digital Scholarly Editing, Digital Humanities},
PAGES = {113-133},
URL = {http://digital.casalini.it/10.48255/9788891328373.09},
VOLUME = {7},
DOI = {10.48255/9788891328373.09},
PUBLISHER = {L'Erma di Bretschneider srl (Roma, ITA)},
ISBN = {9788891328373},
CONFERENCE_PLACE = {Roma},
BOOKTITLE = {Sinergie fra VeDPH e CNR-ILC in termini di condivisione della conoscenza e sostenibilità dei progetti digitali},
EDITOR = {Di Maro, M. and Merola, V. and Nocita, T.},
}
@INCOLLECTION{GIOVANNETTI_2023_INCOLLECTION_GSS_475249,
AUTHOR = {Giovannetti, E. and Saponaro, D. and Sciolette, F.},
TITLE = {Una rappresentazione computazionale della diversità religiosa in una prospettiva terminologica e concettuale},
YEAR = {2023},
PAGES = {497-536},
URL = {https://iris.cnr.it/handle/20.500.14243/475249},
VOLUME = {46},
DOI = {10.7410/1677},
ISBN = {978-88-97317-81-4},
BOOKTITLE = {Storie di idee nell'Europa mediterranea},
}
@INCOLLECTION{GUADAGNINI_2023_INCOLLECTION_G_469821,
AUTHOR = {Guadagnini, E.},
TITLE = {Il corpo morto in italiano antico (e in Dante)},
YEAR = {2023},
ABSTRACT = {The paper reconstructs the evolution of corpo morto, which conveyed the concept of ‘corpse’ in medieval Italian due to the absence of the lexical type cadavere. Specifically, it delves into the instances of this expression found in Dante’s Convivio and the Divine Comedy},
KEYWORDS = {Lexicology, Corpse, corpo morto, Dante},
PAGES = {403-415},
URL = {https://www.torrossa.com/it/resources/an/5749237},
DOI = {10.7410/1673},
PUBLISHER = {CNR Istituto di Storia dell'Europa Mediterranea (Cagliari, ITA)},
ISBN = {9788897317814},
CONFERENCE_PLACE = {Cagliari},
BOOKTITLE = {Storie di idee nell'Europa mediterranea: trasmissione di parole e saperi nel Medioevo e nella prima età moderna},
}
@INCOLLECTION{LUZIETTI_2023_INCOLLECTION_L_462400,
AUTHOR = {Luzietti, R. B.},
TITLE = {Evaluation of the Archivio Vi. Vo Architecture: A Case Study on the Reuse of Legacy Data for Linguistic Purposes},
YEAR = {2023},
ABSTRACT = {The object of this paper is the evaluation of the Archivio Vi. Vo. architecture, developed within the CLARIN-IT consortium for the preservation and accessible consultation of historical oral archives. Following the first case study employing the Caterina Bueno archive, the goal is to now to show how this innovative architecture is also suitable for conducting research investigations on the archival data and hosting a different type of archive. The real use case study presented in this contribution, aims at employing the Angela Spinelli archive for conducting a sociophonetic investigation on Tuscan vernacular},
KEYWORDS = {Digital Humanities, Oral Archives, Reusing Data, Sociophonetics},
PAGES = {90-98},
URL = {https://iris.cnr.it/handle/20.500.14243/462400},
DOI = {10.3384/ecp198009},
PUBLISHER = {Linköping University (LIU) (Linköping, SWE)},
ISBN = {978-91-8075-254-1},
CONFERENCE_PLACE = {Linköping},
BOOKTITLE = {Selected papers from the CLARIN Annual Conference 2022},
}
@INCOLLECTION{LUZIETTI_2023_INCOLLECTION_L_572723,
AUTHOR = {Luzietti, R. B.},
TITLE = {Degemination in Tuscan rhotics: a preliminary analysis in an historical oral archive},
YEAR = {2023},
ABSTRACT = {The paper presents the first results of a preliminary sociophonetic investigation on the residual phenomenon of rhotic degemination in the Tuscan Pratese variety, through the reuse of the Angela Spinelli historical oral archive, initially conceived for other (non-linguistic) purposes. In past research, some authors reported the presence of rhotic degemination phenomena in the nearby territories investigated by the historian. However, until recent times the phenomenon has been under-investigated. T o find evidence of rhotic degemination in a phonetic laboratory would now be impossible since this phenomenon embodies the residual vestige of a past tendency, challenged by the diffusion of more standard-like pronunciations in favor of the maintenance of the singleton–geminate contrast. The assumption is that the consultation of the Spinelli archive would allow to find and study the use of past non-standard forms in situations where participants narrate of life-threatening events and their speech is, therefore, less controlled, and more spontaneous},
KEYWORDS = {sociophonetics, oral history archives},
PAGES = {317-336},
DOI = {10.17469/O2111AISV000017},
BOOKTITLE = {Il parlato in ambito medico [Spoken language in the medical field]},
}
@INCOLLECTION{MONACHINI_2023_INCOLLECTION_MF_475983,
AUTHOR = {Monachini, M. and Frontini, F.},
TITLE = {Infrastrutture digitali per le scienze umane e sociali},
YEAR = {2023},
ABSTRACT = {Questo capitolo esplora il ruolo delle infrastrutture di ricerca (IR) nel promuovere la collaborazione interdisciplinare e l’innovazione tecnologica nell’ambito delle Digital Humanities. Le IR, come CLARIN e DARIAH, rappresentano nodi cruciali per l’accesso e la condivisione di risorse linguistiche, tecnologie e dati. Attraverso una panoramica dei servizi offerti, tra cui l’archiviazione, l’accesso federato e le applicazioni web, viene evidenziata la loro importanza per garantire principi FAIR (Findable, Accessible, Interoperable, Reusable) e supportare la ricerca umanistica e sociale in Europa. Il lavoro sottolinea l’impatto strategico delle IR nel favorire la condivisione delle conoscenze e l’integrazione delle risorse a livello transnazionale, contribuendo alla costruzione di ecosistemi di ricerca avanzati},
KEYWORDS = {Infrastrutture di ricerca, Digital Humanities, Principi FAIR},
PAGES = {197-213},
URL = {https://iris.cnr.it/handle/20.500.14243/475983},
VOLUME = {DIGITAL HUMANITIES. METODI, STRUMENTI, SAPERI},
PUBLISHER = {Carocci Editore},
ISBN = {978-88-290-1843-7},
BOOKTITLE = {Digital (Humanities). (Metodi), strumenti, saperi},
}
@INCOLLECTION{MONTEMAGNI_2023_INCOLLECTION_M_523049,
AUTHOR = {Montemagni, S.},
TITLE = {Trattamento automatico del linguaggio e Digital Humanities: metodi e strumenti, sfide},
YEAR = {2023},
ABSTRACT = {Il contributo si focalizza sul rapporto sinergico tra Trattamento Automatico della Lingua (TAL) e Digital Humanities (DH), ovvero su come metodi, modelli, strumenti e risorse per il trattamento automatico della lingua possano essere di aiuto nell’analisi e interpretazione di testi oggetto di studio nel settore delle scienze umane e sociali, su quali siano le sfide da affrontare per valorizzare questa sinergia, e quali le ricadute sui versanti scientifico e applicativo. In particolare, il contributo introduce i concetti di base relativi all’analisi linguistica del testo per il settore delle DH; senza l’ambizione di illustrarne in dettaglio metodi e tecniche, delinea lo stato dell’arte e i limiti delle tecnologie correntemente in uso, per arrivare a definire le sfide aperte con le possibili soluzioni},
KEYWORDS = {Trattamento automatico di varietà storiche della lingua, Digital Humanities, Annotazione Linguistica, Estrazione di Conoscenza},
PAGES = {160-177},
URL = {https://iris.cnr.it/handle/20.500.14243/523049},
PUBLISHER = {Carocci Editore (Roma, ITA)},
ISBN = {978-88-290-1843-7},
CONFERENCE_PLACE = {Roma},
BOOKTITLE = {Digital Humanities. Metodi, strumenti, saperi},
}
@INCOLLECTION{PICCINI_2023_INCOLLECTION_P_519747,
AUTHOR = {Piccini, S.},
TITLE = {"Eppur si muove!" Per una rappresentazione formale della variazione diacronica in terminologia},
YEAR = {2023},
ABSTRACT = {This contribution introduces the model DIATERM, devoted to computationally representing the change of terms and concepts over time. Based on three levels of analysis – textual, linguistic and ontological – this model relies on semantic web technologies (RDF, OWL, SWRL, SPARQL). In particular, the approach adopted for the representation of temporal information is based on the reification of the n-ary relations, with n \> 2. The potential of the model will be shown through examples taken from Ferdinand de Saussure’s diachronic lexicon},
KEYWORDS = {Diachronic Terminology, Ontologie, Semantic Web, Ontolex-Lemon, Ferdinand de Saussure, Terminologia diacronica, Web Semantico},
PAGES = {569-602},
URL = {https://iris.cnr.it/handle/20.500.14243/519747},
DOI = {10.7410/1679},
ISBN = {978-88-97317-81-4},
BOOKTITLE = {Storie di Idee nell'Europa Mediterranea},
}
@EDITORIAL{BURGASSI_2023_EDITORIAL_BGV_469185,
AUTHOR = {Burgassi, C. and Guadagnini, E. and Vaccaro, G.},
TITLE = {Storie di idee nell'Europa mediterranea. Trasmissione di parole e saperi nel Medioevo e nella prima Età moderna},
YEAR = {2023},
ABSTRACT = {Collected essays},
KEYWORDS = {storia delle idee, linguistica, filologia},
URL = {https://iris.cnr.it/handle/20.500.14243/469185},
VOLUME = {46},
DOI = {10.7410/1660},
PUBLISHER = {Consiglio Nazionale delle Ricerche-Istituto di Storia dell’Europa Mediterranea (Cagliari, ITA)},
ISBN = {9788897317814},
CONFERENCE_PLACE = {Cagliari},
}
@EDITORIAL{DELGROSSO_2023_EDITORIAL_DS_462861,
AUTHOR = {Del Grosso, A. M. and Spampinato, D.},
TITLE = {Bellini Digital Correspondence},
YEAR = {2023},
ABSTRACT = {Bellini Digital Correspondence (BDC) è un progetto di edizione scientifica digitale relativo alle lettere autografe di Vincenzo Bellini. Il fondo è conservato presso il Museo Belliniano di Catania. Il carteggio comprende 40 unità testuali per 35 unità codicologiche, riprodotte in 111 immagini digitali. BDC implementa una piattaforma per la filologia digitale applicata al testo belliniano la cui base critica si regge sul lavoro realizzato dalla prof. ssa Graziella Seminara nel 2017. L'edizione tiene conto di diverse tipologie di fruitori: specialisti, visitatori del museo, che usufruiscono dell'edizione all'interno del percorso museale. L'edizione digitale è stata realizzata in accordo con le linee guida dettate dalla Text Encoding Initiative e integra una fruizione via Web grazie al software Edition Visualization Technology. BDC è completamente open source e open access. Il sito Web, che accompagna l'edizione, illustra con dovizia di particolari tutte le fasi del progetto, i principi editoriali, le scelte di rappresentazione digitale del testo e l'ampio gruppo di persone coinvolte},
KEYWORDS = {Digital Humanities, Digital Scholarly Editions, Edition Visualization Technology, Edizioni Scientifiche Digitali, Vincenzo Bellini, Filologia Digitale},
URL = {http://bellinicorrespondence.cnr.it/},
PUBLISHER = {Cnr Edizioni (ROMA, ITA)},
ISBN = {978-88-8080-562-5},
CONFERENCE_PLACE = {ROMA},
}
@EDITORIAL{MARZI_2023_EDITORIAL_MP_452788,
AUTHOR = {Marzi, C. and Pirrelli, V.},
TITLE = {Integrative Views on Representations and Processes in Morphology},
YEAR = {2023},
ABSTRACT = {One of the most enduring conceptualisations of the language architecture rests ona modular subdivision of work between lexical representations of stored items onthe one hand, and dynamic processes, modelled as procedural rules working on suchitems, on the other hand. In morphology, network-based approaches have suggested an alternative "integrative" view of word representations and processes, where lexical representations consist of partially overlapping activation patterns spreading over several processing units. From this integrative perspective, the resulting network is both a lexicon and a word processor. We argue that the network-based view provides a stimulating research framework for several complementary levels of language inquiry (including theoretical, computational and neuro-psychological approaches) to be fruitfully integrated into a novel, comprehensive understanding of morphology. We discuss some implications of this view and delineate prospects of progress in this area},
KEYWORDS = {morphology, mental lexicon, Connectionism, Network science, Discriminative Learning},
PAGES = {397-556},
URL = {https://link.springer.com/journal/11525/volumes-and-issues/33-4},
DOI = {10.1007/s11525-023-09416-5},
PUBLISHER = {Springer (Dordrecht, NLD)},
ISSN = {1871-5656},
CONFERENCE_PLACE = {Dordrecht},
}
@EDITORIAL{MARZI_2023_EDITORIAL_MP_450063,
AUTHOR = {Marzi, C. and Pirrelli, V.},
TITLE = {Integrative views of representations and processes in morphology: an introduction},
YEAR = {2023},
ABSTRACT = {One of the most enduring conceptualisations of the language architecture rests on a modular subdivision of work between lexical representations of stored items on the one hand, and dynamic processes, modelled as procedural rules working on such items, on the other hand. In morphology, network-based approaches have suggested an alternative “integrative” view of word representations and processes, where lexical representations consist of partially overlapping activation patterns spreading over several processing units. From this integrative perspective, the resulting network is both a lexicon and a word processor. We argue that the network-based view provides a stimulating research framework for several complementary levels of language inquiry (including theoretical, computational and neuro-psychological approaches) to be fruitfully integrated into a novel, comprehensive understanding of morphology},
KEYWORDS = {Morphology, Mental Lexicon, Connectionism, Network science, Discriminative learning},
PAGES = {397-408},
URL = {https://link.springer.com/article/10.1007/s11525-023-09416-5},
VOLUME = {33},
DOI = {10.1007/s11525-023-09416-5},
ISSN = {1871-5621},
}
@INPROCEEDINGS{ALZETTA_2023_INPROCEEDINGS_ABDMSSV_470901,
AUTHOR = {Alzetta, C. and Brunato, D. and Dell'Orletta, F. and Miaschi, A. and Sagae, K. and Sánchez Gutiérrez, C. H. and Venturi, G.},
TITLE = {LangLearn at EVALITA 2023: Overview of the Language Learning Development Task},
YEAR = {2023},
ABSTRACT = {Language Learning Development (LangLearn) is the EVALITA 2023 shared task on automatic language development assessment, which consists in predicting the evolution of the written language abilities of learners across time. LangLearn is conceived to be multilingual, relying on written productions of Italian and Spanish learners, and representative of L1 and L2 learning scenarios. A total of 9 systems were submitted by 5 teams. The results highlight the open challenges of automatic language development assessment},
URL = {https://iris.cnr.it/handle/20.500.14243/470901},
PUBLISHER = {Accademia University Press (Torino, ITA)},
ISBN = {9791255000693},
CONFERENCE_NAME = {8th Evaluation Campaign of Natural Language Processing and Speech Tools for Italian},
CONFERENCE_PLACE = {Torino},
BOOKTITLE = {Proceedings of EVALITA 2023},
}
@INPROCEEDINGS{ALZETTA_2023_INPROCEEDINGS_ADFMV_470921,
AUTHOR = {Alzetta, C. and Dell'Orletta, F. and Fazzone, C. and Miaschi, A. and Venturi, G.},
TITLE = {Unmasking the Wordsmith: Revealing Author Identity through Reader Reviews},
YEAR = {2023},
ABSTRACT = {Traditional genre-based approaches for book recommendations face challenges due to the vague definition of genres. To overcome this, we propose a novel task called Book Author Prediction, where we predict the author of a book based on user-generated reviews’ writing style. To this aim, we first introduce the ‘Literary Voices Corpus’ (LVC), a dataset of Italian book reviews, and use it to train and test machine learning models. Our study contributes valuable insights for developing user-centric systems that recommend leisure readings based on individual readers’ interests and writing styles},
URL = {https://ceur-ws.org/Vol-3596/paper4.pdf},
CONFERENCE_NAME = {9th Italian Conference on Computational Linguistics},
BOOKTITLE = {Proceedings of the 9th Italian Conference on Computational Linguistics},
}
@INPROCEEDINGS{BOSCHETTI_2023_INPROCEEDINGS_BDDFM_504563,
AUTHOR = {Boschetti, F. and Del Grosso, A. M. and Del Gratta, R. and Frontini, F. and Monachini, M.},
TITLE = {CLARIN-IT: texts, documents and new contexts},
YEAR = {2023},
ABSTRACT = {In recent years, CLARIN has increasingly broadened its interest from linguistic resources to textual resources relevant to digital humanists. This new and attractive scenario requires new technologies for texts, variants, and digital representations of primary sources, their contexts, and complex relationships. VeDPH in Venice, CNR-ILC-CoPhiLab, and ILC4CLARIN in Pisa collaborate on DH projects. Together, they are working on extracting text from manuscript page images, annotating historical graffiti on georeferenced images, and identifying text in digital images of paintings and sculptures},
KEYWORDS = {Research Infrastructure},
PAGES = {53-56},
URL = {https://iris.cnr.it/handle/20.500.14243/504563},
CONFERENCE_NAME = {CLARIN Annual Conference Proceedings 2023},
BOOKTITLE = {CLARIN Annual Conference Proceedings 2023},
}
@INPROCEEDINGS{BOSCHETTI_2023_INPROCEEDINGS_BRQ_479742,
AUTHOR = {Boschetti, F. and Rigobianco, L. and Quochi, V.},
TITLE = {Domain-Specific Languages for Epigraphy: The Case of ItAnt},
YEAR = {2023},
ABSTRACT = {ItAnt is a research project devoted to the languages and cultures of ancient Italy witnessed by a digital collection of inscriptions. This contribution illustrates how the definition of a Domain-Specific Language can support the activity of the epigraphists involved in the project by increasing the human readability of the encoded data without sacrificing the compliance to standard models and formats. Finally, an example of concrete use of the encoded texts within the CLARIN-IT DigItAnt platform will be briefly described},
KEYWORDS = {Domain-specific languages, Digital Scholarly Editions, Ancient Languages, Digital Humanities, Text Representation, TEI EpiDoc},
PAGES = {5},
URL = {https://office.clarin.eu/v/CE-2023-2328_CLARIN2023_ConferenceProceedings.pdf},
CONFERENCE_NAME = {CLARIN Annual Conference 2023},
BOOKTITLE = {CLARIN Annual Conference Proceedings 2023},
}
@INPROCEEDINGS{BRUNATO_2023_INPROCEEDINGS_BDDR_455142,
AUTHOR = {Brunato, D. and Dell'Orletta, F. and Dini, I. and Ravelli, A. A.},
TITLE = {Coherent or Not? Stressing a Neural Language Model for Discourse Coherence in Multiple Languages},
YEAR = {2023},
ABSTRACT = {In this study, we investigate the capability of a Neural Language Model (NLM) to distinguish between coherent and incoherent text, where the latter has been artificially created to gradually undermine local coherence within text. While previous research on coherence assessment using NLMs has primarily focused on English, we extend our investigation to multiple languages. We employ a consistent evaluation framework to compare the performance of monolingual and multilingual models in both in-domain and out-domain settings. Additionally, we explore the model's performance in a cross-language scenario},
KEYWORDS = {text coherence, neural language models, multilingual corpora},
PAGES = {10690-10700},
URL = {https://aclanthology.org/2023.findings-acl.680},
DOI = {10.18653/v1/2023.findings-acl.680},
PUBLISHER = {Association for Computational Linguistics (Stroudsburg, USA)},
ISBN = {978-1-959429-62-3},
CONFERENCE_NAME = {61st Annual Meeting of the Association for Computational Linguistics (ACL 2023)},
CONFERENCE_PLACE = {Stroudsburg},
BOOKTITLE = {Findings of the Association for Computational Linguistics: ACL 2023},
}
@INPROCEEDINGS{CALAMAI_2023_INPROCEEDINGS_CNSC_464847,
AUTHOR = {Calamai, S. and Nodari, R. and Soria, C. and Carlucci, A.},
TITLE = {Linguistic Autobiographies. Towards the Creation of a Multilingual Resource Family},
YEAR = {2023},
ABSTRACT = {This paper describes a project aimed at creating a new resource family of multilingual and multimodal resources centered around the concept of "Linguistics of self", that is personal re-flections on the role of languages in shaping one's identity. Language portrait silhouettes, drawing bilingualism, and linguistic autobiographies are different types of resources that share this common feature. We describe the resources and the criteria for their metadata annotation, focusing in particular on linguistic autobiographies, where the writer explicitly reflects on the relationship between him/herself and language. These genres are fruitfully used in different educational settings, and research has shown that they help to uncover the social, affective, and psychological dimensions of language learning. The potential of a multilingual and mul-timodal collection is discussed starting from data collected in Italy and Norway},
KEYWORDS = {Linguistic autobiographies, Resource families, Multilingualism},
PAGES = {23-32},
URL = {https://ecp.ep.liu.se/index.php/clarin/article/view/725/631},
DOI = {10.3384/ecp198003},
ISBN = {978-91-8075-254-1},
BOOKTITLE = {Selected papers from the CLARIN Annual Conference 2022},
}
@INPROCEEDINGS{CARDILLO_2023_INPROCEEDINGS_C_505702,
AUTHOR = {Cardillo, F. A.},
TITLE = {Baselines for Automatic Medical Image Reporting},
YEAR = {2023},
ABSTRACT = {Despite the high number of machine learning models presented in the last few years for automatically annotating medical images with deep learning models, clear baselines to compare methods upon are still missing. We present an initial set of experimentations of a standard encoder-decoder architecture with the Indiana University Chest X-ray dataset. The experiments include different convolutional architectures and decoding strategies for the recurrent decoder module. The results here presented could potentially benefit those tackling the same task in languages with fewer linguistic resources than those available in English},
KEYWORDS = {Medical Image Analysis, Neural Language Generation, Deep Learning},
PAGES = {58-74},
URL = {https://link.springer.com/chapter/10.1007/978-3-031-29717-5_4},
VOLUME = {659},
DOI = {10.1007/978-3-031-29717-5_4},
PUBLISHER = {Springer International Publishing (Springer Nature Switzerland AG, CHE)},
ISBN = {978-3-031-29717-5},
CONFERENCE_NAME = {1st Serbian International Conference on Applied Artificial Intelligence},
CONFERENCE_PLACE = {Springer Nature Switzerland AG},
BOOKTITLE = {Applied Artificial Intelligence: Medicine, Biology, Chemistry, Financial, Games, Engineering},
}
@INPROCEEDINGS{CHIARELLA_2023_INPROCEEDINGS_CCF_433913,
AUTHOR = {Chiarella, D. and Cutugno, P. and Ferretti, M.},
TITLE = {A linguistic approach of sound characterisation and polarization: first steps},
YEAR = {2023},
ABSTRACT = {The activities of the "TRIPLO: TRasporti e collegamenti Innovativi e sostenibili tra Porti e piattaforme LOgistiche" project, funded with funds from the Interregional Operational Programme Italy-France Maritime 2014-2020, have as their particular goal to increase the sustainability of commercial ports and associated logistic platforms, helping to lessen noise pollution [1][2]. In some project activities, the acoustic impact on the people exposed to noise from back port activities is evaluated in connection to how each person perceives the noise. Only technical investigations, which cannot ensure a phenomena's universality in terms of perception, can objectively describe a phenomenon in environmental surveys [3]; A sound can be viewed as both a physical reality that can be measured using objective criteria and a sound perception phenomenon that is of a subjective character and related to the subject's psycho-physical-emotional state. Because these two traits are inextricably linked, it is not enough to just look at them independently. Driven by these motivations, we created questionnaires concerning the perception of sounds, the structure and first results of which can be consulted in [4] [5] [6]. In this article, in the first part we present a methodology to identify adjectives characterising each sound via TF-IDF (term frequency-inverse document frequency) [7][8][9][10]; in the second part we analyse the positive or negative emotions described by the adjectives given for each sounds with TexBlob, a sentiment analysis classifier, and subsequently we compare the results obtained with the ones shown in [6]},
KEYWORDS = {sentiment analysis, TF-IDF, sound polarization, sound characterisation},
PAGES = {86-91},
URL = {https://iris.cnr.it/handle/20.500.14243/433913},
PUBLISHER = {Centro de Lingüística Aplicada (Santiago de Cuba, CUB)},
ISBN = {978-959-7174-41-7},
CONFERENCE_NAME = {XVIII° Simposio Internacional de Comunicación Social},
CONFERENCE_PLACE = {Santiago de Cuba},
BOOKTITLE = {Serie de Comunicación Social 2022-2023},
}
@INPROCEEDINGS{CORR_2023_INPROCEEDINGS_CDFBKTBFPDD_463579,
AUTHOR = {Corrò, E. and Danelon, N. and Forte, M. and Boschetti, F. and Kafkas, A. and Ticini, L. and Bernardini, F. and Fischer, F. and Peratello, P. and Dolcetti, F. and Delpozzo, E.},
TITLE = {The Lions of Venice Arsenal: a neuroscientific approach to Cultural Heritage},
YEAR = {2023},
ABSTRACT = {In this contribution, the authors discuss the preliminary outcomes of a neuroscience research project conducted during the Summer School in Digital and Public Humanities 2022 organized by the Venice Centre for Digital and Public Humanities (VeDPH). The research was based on a series of experiments combining electroencephalography (EEG) and eye tracking to investigate the perception of Cultural Heritage (virtual and real), in this case, the statues of lions in the Venice Arsenal. Particular attention was given to the Piraeus Lion, today at the main entrance to the Arsenal, noteworthy for having been inscribed in the second half of the 11th century AD by Varangian mercenaries with three runic inscriptions, today heavily eroded due to weathering and air pollution. This lion was originally located in the port of Piraeus (Athens) and dates back to the 4th century BC. It was stolen as war booty by a famous Venetian naval commander, Francesco Morosini in 1687 during the Ottoman Venetian war. Among neuroimaging techniques, EEG is used to detect specific states of mind, such as mental alertness, cognitive distraction and learning ability in normal and virtual reality conditions. Specifically, in cultural sectors eye tracking technology is useful to investigate actual involvement in sites of cultural interest. The data analysis showedchanges in the perception of the artifact among different audiences, i. e. women and men, residents and tourists, people with and without previous knowledge on the artifact's historical background. This entails a new method of interactions between a single person, the artifact and the environment. Indeed, this experiment may indicate diversified and accelerated learning and processing, a deep immersiveness of information and different levels of feedback},
KEYWORDS = {Heritage, Neuroscience, EEG, Eye-tracking, Runic inscription, Venice Arsenal},
PAGES = {343-346},
URL = {http://www.aiucd2023.unisi.it/atti/},
PUBLISHER = {Alma Mater Studiorum-Università di Bologna (Bologna, ITA)},
ISBN = {978-88-942535-7-3},
CONFERENCE_NAME = {LA MEMORIA DIGITALE: XII CONVEGNO ANNUALE AIUCD},
CONFERENCE_PLACE = {Bologna},
BOOKTITLE = {Atti Convegno AIUCD 2023},
EDITOR = {Carbé and Emmanuela and Lo Piccolo and Gabriele and Valenti and Alessia and Stella and Francesco},
}
@INPROCEEDINGS{CRISTOFARO_2023_INPROCEEDINGS_CDMSS_516581,
AUTHOR = {Cristofaro, S. and Del Grosso, A. M. and Mazzagufo, L. and Sichera, P. and Spampinato, D.},
TITLE = {Bellini Digital Correspondence: A Model for Making Collaborative Digital Scholarly Editions},
YEAR = {2023},
ABSTRACT = {This paper presents the work carried out within the Bellini Digital Correspondence project. In particular, it outlines the activities aimed at improving the harmonization process, concerning collaborative digital scholarly editions. The study proposes a preliminary semantic approach to the harmonization process, exploiting the ontology-based mapping perspective},
KEYWORDS = {Cooperative digital scholarly edition , Schemamatching , Harmonization , NormaTEI , Bellini Digital Correspondence},
PAGES = {615-620},
URL = {https://iris.cnr.it/handle/20.500.14243/516581},
DOI = {10.1109/CiSt56084.2023.10409920},
ISBN = {978-1-6654-6133-7},
CONFERENCE_NAME = {Congress on Information Science and Technology},
BOOKTITLE = {7th IEEE International Congress on Information Science and Technology Proceedings},
}
@INPROCEEDINGS{CRISTOFARO_2023_INPROCEEDINGS_CDMSS_516520,
AUTHOR = {Cristofaro, S. and Del Grosso, A. M. and Mazzagufo, L. and Sichera, P. and Spampinato, D.},
TITLE = {Bellini Digital Correspondence: A Model for Making Collaborative Digital Scholarly Editions},
YEAR = {2023},
ABSTRACT = {This paper presents the work carried out within the Bellini Digital Correspondence project. In particular, it outlines the activities aimed at improving the harmonization process, concerning collaborative digital scholarly editions. The study proposes a preliminary semantic approach to the harmonization process, exploiting the ontology-based mapping perspective},
KEYWORDS = {Bellini Digital Correspondence, Cooperative digital scholarly edition, Harmonization, NormaTEI, Schemamatching},
PAGES = {615-620},
URL = {https://iris.cnr.it/handle/20.500.14243/516520},
DOI = {10.1109/CiSt56084.2023.10409920},
PUBLISHER = {Institute of Electrical and Electronics Engineers Inc},
ISBN = {978-1-6654-6133-7},
CONFERENCE_NAME = {7th IEEE International Congress on Information Science and Technology, CiSt 2023},
BOOKTITLE = {2023 7th IEEE Congress on Information Science and Technology (CiSt)},
}
@INPROCEEDINGS{DELGRATTA_2023_INPROCEEDINGS_DZGB_504561,
AUTHOR = {Del Gratta, R. and Zenzaro, S. and Grosso, A. D. and Boschetti, F.},
TITLE = {Document Analysis and Philological Operations. Is Category Theory a suitable approach?},
YEAR = {2023},
ABSTRACT = {Starting with a formal definition of the process of scholarly editing, we further formalize it by exploiting Category Theory. We then apply this formal model to automated Natural Language Processing tools, highlighting the parallelism between composition and associativity and linguistic tool pipelines. We then discuss the notion of interoperability between tools. Finally, we propose some future improvements to the proposed formal model},
KEYWORDS = {Information science, Text analysis, Pipelines, Parallel processing, Natural language processing, Interoperability, Linguistic and philological operations, Category Theory, Formal Models},
PAGES = {605-610},
URL = {https://iris.cnr.it/handle/20.500.14243/504561},
VOLUME = {5},
DOI = {10.1109/cist56084.2023.10409916},
ISBN = {978-1-6654-6133-7},
CONFERENCE_NAME = {7th IEEE Congress on Information Science and Technology (CiSt)},
BOOKTITLE = {7th IEEE Congress on Information Science and Technology (CiSt)},
}
@INPROCEEDINGS{DELGROSSO_2023_INPROCEEDINGS_DZBR_481368,
AUTHOR = {Del Grosso, A. M. and Zenzaro, S. and Boschetti, F. and Ranocchia, G.},
TITLE = {GreekSchools: Making Traditional Papyrology Machine Actionable through Domain-Driven Design},
YEAR = {2023},
ABSTRACT = {Traditional papyrology has optimized its ecdotic methods to study papyrological documents (diplomatic edition) and, simultaneously, the corresponding texts (critical edition). Prominent initiatives, such as Papyri. info, are striving to find an optimal trade-off between familiarity for traditional scholars and machine actionability for automatic processing. The approach proposed throughout this paper is based on the Domain-Driven Design (DDD) and, particularly, on the DSL-based Digital Scholarly Editions (DSEs). The work aims to create a comprehensive textual scholarship workflow implemented in a modular web environment named CoPhi Editor. The ERC GreekSchools project serves as the scientific testbench for co-design our editing environment with a multidisciplinary team of papyrologists, philologists, linguists, and other humanists},
KEYWORDS = {Information science, Scholarships, Computational Philology, Digital Papyrology, Digital Humanities, Digital Scholarly Editing, TEI/EpiDoc,},
PAGES = {621-626},
URL = {https://ieeexplore.ieee.org/document/10409929},
DOI = {10.1109/cist56084.2023.10409929},
PUBLISHER = {IEEE},
ISBN = {9781665461337},
CONFERENCE_NAME = {7th IEEE Congress on Information Science and Technology (CiSt)},
BOOKTITLE = {7th IEEE Congress on Information Science and Technology (CiSt)},
}
@INPROCEEDINGS{FAVARO_2023_INPROCEEDINGS_FSCH_499985,
AUTHOR = {Favaro, M. and Sassolini, E. and Cinini, A. and Haines, M.},
TITLE = {Un futuro digitale per gli archivi de ‘Gli Anni della Cupola’},
YEAR = {2023},
ABSTRACT = {L’articolo si inserisce tra le iniziative di recupero, salvaguardia e valorizzazione di archivi digitali conservati in formati non standard che l’Istituto di Linguistica Computazionale “A. Zampolli” sta promuovendo da alcuni anni con diverse strategie legate alla natura delle risorse testuali trattate [8, 9 e 10]. In queste iniziative l’istituto offre inoltre la possibilità di depositare gli output sull’infrastruttura internazionale CLARIN1, al fine di garantirne la preservazione a lungo termine e la divulgazione. In questo particolare caso sono discussi i metodi, le criticità e le strategie di conversione di dati digitali strutturati e codificati con un sistema software proprietario, in un nuovo formato di rappresentazione in linea con gli standard internazionali TEI. Il contenuto è costituito dall’edizione completa delle fonti amministrative conservate presso l’Opera di Santa Maria del Fiore di Firenze relative al periodo dal 1417 al 1436 quando fu progettata e costruita la Cupola di Brunelleschi. L’intervento intende proporre una riflessione metodologica sulla standardizzazione di edizioni digitali obsolete, la conservazione a lungo termine e sulle problematiche legate alla condivisione dei dati con la comunità scientifica. Gli archivi hanno infatti un interesse multidisciplinare, non solo per le informazioni storiche e artistiche che vi sono contenute, ma anche per le peculiarità che riguardano la lingua in cui gli atti originali sono stati redatti: una delle più antiche e autentiche attestazioni del volgare fiorentino, usato non con intenti letterari, ma pratici. Il processo di conversione riguarda tutti i materiali digitali, sia i metadati inseriti manualmente durante la preparazione dei testi, sia il contenuto originale degli atti, e mira a rappresentare opportunamente l’edizione digitale dei testi, ma vuole anche conservare l’apparato critico predisposto dai redattori che correda le schede di voci analitiche sulle quali si basano le funzioni di ricerca all’epoca realizzate},
KEYWORDS = {Digital Humanities, TEI mapping, corpora, knowledge discovery, knowledge representation},
PAGES = {78-84},
URL = {https://amsacta.unibo.it/id/eprint/7721/},
DOI = {10.6092/unibo/amsacta/7721},
PUBLISHER = {AIUCD-Associazione per l'informatica umanistica e la cultura digitale (SIENA, ITA)},
ISBN = {9788894253573},
CONFERENCE_NAME = {XII Convegno Annuale AIUCD: La memoria digitale},
CONFERENCE_PLACE = {SIENA},
BOOKTITLE = {La memoria digitale: forme del testo e organizzazione della conoscenza. Atti del XII Convegno Annuale AIUCD},
EDITOR = {Carbé, E.},
}
@INPROCEEDINGS{FRONTINI_2023_INPROCEEDINGS_FRK_476002,
AUTHOR = {Frontini, F. and Romary, L. and Khan, A. F. A.},
TITLE = {ISO LMF 24613-6: A Revised Syntax Semantics Module for the Lexical Markup Framework},
YEAR = {2023},
ABSTRACT = {The Lexical Markup Framework (LMF) is a meta-model for representing data in monolingual and multilingual lexical databases with a view to its use in computer applications. The "new LMF" replaces the old LMF standard, ISO 24613: 2008, and is being published as a multi-part standard. This short paper introduces one of these new parts, ISO 24613-6, namely the Syntax and Semantics (SynSem) module. The SynSem module allows for the description of syntactic and semantic properties of lexemes, as well as the complex interactions between them. While the new standard remains faithful to (and backwards compatible with) the syntax and semantics coverage of the previous model, the new standard clarifies and simplifies it in a few places, which will be illustrated},
KEYWORDS = {ISO, LMF, TEI, Semantics, Syntax},
URL = {https://inria.hal.science/hal-04117132},
BOOKTITLE = {Proceedings of LDK 2023 – 4th Conference on Language, Data and Knowledge},
}
@INPROCEEDINGS{HOHENEGGER_2023_INPROCEEDINGS_HBCCDDMM_463577,
AUTHOR = {Hohenegger, H. and Boschetti, F. and Chiaravalli, I. and Ciotti, F. and De Longis, E. and Del Grosso, A. M. and Mancinelli, T. and Meschini, F.},
TITLE = {Metodologie di indagine per una nuova piattaforma: Digital Scholarly Editions Platform and Aligned Translation},
YEAR = {2023},
ABSTRACT = {La Digital Scholarly Editions Platform and Aligned Translations (DiScEPT, Progetto Straordinario FOE finanziato dal MUR: 2022-2024) è un ecosistema digitale sostenibile che integra strumenti di codifica testuale e visuale in un'interfaccia coerente che consente sia la costituzione e curatela di Digital Scholarly Editions (DSE) sia la loro pubblicazione e fruizione. A tal fine sono stati sviluppati protocolli di ricerca empirica (qualitativa e quantitativa). Qui presentiamo un sistema di interviste strutturate da somministrare alle figure professionali che operano nel campo delle DSE. Il fine è raccogliere le loro esigenze e i requisiti per progettare una piattaforma che ad esse risponda},
KEYWORDS = {Survey questionnaires, Needs and Requirements Gathering, Digital Scholarly Editions, Aligned Translations},
PAGES = {111-113},
URL = {http://www.aiucd2023.unisi.it/atti/},
PUBLISHER = {Alma Mater Studiorum-Università di Bologna (Bologna, ITA)},
ISBN = {978-88-942535-7-3},
CONFERENCE_NAME = {LA MEMORIA DIGITALE: XII CONVEGNO ANNUALE AIUCD},
CONFERENCE_PLACE = {Bologna},
BOOKTITLE = {LA MEMORIA DIGITALE ATTI DEL XII CONVEGNO ANNUALE AIUCD Siena, 5-7 giugno 2023},
EDITOR = {Carbé and Emmanuela and Lo Piccolo and Gabrieleand, V. and Alessia and Stella and Francesco},
}
@INPROCEEDINGS{KHAN_2023_INPROCEEDINGS_KPJCE_461981,
AUTHOR = {Khan, A. F. A. and P McCrae, J. and Javier Minaya Gómez, F. and Cruz González, R. and E Díazvera, J.},
TITLE = {Some Considerations in the Construction of a Historical Language WordNet},
YEAR = {2023},
ABSTRACT = {This article describes the manual construction of a part of the Old English WordNet (Old-EWN) covering the semantic field of emotion terms. This manually constructed part of the wordnet is to be eventually integrated with the automatically generated/manually checked part covering the whole of the rest of the Old English lexicon (currently under construction). We present the workflow for the definition of these emotion synsets on the basis of a dataset produced by a specialist in this area. We also look at the enrichment of the original Global WordNet Association Lexical Markup Framework (GWA LMF) schema to include the extra information which this part of the OldEWN requires. In the final part of the article we discuss how the wordnet style of lexicon organisation can be used to share and disseminate research findings/datasets in lexical semantics},
KEYWORDS = {old english, wordnet, lexical resources},
URL = {https://www.hitz.eus/gwc2023/sites/default/files/aurkezpenak/GWC2023_paper_3631.pdf},
CONFERENCE_NAME = {Global WordNet Conference 2023},
BOOKTITLE = {Proceedings of the 12th Global Wordnet Conference},
}
@INPROCEEDINGS{MARTELLI_2023_INPROCEEDINGS_MBCCCGKKKKLLNOPQSSTUN_479241,
AUTHOR = {Martelli, F. and Bejgu, A. S. and Campagnano, C. and Cibej, J. and Costa, R. and Gantar, A. and Kallas, J. and Koeva, S. and Koppel, K. and Krek, S. and Langemets, M. and Lipp, V. and Nimb, S. and Olsen, S. and Pedersen, B. S. and Quochi, V. and Salgado, A. and Simon, L. and Tiberius, C. and Urena Ruiz, R. J. and Navigli, R.},
TITLE = {XL-WA: a Gold Evaluation Benchmark for Word Alignment in 14 Language Pairs},
YEAR = {2023},
ABSTRACT = {Word alignment plays a crucial role in several Natural Language Processing tasks, such as lexicon injection and cross-lingual label projection. The evaluation of word alignment systems relies heavily on manually-curated datasets, which are not always available, especially in mid-and low-resource languages. In order to address this limitation, we propose XL-WA, a novel entirely manually-curated evaluation benchmark for word alignment covering 14 language pairs. We illustrate the creation process of our benchmark and compare statistical and neural approaches to word alignment in both language-specific and zero-shot settings, thus investigating the ability of state-of-the-art models to generalize on unseen language pairs. We release our new benchmark at: https: //github. com/SapienzaNLP/XL-WA},
KEYWORDS = {Deep Learning, Multilinguality, Natural Language Processing, Word Alignment},
PAGES = {9},
URL = {https://iris.cnr.it/handle/20.500.14243/479241},
VOLUME = {3596},
PUBLISHER = {CEUR-WS},
CONFERENCE_NAME = {9th Italian Conference on Computational Linguistics, CLiC-it 2023},
BOOKTITLE = {Proceedings of the Ninth Italian Conference on Computational Linguistics},
}
@INPROCEEDINGS{MIASCHI_2023_INPROCEEDINGS_MPD_520527,
AUTHOR = {Miaschi, A. and Papucci, M. and Dell'Orletta, F.},
TITLE = {Lost in Labels: An Ongoing Quest to Optimize Text-to-Text Label Selection for Classification},
YEAR = {2023},
ABSTRACT = {In this paper, we present an evaluation of the influence of label selection on the performance of a Sequence-to-Sequence Transformer model in a classification task. Our study investigates whether the choice of words used to represent classification categories affects the model’s performance, and if there exists a relationship between the model’s performance and the selected words. To achieve this, we fine-tuned an Italian T5 model on topic classification using various labels. Our results indicate that the different label choices can significantly impact the model’s performance. That being said, we did not find a clear answer on how these choices affect the model performances, highlighting the need for further research in optimizing label selection},
KEYWORDS = {encoder-decoder, label selection, topic classification},
URL = {https://iris.cnr.it/handle/20.500.14243/520527},
VOLUME = {516 (394)},
BOOKTITLE = {Proceedings of the 9th Italian Conference on Computational Linguistics CLiC-it 2023: Venice, Italy, November 30-December 2, 2023},
}
@INPROCEEDINGS{NAHLI_2023_INPROCEEDINGS_NGKB_481366,
AUTHOR = {Nahli, O. and Gugliotta, E. and Khlif, N. and Benotto, G.},
TITLE = {Challenges and Progress in Constructing Arabic Dialect Corpora and Linguistic tools: A Focus on Moroccan and Tunisian Dialects},
YEAR = {2023},
ABSTRACT = {Given the lack of resources for Arabic dialects, the construction of corpora, lexical resources, and tools is a non-trivial challenge. The focus of the article is to describe our in-progress work to address these deficiencies. We start with Moroccan and Tunisian dialects to provide annotated corpora and corpus-based lexical resources. We also aim to extend an existing morphological engine with linguistic resources built \emph(ad hoc) for each dialect. In addition, we develop an integrated component in the morphological engine to better address linguistic and sociolinguistic characteristics while preserving the integrity of dialectal texts},
KEYWORDS = {Arabic dialects, Moroccan dialect, Tunisian dialect, corpora, lexical resources, Aramorph},
PAGES = {293-298},
URL = {https://ieeexplore.ieee.org/stamp/stamp.jsp?tp=\&arnumber=10410009},
DOI = {10.1109/cist56084.2023.10410009},
PUBLISHER = {IEEE (USA)},
ISBN = {978-1-6654-6133-7},
CONFERENCE_NAME = {7th IEEE Congress on Information Science and Technology (CiSt)},
CONFERENCE_PLACE = {USA},
BOOKTITLE = {2023 7th IEEE Congress on Information Science and Technology (CiSt)},
}
@INPROCEEDINGS{PROIETTI_2023_INPROCEEDINGS_PVY_467363,
AUTHOR = {Proietti, C. and Velázquez Quesada, F. R. and Yuste Ginel, A.},
TITLE = {An Abstract Look at Awareness Models and Their Dynamics},
YEAR = {2023},
ABSTRACT = {This work builds upon a well-established research tradition on modal logics of awareness. One of its aims is to export tools and techniques to other areas within modal logic. To this end, we illustrate a number of significant bridges with abstract argumentation, justification logics, the epistemic logic of knowing-what and deontic logic, where basic notions and definitional concepts can be expressed in terms of the awareness operator combined with the box modality. Furthermore, these conceptual links point to interesting properties of awareness sets beyond those standardly assumed in awareness logics, i. e. positive and negative introspection. We show that the properties we list are characterised by corresponding canonical formulas, so as to obtain a series of off-the-shelf axiomatisations for them. As a second focus, we investigate the general dynamics of this framework by means of event models. Of specific interest in this context is to know under which conditions, given a model that satisfies some property, the update with an event model keeps it within the intended class. This is known as the closure problem in general dynamic epistemic logics. As a main contribution, we prove a number of closure theorems providing sufficient conditions for the preservation of our properties. Again, these results enable us to axiomatize our dynamic logics by means of reduction axioms},
KEYWORDS = {Awareness Logics, Dynamic Epistemic Logics, Deontic Logics, Event Models},
PAGES = {455-469},
URL = {https://iris.cnr.it/handle/20.500.14243/467363},
VOLUME = {379},
DOI = {10.4204/EPTCS.379},
PUBLISHER = {Rineke Verbrugge},
ISSN = {2075-2180},
CONFERENCE_NAME = {TARK 2023},
BOOKTITLE = {ELECTRONIC PROCEEDINGS IN THEORETICAL COMPUTER SCIENCE},
}
@INPROCEEDINGS{PROIETTI_2023_INPROCEEDINGS_PY_477062,
AUTHOR = {Proietti, C. and Yuste Ginel, A.},
TITLE = {On the instantiation of argument-incomplete argumentation frameworks},
YEAR = {2023},
ABSTRACT = {Argument-incomplete argumentation frameworks provide an intuitive way of representing uncertainty in argumentative contexts. It is however possible that, taking structured argumentation as a reference point, the general assumptions of these models present the same risks of hasty generalization attributed to some abstract argumentation models, as they do not have a structured counterpart. Here, we focus on a specific instantiation of argument-incomplete argumentation frameworks: rooting the uncertainty about arguments in the uncertainty about the application of ASPIC-inference rules. We show (Proposition 1) that the abovementioned risk is concrete. Therefore a more fine-grained representation of uncertainty at the abstract level is needed, which we provide with implicative argument-incomplete argumentation frameworks and prove to work (Theorem 1)},
KEYWORDS = {abstract argumentation, Incompleteness, structured argumentation, uncertainty},
PAGES = {1-7},
URL = {https://ceur-ws.org/Vol-3546/paper12.pdf},
VOLUME = {3546},
CONFERENCE_NAME = {7th Workshop on Advances in Argumentation in Artificial Intelligence (AI^3)},
BOOKTITLE = {7th Workshop on Advances in Argumentation in Artificial Intelligence},
}
@INPROCEEDINGS{SCIOLETTE_2023_INPROCEEDINGS_SMG_452910,
AUTHOR = {Sciolette, F. and Marchi, S. and Giovannetti, E.},
TITLE = {Towards a New Computational Lexicon for Italian: building the morphological layer by harmonizing and merging existing resources},
YEAR = {2023},
ABSTRACT = {The present work illustrates the first steps towards the construction of a new computational lexicon for the Italian language. Following an analysis of existing lexical resources, it was decided to use LexicO as the reference base. In this first phase a resource of nearly 800, 000 inflected forms was produced, accompanied by lemmas and morphological traits, obtained by integrating the available data in LexicO with those coming from two support sources: the tool MAGIC and a selection of Italian treebanks},
KEYWORDS = {computational lexicon, lexical resources, morphology, morphological harmonization},
PAGES = {5},
URL = {https://ceur-ws.org/Vol-3596/short20.pdf},
CONFERENCE_NAME = {9th Italian Conference on Computational Linguistics},
BOOKTITLE = {Proceedings of the 9th Italian Conference on Computational Linguistics},
EDITOR = {Boschetti, F. and Lebani, G. E. and Magnini, B. and Novielli, N.},
}
@INPROCEEDINGS{ZENZARO_2023_INPROCEEDINGS_Z_479566,
AUTHOR = {Zenzaro, S.},
TITLE = {On the role of models and modularity in the design and development of Digital Humanities tools},
YEAR = {2023},
ABSTRACT = {This article emphasizes the importance of defining models and building modular software for digital humanities tools. In particular, we address the availability of modular models for tools as a necessity to cope with the rapidly changing technological landscape that has produced a large set of short-lived tools. We propose an approach that aims to mitigate the effects of software obsolescence that leverages modular models},
KEYWORDS = {digital humanities, models, modularity, tools, obsolescence},
PAGES = {611-614},
URL = {https://ieeexplore.ieee.org/servlet/opac?punumber=10409867},
DOI = {10.1109/cist56084.2023.10409925},
ISBN = {978-1-6654-6133-7},
CONFERENCE_NAME = {7th IEEE Congress on Information Science and Technology (CiSt)},
BOOKTITLE = {2023 7th IEEE Congress on Information Science and Technology (CiSt)},
}
@INPROCEEDINGS{ZENZARO_2023_INPROCEEDINGS_ZDBR_463578,
AUTHOR = {Zenzaro, S. and Del Grosso, A. M. and Boschetti, F. and Ranocchia, G.},
TITLE = {Ease the collaboration making Scholarly Editions: the GreekSchools case study},
YEAR = {2023},
ABSTRACT = {CophiEditor is a Digital Scholarly Editing Web platform based on Domain Specific Languages (DSL-based DSE). We are developing this platform in the context of the GreekSchools-885222 ERC project in which it is being used for the constitutio textus of Philodemus of Gadara's Arrangement of the Philosophers. The digital papyrological edition of these texts is challenging in many ways, as most of the Herculaneum papyri are highly fragmentary because they are carbonized and damaged. One of the main goals of the CophiEditor is to provide a full-fledged collaborative environment in order to support the scholar's editorial work. In this poster we show how the progress of CophiEditor eases the collaboration between scholars and the role played by the Web Annotation Data Model (WADM) for data representation and interchange},
KEYWORDS = {Domain Specific Language, Computational Philology, Digital Philology, Web Annotation Data Model, DSE tools},
PAGES = {230-232},
URL = {http://www.aiucd2023.unisi.it/atti/},
PUBLISHER = {Alma Mater Studiorum-Università di Bologna (Bologna, ITA)},
ISBN = {978-88-942535-7-3},
CONFERENCE_NAME = {LA MEMORIA DIGITALE: XII CONVEGNO ANNUALE AIUCD},
CONFERENCE_PLACE = {Bologna},
BOOKTITLE = {NA},
EDITOR = {Carbé and Emmanuela and Lo Piccolo and Gabrieleand, V. and Alessia and Stella and Francesco},
}
@INPROCEEDINGS{KHAN_2023_INPROCEEDINGS_KCCDFJ_475981,
AUTHOR = {Khan, A. F. A. and Cavallaro, M. and Cruz González, R. and Díaz Vera, J. and Frontini, F. and Javier Minaya Gómez, F.},
TITLE = {Constructing an Old English WordNet: The Case of Guilt},
YEAR = {2023},
PAGES = {122-124},
URL = {https://iris.unive.it/retrieve/0f226d38-e332-418b-9b14-d5558d1a0d9d/AIUCD2023.pdf},
BOOKTITLE = {La Memoria Digitale. Forme Del Testo e Organizzazione Della Conoscenza. Atti Del XII Convegno Annuale AIUCD},
}
@INPROCEEDINGS{SICILIANO_2023_INPROCEEDINGS_SD_452907,
AUTHOR = {Siciliano, A. and Del Grosso, A. M.},
TITLE = {Giorgio Bassani's notes between tradition and innovation},
YEAR = {2023},
ABSTRACT = {This contribution illustrates the preliminary results of the project concerning Giorgio Bassani's personal library. The project provides both a printed traditional edition of the notes he wrote on his books and the development of a digital environment to browse and analyze them},
KEYWORDS = {Digital Humanities, Digital Philology, Digital Scholarly Editions, Giorgio Bassani},
URL = {https://doi.org/10.5281/zenodo.8107868},
DOI = {10.5281/zenodo.7961822},
PUBLISHER = {ADHO},
CONFERENCE_NAME = {Digital Humanities 2023. Collaboration as Opportunity},
BOOKTITLE = {Digital Humanities 2023. Collaboration as Opportunity},
EDITOR = {Scholger, W. and Vogeler, G. and Tasovac, T. and Baillot, A. and Helling, P.},
}
@TECHREPORT{ALBANESI_2023_TECHREPORT_ABGMPS_544724,
AUTHOR = {Albanesi, D. and Bellandi, A. and Giovannetti, E. and Marchi, S. and Papini, M. and Sciolette, F.},
TITLE = {Traduco: l'Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-Rapporto tecnico 24},
YEAR = {2023},
ABSTRACT = {La presente relazione tecnico-scientifica descrive l’attività svolta da CNR-ILC nel contesto del Progetto Traduzione Talmud Babilonese nel periodo luglio 2023-dicembre 2023. Le principali attività tecniche svolte sul sistema Traduco attualmente in produzione hanno riguardato l’aggiornamento di alcune funzionalità. Parallelamente, in continuità alle attività descritte nel documento di SAL precedente, è proseguito il lavoro di ricerca e sviluppo su due fronti: i) la realizzazione della nuova versione di Traduco, ii) l’ampliamento della risorsa lessicale per l’italiano contemporaneo a supporto della funzionalità di ricerca full-text sul testo del Talmud tradotto in italiano},
KEYWORDS = {Lessici elettronici, rappresentazione della conoscenza, Linguistica Computazionale, traduzione di testi religiosi, traduzione assistita dal calcolatore},
URL = {https://iris.cnr.it/handle/20.500.14243/544724},
}
@TECHREPORT{ALBANESI_2023_TECHREPORT_AGMPS_452915,
AUTHOR = {Albanesi, D. and Giovannetti, E. and Marchi, S. and Papini, M. and Sciolette, F.},
TITLE = {Traduco: l'Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-Rapporto tecnico 23},
YEAR = {2023},
ABSTRACT = {La presente relazione tecnico-scientifica descrive l'attività svolta da ILC-CNR nel contesto del Progetto Traduzione Talmud Babilonese nel periodo gennaio 2023-giugno 2023. Le principali attività tecniche svolte sul sistema Traduco attualmente in produzione sono state la risoluzione di bug e l'aggiornamento di alcune funzionalità. Parallelamente, è proseguito il lavoro di ricerca e sviluppo su due fronti: i) la realizzazione della nuova versione di Traduco, ii) l'ampliamento della risorsa lessicale per l'italiano contemporaneo a supporto della funzionalità di ricerca full-text sul testo del Talmud tradotto in italiano},
KEYWORDS = {Lessici elettronici, rappresentazione della conoscenza, Linguistica Computazionale, traduzione di testi religiosi, traduzione assistita dal calcolatore},
PAGES = {13},
URL = {https://iris.cnr.it/handle/20.500.14243/452915},
}
@TECHREPORT{CARNIANI_2023_TECHREPORT_CP_454363,
AUTHOR = {Carniani, E. and Papini, M.},
TITLE = {Maia: Una piattaforma aperta e collaborativa per la lessicografia elettronica, l'annotazione del testo e il linking testo-lessico-Consultazione e compilazione del lessico},
YEAR = {2023},
ABSTRACT = {La presente relazione tecnico-scientifica descrive l'attività svolta sull'interfaccia web Maia nel periodo marzo 2023-dicembre 2023. In particolare riportiamo le attività tecniche svolte sulla parte di creazione e manipolazione del lessico},
KEYWORDS = {Linguistica Computazionale, Lessici elettronici, Lexicon editor, Text annotation, Digital lexicography, text-lexical connection},
PAGES = {13},
URL = {https://iris.cnr.it/handle/20.500.14243/454363},
}
@TECHREPORT{CASTELLI_2023_TECHREPORT_CDCCCCDGLMPR_457314,
AUTHOR = {Castelli, D. and De Simone, G. and Cancedda, F. and Candela, L. and Colcelli, V. and Conte, R. and Di Donato, F. and Giannini, S. and Lazzeri, E. and Mangiaracina, S. and Puccinelli, R. and Ranchino, M.},
TITLE = {Roadmap Scienza Aperta},
YEAR = {2023},
ABSTRACT = {La scienza aperta è un paradigma che influenza le pratiche di produzione e condivisione di conoscenza. Obiettivo di questa roadmap è delineare un percorso per la realizzazione e diffusione di pratiche e politiche di scienza aperta all'interno del Consiglio Nazionale delle Ricerche},
KEYWORDS = {Open Science, Open Access, Roadmap},
PAGES = {23},
URL = {https://publications.cnr.it/doc/482044},
PUBLISHER = {CNR (Roma, ITA)},
CONFERENCE_PLACE = {Roma},
}
@TECHREPORT{MALLIA_2023_TECHREPORT_M_524256,
AUTHOR = {Mallia, M.},
TITLE = {Epilexo stack: descrizione della struttura e personalizzazioni},
YEAR = {2023},
ABSTRACT = {Il documento descrive la piattaforma che ospita l’interfaccia “EpiLexO” dal punto di vista strutturale e sistemistico. Questo documento include informazioni su come effettuare personalizzazioni in base all’ambiente in cui viene sviluppato},
KEYWORDS = {architettura software, docker stack, devops},
URL = {https://iris.cnr.it/handle/20.500.14243/524256},
}
@TECHREPORT{MALLIA_2023_TECHREPORT_M_437138,
AUTHOR = {Mallia, M.},
TITLE = {Epilexo: uno strumento per la creazione, modifica e interlinking di lessici antichi},
YEAR = {2023},
ABSTRACT = {Il presente documento descrive lo sviluppo di "EpiLexo", una piattaforma web per la creazione, l'aggiornamento e la revisione di lessici elettronici collegati a materiali testuali e bibliografici, nonché a risorse lessicografiche esterne. L'applicazione è stata sviluppata nel contesto del progetto ItAnt ovvero "Lingue e culture dell'Italia antica: linguistica storica e modelli digitali" (finanziato dal MUR-PRIN 2017-2017XJLE8J). L'obiettivo è quello di creare uno strumento che possa migliorare la modifica dei lessici e il collegamento tra questi ultimi e le risorse epigrafiche. Il rapporto definisce l'architettura funzionale generale della soluzione che viene implementata all'interno del progetto},
KEYWORDS = {digital lexicography, digital humanities, linguistic linked open data},
URL = {https://doi.org/10.5281/zenodo.7736679},
DOI = {10.5281/zenodo},
}
@MISC{BARONI_2023_MISC_B_462402,
AUTHOR = {Baroni, P.},
TITLE = {CoPhiLab Web Site},
YEAR = {2023},
ABSTRACT = {Web site of CNR-ILC Laboratory "CoPhiLab-Laboratory of Collaborative and Cooperative Philology", powered by WordPress, developed in English},
KEYWORDS = {Filologia Collaborativa, Filologia Cooperativa, Digital Humanities, Digital Scholarly Editing, risorse digitali, strumenti digitali, mondo mediterraneo antico, mondo mediterraneo medievale, mondo mediterraneo rinascimentale, greco, latino, arabo, ebraico, italiano, dialetti italiani, lingue minoritarie europee},
URL = {https://cophilab.ilc.cnr.it},
}
@MISC{BARONI_2023_MISC_B_461442,
AUTHOR = {Baroni, P.},
TITLE = {PRIN-20204EJYRX CWALM: Project Web Site},
YEAR = {2023},
ABSTRACT = {Web site of the project CWALM-A Lexical Corpus-based Model of Contemporary Written Arabic (PRIN 2020 Call | ERC Fields SH4 and PE6 | Prot. No. 20204EJYRX), powered by WordPress, developed in English},
KEYWORDS = {lexical model, corpus, Contemporary Written Arabic},
URL = {https://cwalm.ilc.cnr.it},
}
@MISC{CARLINO_2023_MISC_C_462407,
AUTHOR = {Carlino, M.},
TITLE = {Sito web www. ilc. cnr. it},
YEAR = {2023},
ABSTRACT = {Design of the structure, implementation with the WordPress CMS and updating of the contents of the institutional site of the Cnr-Istituto di Linguistica Computazionale "Antonio Zampolli" (CNR-ILC): https: //www. ilc. cnr. it Bilingual site (Italian and English)},
KEYWORDS = {website, dissemination, sito web},
URL = {https://www.ilc.cnr.it},
}
@MISC{CASTELLI_2023_MISC_CCDGLLR_519138,
AUTHOR = {Castelli, D. and Cimino, R. and Di Donato, F. and Gatt, L. and Lavitrano, M. and Lazzeri, E. and Rossi, G.},
TITLE = {Piano Nazionale della Scienza Aperta: ruolo ed azioni prioritarie},
YEAR = {2023},
ABSTRACT = {La Scienza Aperta definisce la nuova normalità nella collaborazione e comunicazione scientifica. Questa si basa sulla condivisione dei prodotti della ricerca e sulla rimozione delle barriere alla loro diffusione, verifica e riproduzione, alla attribuzione dei meriti effettivi ed al controllo di qualità e di efficacia degli investimenti in ricerca. Il Piano Nazionale per la Scienza Aperta (PNSA) del 2022 imposta gli obiettivi per implementare uno scenario in cui la nuova normalità si possa affermare in linea con gli sviluppi della scienza aperta a livello europeo e dello European Open Science Cloud (EOSC). Questo documento inquadra il PNSA nell’ambito nazionale ed europeo, evidenziando gli effetti della sua implementazione nel contesto della ricerca e dell’innovazione nazionale. Esso inoltre introduce un primo insieme di azioni prioritarie per la sua attuazione identificate dal Tavolo di Lavoro istituito dalla Direzione generale dell’internazionalizzazione e della comunicazione del MUR},
KEYWORDS = {scienza aperta, Piano nazionale scienza aperta},
URL = {https://iris.cnr.it/handle/20.500.14243/519138},
}
@MISC{FRONTINI_2023_MISC_F_456225,
AUTHOR = {Frontini, F.},
TITLE = {Words and the Company they Keep: Digital corpora and infrastructures for the foreign language classroom},
YEAR = {2023},
ABSTRACT = {We give an overview of corpora \& language technologies and their use in foreign language teaching},
KEYWORDS = {corpora, didattica L2, tecnologie del linguaggio},
URL = {https://iris.cnr.it/handle/20.500.14243/456225},
CONFERENCE_NAME = {Didattica della lingua, della cultura e cittadinanza attiva: sfide educative contemporanee-Seminari LEND Modena},
}
@MISC{GIOVANNETTI_2023_MISC_GABCGMPS_452912,
AUTHOR = {Giovannetti, E. and Albanesi, D. and Bellandi, A. and Carniani, E. and Guidi, L. and Marchi, S. and Papini, M. and Sciolette, F.},
TITLE = {Maia},
YEAR = {2023},
ABSTRACT = {Maia is an open and collaborative web tool based on semantic web and linked open data technologies for text annotation, e-lexicography, and lexical linking},
KEYWORDS = {maia, linked open data, e-lexicography, text annotation, lexical linking, collaborative tools},
URL = {https://github.com/klab-ilc-cnr/Maia},
}
@MISC{GUADAGNINI_2023_MISC_G_454367,
AUTHOR = {Guadagnini, E.},
TITLE = {[recensione] Toscana bilingue (1260 ca.-1430 ca.). Per una storia sociale del tradurre medievale},
YEAR = {2023},
KEYWORDS = {Volgarizzamenti, Traduttologia, Storia medievale},
PAGES = {239-243},
URL = {https://iris.cnr.it/handle/20.500.14243/454367},
VOLUME = {87},
ISSN = {0035-1458},
}
@MISC{MALLIA_2023_MISC_MQ_545243,
AUTHOR = {Mallia, M. and Quochi, V.},
TITLE = {EpiLexO},
YEAR = {2023},
ABSTRACT = {EpiLexO is a user friendly web application for the creation and editing of an integrated system of language resources for ancient fragmentary languages centered on the lexicon, in compliance with current digital humanities and Linked Open Data principles. EpiLexo allows for the editing of lexica with all relevant cross-references: for their linking to their testimonies, as well as to bibliographic information and other (external) resources and common vocabularies. This front-end application rests on a Service-Oriented Architecture with two main back-end components, the LexO-server (\handle) and the CASH-server (1github), which manage lexica and textual documents respectively via Rest-ful APIs web-services, plus additional services for the management of other aspects such as access and authentication, XML rendering, etc. All code is available on https: //github. com/DigItAnt/ The application has been developed in the context of a project on the languages of fragmentary attestation of ancient Italy, but can be applied to other similar contexts},
KEYWORDS = {Historical linguistics, Digital epigraphy, Linguistic Open Linked Data, Web GUI application, Lexicon Editor},
URL = {https://github.com/DigItAnt/LexO-angular-dev},
}
@MISC{MAZZAGUFO_2023_MISC_MSGS_525144,
AUTHOR = {Mazzagufo, L. and Sichera, P. and Grosso, A. M. D. and Spampinato, D.},
TITLE = {Bellini Digital Correspondence meets MEI},
YEAR = {2023},
ABSTRACT = {In this contribution, we show some features of the BDC digital scholarly edition along with some strategies implemented to automate, wherever possible, the process of textual encoding, analysis and normalisation, as well as some perspectives on the work in progress concerning the encoding of epistolary-related music materials in MEI. Paper presented at the joint MEC TEI conference 2023. "Encoding Cultures" September 4-8, 2023 | Paderborn, Germany},
KEYWORDS = {Bellini Digital Correspondence, Vincenzo Bellini, TEI-MEI, Digital scholarly edition, multimedia museum},
URL = {https://iris.cnr.it/handle/20.500.14243/525144},
DOI = {10.5281/zenodo.8335048},
CONFERENCE_NAME = {“Encoding Cultures”, the 2023 joint MEC and TEI conference},
}
@MISC{PAPINI_2023_MISC_P_453900,
AUTHOR = {Papini, M.},
TITLE = {Maia: Una piattaforma aperta e collaborativa per la lessicografia elettronica, l'annotazione del testo e il linking testo-lessico-Gestione del corpus e annotazione del testo},
YEAR = {2023},
ABSTRACT = {La presente relazione tecnico-scientifica descrive l'attività svolta sull'interfaccia web Maia nel periodo marzo 2023-dicembre 2023. In particolare riportiamo le attività tecniche svolte sulla parte di manipolazione del Corpus e annotazione del testo},
KEYWORDS = {Linguistica Computazionale, Lessici elettronici, Lexicon editor, Text annotation, Digital lexicography, text-lexical connection},
}
@MISC{PAPINI_2023_MISC_P_453898,
AUTHOR = {Papini, M.},
TITLE = {Maia: Una piattaforma aperta e collaborativa per la lessicografia elettronica, l'annotazione del testo e il linking testo-lessico-Autenticazione e gestione utenti},
YEAR = {2023},
ABSTRACT = {La presente relazione tecnico-scientifica descrive l'attività svolta sull'interfaccia web Maia nel periodo marzo 2023-dicembre 2023. In particolare riportiamo le attività tecniche svolte sulla parte di autenticazione e gestione utenti},
KEYWORDS = {Linguistica Computazionale, Lessici elettronici, Lexicon editor, Text annotation, Digital lexicography, text-lexical connection},
PAGES = {7},
}
@MISC{PROVOST_2023_MISC_P_475287,
AUTHOR = {Provost, L. M.},
TITLE = {[FOSSR Training] Managing data within the social science infrastructures: the role of FOSSR. Module 1 Research Data and Open Science},
YEAR = {2023},
ABSTRACT = {Module 1 of the course on Research Data and Open Science for the FOSSR online training Managing data within the social science infrastructure: the role of FOSSR, held on 6 November 2023},
KEYWORDS = {Open Science, Training, Research Data Management},
URL = {https://zenodo.org/records/10074214},
DOI = {10.5281/ZENODO.10074214},
}
@MISC{PROVOST_2023_MISC_PM_475263,
AUTHOR = {Provost, L. and Mihalenas, V.},
TITLE = {GraspOS Poster},
YEAR = {2023},
ABSTRACT = {GraspOS is a Horizon Europe research project focused on creating an open research assessment dataspace. This poster presents the aims, outcomes, methodology and pilot studies of the project},
KEYWORDS = {GraspOS, Horizon Europe, EOSC},
URL = {https://zenodo.org/records/8075017},
DOI = {10.5281/ZENODO.8075017},
}
@MISC{SALVATORI_2023_MISC_SDKC_504961,
AUTHOR = {Salvatori, E. and Del Grosso, A. M. and Kortobi, N. and Cardamone, R.},
TITLE = {Statuti di Monterosso. Edizione digitale},
YEAR = {2023},
ABSTRACT = {Edizione critica digitale con traduzione in italiano degli Statuti di Monterosso degli inizi del XV secolo conservati in un manoscritto cartaceo dell’età moderna. Il progetto è nato dalla collaborazione tra il LabCD (Laboratorio di Cultura Digitale, centro interdipartimentale dell’Università di Pisa) e il comune di Monterosso a Mare (SP), finalizzata alla realizzazione di progetti, tesi di laurea triennale e magistrale e ricerche volti alla pubblicazione e valorizzazione dei beni documentali e storico/architettonici del CMM e della diffusione della “conoscenza storica”. L’edizione ha l’obiettivo di rappresentare correttamente il primo testo normativo di quella comunità nel modo più corretto, efficace e fruibile possibile},
KEYWORDS = {Digital Humanities, Digital Scholarly Editions, Edizione Scientifica Digitale},
URL = {https://iris.cnr.it/handle/20.500.14243/504961},
ISBN = {9788894443059},
}
@MISC{SICHERA_2023_MISC_SSDC_530821,
AUTHOR = {Sichera, P. and Spampinato, D. and Del Grosso, A. M. and Cristofaro, S.},
TITLE = {ZoneRW: v0. 5-beta (7th IEEE CiSt'23)},
YEAR = {2023},
ABSTRACT = {ZoneRW is a WYSIWYG tool that, starting from the declaration of the surfaces with the relative graphic and zone tags, shows the zones encoded in the TEI file with the relative xml: id attributes, allowing them to be modified on the fly (updating the coordinates, adding or removing zone) generating the relative TEI code. The result on the screen can be exported to images. Environment ZoneRW is developed using 4th Dimension. Among the many features of the 4D platform, the native XML support with the Apache Foundation's Xerces library, the access to the structure through the DOM (Document Object Model) standard, the management of the SVG (Scalable Vector Graphics) format, both as visualization that creation and modification. Installation on Windows download the Windows folder, unzip the archive you downloaded and run ZoneRW. exe on MacOSX download the MacOSX folder and unzip the compressed archive contained in "Installer 4D". Install 4D. 18. 6. Once 4D is installed, use the 4D application to open ZoneRW (probably located in /Applications/4D v18. 6/ folder); open the 4D. app file; then choose "File-\> Open-\> Local application-\> " and open the ZoneRW. 4dbase package you downloaded. XML-TEI specifications In the start window, click on the "XML folder" space to select the folder containing the XML files, and on the "Picture folder" space to select the folder containing the images. The chosen settings will be stored for subsequent program starts. After clicking on "Start", ZoneRW shows the list of files from the folder set at startup. When the user chooses a file, ZoneRW shows the images recalled in the file. Once an image has been chosen, ZoneRW loads it from the folder set for image search. ZoneRW searches for the image: in the folder set at startup; in a subfolder having the same name as the image file; in a subfolder having the same name as the XML file without the extension; in a subfolder having the same name as the XML file without the extension by replacing the ". " with the "_" character. If the image has been found, ZoneRW looks for the tag related to the chosen page; intercepted the element, ZoneRW searches among the children the tag to find the corresponding image (@url attribute); the declared size (@width attribute), in order to calculate a possible scale ratio between image and coordinates; all tags (even nested) to draw the zones on the screen. The list of zones is populated with the values of the attributes @xml: id, @rendition, and the coordinates with @points, @ulx, @uly, @lrx and @lry. The relative id is shown in the upper left corner of each area. Functionality How to use the ZoneRW main window. The "Aggiungi zona" and "Elimina zona" buttons respectively add or delete a zone. The "Genera TEI" button inserts the text containing the zones in XML-TEI format on the clipboard. The "Export image" button exports a file with the image shown. It is possible to modify the zone data manually by entering the coordinates. When the cursor is in the zone list, you can move between the lines with the up/down arrow keys. When the cursor is in the ulx or uly columns, clicking on the image, the coordinates of the point at the top left are automatically updated based on the click. Same thing when the cursor is on lrx and lry. The "Edit" check box hides the lists of documents and images in order to avoid changing pages when editing zones. When clicking on the image in order to update one of the ulx, uly, lrx or lry coordinates, the cursor remains in the coordinate field. By activating the "Click \& validate" check box, the cursor automatically moves to the next coordinate or creates a new zone if necessary. When the cursor is in the points column, each click generates a new vertex for the irregular polygon defined by the points in the points field. Area currently being edited is colored yellow Areas defined as coordinates of a rectangle are colored red. Areas defined as coordinates of a polygon are colored purple. A horizontal thermometer allows you to change the zoom level of the image. It is possible to export zones in XML-TEI text. It is possible to export zones in images. Usage tips The use of the "Click \& validate" check box is very useful when entering zones. For fine correction operations it is more useful to keep the check box deactivated so that you can click several times on the same coordinate until you find the correct position. Clicking on the image scroll bar is a click, so if the cursor is on ulx, uly, lrx, lry or points the click will be intercepted as a new coordinate. Then to scroll, go to one of the other elements of the zone list or use the mouse/trackpad scroll function},
KEYWORDS = {4D, Bellini Digital Correspondence, XML parser, XPath, ROI, Region of Interest},
URL = {https://github.com/pierpaolosichera/ZoneRW},
DOI = {10.5281/zenodo.5599509},
}
@ARTICLE{ACHENBACH_2022_ARTICLE_ABDDDFKV_431678,
AUTHOR = {Achenbach, K. and Baszczyska, M. and De Paoli, S. and Di Donato, F. and Dumouchel, S. and Forbes, P. and Kraker, P. and Vignoli, M.},
TITLE = {Defining discovery: Is Google Scholar a discovery platform? An essay on the need for a new approach to scholarly discovery},
YEAR = {2022},
ABSTRACT = {This essay discusses the concept of discovery, intended as content discovery, and defines it in the new context of Open Science, with a focus on Social Sciences and Humanities (SSH). Starting from the example of Google Scholar, the authors argue that this well-established service does not address the current needs, practices, and variety of discovery. Alternatives in terms of technical choices, features, and governance, do however exist, offering richer and more open discovery. The paper presents, in particular, the implementations and research work of the H2020 project TRIPLE (Transforming Research through Innovative Practices for Linked Interdisciplinary Exploration). Dedicated to the building of a discovery platform for the SSH, the project is meant to address the specificities and evolution of discovery in this field. Prevailing scholarly resource platforms like Google Scholar limit discovery by focussing only on publications, and favouring through their algorithm well-cited papers, English content, and discipline-specific resources. A limitation in the context of cross-disciplinary and collaborative Open Science, such a service more specifically hinders discovery in the SSH. Characterized by a fragmented landscape, a variety of languages, data types, and outputs, research in the SSH requires services that fully exploit discovery potentialities. Moreover, a survey conducted within the TRIPLE project showed that most SSH researchers use Google Scholar as their starting point, and that they recognise the lack of control they have with this system. Beyond the extension of features and content, transparency is the other important criterion for the building of an open infrastructure serving the research community. In light of this, we present the GoTriple platform, which exploits today's technological potential and incorporates the best known functionalities, in order to unveil more and innovative scholarly outputs and lead to international and interdisciplinary research project collaborations},
KEYWORDS = {GoTRIPLE, discovery, TRIPLE},
URL = {https://open-research-europe.ec.europa.eu/articles/2-28/v1},
DOI = {10.12688/openreseurope.14318.1},
ISSN = {2732-5121},
JOURNAL = {OPEN RESEARCH EUROPE},
}
@ARTICLE{ACHENBACH_2022_ARTICLE_ABDDDFKV_530149,
AUTHOR = {Achenbach, K. and Błaszczyńska, M. and De Paoli, S. and Di Donato, F. and Dumouchel, S. and Forbes, P. and Kraker, P. and Vignoli, M.},
TITLE = {Defining discovery: Is Google Scholar a discovery platform? An essay on the need for a new approach to scholarly discovery},
YEAR = {2022},
ABSTRACT = {This essay discusses the concept of discovery, intended as content discovery, and defines it in the new context of Open Science, with a focus on Social Sciences and Humanities (SSH). Starting from the example of Google Scholar, the authors show that this well established service does not address the current needs, practices, and variety of discovery. Alternatives in terms of technical choices, features, and governance, do however exist, offering richer and more open discovery. The paper presents in particular the implementations and research work of the H2020 project TRIPLE (Transforming Research through Innovative Practices for Linked Interdisciplinary Exploration). Dedicated to the building of a discovery platform for the SSH, the project is meant to address the specificities and evolution of discovery in this field. Prevailing scholarly resource platforms like Google Scholar limit discovery by focussing only on publications, and favouring through their algorithm well-cited papers, English content, and discipline-specific resources. A limitation in the context of cross-disciplinary and collaborative Open Science, such a service more specifically hinders discovery in the SSH. Characterized by a fragmented landscape, a variety of languages, data types, and outputs, research in the SSH requires services that fully exploit discovery potentialities. Moreover, a survey conducted within the TRIPLE project showed that most SSH researchers use Google Scholar as their starting point, and that they recognise the lack of control they have with this system},
KEYWORDS = {Open Science, Content discovery, Information seeking, Social Sciences, Humanities, Infrastructure, Search engines, Multilingualism},
PAGES = {1-22},
URL = {https://open-research-europe.ec.europa.eu/articles/2-28},
DOI = {10.12688/openreseurope.14318.2},
ISSN = {2732-5121},
JOURNAL = {OPEN RESEARCH EUROPE},
}
@ARTICLE{ANGELIS_2022_ARTICLE_AVTSGPCM_437313,
AUTHOR = {Angelis, D. and Vacca, F. and Tofanicchio, V. and Strimpakos, J. and Giacovazzo, G. and Pavone, G. and Coccurello, F. and Marinelli, R.},
TITLE = {Sex Differences in Neuropathy: The Paradigmatic Case of MetFormin},
YEAR = {2022},
ABSTRACT = {As a widely prescribed anti-diabetic drug, metformin has been receiving novel attention for its analgesic potential. In the study of the complex etiology of neuropathic pain (NeP), male and female individuals exhibit quite different responses characterized by higher pain sensitivity and greater NeP incidence in women. This "gender gap" in our knowledge of sex differences in pain processing strongly limits the sex-oriented treatment of patients suffering from NeP. Besides, the current investigation of the analgesic potential of metformin has not addressed the "gender gap" problem. Hence, this study focuses on metformin and sex-dependent analgesia in a murine model of NeP induced by chronic constriction injury of the sciatic nerve. We investigated sexual dimorphism in signaling pathways involved by 7 days of metformin administration, such as changes in AMP-activated protein kinase and the positive regulation of autophagy machinery, discovering that metformin affected in a sexually dimorphic manner the immunological and inflammatory response to nerve lesion. These effects were complemented by morphological and adaptive changes occurring after peripheral nerve injury. Altogether these data can contribute to explaining a number of potential mechanisms responsible for the complete recovery from NeP found in male mice, as opposed to the failure of long-lasting recovery in female animals. © 2022 by the authors},
KEYWORDS = {allodynia, AMPK, autophagy, leptin, macrophage, metformin, neurofilament, neuropathic pain, sex difference, TNF?},
PAGES = {22},
URL = {https://www.mdpi.com/1422-0067/23/23/14503},
VOLUME = {23 (23)},
DOI = {10.3390/ijms232314503},
ISSN = {1422-0067},
JOURNAL = {INTERNATIONAL JOURNAL OF MOLECULAR SCIENCES (ONLINE)},
}
@ARTICLE{ARMASELU_2022_ARTICLE_AAKLMTUVV_444088,
AUTHOR = {Armaselu, F. and Apostol, E. S. and Khan, A. F. A. and Liebeskind, C. and McGillivray, B. and Truic, C. O. and Utka, A. and Valunaite Oleskeviciene, G. and Van Erp, M.},
TITLE = {LL(O)D and NLP perspectives on semantic change for humanities research},
YEAR = {2022},
ABSTRACT = {This paper presents an overview of the LL(O)D and NLP methods, tools and data for detecting and representing semantic change, with its main application in humanities research. The paper's aim is to provide the starting point for the construction of a workflow and set of multilingual diachronic ontologies within the humanities use case of the COST Action Nexus Linguarum, European network for Web-centred linguistic data science, CA18209. The survey focuses on the essential aspects needed to understand the current trends and to build applications in this area of study},
KEYWORDS = {Linguistic linked open data, natural language processing, semantic change, ontologies, humanities},
URL = {https://iris.cnr.it/handle/20.500.14243/444088},
DOI = {10.3233/SW-222848},
ISSN = {2210-4968},
JOURNAL = {SEMANTIC WEB (ONLINE)},
}
@ARTICLE{BACCO_2022_ARTICLE_BRADVVDMPD_446362,
AUTHOR = {Bacco, L. and Russo, F. and Ambrosio, L. and D'Antoni, F. and Vollero, L. and Vadala, G. and Dell'Orletta, F. and Merone, M. and Papalia, R. and Denaro, V.},
TITLE = {Natural language processing in low back pain and spine diseases: A systematic review},
YEAR = {2022},
ABSTRACT = {Natural Language Processing (NLP) is a discipline at the intersection between Computer Science (CS), Artificial Intelligence (AI), and Linguistics that leverages unstructured human-interpretable (natural) language text. In recent years, it gained momentum also in health-related applications and research. Although preliminary, studies concerning Low Back Pain (LBP) and other related spine disorders with relevant applications of NLP methodologies have been reported in the literature over the last few years. It motivated us to systematically review the literature comprised of two major public databases, PubMed and Scopus. To do so, we first formulated our research question following the PICO guidelines. Then, we followed a PRISMA-like protocol by performing a search query including terminologies of both technical (e. g., natural language and computational linguistics) and clinical (e. g., lumbar and spine surgery) domains. We collected 221 non-duplicated studies, 16 of which were eligible for our analysis. In this work, we present these studies divided into sub-categories, from both tasks and exploited models' points of view. Furthermore, we report a detailed description of techniques used to extract and process textual features and the several evaluation metrics used to assess the performance of the NLP models. However, what is clear from our analysis is that additional studies on larger datasets are needed to better define the role of NLP in the care of patients with spinal disorders},
KEYWORDS = {natural language processing, Low Back Pain, Survey},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85135163810\&origin=inward},
VOLUME = {9},
DOI = {10.3389/fsurg.2022.957085},
ISSN = {2296-875X},
JOURNAL = {FRONTIERS IN SURGERY},
}
@ARTICLE{BELLANDI_2022_ARTICLE_B_505727,
AUTHOR = {Bellandi, A.},
TITLE = {Le Risorse Linguistiche nell’era del Web Semantico},
YEAR = {2022},
ABSTRACT = {The application of digital technologies in lexicography and terminology is becoming increasingly pervasive. The Semantic Web offers a great potential for representing data in order to process it, understand its meaning, and share it across different scientific communities. In this area scientific communities defined computational models for the representation of linguistic data together with best practices for their use. However, applications for managing this data in the context of the Semantic Web, are a few. This paper fills this gap by presenting a set of web services that are general enough to be used as a basis for the development of task-oriented lexicography and terminology applications, such as editing, data visualization, querying, and using for linguistic/conceptual full-text searches. The final part of the contribution will describe some use cases of the presented services},
KEYWORDS = {Semantic Web, Lexicography, Terminology, OntoLex-Lemon},
PAGES = {31-50},
URL = {https://iris.cnr.it/handle/20.500.14243/505727},
VOLUME = {(1-2)},
ISSN = {1594-2201},
JOURNAL = {AIDA INFORMAZIONI (ONLINE)},
}
@ARTICLE{BIFFI_2022_ARTICLE_BDFGMS_458632,
AUTHOR = {Biffi, M. and De Blasi, F. and Favaro, M. and Guadagnini, E. and Montemagni, S. and Sassolini, E.},
TITLE = {Parole in rete / reti di parole. Possibili impieghi didattici dei grandi vocabolari storici digitalizzati},
YEAR = {2022},
ABSTRACT = {After a brief presentation of the great historical dictionaries of Italian, which are freeto use online thanks to the digitalisation work carried out by the Accademia dellaCrusca, the contribution offers a number of examples of how these tools can be usedfor educational purposes. Finally, further didactic uses are described, which will bemade possible thanks to the advanced digital tools that the Accademia della Cruscaand the Istituto di Linguistica Computazionale "Antonio Zampolli" del Consiglio Nazionaledelle Ricerche (ILC) are currently working on},
KEYWORDS = {Lessicografia italiana, Didattica dell'italiano, Lessicografia digitale},
PAGES = {143-188},
URL = {https://italianoascuola.unibo.it/article/view/14866},
VOLUME = {4},
DOI = {10.6092/issn.2704-8128/14866},
ISSN = {2704-8128},
JOURNAL = {ITALIANO A SCUOLA},
}
@ARTICLE{BIFFI_2022_ARTICLE_BG_413333,
AUTHOR = {Biffi, M. and Guadagnini, E.},
TITLE = {«Le citazioni riconducono il dizionario nell'ambito della letteratura e della vita»: un primo sguardo d'insieme sui citati del GDLI},
YEAR = {2022},
ABSTRACT = {During the refinement of the computerised version of the Grande dizionario della lingua italiana, carried out by the Accademia della Crusca in collaboration with the Istituto di linguistica computazionale (CNR-Pisa), the Index of cited authors was fully corrected and digitally acquired. The contribution presents some data, now available for the first time thanks to the conversion into electronic format of the vocabulary and its bibliography, useful for closer study of the sources used in Battaglia. The examples cited in the entries represent, as is well known, the heart of the GDLI and at the same time one of the most intensely discussed aspects by scholars. The perception that we have and have had of this aspect of the dictionary, however, does not always correspond to the actual data. Given the size of the corpus of the entries, only the overall view made possible by digital interrogation allows an objective assessment},
KEYWORDS = {Lessicografia italiana, Storia della lingua italiana},
PAGES = {351-386},
URL = {https://accademiadellacrusca.it/it/riviste/articoli/slei-xxxix-2022/7599},
VOLUME = {XXXIX},
ISSN = {0392-5218},
JOURNAL = {STUDI DI LESSICOGRAFIA ITALIANA},
}
@ARTICLE{BRANCATO_2022_ARTICLE_BB_430687,
AUTHOR = {Brancato, D. and Burgassi, C.},
TITLE = {IL DE' BENIFIZII DI BENEDETTO VARCHI. VERSO L'EDIZIONE},
YEAR = {2022},
ABSTRACT = {This article examines the main linguistic features in Benedetto Varchi's translation of Seneca's De beneficiis (Florence, Torrentino, 1554) in preparation for a critical edition of the text. It provides the essential information about the cultural context of the work, including its origins, sources, as well as the specific linguistic features of the target text, in particular the translator's programmatic claims and strategies. The analysis uncovers new cultural and linguistic aspects that were hitherto unknown, such as the connection between Varchi and the viceroyal family of Pedro de Toledo in Naples, the relationship between source and target texts (with emphasis to the editions of Seneca's Opera omnia edited by Erasmus), and the translation techniques that reveal Varchi's sustained use of lexical (idioms in particular) and syntactic traits of spoken Florentine (fiorentino vivo)},
KEYWORDS = {Bendetto Varchi, Seneca, Traduzione, De beneficiis},
PAGES = {208-236},
URL = {https://iris.cnr.it/handle/20.500.14243/430687},
VOLUME = {48 (2)},
DOI = {10.61001/108416},
ISSN = {0394-3569},
JOURNAL = {STUDI LINGUISTICI ITALIANI},
}
@ARTICLE{BRUNATO_2022_ARTICLE_BDV_440157,
AUTHOR = {Brunato, D. and Dell'Orletta, F. and Venturi, G.},
TITLE = {Linguistically-Based Comparison of Different Approaches to Building Corpora for Text Simplification: A Case Study on Italian},
YEAR = {2022},
ABSTRACT = {In this paper, we present an overview of existing parallel corpora for Automatic Text Simplification (ATS) in different languages focusing on the approach adopted for their construction. We make the main distinction between manual and (semi)-automatic approaches in order to investigate in which respect complex and simple texts vary and whether and how the observed modifications may depend on the underlying approach. To this end, we perform a two-level comparison on Italian corpora, since this is the only language, with the exception of English, for which there are large parallel resources derived through the two approaches considered. The first level of comparison accounts for the main types of sentence transformations occurring in the simplification process, the second one examines the results of a linguistic profiling analysis based on Natural Language Processing techniques and carried out on the original and the simple version of the same texts. For both levels of analysis, we chose to focus our discussion mostly on sentence transformations and linguistic characteristics that pertain to the morpho-syntactic and syntactic structure of the sentence},
KEYWORDS = {linguistic complexity, corpus construction, text simplification},
PAGES = {1-19},
URL = {https://www.frontiersin.org/articles/10.3389/fpsyg.2022.707630/full},
VOLUME = {13},
DOI = {10.3389/fpsyg.2022.707630},
ISSN = {1664-1078},
JOURNAL = {FRONTIERS IN PSYCHOLOGY},
}
@ARTICLE{BRUNATO_2022_ARTICLE_BMD_414977,
AUTHOR = {Brunato, D. and Mattei, A. and Dell'Orletta, F.},
TITLE = {Analisi della scrittura giovanile da una prospettiva linguistico-computazionale: il caso di studio della Fanfiction},
YEAR = {2022},
ABSTRACT = {This paper presents a study aimed at characterizing the linguistic style of an emerging literary genre of the web, particularly appreciated by teens and young adults: fanfiction. By relying on Natural Language Processing approaches, and in particular on the methodology of linguistic profiling applied to a novel corpus of Italian fanfiction stories inspired by the fantasy saga "Harry Potter", we investigate the relationship between linguistic style and 'success', measured in terms of number of reviews obtained by the readers. We show that it is possible to detect a set of features, among a wide set of linguistic ones modeling lexical, morpho-syntactic and syntactic phenomena, which help more in discriminating between 'successful' and 'unsuccessful' fanfics},
KEYWORDS = {stilometria computazionale, linguistic profiling, fanfiction},
PAGES = {171-189},
URL = {https://iris.cnr.it/handle/20.500.14243/414977},
VOLUME = {2021/3},
ISSN = {0033-9725},
JOURNAL = {RASSEGNA ITALIANA DI LINGUISTICA APPLICATA},
}
@ARTICLE{BRUNATO_2022_ARTICLE_BV_420475,
AUTHOR = {Brunato, D. and Venturi, G.},
TITLE = {Why is this language complex? Cherry-pick the optimal set of features in multilingual treebanks},
YEAR = {2022},
ABSTRACT = {This paper investigates linguistic complexity across natural languages from a corpus-based perspective and relies on the assumptions of linguistic profiling as a methodological framework. We focus in particular on the domain of syntactic complexity and analyze the distribution of a set of features taken as proxies of complexity phenomena at the sentence level, which were extracted from 63 treebanks annotated according to the Universal Dependencies formalism. This dataset guarantees that the features considered are modeling the same linguistic phenomena in different treebanks, allowing reliable comparison among languages. We show that our approach is able to identify tendencies of structural proximity between languages not necessarily in line with typologically-supported classification, thus shedding light on new corpus-based findings},
KEYWORDS = {Linguistic Complexity, Linguistic Profiling, Universal Dependencies},
PAGES = {59-72},
URL = {https://www.degruyter.com/document/doi/10.1515/lingvan-2021-0017/html},
DOI = {10.1515/lingvan-2021-0017},
ISSN = {2199-174X},
JOURNAL = {LINGUISTICS VANGUARD},
}
@ARTICLE{CARRARI_2022_ARTICLE_CABDFFGGMMMPRSB_516090,
AUTHOR = {Carrari, E. and Aglietti, C. and Bellandi, A. and Dibari, C. and Ferrini, F. and Fineschi, S. and Galeotti, P. and Giuntoli, A. and Manganelli Del Fa, R. and Moriondo, M. and Mozzo, M. and Padovan, G. and Riminesi, C. and Selvi, F. and Bindi, M.},
TITLE = {The management of plants and their impact on monuments in historic gardens: Current threats and solutions},
YEAR = {2022},
ABSTRACT = {The conservation of historic gardens is crucial for safeguarding monumental, aesthetic, historical, ecological and economic values in many countries of the World, as well as associated services, such as carbon stock, microclimate and water regulation, biodiversity conservation, pollution removal, and recreation. In historic gardens, architectural and sculpture elements coexist with an abundant plant component, which is currently often precarious due to senescence processes occurring nowadays. Unhealthy plants and reduced structural stability of trees represent a threat for both garden artistic structures and buildings, as well for the visitors’ safety. Awareness in garden managers about the most relevant and current threats is necessary for garden conservation. This review, through a global survey of the literature since 1990, addresses two main questions (1) which are the most relevant threats on historic gardens vegetation as affected by environmental, biological and anthropogenic causes, and how do they impact on monuments? (2) Which are related strategies to counteract these threats? Regarding the whole analysed period, the impact of the biotic component on monuments was the most discussed threat; in recent years a growing concern on the effects of climate change and pathogens and pests on historic garden plants also emerged. Strategies to address current and future challenges of historic gardens are hereby identified from experiences reported in worldwide literature and discussed. Best practices are collected in tables to provide managers of historic gardens with a valuable tool and guide to conserve and enhance their value. Due to the heterogeneity of the threats to be addressed, a multidisciplinary approach to ensure the conservation of historic gardens is recommended},
KEYWORDS = {Heritage gardens, Biodeterioration, Climate change, Veteran tree management, Phytosanitary control, Alien species},
PAGES = {127727-1-127727-15},
URL = {https://www.sciencedirect.com/science/article/abs/pii/S1618866722002709},
VOLUME = {76},
DOI = {10.1016/j.ufug.2022.127727},
ISSN = {1618-8667},
JOURNAL = {URBAN FORESTRY \& URBAN GREENING},
}
@ARTICLE{DELFANTE_2022_ARTICLE_D_448012,
AUTHOR = {Del Fante, D.},
TITLE = {Metaphors and pandemics: Spanish Flu and Coronavirus in US newspapers. A case-study},
YEAR = {2022},
ABSTRACT = {Der internationale Ausbruch des Coronavirus hat unser Leben radikal verändert und die Stabilität unserer heutigen Gesellschaften in Frage gestellt. Es ist jedoch nicht das erste Mal, dass die Menschheit mit einer globalen Pandemie konfrontiert ist. Die Spanische Grippe von 1918 führte zu einer der tödlichsten Pandemien aller Zeiten. Bei der Frage, wie wir über Gesundheit und Krankheit denken und sprechen, spielen Metaphern eine bedeutende Rolle. Wenn man versteht, wie das Coronavirus und die Spanische Grippe im Zeitungsdiskurs metaphorisch dargestellt werden, ist es einfacher, den sprachlichen Prozess zu beleuchten, durch den Metaphern wirken, und zu verstehen, inwieweit sozio-historisch-kulturelle Bedingungen die Aktualisierung einer Metapher beeinflussen können. Die Arbeit zeigt, dass Metaphern in beiden Zeitkontexten durchgängig vorhanden sind und das Coronavirus und die Spanische Grippe in ähnlicher Weise metaphorisch dargestellt werden. Dies könnte darauf hindeuten, dass es eine Pandemie-Rhetorik gibt, die über den spezifischen soziokulturellen und politischen Kontext hinausgeht: eine Reaktion auf eine Bedrohung in Form einer Pandemie, die tief mit der menschlichen Natur verbunden ist},
KEYWORDS = {conceptual metaphor, corpus assisted discourse studies, health communication, corpus linguistics},
PAGES = {143-184},
URL = {https://www.metaphorik.de/sites/www.metaphorik.de/files/journal-pdf/32-2022_6_del-fante_0.pdf},
VOLUME = {32},
JOURNAL = {METAPHORIK. DE},
}
@ARTICLE{DELFANTE_2022_ARTICLE_D_439555,
AUTHOR = {Del Fante, D.},
TITLE = {Review: A Corpus-Based Analysis of Ideological Bias: Migration in the British Press},
YEAR = {2022},
KEYWORDS = {Migration Studies, Newspaper Discourse, Corpus Linguistics, Corpus Approaches to Discourse Analysis},
PAGES = {137-139},
URL = {https://journals.sagepub.com/doi/10.1177/14614456211073219a},
VOLUME = {24 (1)},
DOI = {10.1177/14614456211073219a},
JOURNAL = {DISCOURSE STUDIES},
}
@ARTICLE{DELFANTE_2022_ARTICLE_DG_444870,
AUTHOR = {Del Fante, D. and Giorgio, M. D. N.},
TITLE = {OCR Correction for Corpus-assisted Discourse Studies: A Case Study of Old Newspapers},
YEAR = {2022},
ABSTRACT = {L'uso di software di riconoscimento OCR per convertire i caratteri stampati in testo digitale è uno strumento fondamentale per quanto riguarda l'ambito di studio degli approcci diacronici all'analisi del discorso politico attraverso i corpora (CADS studies). Tuttavia, i software OCR non sono totalmente affidabili, e il loro tasso di fallibilità può compromettere l'analisi. Questo articolo propone un approccio qualitativo-quantitativo al rilevamento e alla correzione degli errori post scansione OCR al fine di sviluppare una metodologia per migliorare la qualità dei corpora all'interno degli studi storici. Abbiamo applicato la metodologia sviluppata a due casi di studio su giornali dell'inizio del XX secolo per l'analisi linguistica delle rappresentazioni metaforiche delle migrazioni e delle pandemie. Il risultato di questo progetto consiste in un insieme di regole che sono valide per diversi contesti e applicabili a diversi corpora e che possono essere riutilizzate. La procedura proposta, in termini di leggibilità computazionale, ha lo scopo di rendere più leggibile e ricercabile la vasta gamma di corpora di testi storici che sono, al momento, solo parzialmente utilizzabili dato l'alto tasso di errore derivante da un software di riconoscimento OCR},
KEYWORDS = {Corpus-assisted Discourse Studies, OCR detection, OCR correction, OCR post-processing, Text Mining},
PAGES = {99-124},
URL = {https://umanisticadigitale.unibo.it/article/view/13689},
VOLUME = {11},
DOI = {10.6092/issn},
ISSN = {2532-8816},
JOURNAL = {UMANISTICA DIGITALE},
}
@ARTICLE{DELGRATTA_2022_ARTICLE_DDZBB_446354,
AUTHOR = {Del Gratta, R. and Del Grosso, A. M. and Zenzaro, S. and Boschetti, F. and Bambaci, L.},
TITLE = {La Filologia come sistema dinamico},
YEAR = {2022},
ABSTRACT = {In this article we introduce a formal approach to the evolution of documents with particular attention to the philological perspective and the typical related issues. We propose a mathematical model capable of formalizing various complex phenomena in various research fields such as Computational Linguistics, Digital Philology and Software Engineering, in particular when this is applied to the analysis of documents and texts of historical and literary interest},
KEYWORDS = {computational philology, formal philology, digital humanities},
PAGES = {1-20},
URL = {https://umanisticadigitale.unibo.it/article/view/13684},
VOLUME = {13},
DOI = {10.6092/issn.2532-8816/13684},
ISSN = {2532-8816},
JOURNAL = {UMANISTICA DIGITALE},
}
@ARTICLE{DIDONATO_2022_ARTICLE_D_474445,
AUTHOR = {Di Donato, F.},
TITLE = {Una questione di qualità o una formalità? L'Agreement on Reforming Research Assessment e il processo di riforma della valutazione della ricerca in Europa},
YEAR = {2022},
ABSTRACT = {L’Agreement on Reforming Research Assessment è stato pubblicato il 20 luglio 2022, al termine di un processo avviato dalla Commissione europea all’inizio del 2021. L’articolo espone gli elementi fondamentali dell’accordo, ricostruisce la genesi e le tappe del processo e presenta il contesto culturale e politico in cui si è definito. Inoltre, vengono proposti alcuni primi elementi per la definizione di roadmap e piani d'azione necessari a tradurre i principi e gli impegni dell’accordo in una serie di criteri e indicatori per la valutazione di istituzioni, di progetti di ricerca e di singoli ricercatori. In conclusione sono presentate alcune riflessioni sulle sfide da affrontare e sulle opportunità che la riforma della valutazione offre},
KEYWORDS = {Coara, riforma della valutazione della ricerca, scienza aperta},
PAGES = {22},
URL = {https://commentbfp.sp.unipi.it/francesca-di-donato-una-questione-di-qualita-o-una-formalita-lagreement-on-reforming-research-assessment-e-il-processo-di-riforma-della-valutazione-della-ricerca-in-europa/},
DOI = {10.5281/zenodo.7433047},
ISSN = {1591-4305},
JOURNAL = {BOLLETTINO TELEMATICO DI FILOSOFIA POLITICA},
}
@ARTICLE{FERRARI_2022_ARTICLE_FPBVV_420230,
AUTHOR = {Ferrari, A. and Pirrotta, L. and Bonciani, M. and Venturi, G. and Vainieri, M.},
TITLE = {Higher readability of institutional websites drives the correct fruition of the abortion pathway: A cross-sectional study},
YEAR = {2022},
ABSTRACT = {In Italy, abortion services are public: therefore, health Institutions should provide clear and easily readable web-based information. We aimed to 1) assess variation in abortion services utilisation; 2) analyse the readability of institutional websites informing on induced abortion; 3) explore whether easier-to-read institutional websites influenced the correct fruition of abortion services. We identified from the 2021 administrative databases of Tuscany all women having an abortion, and-among them-women having an abortion with the certification provided by family counselling centres, following the pathway established by law. We assessed variation in total and certified abortion rates by computing the Systematic Component of Variation. We analysed the readability of the Tuscan health authorities' websites using the readability assessment tool READ-IT. We explored how institutional website readability influenced the odds of having certified abortions by running multilevel logistic models, considering health authorities as the highest-level variables. We observed high variation in the correct utilization of the abortion pathway in terms of certified abortion rates. The READ-IT scores showed that the most readable text was from the Florence Teaching Hospital website. Multilevel models revealed that higher READ-IT scores, corresponding to more difficult texts, resulted in lower odds of certified abortions. Large variation in the proper fruition of abortion pathways occurs in Tuscany, and such variation may depend on readability of institutional websites informing on induced abortion. Therefore, health Institutions should monitor and improve the readability of their websites to ensure proper and more equitable access to abortion},
KEYWORDS = {abortion services, readability assessment},
PAGES = {1-13},
URL = {https://journals.plos.org/plosone/article?id=10.1371/journal.pone.0277342},
VOLUME = {17 (11)},
DOI = {10.1371/journal.pone.0277342},
ISSN = {1932-6203},
JOURNAL = {PLOS ONE},
}
@ARTICLE{GUADAGNINI_2022_ARTICLE_G_420054,
AUTHOR = {Guadagnini, E.},
TITLE = {Alessandro Manzoni tra l'ancudine e l'incudine},
YEAR = {2022},
ABSTRACT = {In Fermo e Lucia the phrase tra l'incudine e il martello appears. After having eliminated it in the "seconda minuta", in the Ventisettana Alessandro Manzoni reinserts (essere) tra l'ancudine e il martello, and this idiomatic expression remains in the Quarantana. The paper highlights particular aspects in order to explain the reasons that may have led Manzoni to prefer ancudine to incudine, before and after his journey to Tuscany},
KEYWORDS = {Alessandro Manzoni, Toscanismo, Latinismo},
PAGES = {161-169},
URL = {https://iris.cnr.it/handle/20.500.14243/420054},
VOLUME = {18},
ISSN = {1724-9074},
JOURNAL = {LA LINGUA ITALIANA},
}
@ARTICLE{KHAN_2022_ARTICLE_KCDGGGILMMPPRT_444090,
AUTHOR = {Khan, A. F. A. and Chiarcos, C. and Declerck, T. and Gifu, D. and González Blanco García, E. and Gracia, J. and Ionov, M. and Labropoulou, P. and Mambrini, F. and McCrae, J. P. and Pagé Perron, É. and Passarotti, M. and Ros Muñoz, S. and Truic, C. O.},
TITLE = {When linguistics meets web technologies. Recent advances in modelling linguistic linked data},
YEAR = {2022},
ABSTRACT = {This article provides a comprehensive and up-to-date survey of models and vocabularies for creating linguistic linked data (LLD) focusing on the latest developments in the area and both building upon and complementing previous works covering similar territory. The article begins with an overview of some recent trends which have had a significant impact on linked data models and vocabularies. Next, we give a general overview of existing vocabularies and models for different categories of LLD resource. After which we look at some of the latest developments in community standards and initiatives including descriptions of recent work on the OntoLex-Lemon model, a survey of recent initiatives in linguistic annotation and LLD, and a discussion of the LLD metadata vocabularies META-SHARE and lime. In the next part of the paper, we focus on the influence of projects on LLD models and vocabularies, starting with a general survey of relevant projects, before dedicating individual sections to a number of recent projects and their impact on LLD vocabularies and models. Finally, in the conclusion, we look ahead at some future challenges for LLD models and vocabularies. The appendix to the paper consists of a brief introduction to the OntoLex-Lemon model},
KEYWORDS = {Linguistic linked data, FAIR, corpora, annotation, language resources, OntoLex-Lemon, Digital Humanities, metadata, models, lexicon, language identification},
URL = {https://iris.cnr.it/handle/20.500.14243/444090},
DOI = {10.3233/SW-222859},
ISSN = {2210-4968},
JOURNAL = {SEMANTIC WEB (ONLINE)},
}
@ARTICLE{MARZI_2022_ARTICLE_MNMMP_419693,
AUTHOR = {Marzi, C. and Narzisi, A. and Milone, A. and Masi, G. and Pirrelli, V.},
TITLE = {Reading behaviors through patterns of finger-tracking in Italian children with autism spectrum disorder},
YEAR = {2022},
ABSTRACT = {The paper proposes an ecological and portable protocol for the large-scale collection of reading data in high-functioning autism spectrum disorder (ASD) children based on recording the finger movements of a subject reading a text displayed on a tablet touchscreen. By capitalizing on recent evidence that movements of a finger that points to a scene or text during visual exploration or reading may approximate eye fixations, we focus on recognition of written content and function words, pace of reading, and accuracy in reading comprehension. The analysis showed significant differences between typically developing and ASD children, with the latter group exhibiting greater variation in levels of reading ability, slower developmental pace in reading speed, less accurate comprehension, greater dependency on word length and word frequency, less significant prediction-based processing, as well as a monotonous, steady reading pace with reduced attention to weak punctuation. Finger-tracking patterns provides evidence that ASD readers may fail to integrate single word processing into major syntactic structures and lends support to the hypothesis of an impaired use of contextual information to predict upcoming stimuli, suggesting that difficulties in perception may arise as difficulties in prediction},
KEYWORDS = {reading, autism, finger-tracking, deleloping readers, prediction-driven processing},
PAGES = {1-17},
URL = {https://www.mdpi.com/2076-3425/12/10/1316},
VOLUME = {12 (1316)},
DOI = {10.3390/brainsci12101316},
ISSN = {2076-3425},
JOURNAL = {BRAIN SCIENCES},
}
@ARTICLE{MIASCHI_2022_ARTICLE_MBDV_417257,
AUTHOR = {Miaschi, A. and Brunato, D. P. and Dell'Orletta, F. and Venturi, G.},
TITLE = {On Robustness and Sensitivity of a Neural Language Model: A Case Study on Italian L1 Learner Errors},
YEAR = {2022},
ABSTRACT = {In this paper, we propose a comprehensive linguistic study aimed at assessing the implicit behavior of one of the most prominent Neural Language Models (NLM) based on Transformer architectures, BERT (Devlin et al., 2019), when dealing with a particular source of noisy data, namely essays written by L1 Italian learners containing a variety of errors targeting grammar, orthography and lexicon. Differently from previous works, we focus on the pre-training stage and we devise two complementary evaluation tasks aimed at assessing the impact of errors on sentence-level inner representations in terms of semantic robustness and linguistic sensitivity. While the first evaluation perspective is meant to probe the model's ability to encode the semantic similarity between sentences also in the presence of errors, the second type of probing task evaluates the influence of errors on BERT's implicit knowledge of a set of raw and morpho-syntactic properties of a sentence. Our experiments show that BERT's ability to compute sentence similarity and to correctly encode multi-leveled linguistic information of a sentence are differently modulated by the category of errors and that the error hierarchies in terms of robustness and sensitivity change across layer-wise representations},
KEYWORDS = {Natural Language Processing, Neural Language Model, Interpretability},
PAGES = {426-438},
URL = {https://doi.org/10.1109/TASLP.2022.3226333},
VOLUME = {31},
DOI = {10.1109/TASLP.2022.3226333},
ISSN = {2329-9290},
JOURNAL = {IEEE/ACM TRANSACTIONS ON AUDIO, SPEECH, AND LANGUAGE PROCESSING},
}
@ARTICLE{MIASCHI_2022_ARTICLE_MSBDV_443057,
AUTHOR = {Miaschi, A. and Sarti, G. and Brunato, D. P. and Dell'Orletta, F. and Venturi, G.},
TITLE = {Probing Linguistic Knowledge in Italian Neural Language Models across Language Varieties},
YEAR = {2022},
ABSTRACT = {In this paper, we present an in-depth investigation of the linguistic knowledge encoded by the transformer models currently available for the Italian language. In particular, we investigate how the complexity of two different architectures of probing models affects the performance of the Transformers in encoding a wide spectrum of linguistic features. Moreover, we explore how this implicit knowledge varies according to different textual genres and language varieties},
KEYWORDS = {Neural Language Models, Interpretability, Language Varieties},
PAGES = {25-44},
URL = {http://www.aaccademia.it/ita/scheda-libro?aaref=1518},
DOI = {10.4000/ijcol.965},
ISSN = {2499-4553},
JOURNAL = {IJCOL},
}
@ARTICLE{NAHLI_2022_ARTICLE_ND_446546,
AUTHOR = {Nahli, O. and Del Grosso, A. M.},
TITLE = {Structuring Arabic lexical and morphological resources using TEI: theory and practice},
YEAR = {2022},
ABSTRACT = {An Arabic word can be described according to its lexical and morphological information. The lexical information, conveyed by the root, consists of both semantic meaning and syntactic properties (e. g. parts of speech). The morphological information, encoded by patterns, is useful to group the words having similar syntactic, inflectional and semantic behaviour. Lexical analysis and morphological analysis have been separately described since the very first studies of the Arabic language. Although several scholarly works have illustrated Arabic lexicon models that encode semantic meanings, a systematic description of word patterns is still strongly lacking. In this work, we have implemented an exhaustive resource consisting of two levels: lexical and morphological. The lexical level collects information extracted from the dictionary al=q¯am¯us al=muh. ¯?t. The morphological level describes pattern formalization, which allows to enrich word descriptions with additional semantic, morphosyntactic and inflectional information. To build our digital resource, taking into account primary source, lexical requirements, and reusability, we followed the guidelines provided by the Text Encoding Initiative (abbreviated as TEI). In particular, we adopted the TEI module for the encoding of digital dictionaries and lexicons to formally represent the medieval al=q¯am¯us al=muh. ¯?t. dictionary. Given the complexityof describing the morphological information present in the patterns, we also used the TEI module devoted to encoding feature structures. Consequently, we are building an exhaustive resource formed by the lexical and the morphological blocks. These two components are distinct but complementary resources where the lexical data are connected to morphological information. In addition, the morphological resource can be used as a stand-alone tool that allows the morphological analyzers to capture aspects of meaning that cannot be identified by current systems},
KEYWORDS = {classical Arabic dictionary, digital lexicography, al=qamus al=muhit., word patterns, TEI, feature structures},
PAGES = {3-14},
URL = {https://www.innove.org/ijist/index.php/ijist/article/view/191/146},
VOLUME = {5 (3)},
DOI = {10.57675/IMIST.PRSM/ijist-v5i3.191},
ISSN = {2550-5114},
JOURNAL = {INTERNATIONAL JOURNAL OF INFORMATION SCIENCE AND TECHNOLOGY},
}
@ARTICLE{NAHLI_2022_ARTICLE_NSBB_446539,
AUTHOR = {Nahli, O. and Sanna, A. and Bandini, M. and Boschetti, F.},
TITLE = {Commerce Numérique: traffic signals for the crossroads between cultures},
YEAR = {2022},
ABSTRACT = {Commerce is a literary French journal founded by Princess Margherita Caetani, involving three prestigious collaborators: Paul Valéry, Léon-Paul Fargue, Valéry Larbaud. It is composed by 29 volumes published between 1924 and 1932. Each volume collects different literary material of various well-known and unknown writers as poems or novels, translating some of the most important authors like Joyce, T. S. Eliot, Pirandello, Ungaretti, Saint-John Perse, Rilke, Hofmannsthal. Considering the historical, literary, and cultural importance of the Commerce journal, our project "Commerce numérique" aims to digitize and to make the journal contents freely available online to both the general public and the research community. This article presents how the journal was encoded. Also, we give importance to the coding of poems present in Commerce. Indeed, some poems are original in another language and they are accompanied by their French translation. Other poems are a French-translated form without original text. In order to fully and accurately express the phenomena and their structures, we have adopted some aspects of the TEI framework, which we will explain in detail. Particular attention was paid to the French translation of a Moroccan Arabic poem from the 13th century. On the one hand, the original Arabic poetry is interesting because it presents some aspects of the Moroccan dialect and some aspects of the oral text. On the other hand, the study and the encoding of Arabic poetry in parallel to its translation highlight some important structural differences between Arabic poetry and Western poetry},
KEYWORDS = {Commerce Journal, OCR, TEI encoding, literary journal, digital resources, Arabic poetry},
PAGES = {36-45},
URL = {https://www.innove.org/ijist/index.php/ijist/article/view/193/149},
VOLUME = {5 (3)},
DOI = {10.57675/IMIST.PRSM/ijist-v5i3.193},
ISSN = {2550-5114},
JOURNAL = {INTERNATIONAL JOURNAL OF INFORMATION SCIENCE AND TECHNOLOGY},
}
@ARTICLE{PIRROTTA_2022_ARTICLE_PGTBVD_445825,
AUTHOR = {Pirrotta, L. and Guidotti, E. and Tramontani, C. and Bignardelli, E. and Venturi, G. and De Rosis, S.},
TITLE = {COVID-19 vaccinations: An overview of the Italian national health system's online communication from a citizen perspective},
YEAR = {2022},
ABSTRACT = {COVID-19 vaccine hesitancy is still widespread. During the pandemic, the internet has been the preferred channel for health-related information, especially for less-educated citizens who tend to be the most hesitant about vaccination. A well-structured web communication strategy could help both to overcome vaccine hesitancy and to ensure equity in healthcare service access. This study investigated how the various regional and local health authorities in Italy used their institutional websites to inform users about COVID-19 vaccinations between March and April 2021. We browsed 129 institutional websites, checking the availability, quality and quantity, actionability and readability of information using a literature-based common grid. Descriptive statistics and statistical tests were performed. The online public dissemination of COVID-19 vaccination information in Italy was fragmented, both across and within regions. The side effects of vaccinations, were often not reported on the websites, thus missing an opportunity to enhance vaccination uptake. More focus should also be placed on readability, since readability indexes showed that they were difficult to understand. Our research revealed that several actions could be implemented to enhance online communication on COVID-19 vaccination. For instance, simplifying texts can make them more understandable and the information reported actionable},
KEYWORDS = {Vaccinationa Communication, Readability Assessment, Online Information, Covid-19},
PAGES = {970-979},
URL = {https://www.sciencedirect.com/science/article/pii/S0168851022002184},
VOLUME = {10 (126)},
DOI = {10.1016/j.healthpol.2022.08.001},
ISSN = {0168-8510},
JOURNAL = {HEALTH POLICY},
}
@ARTICLE{RUSSO_2022_ARTICLE_RCCP_505401,
AUTHOR = {Russo, I. and Comandini, G. and Caselli, T. and Patti, V.},
TITLE = {Share and Shout: Proto-Slogans in Online Political Communities},
YEAR = {2022},
ABSTRACT = {This paper proposes a methodology for investigating populism on social media by analyzing the emergence of proto-slogans, defined as nominal utterances (NUs) typical of a political community on social media. We extracted more than 700. 000 comments from the public Facebook pages of two Italian populist parties’ leaders (Matteo Salvini and Luigi Di Maio) during the week preceding the 2019 European elections (i. e., from May 20 to May 26, 2019). These comments have been automatically clustered and manually annotated to find proto-slogans created by the parties’ supporters. Our manual annotation consists of four layers, namely: Nominal Utterances (NUs), a syntactic device widely used for slogans; Slogans for NUs with a slogan function; Top-down/Bottom-up, to recognize the slogans produced by the politicians and those produced by supporters; Proto-slogans, for NUs devoid of specific political content that nonetheless express partisanship and support for the leaders},
KEYWORDS = {political communication, slogans, populism},
PAGES = {33-49},
URL = {https://jlcl.org/article/download/228/226},
VOLUME = {35 (2)},
ISSN = {2190-6858},
JOURNAL = {JOURNAL FOR LANGUAGE TECHNOLOGY AND COMPUTATIONAL LINGUISTICS},
}
@ARTICLE{SAPONARO_2022_ARTICLE_SGS_455990,
AUTHOR = {Saponaro, D. and Giovannetti, E. and Sciolette, F.},
TITLE = {From Religious Sources to Computational Resources: Approach and Case Study on Hebrew Terms and Concepts},
YEAR = {2022},
ABSTRACT = {This paper introduces a methodology for the creation of a digital representation of a religious case study integrating textual, linguistic, and conceptual entities. the description of a holistic model of text, to be used as the backbone of the computational resource that needs to be built, is provided. the proposed case study, focusing on the semantic field of "face" in Jewish religion, is first introduced from the point of view of the scholar and then translated, with the support of digital tools, into the relative computational representation},
KEYWORDS = {religious studies, Hebrew terminology, ontology},
PAGES = {21},
URL = {https://iris.cnr.it/handle/20.500.14243/455990},
VOLUME = {XXVII(2022)},
ISSN = {2282-4499},
JOURNAL = {MATERIA GIUDAICA},
}
@ARTICLE{SICILIANO_2022_ARTICLE_SD_446341,
AUTHOR = {Siciliano, A. and Del Grosso, A. M.},
TITLE = {Dalla stampa al digitale: Un modello di codifica per l'edizione delle postille di Giorgio Bassani},
YEAR = {2022},
ABSTRACT = {The notes Giorgio Bassani wrote on his books represent a privileged access to his workshop, allowing us to reconstruct the genesis of the works and the intellectual profile of an important 20th century writer. When it comes to publishing, however, they pose numerous problems of classification, representation and systematisation of the data, against which the digital tool proves to be extremely advantageous. This contribution reflects on this theme, presenting the prototype of a digital scholarly edition built on the case study of Bassani's annotations to La scuola dell'uomo by Guido Calogero (Firenze, Sansoni, 1939) and reasoning on the important potential of XML-TEI markup in the treatment and representation of a complex, structured and sometimes elusive textual object such as the note},
KEYWORDS = {Digital Humanities, Digital Philology, Computational Philology, Postille, Giorgio Bassani},
PAGES = {1-26},
URL = {https://umanisticadigitale.unibo.it/article/view/13688},
VOLUME = {13},
DOI = {10.6092/issn.2532-8816/13688},
ISSN = {2532-8816},
JOURNAL = {UMANISTICA DIGITALE},
}
@BOOK{VENTURI_2022_BOOK_VCD_440167,
AUTHOR = {Venturi, G. and Cimino, A. and Dell'Orletta, F.},
TITLE = {La fede dichiarata. Un'analisi linguistico-computazionale},
YEAR = {2022},
ABSTRACT = {Il volume indaga l'apporto di tecnologie basate sul Natural Language Processing (NLP) all'analisi di un corpus di trascrizioni di 164 interviste orali raccolte durante la ricerca 2017 sulla "Religiosità in Italia". Gli autori illustrano metodologie e strumenti che permettono di trasformare l'informazione implicitamente contenuta nelle interviste in informazione esplicitamente strutturata. Il risultato finale di questo processo interpretativo spazia dall'acquisizione di conoscenze lessicali e terminologiche complesse alla loro organizzazione in strutture proto-concettuali, fino ad arrivare alla qualificazione dell'atteggiamento con il quale l'intervistato si esprime. Il lettore viene accompagnato a scoprire quale sia il valore aggiunto delle analisi basate su NLP e quali nuovi orizzonti di ricerca siano aperti da queste analisi},
KEYWORDS = {Knowledge Extraction, Knowledge Organization},
PAGES = {1-181},
URL = {https://iris.cnr.it/handle/20.500.14243/440167},
PUBLISHER = {Franco Angeli Editore (Milano, ITA)},
ISBN = {978-88-351-2146-6},
CONFERENCE_PLACE = {Milano},
}
@INCOLLECTION{CALAMAI_2022_INCOLLECTION_CPPCSM_437431,
AUTHOR = {Calamai, S. and Piccardi, D. and Pretto, N. and Candeo, G. and Stamuli, F. M. and Monachini, M.},
TITLE = {Not Just Paper: Enhancement of Archive Cultural Heritage},
YEAR = {2022},
ABSTRACT = {Oral archives and digital technologies have gone hand-in-hand for avery long time. Both sides benefit from this interdisciplinary junction: technologyenhances the preservation and diffusion of oral materials, while exploiting themto develop cutting-edge tools for their treatment. This chapter deals with anItalian instantiation of this mutual relationship: the Archivio Vi. Vo. project. Offering innovative solutions concerning metadata, audio restoration, description, and access, Archivio Vi. Vo. aims to build an online platform to hostthe oral archives from Tuscany. The project is powered by CLARIN-IT, whichguarantees its compliance with standards and offers resources for data accessand discoverability. Archivio Vi. Vo. has not been built from scratch: it is insteada cross-fertilization of previous initiatives and research projects (e. g., the Gra. foproject). Moreover, the chapter presents the related, contemporary work of amultidisciplinary group striving to synthesize a Vademecum for futuregenerations of oral archive researchers. Lastly, a brief list of tentative ideas forfuture developments of the Archivio Vi. Vo. platform will be presented},
KEYWORDS = {digital oral archives, research infrastructures, models for digital preservation},
URL = {https://www.degruyter.com/document/isbn/9783110767377/html},
DOI = {10.1515/9783110767377-025},
PUBLISHER = {Walter De Gruyter \& Co (Berlin, DEU)},
ISBN = {9783110767377},
CONFERENCE_PLACE = {Berlin},
BOOKTITLE = {CLARIN The Infrastructure for Language Resources},
EDITOR = {Fišer, D. and Witt, A.},
}
@INCOLLECTION{CREPALDI_2022_INCOLLECTION_CFMNPT_415388,
AUTHOR = {Crepaldi, D. and Ferro, M. and Marzi, C. and Nadalini, A. and Pirrelli, V. and Taxitari, L.},
TITLE = {Finger movements and eye movements during adults' silent and oral reading},
YEAR = {2022},
ABSTRACT = {Using a common tablet and a web application, we can record the finger movements of a reader that is concurrently reading and finger-pointing a text displayed on the tablet touchscreen. In a preliminary analysis of "finger-tracking" data of early-graders we showed that finger movements can replicate established reading effects observed in more controlled settings. Here, we analyse and discuss reading evidence collected by (i) tracking the finger movements of adults reading a short essay displayed on a tablet touchscreen, and (ii) tracking the eye movements of adultsreading a comparable text displayed on the screen of a computer. Texts in the two conditions were controlled for linguistic complexity and page layout. In addition, we tested adults' comprehension in both silent and oral reading, by asking them multiple-choice questions after reading each text. We show and discuss the reading evidence that the two (optical and tactile) protocols provide, and to what extent they show comparable effects. We conclude with some remarks on the importance of ecology and portability of protocols for large-scale collection of naturalistic reading data},
KEYWORDS = {Reading, finger-tracking, digital technology},
PAGES = {443-471},
URL = {https://link.springer.com/book/9783030998905},
PUBLISHER = {Springer (Dordrecht, NLD)},
ISBN = {978-3-030-99890-5},
CONFERENCE_PLACE = {Dordrecht},
BOOKTITLE = {Developing language and literacy-Studies in Honor of Dorit Diskin Ravid},
EDITOR = {Levie, R. and Bar On, A. and Ashkenazi, O. and Dattner, E. and Brandes, G.},
}
@INCOLLECTION{DEJONG_2022_INCOLLECTION_DVFVFW_446352,
AUTHOR = {De Jong, F. and Van Uytvanck, D. and Frontini, F. and Van Den Bosch, A. and Fišer, D. and Witt, A.},
TITLE = {Language Matters. The European Research Infrastructure CLARIN, Today and Tomorrow},
YEAR = {2022},
ABSTRACT = {LARIN stands for "Common Language Resources and Technology Infrastructure". In 2012 CLARIN ERIC was established as a legal entity with the mission to create and maintain a digital infrastructure to support the sharing, use, and sustainability of language data (in written, spoken, or multimodal form) available through repositories from all over Europe, in support of research in the humanities and social sciences and beyond. Since 2016 CLARIN has had the status of Landmark research infrastructure and currently it provides easy and sustainable access to digital language data and also offers advanced tools to discover, explore, exploit, annotate, analyse, or combine such datasets, wherever they are located. This is enabled through a networked federation of centres: language data repositories, service centres, and knowledge centres with single sign-on access for all members of the academic community in all participating countries. In addition, CLARIN offers open access facilities for other interested communities of use, both inside and outside of academia. Tools and data from different centres are interoperable, so that data collections can be combined and tools from different sources can be chained to perform operations at different levels of complexity. The strategic agenda adopted by CLARIN and the activities undertaken are rooted in a strong commitment to the Open Science paradigm and the FAIR data principles. This also enables CLARIN to express its added value for the European Research Area and to act as a key driver of innovation and contributor to the increasing number of industry programmes running on data-driven processes and the digitalization of society at large},
KEYWORDS = {research infrastructure, language resources, service interoperability, innovation, SSH, language technology, open science},
PAGES = {31-58},
URL = {https://www.degruyter.com/document/doi/10.1515/9783110767377-002/html},
DOI = {10.1515/9783110767377-002},
PUBLISHER = {Walter De Gruyter Inc (Boston/Berlin/Munich, USA)},
ISBN = {978-3-11-076737-7},
CONFERENCE_PLACE = {Boston/Berlin/Munich},
BOOKTITLE = {CLARIN: The Infrastructure for Language Resources},
}
@INCOLLECTION{DELFANTE_2022_INCOLLECTION_DFMQ_419162,
AUTHOR = {Del Fante, D. and Frontini, F. and Monachini, M. and Quochi, V.},
TITLE = {Italian Language Resources. From CLARIN-IT to the VLO and Back: Sketching a Methodology for Monitoring LRs Visibility},
YEAR = {2022},
ABSTRACT = {This paper sketches a user-oriented, qualitative methodology for both (i) monitoring the existence and availability of language resources relevant for a given CLARIN national community and language and (ii) assessing the offering potential of CLARIN, in terms of Language Resources provided to national consortia. From the user perspective, the methodology has been applied to investigate the visibility of language resources available for Italian within the CLARIN central services, in particular the Virtual Language Observatory. As a proof-of-concept, the methodology has been tested on the resources available through the CLARIN-IT data centres, but, ideally, it could be applied by any national data centre aiming to assess the existence of LRs in CLARIN for any given languages and check their accessibility for the interested users. It is thus argued that such an assessment might be a useful instrument in the hands of national coordinators and centre managers for (i) bringing to the fore both strengths and critical issues about their data providing community and (ii) for planning targeted actions to improve and increase both visibility and accessibility of their LRs},
KEYWORDS = {Virtual Language Observatory, CLARIN-IT, CLARIN-ERIC, Qualitative Assessment Methodology, User Involvement},
PAGES = {10-22},
URL = {https://ecp.ep.liu.se/index.php/clarin/article/view/413/371},
DOI = {10.3384/9789179294441},
ISBN = {978-91-7929-444-1},
BOOKTITLE = {Selected Papers from the CLARIN Annual Conference 2021},
}
@INCOLLECTION{MENANT_2022_INCOLLECTION_MGFFMMC_412939,
AUTHOR = {Menant and Geneviève and Frontini, F. and Fujiwara and Mami and Martin and Chrostophe},
TITLE = {Approches numériques des questions d'auctorialité. Le corpus Challe},
YEAR = {2022},
ABSTRACT = {La contribution se concentre sur l'application d'approches textométriques et d'identification d'auteur à l'oeuvre de Robert Challe},
KEYWORDS = {Robert Challe, attribution d'auteur, textométrie},
PAGES = {167-192},
URL = {https://iris.cnr.it/handle/20.500.14243/412939},
DOI = {10.48611/isbn.978-2-406-13347-6.p.0167},
PUBLISHER = {Editions Classiques Garnier (Paris, FRA)},
ISBN = {978-2-406-13347-6},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Observer la vie littéraire. Études littéraires et numériques},
EDITOR = {Alexandre, D. and Roe, G.},
}
@INCOLLECTION{SCIOLETTE_2022_INCOLLECTION_SG_447932,
AUTHOR = {Sciolette, F. and Giovannetti, E.},
TITLE = {Un modello per domarli tutti: verso una rappresentazione del testo come esplicitazione di documento, lingua e contenuto},
YEAR = {2022},
ABSTRACT = {The aim of this research is to describe the first steps towards the theoretical elaboration of a holistic model to represent textual information. The focus of the model is the definition of "text", with its different dimensions, as a "diasystem". The set of elements, organized into distinct but strictly interconnected systems, wherein each element has an effect on the whole diasystem, is described in a model structured in the following components: graphic, linguistic, documental, discursive, and conceptual. In this work, the first attempts in the modeling of text will be shown through two case studies: the Babylonian Talmud and the DiTMAO (Dictionary of Old Occitan medico-botanical terminology)},
KEYWORDS = {textual model, holystic model, diasystem, model of text},
PAGES = {145-157},
URL = {http://www.aitla.it/images/pdf/StudiAItLA14/009_AItLA14_ScioletteGiovannetti.pdf},
PUBLISHER = {Officinaventuno (Milano, ITA)},
ISBN = {978-88-97657-51-4},
CONFERENCE_PLACE = {Milano},
BOOKTITLE = {Fare linguistica applicata con le digital humanities},
EDITOR = {Saturno, J. and Spreafico, L.},
}
@INCOLLECTION{VAGIONAKIS_2022_INCOLLECTION_VDBBDMM_446355,
AUTHOR = {Vagionakis, I. and Del Gratta, R. and Boschetti, F. and Baroni, P. and Del Grosso, A. M. and Mancinelli, T. and Monachini, M.},
TITLE = {'Cretan Institutional Inscriptions' Meets CLARIN-IT},
YEAR = {2022},
ABSTRACT = {This paper presents 'Cretan Institutional Inscriptions', a resource in the domain of Digital Epigraphy developed at the Ca' Foscari University of Venice and supported by CLARIN-IT as part of its actions addressed to initiatives, projects and events in the field of Social Sciences and Humanities. The paper begins with a brief outline of the project within which the resource was created and then goes into a more in-depth description of the main methodologies used to develop the resource (EpiDoc and EFES) and of their benefits. The paper then focuses on the cooperation of the project with the Venice Centre of Digital and Public Humanities and the Italian node of CLARIN, also illustrating the dockerization process applied to the resource hosted on the CLARIN-IT servers. Some desiderata for future developments are outlined as well. The paper ends with some remarks about the widening of CLARIN horizons towards Digital Epigraphy and on the role of its K-Centres in this respect},
KEYWORDS = {Digital Epigraphy, Digital Classics, Ancient Greek, Crete, Institutions, Text Encoding Initiative, TEI, EpiDoc, EpiDoc Front-End Services, EFES, Virtual Language Observatory, Dockerization, ILC4CLARIN, CLARIN-IT, CLARIN},
PAGES = {139-150},
URL = {https://ecp.ep.liu.se/index.php/clarin/article/view/424/382},
DOI = {10.3384/9789179294441},
ISBN = {978-91-7929-444-1},
BOOKTITLE = {Selected Papers from the CLARIN Annual Conference 2021},
EDITOR = {Monachini, M. and Eskevich, M.},
}
@EDITORIAL{MELERO_2022_EDITORIAL_MSS_444080,
AUTHOR = {Melero, M. and Sakriani, S. and Soria, C.},
TITLE = {Proceedings of The 1st Annual Meeting of the ELRA/ISCA Special Interest Group on Under-Resourced Languages (SIGUL2022)},
YEAR = {2022},
ABSTRACT = {Proceedings of the SIGUL 2022 workshop},
KEYWORDS = {conference proceedings, less-resourced languages, language resources, NLP, ù},
URL = {https://aclanthology.org/events/lrec-2022/#2022-sigul-1},
ISBN = {979-10-95546-91-7},
}
@EDITORIAL{MONACHINI_2022_EDITORIAL_ME_420369,
AUTHOR = {Monachini, M. and Eskevich, M.},
TITLE = {Selected Papers from the CLARIN Annual Conference 2021},
YEAR = {2022},
ABSTRACT = {This volume presents the highlights of the 10th CLARIN Annual Conference 2021. The conference was held on 27th-29th September 2021 and because of the COVID-19 pandemic, for the second year in row a virtual format had te be adopted. CLARIN, the Common Language Resources and Technology Infrastructure, is a virtual platform that is accessible for everyone interested in language. CLARIN offers access to language resources, technology, and knowledge, and enables cross-country collaboration among academia, industry, policy-makers, cultural institutions, and the general public. Researchers, students, and citizens are offered access to digital language resources and technology services to deploy, connect, analyse and sustain such resources. In line with the Open Science agenda, CLARIN enables scholars from the Social Sciences and Humanities (SSH) and beyond to engage in and contribute to cutting-edge, data-driven research based on language data in a range of formats and modalities},
KEYWORDS = {Language Resource Infrastructure},
PAGES = {1-212},
URL = {https://iris.cnr.it/handle/20.500.14243/420369},
DOI = {10.3384/9789179294441},
ISBN = {978-91-7929-444-1},
}
@EDITORIAL{DEJONG_2022_EDITORIAL_DM_420371,
AUTHOR = {De Jong, F. and Monachini, M.},
TITLE = {Introduction. Selected papers from the CLARIN Annual Conference 2021},
YEAR = {2022},
ABSTRACT = {CLARIN, the Common Language Resources and Technology Infrastructure, is a virtual platform that is accessible for everyone interested in language. CLARIN offers access to language resources, technology, and knowledge, and enables cross-country collaboration among academia, industry, policy-makers, cultural institutions, and the general public. Researchers, students, and citizens are offered access to digital language resources and technology services to deploy, connect, analyse and sustain such resources. Inline with the Open Science agenda, CLARIN enables scholars from the Social Sciences and Humanities(SSH) and beyond to engage in and contribute to cutting-edge, data-driven research based on language data in a range of formats and modalities},
KEYWORDS = {Language Resource Infrastructure},
PAGES = {i-v},
URL = {https://iris.cnr.it/handle/20.500.14243/420371},
DOI = {10.3384/9789179294441},
ISBN = {978-91-7929-444-1},
EDITOR = {Monachini, M. and Eskevich, M.},
}
@INPROCEEDINGS{AGNOLONI_2022_INPROCEEDINGS_ABFMMQRV_446358,
AUTHOR = {Agnoloni, T. and Bartolini, R. and Frontini, F. and Montemagni, S. and Marchetti, C. and Quochi, V. and Ruisi, M. and Venturi, G.},
TITLE = {Making Italian Parliamentary Records Machine-Actionable: the Construction of the ParlaMint-IT corpus},
YEAR = {2022},
ABSTRACT = {This paper describes the process of acquisition, cleaning, interpretation, coding and linguistic annotation of a collection of parliamentary debates from the Senate of the Italian Republic covering the COVID-19 pandemic emergency period and a former period for reference and comparison according to the CLARIN ParlaMint prescriptions. The corpus contains 1199 sessions and 79, 373 speeches for a total of about 31 million words, and was encoded according to the ParlaCLARIN TEI XML format. It includes extensive metadata about the speakers, sessions, political parties and parliamentary groups. As required by the ParlaMint initiative, the corpus was also linguistically annotated for sentences, tokens, POS tags, lemmas and dependency syntax according to the universal dependencies guidelines. Named entity annotation and classification is also included. All linguistic annotation was performed automatically using state-of-the-art NLP technology with no manual revision. The Italian dataset is freely available as part of the larger ParlaMint 2. 1 corpus deposited and archived in CLARIN repository together with all other national corpora. It is also available for direct analysis and inspection via various CLARIN services and has already been used both for research and educational purposes},
KEYWORDS = {parliamentary debates, CLARIN ParlaMint, corpus creation, corpus annotation},
PAGES = {117-124},
URL = {https://aclanthology.org/2022.parlaclarin-1.17/},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {979-10-95546-85-6},
CONFERENCE_NAME = {Workshop ParlaCLARIN III within the 13th Language Resources and Evaluation Conference},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of The Workshop ParlaCLARIN III within the 13th Language Resources and Evaluation Conference},
}
@INPROCEEDINGS{BARREIRO_2022_INPROCEEDINGS_BGGBLEGMRKCPPAA_506141,
AUTHOR = {Barreiro, A. and Gc De Souza, J. and Gatt, A. and Bhatt, M. and Lloret, E. and Erdem, A. and Gkatzia, D. and Moniz, H. and Russo, I. and Kepler, F. and Calixto, I. and Paprzycki, M. and Portet, F. and Augenstein, I. and Alhasani, M.},
TITLE = {Multi3generation: multitask, multilingual, multimodal language generation},
YEAR = {2022},
ABSTRACT = {This paper presents the Multitask, Multilingual, Multimodal Language Generation COST Action–Multi3Generation (CA18231), an interdisciplinary network of research groups working on different aspects of language generation. This “meta-paper” will serve as reference for citations of the Action in future publications. It presents the objectives, challenges and a the links for the achieved outcomes},
KEYWORDS = {natural language generation},
PAGES = {347-348},
URL = {https://iris.cnr.it/handle/20.500.14243/506141},
BOOKTITLE = {Proceedings of the 23rd Annual Conference of the European Association for Machine Translation},
}
@INPROCEEDINGS{BOSCHETTI_2022_INPROCEEDINGS_BBDDGNZ_446353,
AUTHOR = {Boschetti, F. and Burgassi, C. and Del Gratta, R. and Del Grosso, A. M. and Guadagnini, E. and Nahli, O. and Zenzaro, S.},
TITLE = {Il Laboratorio di Filologia Collaborativa e Cooperativa (CoPhiLab) del CNR-ILC: dati, strumenti, servizi e infrastrutture},
YEAR = {2022},
ABSTRACT = {Questo contributo illustra le attività e le risorse del Laboratorio di Filologia Collaborativa e Cooperativa (CoPhiLab) dell'Istituto di Linguistica Computazionale "A. Zampolli" del Consiglio Nazionale delle Ricerche (CNR-ILC), con particolare attenzione all'uso delle infrastrutture di ricerca nazionali e internazionali},
KEYWORDS = {Filologia Computazionale, Modelli Formali, Lingua Araba, Domain-Specific Languages, Ingegneria del Software.},
PAGES = {45-50},
URL = {https://www.eventi.garr.it/it/conf22},
DOI = {10.26314/GARR-Conf22-proceedings},
PUBLISHER = {Associazione Consortium GARR (Roma, ITA)},
ISBN = {978-88-946629-1-7},
CONFERENCE_NAME = {CondiVisioni. La rete come strumento per costruire il futuro},
CONFERENCE_PLACE = {Roma},
BOOKTITLE = {CONDIVISIONI La rete come strumento per costruire il futuro},
EDITOR = {Mieli, M. and Volpe, C.},
}
@INPROCEEDINGS{CACIOLI_2022_INPROCEEDINGS_CCDMDZ_446349,
AUTHOR = {Cacioli, G. and Cerretini, G. and Di Pietro, C. and Maenza, S. and Del Turco, R. R. and Zenzaro, S.},
TITLE = {There and back again: what to expect in the next EVT version},
YEAR = {2022},
ABSTRACT = {Developing software as complex as EVT requires a significant amount of time and resources. As a result, the release frequency of new versions has never been particularly high, especially for major versions. The first release of EVT 1 dates back to 2014, in 2016 we published the first alpha version of EVT 2, after which more complete versions followed: a beta1 in 2017, and a beta2 in 2020. Not only did it take three years between the two beta versions of EVT 2, but we still don't see the light for a 1. 0 version. What has happened in the meantime? How is it possible that a stable version for EVT 1 was achieved relatively quickly, and development slowed down significantly thereafter? This talk aims at updating the Italian DH community about the current status of EVT and its future prospects with regard to the next version (EVT 3)},
KEYWORDS = {XML-TEI, filologia d'autore, mark-up, varianti, Saba},
PAGES = {212-217},
URL = {http://amsacta.unibo.it/6848/1/Proceedings_AIUCD2022.pdf#page=222},
DOI = {10.6092/unibo/amsacta/6848},
ISBN = {9788894253566},
CONFERENCE_NAME = {AIUCD 2022. Culture digitali. Intersezioni: filosofia, arti, media},
BOOKTITLE = {AIUCD 2022-Proceedings. Culture digitali. Intersezioni: filosofia, arti, media},
EDITOR = {Ciracì and Miglietta, F. and Gatto, G. and Carola},
}
@INPROCEEDINGS{CHIARCOS_2022_INPROCEEDINGS_CGIKKT_444084,
AUTHOR = {Chiarcos, C. and Gkirtzou, K. and Ionov, M. and Kabashi, B. and Khan, F. and Truic, C.},
TITLE = {Modelling Collocations in OntoLex-FrAC},
YEAR = {2022},
ABSTRACT = {Following presentations of frequency and attestations, and embeddings and distributional similarity, this paper introduces the third cornerstone of the emerging OntoLex module for Frequency, Attestation and Corpus-based Information, OntoLex-FrAC. We provide an RDF vocabulary for collocations, established as a consensus over contributions from five different institutions and numerous data sets, with the goal of eliciting feedback from reviewers, workshop audience and the scientific community in preparation of the final consolidation of the OntoLex-FrAC module, whose publication as a W3C community report is foreseen for the end of this year. The novel collocation component of OntoLex-FrAC is described in application to a lexicographic resource and corpus-based collocation scores available from the web, and finally, we demonstrate the capability and genericity of the model by showing how to retrieve and aggregate collocation information by means of SPARQL, and its export to a tabular format, so that it can be easily processed in downstream applications},
URL = {https://iris.cnr.it/handle/20.500.14243/444084},
ISBN = {979-10-95546-92-4},
}
@INPROCEEDINGS{COLOMBO_2022_INPROCEEDINGS_CG_443112,
AUTHOR = {Colombo, M. and Giovannetti, E.},
TITLE = {La Visualizzazione Grafica di Sensi e Relazioni Semantiche di un Lessico Computazionale della Lingua Italiana},
YEAR = {2022},
ABSTRACT = {La visualizzazione, intesa come ausilio alla consultazione e alla ricerca, può giocare un ruolo fondamentale nella fruizionedi dati linguistici e di conoscenza. Attraverso la rappresentazione di una risorsa lessicale o di una ontologia sotto forma digrafo, ad esempio, uno studioso ha la possibilità di farsi un'idea immediata delle relazioni che intercorrono tra i varielementi di un lessico (di lingua o specialistico) o dei concetti che formalizzano un determinato dominio. In questocontributo presentiamo un'applicazione web based per la visualizzazione grafica della componente semantica di un lessicocomputazionale dell'italiano. Il grafo è stato sviluppato con Cytoscape. js, una libreria Javascript per la creazione di grafi. L'interfaccia al grafo, sviluppata come applicazione Angular, offre un primo insieme di funzionalità di interazione per lanavigazione e la manipolazione della risorsa lessico-semantica},
KEYWORDS = {human-computer interaction, lessico computazionale, grafi, Visualizzazione grafica di risorse linguistiche, rappresentazione della conoscenza},
PAGES = {155-160},
URL = {http://amsacta.unibo.it/6848/1/Proceedings_AIUCD2022.pdf},
DOI = {10.6092/unibo/amsacta/6848},
PUBLISHER = {Fabio Ciracì, Giulia Miglietta, Carola Gatto},
ISBN = {9788894253566},
CONFERENCE_NAME = {AIUCD 2022},
BOOKTITLE = {AIUCD 2022-Culture digitali. Intersezioni: filosofia, arti, media. Proceedings della 11a conferenza nazionale},
}
@INPROCEEDINGS{COSTA_2022_INPROCEEDINGS_CSRKCTAKRS_444087,
AUTHOR = {Costa, R. and Salgado, A. and Ramos, M. and Khan, F. and Carvalho, S. and Tasovac, T. and Almeida, B. and Khemakhem, M. and Romary, L. and Silva, R.},
TITLE = {Integrating Terminological and Ontological Principles into a Lexicographic Resource},
YEAR = {2022},
ABSTRACT = {In this paper we will present the research that is taking place at the NOVA CLUNL1 where an international team is working on a financed project MORDigital2. MORDigital's goal is to encode the selected editions of Diccinario de Lingua Portugueza by António de Morais Silva (MOR), first published in 1789},
URL = {https://iris.cnr.it/handle/20.500.14243/444087},
}
@INPROCEEDINGS{DELFANTE_2022_INPROCEEDINGS_DFMQ_416549,
AUTHOR = {Del Fante, D. and Frontini, F. and Monachini, M. and Quochi, V.},
TITLE = {CLARIN-IT: An Overview on the Italian Clarin Consortium After Six Years of Activity},
YEAR = {2022},
ABSTRACT = {This paper offers an overview of the Italian CLARIN consortium after six years since its establishment. The members, the centres and the repositories and the most important collections are described. Lastly, in order to showcase the visibility and the accessiblity of Language Resources provided by CLARIN-IT from a user-perspective, we show how Italian resources are findable within CLARIN ERI},
KEYWORDS = {Language Resources, Data Repositories and Archives, Research Infrastructures, CLARIN},
PAGES = {8},
URL = {http://ceur-ws.org/Vol-3160/short21.pdf},
PUBLISHER = {CEUR-WS. org (Aachen, DEU)},
CONFERENCE_NAME = {Italian Research Conference on Digital Libraries},
CONFERENCE_PLACE = {Aachen},
BOOKTITLE = {Proceedings of the 18th Italian Research Conference on Digital Libraries},
EDITOR = {Di Nunzio, G. M. and Portelli, B. and Redavid, D. and Silvello, G.},
}
@INPROCEEDINGS{DIDONATO_2022_INPROCEEDINGS_DP_446877,
AUTHOR = {Di Donato, F. and Provost, L. M.},
TITLE = {The TRIPLE Training Toolkit. From online training on Open Science to the design and delivery of Open Educational Resources: an example of FAIR-ification of digital training resources and workflows},
YEAR = {2022},
ABSTRACT = {This paper presents the work performed within the task dedicated to online training and guidelines on Open Science and the EOSC in the EU-funded project TRIPLE (Transforming Research through Innovative Practices for Linked Interdisciplinary Exploration, Grant Agreement n. 863420). In light of the need for a common understanding of recent European Open Science advancements and to spur the uptake and implementation of Open Science practices within SSH research and training communities, this task produced two kinds of outputs. The TRIPLE Open Science training series is a series of 12 open and reusable training events specifically designed to up-skill researchers in FAIR and Open Science. The TRIPLE Training Toolkit is an open workflow for trainers to reproduce and adapt to organise training events following a FAIR-by-design method},
KEYWORDS = {open science, training},
PAGES = {56-61},
URL = {https://www.garr.it/it/chi-siamo/documenti/selected-papers/selected-papers-conferenza-2022/6090-conferenza-2022-selected-papers-09-di-donato},
DOI = {10.26314/GARR-Conf22-proceedings},
ISBN = {978-88-946629-1-7},
CONFERENCE_NAME = {GARR Conference 2022-Condivisioni. La rete come strumento per costruire il futuro},
BOOKTITLE = {GaRR 2022 Conference proceedings},
}
@INPROCEEDINGS{FAVARO_2022_INPROCEEDINGS_FBM_533921,
AUTHOR = {Favaro, M. and Biffi, M. and Montemagni, S.},
TITLE = {Trattamento automatico del linguaggio e varietà storiche di italiano: la sfida della lemmatizzazione},
YEAR = {2022},
ABSTRACT = {Il contributo si propone di illustrare alcune delle risorse sviluppate all’interno del progetto TrAVaSI (Trattamento Automatico di Varietà Storiche di Italiano). Ci si concentrerà sulla creazione di corpora annotati e lessici morfologici per il miglioramento dell’accuratezza del processo di lemmatizzazione. I risultati sono ottenuti attraverso l’estensione dei dizionari morfologici e l’addestramento del modulo di lemmatizzazione con corpora rappresentativi delle varietà storiche della lingua trattate. Sono presentati i risultati di uno studio preliminare sulle tipologie di errore di lemmatizzazione riscontrate nei diversi approcci},
KEYWORDS = {TAL, corpora, lessici morfologici, varietà storiche della lingua},
PAGES = {393-399},
URL = {https://iris.cnr.it/handle/20.500.14243/533921},
PUBLISHER = {VADISTAT PressEditor-Edizioni Erranti (Cosenza, ITA)},
ISBN = {979-12-80153-30-2},
CONFERENCE_NAME = {16th International Conference on Statistical Analysis of Textual Data (JADT22)},
CONFERENCE_PLACE = {Cosenza},
BOOKTITLE = {Proceedings of the 16th International Conference on Statistical Analysis of Textual Data (JADT22)},
EDITOR = {Misuraca, M. and Scepi, G. and Spano, M.},
}
@INPROCEEDINGS{FAVARO_2022_INPROCEEDINGS_FGSBM_533922,
AUTHOR = {Favaro, M. and Guadagnini, E. and Sassolini, E. and Biffi, M. and Montemagni, S.},
TITLE = {Towards the Creation of a Diachronic Corpus for Italian: a Case Study on the GDLI Quotations},
YEAR = {2022},
ABSTRACT = {In this paper we describe some experiments related to a corpus derived from an authoritative historical Italian dictionary, namely the Grande dizionario della lingua italiana (‘Great Dictionary of Italian Language’, in short GDLI). Thanks to the digitization and structuring of this dictionary, we have been able to set up the first nucleus of a diachronic annotated corpus that selects—according to specific criteria, and distinguishing between prose and poetry—some of the quotations that within the entries illustrate the different definitions and sub-definitions. In fact, the GDLI presents a huge collection of quotations covering the entire history of the Italian language and thus ranging from the Middle Ages to the present day. The corpus was enriched with linguistic annotation and used to train and evaluate NLP models for POS tagging and lemmatization, with promising results},
KEYWORDS = {Diachronic Corpus, Adaptation of Annotation Tools, Historical Dictionaries},
PAGES = {94-100},
URL = {http://www.lrec-conf.org/proceedings/lrec2022/workshops/LT4HALA/pdf/2022.lt4hala2022-1.13.pdf},
PUBLISHER = {European Language Resources Association (ELRA) (Paris, FRA)},
ISBN = {979-10-95546-78-8},
CONFERENCE_NAME = {2nd Workshop on Language Technologies for Historical and Ancient Languages (LT4HALA 2022)},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the 2nd Workshop on Language Technologies for Historical and Ancient Languages},
EDITOR = {Sprugnoli, R. and Passarotti, M.},
}
@INPROCEEDINGS{GAMBA_2022_INPROCEEDINGS_GFBM_446356,
AUTHOR = {Gamba, F. and Frontini, F. and Broeder, D. and Monachini, M.},
TITLE = {Language Technologies for the Creation of Multilingual Terminologies. Lessons Learned from the SSHOC Project},
YEAR = {2022},
ABSTRACT = {This paper is framed in the context of the SSHOC project and aims at exploring how Language Technologies can help in promoting and facilitating multilingualism in the Social Sciences and Humanities (SSH). Although most SSH researchers produce culturally and societally relevant work in their local languages, metadata and vocabularies used in the SSH domain to describe and index research data are currently mostly in English. We thus investigate Natural Language Processing and Machine Translation approaches in view of providing resources and tools to foster multilingual access and discovery to SSH content across different languages. As case studies, we create and deliver as freely, openly available data a set of multilingual metadata concepts and an automatically extracted multilingual Data Stewardship terminology. The two case studies allow as well to evaluate performances of state-of-the-art tools and to derive a set of recommendations as to how best apply them. Although not adapted to the specific domain, the employed tools prove to be a valid asset to translation tasks. Nonetheless, validation of results by domain experts proficient in the language is an unavoidable phase of the whole workflow},
KEYWORDS = {language resource infrastructures, Multilingual terminologies, data curation},
PAGES = {154-163},
URL = {https://aclanthology.org/2022.lrec-1.17},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {979-10-95546-72-6},
CONFERENCE_NAME = {13th Conference on Language Resources and Evaluation (LREC 2022)},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the 13th Language Resources and Evaluation Conference},
}
@INPROCEEDINGS{HIRSCH_2022_INPROCEEDINGS_HFDD_419303,
AUTHOR = {Hirsch, F. and Frontini, F. and Didirková, I. and Drengubiak, J.},
TITLE = {Esthétique de la voix dans les livres audio en langue française},
YEAR = {2022},
ABSTRACT = {Cette recherche vise à étudier les préférences des auditeurs concernant les voix des livres audio. Des échantillons de 8 voix masculines et 7 voix féminines ont été extraits de différents livres audio et analysés. Une enquête a été réalisée pour obtenir le point de vue de 69 auditeurs en répondant à des questions sur les caractéristiques vocales. Les résultats montrent que les choix des participants dépendent du genre littéraire. En effet, les voix masculines sont préférées pour les romans de science-fiction et les voix féminines pour la littérature pour enfants et les romans contemporains. Néanmoins, les autres genres littéraires testés ne correspondent pas à une voix spécifique. Concernant le débit, une préférence a été notée pour des essais lus avec un débit de parole plus lent, alors que les auditeurs préfèrent un débit de parole plus rapide pour les romans érotiques},
KEYWORDS = {audiobooks, voice esthetics, speech},
URL = {https://doi.org/10.1051/shsconf/202213808004},
DOI = {10.1051/shsconf/202213808004},
CONFERENCE_NAME = {8e Congrès Mondial de Linguistique Française},
BOOKTITLE = {138},
}
@INPROCEEDINGS{KHAN_2022_INPROCEEDINGS_KGGDVMOSS_444085,
AUTHOR = {Khan, F. and Gómez, F. J. M. and González, R. C. and Diakoff, H. and Vera, J. E. D. and McCrae, J. P. and O'Loughlin, C. and Short, W. M. and Stolk, S.},
TITLE = {Towards the Construction of a WordNet for Old English},
YEAR = {2022},
ABSTRACT = {In this paper we will discuss our preliminary work towards the construction of a WordNet for Old English, taking our inspiration from other similar WN construction projects for ancient languages such as Ancient Greek, Latin and Sanskrit. The Old English WordNet (OldEWN) will build upon this innovative work in a number of different ways which we articulate in the article, most importantly by treateating figurative meaning as a 'first-class citizen' in the structuring of the semantic system. From a more practical perspective we will describe our plan to utilize a pre-existing lexicographic resource and the naisc system to automatically compile a provisional version of the WordNet which will then be checked and enriched by Old English experts},
URL = {https://iris.cnr.it/handle/20.500.14243/444085},
}
@INPROCEEDINGS{MARCHI_2022_INPROCEEDINGS_MCDG_443132,
AUTHOR = {Marchi, S. and Colombo, M. and Dattilo, D. and Giovannetti, E.},
TITLE = {Un esperimento di visualizzazione grafica della terminologia del Talmud babilonese},
YEAR = {2022},
ABSTRACT = {L'impiego di tecnologie di information visualization nel settore delle digital humanities può aprire nuove frontiere di ricerca. Le informazioni veicolate attraverso modalità grafiche, infatti, possono apparire agli studiosi più immediatamente comprensibili e le interfacce grafiche realizzate fornire inediti paradigmi di studio e di manipolazione dei dati analizzati. Il caso d'uso sperimentale illustrato in questo contributo è stato concepito per fornire allo studioso una modalità visiva, immediata, per l'analisi comparativa del contenuto terminologico di un corpus testuale},
KEYWORDS = {Visualizzazione grafica di risorse testuali, terminologia, linguistica computazionale, tf-idf, grafi},
PAGES = {239-241},
URL = {http://amsacta.unibo.it/6848/1/Proceedings_AIUCD2022.pdf},
DOI = {10.6092/unibo/amsacta/6848},
ISBN = {9788894253566},
CONFERENCE_NAME = {AIUCD 2022},
BOOKTITLE = {AIUCD 2022-Culture digitali. Intersezioni: filosofia, arti, media. Proceedings della 11a conferenza nazionale},
}
@INPROCEEDINGS{MIASCHI_2022_INPROCEEDINGS_MRD_443056,
AUTHOR = {Miaschi, A. and Ravelli, A. and Dell'Orletta, F.},
TITLE = {Punctuation Restoration in Spoken Italian Transcripts with Transformers},
YEAR = {2022},
ABSTRACT = {In this paper, we propose an evaluation of a Transformer-based punctuation restoration model for the Italian language. Experimenting with a BERT-base model, we perform several fine-tuning with different training data and sizes and tested them in an in-and cross-domain scenario. Moreover, we conducted an error analysis of the main weaknesses of the model related to specific punctuation marks. Finally, we test our system either quantitatively and qualitatively, by offering a typical task-oriented and a perception-based acceptability evaluation},
KEYWORDS = {nlp, transformer models, puncutation restoration},
PAGES = {245-260},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85135083576\&origin=inward},
VOLUME = {13196 LNAI},
DOI = {10.1007/978-3-031-08421-8_17},
CONFERENCE_NAME = {AIxIA 2021-Advances in Artificial Intelligence},
BOOKTITLE = {Proccedings of AIxIA 2021-Advances in Artificial Intelligence},
}
@INPROCEEDINGS{NARTENI_2022_INPROCEEDINGS_NFRM_415728,
AUTHOR = {Narteni, S. and Ferretti, M. and Rampa, V. and Mongelli, M.},
TITLE = {Bag-of-Words Similarity in eXplainable AI},
YEAR = {2022},
ABSTRACT = {eXplainable AI (XAI) does not only lie in the interpretation of the rules generated by AI systems, but also in the evaluation and selection, among many rules automatically generated by large datasets, of those that are more relevant and meaningful for domain experts. With this work, we propose a method for evaluation of similarity between rules, which identifies similar rules, or very different ones, by exploiting techniques developed for Natural Language Processing (NLP). We evaluate the similarity of if-then rules by interpreting them as sentences and generating a similarity matrix acting as an enabler for domain experts to analyse the generated rules and thus discover new knowledge. Rule similarity may be applied to rule analysis and manipulation in different scenarios: the first one deals with rule analysis and interpretation, while the second scenario refers to pruning unnecessary rules within a single ruleset. Rule similarity allows also the automatic comparison and evaluation of rulesets. Two different examples are provided to evaluate the effectiveness of the proposed method for rules analysis for knowledge extraction and rule pruning},
KEYWORDS = {eXplainable AI, Rule similarity, Cosine similarity, Bag-of-words, Physical fatigue detection, Vehicle platooning},
PAGES = {835-851},
URL = {https://link.springer.com/chapter/10.1007/978-3-031-16078-3_58},
VOLUME = {2},
DOI = {10.1007/978-3-031-16078-3_58},
PUBLISHER = {Springer Nature Switzerland (Basel, CHE)},
ISBN = {978-3-031-16078-3},
CONFERENCE_NAME = {SAI Intelligent Systems Conference 2022},
CONFERENCE_PLACE = {Basel},
BOOKTITLE = {Intelligent Systems and Applications Proceedings of the 2022 Intelligent Systems Conference (IntelliSys) Volume 2},
EDITOR = {Arai, K.},
}
@INPROCEEDINGS{PAPUCCI_2022_INPROCEEDINGS_PDMD_415084,
AUTHOR = {Papucci, M. and De Nigris, C. and Miaschi, A. and Dell'Orletta, F.},
TITLE = {Evaluating Text-To-Text Framework for Topic and Style Classification of Italian texts},
YEAR = {2022},
ABSTRACT = {In this paper, we propose an extensive evaluation of the first text-to-text Italian Neural Language Model (NLM), IT5 [1], on a classification scenario. In particular, we test the performance of IT5 on several tasks involving both the classification of the topic and the style of a set of Italian posts. We assess the model in two different configurations, single-and multi-task classification, and we compare it with a more traditional NLM based on the Transformer architecture (i. e. BERT). Moreover, we test its performance in a few-shot learning scenario. We also perform a qualitative investigation on the impact of label representations in modeling the classification of the IT5 model. Results show that IT5 could achieve good results, although generally lower than the BERT model. Nevertheless, we observe a significant performance improvement of the Text-to-text model in a multi-task classification scenario. Finally, we found that altering the representation of the labels mainly impacts the classification of the topic},
KEYWORDS = {bert, style classification, t5, text-to-text, topic classification, transformers},
PAGES = {56-70},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85143252156\&origin=inward},
VOLUME = {3287},
CONFERENCE_NAME = {Sixth Workshop on Natural Language for Artificial Intelligence, NL4AI 2022},
}
@INPROCEEDINGS{PELLINO_2022_INPROCEEDINGS_PSDS_445886,
AUTHOR = {Pellino, S. and Sichera, P. and Del Grosso, A. M. and Spampinato, D.},
TITLE = {Dalla codifica alla fruizione: l'edizione digitale Bellini Digital Correspondence},
YEAR = {2022},
ABSTRACT = {L'articolo illustra le attività svolte per la realizzazione dell'edizione scientifica digitale delle lettere autografe belliniane (Bellini Digital Correspondence). Il progetto si inserisce in un contesto didattico finalizzato alla rappresentazione e fruizione della corrispondenza del maestro catanese. In seno alle attivita? e? stato sviluppato un tool di gestione delle regioni d'interesse e la personalizzazione del software EVT},
KEYWORDS = {Digital scholarly edition, correspondence, software design, XSLT, Vincenzo Bellini.},
PAGES = {163-168},
URL = {http://amsacta.unibo.it/6848/1/Proceedings_AIUCD2022.pdf},
DOI = {10.6092/unibo/amsacta/6848},
PUBLISHER = {Alma Mater Studiorum-Università di Bologna (Bologna, ITA)},
ISBN = {9788894253566},
CONFERENCE_NAME = {XI Conferenza annuale AIUCD. Culture digitali. Intersezioni: filosofia, arti, media},
CONFERENCE_PLACE = {Bologna},
BOOKTITLE = {Proceedings della XI conferenza nazionale AIUCD-Culture digitali. Intersezioni: filosofia, arti, media},
EDITOR = {Ciracì, F. and Miglietta, G. and Gatto, C.},
}
@INPROCEEDINGS{PUCCETTI_2022_INPROCEEDINGS_PRDD_521513,
AUTHOR = {Puccetti, G. and Rogers, A. and Drozd, A. and Dell'Orletta, F.},
TITLE = {Outlier dimensions that disrupt transformers are driven by frequency},
YEAR = {2022},
ABSTRACT = {While Transformer-based language models are generally very robust to pruning, there is the recently discovered outlier phenomenon: disabling only 48 out of 110M parameters in BERT-base drops its performance by nearly 30% on MNLI. We replicate the original evidence for the outlier phenomenon and we link it to the geometry of the embedding space. We find that in both BERT and RoBERTa the magnitude of hidden state coefficients corresponding to outlier dimensions correlates with the frequency of encoded tokens in pre-training data, and it also contributes to the “vertical” self-attention pattern enabling the model to focus on the special tokens. This explains the drop in performance from disabling the outliers, and it suggests that to decrease anisotropicity in future models we need pre-training schemas that would better take into account the skewed token distributions},
KEYWORDS = {Large Language Models, Mechanistic interpretability, Natural Language Processing},
PAGES = {1286-1304},
URL = {https://aclanthology.org/2022.findings-emnlp.93/},
DOI = {10.18653/v1/2022.findings-emnlp.93},
PUBLISHER = {Association for Computational Linguistics (ACL)},
ISBN = {978-1-959429-43-2},
CONFERENCE_NAME = {EMNLP 2022-Findings of the Association for Computational Linguistics},
BOOKTITLE = {Findings of the Association for Computational Linguistics: EMNLP 2022},
EDITOR = {Goldberg, Y. and Kozareva, Z. and Zhang, Y.},
}
@INPROCEEDINGS{QUOCHI_2022_INPROCEEDINGS_QBKMMPRTZ_412363,
AUTHOR = {Quochi, V. and Bellandi, A. and Khan, F. and Mallia, M. and Murano, F. and Piccini, S. and Rigobianco, L. and Tommasi, A. and Zavattari, C.},
TITLE = {From Inscriptions to Lexica and Back: A Platform for Editing and Linking the Languages of Ancient Italy},
YEAR = {2022},
ABSTRACT = {Available language technology is hardly applicable to scarcely attested ancient languages, yet their digital semantic representation, though challenging, is an asset for the purpose of sharing and preserving existing cultural knowledge. In the context of a project on the languages and cultures of ancient Italy, we took up this challenge. This paper thus describes the development of a user friendly web platform, EpiLexO, for the creation and editing of an integrated system of language resources for ancient fragmentary languages centered on the lexicon, in compliance with current digital humanities and Linked Open Data principles. EpiLexo allows for the editing of lexica with all relevant cross-references: for their linking to their testimonies, as well as to bibliographic information and other (external) resources and common vocabularies. The focus of the current implementation is on the languages of ancient Italy, in particular Oscan, Faliscan, Celtic and Venetic; however, the technological solutions are designed to be general enough to be potentially applicable to different contexts and scenarios},
KEYWORDS = {Digital Epigraphy, Restsprachen, Lexicon Editing and Linking, tools for DH},
PAGES = {59-67},
URL = {https://aclanthology.org/2022.lt4hala-1.0/},
PUBLISHER = {European language resources association (ELRA) (Paris, FRA)},
ISBN = {979-10-95546-78-8},
CONFERENCE_NAME = {Second Workshop on Language Technologies for Historical and Ancient Languages (LT4HALA 2022)},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the Second Workshop on Language Technologies for Historical and Ancient Languages (LT4HALA 2022)},
EDITOR = {Sprugnoli, R. and Passarotti, M.},
}
@INPROCEEDINGS{QUOCHI_2022_INPROCEEDINGS_QBMTZ_412366,
AUTHOR = {Quochi, V. and Bellandi, A. and Mallia, M. and Tommasi, A. and Zavattari, C.},
TITLE = {Supporting Ancient Historical Linguistics and Cultural Studies with EpiLexO},
YEAR = {2022},
ABSTRACT = {This contribution presents a system of independent software components meant to support the creation of ecosystems of interrelated language data (i. e. lexica linked to textual testimonies, concepts, metadata, bibliographic references, and other external lexical resources) according to the current state-of-the-art representational models for the semantic web. The system is implemented as a set of autonomous servers exposing Restful APIs that in principle can serve different frontend applications and use cases. In this work they serve the EpiLexO GUI application designed and geared to support scholars of ancient languages of fragmentary attestation in their studies. The development of both the back-ends and the front-end is still work-in progress, but a first version is ready for use},
KEYWORDS = {tools for DH, ancient languages, restsprachen, lexicon editor, corpus management, lexicon-text linking},
PAGES = {39-43},
URL = {https://office.clarin.eu/v/CE-2022-2118-CLARIN2022_ConferenceProceedings.pdf},
ISSN = {2022-2118},
CONFERENCE_NAME = {CLARIN Annual Conference 2022},
BOOKTITLE = {CLARIN Annual Conference Proceedings 2022},
EDITOR = {Erjavec, T. and Eskevich, M.},
}
@INPROCEEDINGS{RUSSO_2022_INPROCEEDINGS_R_475282,
AUTHOR = {Russo, I.},
TITLE = {Creative Text-to-Image Generation: Suggestions for a Benchmark},
YEAR = {2022},
ABSTRACT = {Language models for text-to-image generation can output good quality images when referential aspects of pictures are evaluated. The generation of creative images is not under scrutiny at the moment, but it poses interesting challenges: should we expect more creative images using more creative prompts? What is the relationship between prompts and images in the global process of human evaluation? In this paper, we want to highlight several criteria that should be taken into account for building a creative text-to-image generation benchmark, collecting insights from multiple disciplines (e. g., linguistics, cognitive psychology, philosophy, psychology of art)},
KEYWORDS = {artificial creativity, text-to-image models},
PAGES = {145-154},
URL = {https://aclanthology.org/2022.nlp4dh-1.18},
PUBLISHER = {Association for Computational Linguistics},
ISBN = {978-1-955917-75-9},
CONFERENCE_NAME = {Workshop on Natural Language Processing for Digital Humanities},
BOOKTITLE = {Proceedings of the 2nd International Workshop on Natural Language Processing for Digital Humanities},
EDITOR = {Hamalainen and Mika and Alnajjar and Khalid and Partanen and Niko and Rueter and Jack},
}
@INPROCEEDINGS{ZAMPARELLI_2022_INPROCEEDINGS_ZABCDHV_448002,
AUTHOR = {Zamparelli, R. and A Chowdhury, S. and Brunato, D. and Chesi, C. and Dell'Orletta, F. and Hasan, A. and Venturi, G.},
TITLE = {SemEval-2022 Task 3: PreTENS-Evaluating Neural Networks on Presuppositional Semantic Knowledge},
YEAR = {2022},
ABSTRACT = {We report the results of the SemEval 2022 Task 3, PreTENS, on evaluation the acceptability of simple sentences containing constructions whose two arguments are presupposed to be or not to be in an ordered taxonomic relation. The task featured two sub-tasks articulated as: (i) binary prediction task and (ii) regression task, predicting the acceptability in a continuous scale. The sentences were artificially generated in three languages (English, Italian and French). 21 systems, with 8 system papers were submitted for the task, all based on various types of fine-tuned transformer systems, often with ensemble methods and various data augmentation techniques. The best systemsreached an F1-macro score of 94. 49 (sub-task1) and a Spearman correlation coefficient of 0. 80 (sub-task2), with interesting variations in specific constructions and/or languages},
KEYWORDS = {Neural Networks, Presuppositional Knowledge, Evaluation},
PAGES = {228-238},
URL = {https://aclanthology.org/2022.semeval-1.29.pdf},
CONFERENCE_NAME = {16th International Workshop on Semantic Evaluation (SemEval-2022)},
BOOKTITLE = {16th International Workshop on Semantic Evaluation (SemEval-2022)},
}
@INPROCEEDINGS{ZENZARO_2022_INPROCEEDINGS_ZDBR_446342,
AUTHOR = {Zenzaro, S. and Del Grosso, A. M. and Boschetti, F. and Ranocchia, G.},
TITLE = {Verso la definizione di criteri per valutare soluzioni di scholarly editing digitale: il caso d'uso GreekSchools},
YEAR = {2022},
ABSTRACT = {Il contributo propone alcuni criteri di valutazione per l'analisi degli approcci all'editing testuale. Dopo averli presentati brevemente, si mostra come sono stati applicati alle attività finora svolte nel contesto del progetto ERC-885222 GreekSchools per quanto riguarda la progettazione e lo sviluppo di una piattaforma web collaborativa che fa uso di linguaggi specifici di dominio (DSL) finalizzata allo studio scientifico e alla pubblicazione di testi papiracei mediante edizioni critiche digitali},
KEYWORDS = {DSL linguaggi specifici di dominio, filologia computazionale, ingegneria del software, papirologia digitale, Domain Driven Design},
PAGES = {20-25},
URL = {http://amsacta.unibo.it/6848/1/Proceedings_AIUCD2022.pdf#page=30},
DOI = {10.6092/unibo/amsacta/6848},
ISBN = {9788894253566},
CONFERENCE_NAME = {AIUCD 2022. Culture digitali. Intersezioni: filosofia, arti, media},
BOOKTITLE = {AIUCD 2022-Proceedings. Culture digitali. Intersezioni: filosofia, arti, media},
EDITOR = {Ciracì and Miglietta, F. and Gatto, G. and Carola},
}
@INPROCEEDINGS{MARINETTI_2022_INPROCEEDINGS_MMQBBDPRSZMMM_436338,
AUTHOR = {Marinetti, A. and Murano, F. and Quochi, V. and Ballerini, M. and Boschetti, F. and Del Grosso, A. M. and Piccini, S. and Rigobianco, L. and Solinas, P. and Zinzi, M. and Monachini, M. and Mallia, M. and Middei, E.},
TITLE = {Challenges in Encoding Fragmentary Attested Languages},
YEAR = {2022},
ABSTRACT = {The ItAnt project investigates the langages of ancient Italy, whose only attestation consist in epigraphic evidence, focusing on Venetic, Oscan, Faliscan and Celtic languages. For this purpose, the project combines the traditional method proper to historical linguistics with the setting up of digital technologies, developing computational tools specifically designes to create a digital set of interrelated resources},
KEYWORDS = {digital epigraphy, eLexicography, Linguistic Linked Open Data, Text Encoding},
URL = {https://ciegl2022.sciencesconf.org/resource/page/id/30},
CONFERENCE_NAME = {XVI Congresso Internazionale di Epigrafia greca e latina},
}
@INPROCEEDINGS{MARZI_2022_INPROCEEDINGS_MNFMMVPTP_413387,
AUTHOR = {Marzi, C. and Narzisi, A. and Ferro, M. and Masi, G. and Milone, A. and Viglione, V. and Pelagatti, S. and Tomassini, I. and Pirrelli, V.},
TITLE = {Patterns of finger-tracking in Italian early readers with Autism Spectrum Disorder},
YEAR = {2022},
ABSTRACT = {Background: Of late, the synergistic interaction of eye and hand movements in the exploration of a visual scene displayed on a computer touchscreen was shown to provide a congruent signature of the "attention maps" of subjects with autism spectrum disorders (ASD). A familiar context where this visual and tactile interaction is exploited is when children use the finger of their dominant hand to point the letters of written words as they are reading, particularly at early stages of their literacy development. In the present work, a dedicated app running on a common tablet is used to capture and analyse the finger-tracking behaviour of children with ASD while they are reading few episodes of a connected text on the tablet touchscreen. The reader's voice is also recorded through the tablet built-in microphone. The sliding movements of the finger across the tablet touchscreen are discretized into a series of densely distributed "touch events", which are then mapped onto the text lines in much the same way eye fixations are projected onto a sequence of words using an eye-tracker. Reading texts are linguistically annotated, to control for levels of reading difficulty, and finger-tracking times are associated with linguistic glosses. Objectives: Investigate patterns of finger-tracking as a potential non biological marker for identification of children with ASD. Methods: A preliminary analysis is offered of evidence of the finger-tracking behaviour of 20 Italian children with high functioning ASD, aged 7-11 years, while they are engaged in reading. A grade-matched control group of children with typical development was included. Patterns of finger-tracking are assessed in connection with three complementary aspects of reading behaviour: (1) word recognition, (2) pace of reading of multi-word intonation units, and (3) text comprehension, controlled by asking children a few multiple-choice questions on text content after each reading session. Results: Considerable variation in levels of reading ability was observed in the ASD sample, with a few children showing clear evidence of impaired reading comprehension. However, fluent readers with ASD exhibit the same correlation between accurate decoding (assessed by measuring per-word reading speed) and high levels of reading comprehension found in controls. Likewise, decoding rates were found to significantly increase with increasing grade levels, following the typical developmental pattern observed in controls. On a less local level of linguistic analysis, the reading pace of ASD readers fails to be modulated according to major syntactic structures, punctuation marks and direct speech turns, an effect concomitant with a flat prosodic intonation of oral reading. Conclusions: Preliminary findings confirm the heterogeneous nature of reading skills in children with ASD, showing that the use of a tablet screen as a tactile interface for visual perception analysis can offer a robust experimental protocol for large-scale, multimodal collection of naturalistic data for extensive assessment of readers with ASD},
KEYWORDS = {reading, autism, finger-tracking, developing readers, prediction-driven processing},
PAGES = {192-192},
URL = {https://cdn.ymaws.com/www.autism-insar.org/resource/resmgr/files/insar_2022/2022_Abstract_Book.pdf},
VOLUME = {2022},
CONFERENCE_NAME = {INSAR},
BOOKTITLE = {2022 annual meeting abstract book},
}
@INPROCEEDINGS{MARZI_2022_INPROCEEDINGS_MP_415389,
AUTHOR = {Marzi, C. and Pirrelli, V.},
TITLE = {An information-theoretic analysis of the inflectional regular-irregular gradient for optimal processing units},
YEAR = {2022},
ABSTRACT = {Prediction-driven word processing defines the human ability to anticipate upcoming input words in recognition. From this perspective, input word forms need to be processed as quickly and efficiently as possible. Under the reasonable assumption that spoken words are memorized and processed as word trees (e. g. Marslen-Wilson's "cohorts"), the larger the size of the cohort of an input word at a certain point in time (and the later its uniqueness point), the harder and slower to process the word is. Regularly and irregularly inflected verb forms have different stem family sizes and different uniqueness points. Using a Recurrent Neural Network (RNN) as a computational model of the human lexical proces-sor, we explore here how their distributional and structural properties may affect (optimal) processing strategies},
KEYWORDS = {Morphological inflection, prediction-driven processing, discriminability, non-linearity, learnability},
PAGES = {50-51},
URL = {https://archive.nytud.hu/imm20/abstracts/main.pdf},
CONFERENCE_NAME = {20th International Morphology Meeting-(Dedicated to the memory of Ferenc Kiefer)},
BOOKTITLE = {Book of Abstracts of the 20th International Morphology Meeting-Dedicated to the memory of Ferenc Kiefer},
}
@INPROCEEDINGS{RANOCCHIA_2022_INPROCEEDINGS_RPVPFVAMRRCPPZBDE_446348,
AUTHOR = {Ranocchia, G. and Puglia, E. and Vassallo, C. and Pernigotti, C. and Fleischer, K. and Verhasselt, G. and Alessandrelli, M. and Miliani, C. and Romano, F. P. and Rosi, F. and Caliri, C. and Pavone, D. P. and Preisler, Z. and Zenzaro, S. and Boschetti, F. and Del Grosso, A. M. and Enea, A.},
TITLE = {The Greek philosophical schools according to Europe's earliest history of philosophy. Towards a new pioneering critical edition of Philodemus' Arrangement of the Philosophers},
YEAR = {2022},
ABSTRACT = {Our knowledge about Greek philosophical schools is mostly second-hand and based on Diogenes Laërtius' Lives of Eminent Philosophers (3rd century AD) and Philodemus' Arrangement of the Philosophers (75-50 BC), a treatise in several books which represents the earliest 'history of philosophy' to have reached us directly from antiquity. From this work exclusively preserved by the Herculaneum papyri we may derive a virtually systematic account of the history of Greek philosophical schools, which is unique in its kind},
KEYWORDS = {papyrology, digital papyrology, digital humanities, digital cultural heritage},
URL = {https://iris.cnr.it/handle/20.500.14243/446348},
CONFERENCE_NAME = {XXXth International Congress of Papyrology},
}
@TECHREPORT{ALBANESI_2022_TECHREPORT_ABCGMPS_447933,
AUTHOR = {Albanesi, D. and Bellandi, A. and Colombo, M. and Giovannetti, E. and Marchi, S. and Papini, M. and Sciolette, F.},
TITLE = {Traduco: l'Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-Rapporto tecnico 21},
YEAR = {2022},
ABSTRACT = {La presente relazione tecnico-scientifica descrive l'attività svolta da ILC-CNR nel contesto del Progetto Traduzione Talmud Babilonese nel periodo novembre 2021-aprile 2022. Le principali attività tecniche svolte sul sistema Traduco sono state la risoluzione di bug e l'implementazione di nuove funzionalità richieste. Parallelamente, è stata realizzata una applicazione per la consultazione del corpus biblico e sono proseguite le attività volte alla visualizzazione di risorse lessicali tramite grafi e per l'analisi, l'allineamento di testi, l'aggiornamento e la conversione del lessico computazionale PSC da utilizzarsi per la consultazione avanzata, su base morfologica e semantica, del testo talmudico tradotto in italiano},
KEYWORDS = {Traduzione Assistita dal Calcolatore, Traduzione Collaborativa, Lessici elettronici, rappresentazione della conoscenza, Linguistica Computazionale, traduzione di testi religiosi},
PAGES = {23},
URL = {https://iris.cnr.it/handle/20.500.14243/447933},
}
@TECHREPORT{ALBANESI_2022_TECHREPORT_ACGMPS_414174,
AUTHOR = {Albanesi, D. and Colombo, M. and Giovannetti, E. and Marchi, S. and Papini, M. and Sciolette, F.},
TITLE = {Traduco: l'Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-Rapporto tecnico 22},
YEAR = {2022},
ABSTRACT = {La presente relazione tecnico-scientifica descrive l'attività svolta da ILC-CNR nel contesto del Progetto Traduzione Talmud Babilonese nel periodo maggio 2022-dicembre 2022. Le principali attività tecniche svolte sul sistema Traduco sono state la risoluzione di bug e l'implementazione di nuove funzionalità richieste. Parallelamente, è proseguito il lavoro di ricerca e sviluppo su tre fronti: i) la nuova versione di Traduco, ii) la visualizzazione grafica di risorse lessicali, e iii) la ricerca full-text sul testo del Talmud tradotto in italiano},
KEYWORDS = {Traduzione Assistita dal CalcolatoreTraduzione Collaborativa, Lessici elettronici, rappresentazione della conoscenza, Linguistica Computazionale, traduzione di testi religiosi, ricerca full-text},
PAGES = {40},
URL = {https://iris.cnr.it/handle/20.500.14243/414174},
}
@TECHREPORT{ALBANESI_2022_TECHREPORT_AGP_447934,
AUTHOR = {Albanesi, D. and Giovannetti, E. and Papini, M.},
TITLE = {Traduco: l'Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-rapporto integrativo 4},
YEAR = {2022},
ABSTRACT = {La presente relazione tecnico-scientifica descrive l'attività svolta da ILC-CNR nel contesto delle attività di progetto previste dalla convenzione integrativa stipulata tra PTTB e ILC-CNR in data 10/07/2018 e condotte nel periodo febbraio 2021-gennaio 2022},
KEYWORDS = {Linguistica Computazionale, Traduzione di Testi Religiosi, Traduzione Assistita dal Calcolatore, Traduzione Collaborativa, Sviluppo front-end},
PAGES = {15},
URL = {https://iris.cnr.it/handle/20.500.14243/447934},
}
@TECHREPORT{ANTONINI_2022_TECHREPORT_ADFNPRSSSTT_445394,
AUTHOR = {Antonini, G. and Dell'Orletta, F. and Filippetti, A. and Nuzzolese, A. G. and Palaia, R. and Reale, E. and Saccone, M. and Sfameni, C. and Spinello, A. O. and Trufelli, L. and Tuzi, F.},
TITLE = {Le attività dipartimentali di monitoraggio e programmazione della ricerca nel settore delle scienze umane, sociali e del patrimonio culturale: metodologie, processi, risultati e soluzioni proposte per lo sviluppo di un sistema CNR integrato e multi livello per il monitoraggio e la programmazione della ricerca},
YEAR = {2022},
ABSTRACT = {Il Dipartimento Scienze Umane e Sociali, Patrimonio Culturale (DSU) del CNR, con la fattiva collaborazione di tutti gli Istituti ad esso afferenti, ha condotto un'iniziativa finalizzata a migliorare l'efficacia dei processi di monitoraggio e programmazione delle attività progettuali, infrastrutturali e di ricerca. È stato costituito uno specifico gruppo di lavoro che, interagendo costruttivamente con gli Istituti, ha svolto attività di studio e analisi con l'obiettivo di elaborare una proposta di revisione/aggiornamento delle Aree strategiche e delle relative Aree progettuali dipartimentali. Il presente rapporto illustra il percorso che ha portato a tale risultato e fornisce una serie di elementi utili a verificare l'efficacia delle modalità di conduzione dei lavori: dalle metodologie adottate alle attività di rilevazione e analisi dei dati e delle informazioni raccolti con metodi diversi; dall'analisi dei settori di interesse nello scenario più ampio di livello nazionale, europeo e internazionale al ruolo delle scienze sociali, delle discipline umanistiche e del patrimonio culturale in ambito CNR; dalla disamina di tutti gli elementi informativi, una volta disponibili, alla proposta di aggiornamento dell'impianto programmatico delle attività progettuali e di ricerca dipartimentali. Infine, sono evidenziate alcune delle principali criticità riconducibili prevalentemente al contesto organizzativo-gestionale, con particolare riferimento alle misure organizzative, ai metodi e agli strumenti dedicati al monitoraggio e alla programmazione scientifica},
KEYWORDS = {Monitoraggio della ricerca, programmazione della ricerca, Scienze umane - sociali e del patrimonio culturale, PIANO TRIENNALE DI ATTIVITÀ DEL CONSIGLIO NAZIONALE DELLE RICERCHE},
PAGES = {103},
URL = {https://iris.cnr.it/handle/20.500.14243/445394},
PUBLISHER = {Consiglio Nazionale delle Ricerche (Roma, ITA)},
CONFERENCE_PLACE = {Roma},
}
@TECHREPORT{BANTOUNA_2022_TECHREPORT_BMPNGLSDTDSMKKVBDDDCHHBDLPVHAGBCDBCFLACJPAFLBODJBMSPFTDCBGS_462389,
AUTHOR = {Bantouna, A. and Mavrakis, G. C. and Pantazi, N. and Ntemou, A. and Giannopoulou, N. and Labrousi, V. and Stavroulaki, V. and Demestichas, P. and Tzifa, E. and Demesticha, K. and Stenos, I. and Mitrou, M. and Kritikou, Y. and Kominou, A. and Vlaheas, P. and Bourgos, P. and Drigopoulou, I. and Dimitriadis, I. and Dimiropoulou, P. and Chietera, A. and Haugeard, J. E. and Hoornenborg, Y. and Busonera, G. and Del Rio, M. and Lianas, L. and Pireddu, L. and Versaci, F. and Henrik Vincent, P. and Aspegren, O. and Grangetto, M. and Bertero, L. and Cassoni, P. and D'Agata, F. and Bergui, M. and Cavagnino, D. and Fiandrotti, A. and Lucenteforte Daniele Perlo, M. and Aldinucci, M. and Cardillo, F. A. and Javier García Viartola, F. and Puente Mur, D. and Aznar, J. and Fernandez, A. and Lasso Elisa Ionascu, F. and Barseti, L. and Oniga, D. and Dobran, R. and Jianu, M. and Bolocan, V. and Medar, C. and Sutra, G. and Poli, J. P. and Friedmann, E. and Teijeiro, T. and De La Iglesia Vayá, M. and Canalini, L. and Bolelli, F. and Grana, C. and Silva, T.},
TITLE = {DEEPHEALTH-D6. 2 Validation of DeepHealth platforms and use cases},
YEAR = {2022},
ABSTRACT = {Final report on the validation of DeepHealth platforms and use cases (WP6, T6. 2)},
KEYWORDS = {HPC, Machine Learning, Artificial Intelligence},
URL = {https://iris.cnr.it/handle/20.500.14243/462389},
}
@TECHREPORT{DELGRATTA_2022_TECHREPORT_D_413871,
AUTHOR = {Del Gratta, R.},
TITLE = {Installing and configuring CLARIN-DSPACE on UBUNTU 22. 04 LTS},
YEAR = {2022},
ABSTRACT = {This note describes various procedures to install the CLARIN-DSPACE repository at the Institute for Computational Linguistics "A. Zampolli"},
KEYWORDS = {CLARIN, CLARIN-DSPACE, Repository, Installation Guide},
PAGES = {1-67},
URL = {https://iris.cnr.it/handle/20.500.14243/413871},
}
@TECHREPORT{DIDONATO_2022_TECHREPORT_DEPKVVKTTLPTCB_412097,
AUTHOR = {Di Donato, F. and Eskevich, M. and Provost, L. M. and Kraker, P. and Van Uytvanck, D. and Vignoli, M. and König, A. and Thiel, C. and Tetteh Ocansey, J. and Lombardo, T. and Pohle, S. and Tóthcifra, E. and Chen, Y. and Blotière, E.},
TITLE = {D6. 5 Report on Open Science within the EOSC},
YEAR = {2022},
ABSTRACT = {The report Open Science within the EOSC collects the findings of T6. 3 EOSC guidelines training and advocacy on Open Science, whose main goal is to produce, adapt and reuse general and specific guidelines to implement Open Science practices in disciplinary contexts, as well as to provide training to the SSH community on Open Science practices, tools and EOSC related content. In T6. 3 we delivered 12 training sessions and all training materials are published in open access1. In addition, we designed, developed and implemented an open workflow for the definition and management of the Open Science Training series, through the definition of a TRIPLE Training Toolkit, which reproduces the guidelines that have been designed and implemented to produce FAIR-by design training events. This set of documents constitutes section 1 of the present deliverable. Moreover, section 2 of the report presents four use-cases which address Open Science-related issues from different perspectives. The first subsection (CNR) sheds light on pathways for interdisciplinary collaboration and managing networking challenges. The second subsection (OKMAPS) addresses the need for improved discoverability of resources across research publications, research data and research projects. The third (CLARIN) shows how the connection between data, tools and publications can be implemented and made public. A model is explored to enrich the metadata about language resource data and tools from the CLARIN Resource Families with related publications, making use of the GoTriple platform. This cross-connects the CLARIN Virtual Language Observatory, the SSHOC Open Marketplace and the GoTriple platform. The last subsection (CESSDA) examines the balance between making data more accessible and aligning with legal restrictions. It explains how data is aligned internally to make them easily harvestable, and how, in turn, enrichment features from EOSC (OpenAIRE) and GoTriple systems will be used to improve data at their original sources},
KEYWORDS = {open science, training},
URL = {https://zenodo.org/record/7360227#.Y42-zezMJfU},
}
@TECHREPORT{DIDONATO_2022_TECHREPORT_DPLVPTCB_431679,
AUTHOR = {Di Donato, F. and Provost, L. and Lombardo, T. and Vignoli, M. and Pohle, S. and Tóthczifra, E. and Chen, Y. and Blotière, E.},
TITLE = {TRIPLE Training Toolkit (0. 1)},
YEAR = {2022},
ABSTRACT = {The TRIPLE Training Toolkit is part of the work performed by Work Package 6 (WP6) under Task 6. 3 in the TRIPLE Project (Transforming Research through Linked Interdisciplinary Exploration). The project is funded by the European Commission, under Grant Agreement No. 863420 and will run for 42 months starting from October 2019. The TRIPLE Open Science Training Series focuses on the design and delivery of competence-oriented training to address the specific and general needs of the research community on Open Science topics and on the EOSC. The experiment enabled a reflection on the current challenges to make FAIR-by-design training resources and how to overcome them. The following files are deposited in Zenodo to serve as a reference for those wishing to reproduce this experiment within their own institution or for their own training activities. Please note that the training series are still ongoing and as such the present document and the files listed below will be followed by updated versions by the end of the project (2023)},
KEYWORDS = {open science, training, TRIPLE},
URL = {https://doi.org/10.5281/zenodo.6256198},
DOI = {10.5281/zenodo},
}
@TECHREPORT{MARTELLI_2022_TECHREPORT_MMCNVUFQKKLDTTCSKIDGM_412365,
AUTHOR = {Martelli, F. and Maru, M. and Campagnano, C. and Navigli, R. and Velardi, P. and Ureñaruiz, R. and Frontini, F. and Quochi, V. and Kallas, J. and Koppel, K. and Langemets, M. and De Does, J. and Tempelaars, R. and Tiberius, C. and Costa, R. and Salgado, A. and Krek, S. and Ibej, J. and Dobrovoljc, K. and Gantar, P. and Munda, T.},
TITLE = {D3. 8 Lexical-semantic analytics for NLP},
YEAR = {2022},
ABSTRACT = {The present document illustrates the work carried out in task 3. 3 (work package 3) focused on lexicalsemantic analytics for Natural Language Processing (NLP). This task aims at computing analytics for lexicalsemantic information such as words, senses and domains in the available resources, investigating their role in NLP applications. Specifically, this task concentrates on three research directions, namely i) which grouping senses based on their semantic similari sense clustering, in ty improves the performance of NLP tasks such as Word Sense Disambiguation (WSD), ii) domain labeling of text, in which the lexicographic resources made available by the ELEXIS project for research purposes allow better performances to be achieved, and fin senses ally iii) analysing the, for which a software package is made available. diachronic distribution of In this deliverable, we illustrate the research activities aimed at achieving the aforementioned goals and put forward suggestions for future works. Importantly, we stress the crucial role played by highquality lexicalsemantic r esources when investigating such linguistic aspects and their impact on NLP applications. To this end, as an additional contribution, we address the paucity of manually the ELEXIS parallelannotated data in the lexical senseannotated datasetsemantic research field and introduce, a novel entirely manuallyavailable in 10 European languages and featuring 5 annotation layers},
KEYWORDS = {research infrastructures, lexicography, lexical resources, word-sense disambiguation, WSD, sense-annotated language data, multilinguality},
PAGES = {67},
URL = {https://elex.is/wp-content/uploads/ELEXIS_D3_8_Lexical-Semantic_Analytics_for_NLP_final_report.pdf},
}
@TECHREPORT{TASOVAC_2022_TECHREPORT_TTBBBCUFHHMKKKKMMMMMQARSSVWWZ_446092,
AUTHOR = {Tasovac, T. and Tiberius, C. and Bamberg, C. and Bellandi, A. and Burch, T. and Costa, R. and Uro, M. and Frontini, F. and Hennemann, J. and Heylen, K. and Milojakubíek and Khan, F. and Klee, A. and Kosem, I. and Ková, V. and Matuka, O. and McCrae, J. and Monachini, M. and Mörth, K. and Munda, T. and Quochi, V. and Andrarepar and Roche, C. and Salgado, A. and Sievers, H. and Váradi, T. and Weyand, S. and Woldrich, A. and Zhanial, S.},
TITLE = {D5. 3 Overview of Online Tutorials and Instruction Manuals},
YEAR = {2022},
ABSTRACT = {The ELEXIS Curriculum is an integrated set of training materials which contextualizes ELEXIS tools and services inside a broader, systematic pedagogic narrative. This means that the goal of the ELEXIS Curriculum is not simply to inform users about the functionalities of particular tools and services developed within the project, but to show how such tools and services are a) embedded in both lexicographic theory and practice; and b) representative of and contributing to the development of digital skills among lexicographers. The scope and rationale of the curriculum are described in more detail in the Deliverable D5. 2 Guidelines for Producing ELEXIS Tutorials and Instruction Manuals. The goal of this deliverable, as stated in the project DOW, is to provide "a clear, structured overview of tutorials and instruction manuals developed within the project. "},
KEYWORDS = {ELEXIS, lexicography, training materials},
PAGES = {31},
URL = {https://elex.is/wp-content/uploads/ELEXIS_D5_3_Overview-of-Online-Tutorials-and-Instruction-Manuals.pdf},
}
@THESIS{OTTAVIANI_2022_THESIS_O_513782,
AUTHOR = {Ottaviani, R.},
TITLE = {Digitalizzazione e gestione documentale nelle Pubbliche Amministrazioni: analisi del caso concreto dell’Istituto di Tecnologie della Comunicazione, dell’Informazione e della Percezione-Tecip},
YEAR = {2022},
ABSTRACT = {Breve relazione sulla revisione delle procedure di un Istituto universitario, finalizzata all'introduzione di una modalità operativa rispondente ai requisiti della norma ISO 9001: 2015},
URL = {https://iris.cnr.it/handle/20.500.14243/513782},
}
@MISC{BARONI_2022_MISC_B_462844,
AUTHOR = {Baroni, P.},
TITLE = {SIGUL Web Site},
YEAR = {2022},
ABSTRACT = {Web site of SIGUL-Special Interest Group on Under-resourced Languages},
KEYWORDS = {under-resourced languages, digital diversity, digital survival},
URL = {https://www.sigul.eu},
}
@MISC{BOSCHETTI_2022_MISC_BD_455957,
AUTHOR = {Boschetti, F. and Del Grosso, A. M.},
TITLE = {Una bussola per navigare nei mari digitali: il ruolo di un K-Centre CLARIN per le esigenze degli studiosi},
YEAR = {2022},
ABSTRACT = {The contribution will give an overview about the structure of the Common Language Research Infrastructure (CLARIN) and its initiatives devoted to the DH, both at the European and at the national level as well as the activities of a new CLARIN Knowledge Centre: the DiPText-KC. Furthermore, it will introduce the practices that we suggest for a workflow to digit(al)ize texts and how to host projects in ILC4CLARIN through the assistance of the DiPText-KC},
KEYWORDS = {Digital Humanities, CLARIN, DiPText-KC, CoPhiLab, Digital Philology},
URL = {https://iris.cnr.it/handle/20.500.14243/455957},
}
@MISC{BOSCHETTI_2022_MISC_BDGZ_455955,
AUTHOR = {Boschetti, F. and Del Grosso, A. M. and Guadagnini, E. and Zenzaro, S.},
TITLE = {L'annotazione del testo},
YEAR = {2022},
ABSTRACT = {Il contributo illustra le potenzialità offerte dall'uso dei Linguaggi Specifici di Dominio (DSL) per la produzione di note, commenti, apparati e testi scientifici. Il modello Euporia e l'approccio DSL-Based DSE sono richiamati come possibile alternativa alla codifica mediante XML/TEI per la produzione di edizioni scientifiche digitali},
KEYWORDS = {Digital Humanities, Filologia Digitale, Domain Specific Languages, Euporia, DSL-based DSE},
URL = {https://iris.cnr.it/handle/20.500.14243/455955},
CONFERENCE_NAME = {Filologia Digitale e Testi Italiani Antichi. Verso un sistema integrato di ricerca},
}
@MISC{BOSCHETTI_2022_MISC_BDMTP_455948,
AUTHOR = {Boschetti, F. and Del Grosso, A. M. and Macchiarelli, A. and Tanozzi, F. and Puliero, J.},
TITLE = {The Remains of the Text-Natural Language Processing},
YEAR = {2022},
ABSTRACT = {The seminar presents some digital technologies for the study of texts of literary nature mediated by the use of computational tools. Specifically, the following topics are addressed: a) Coronelli's Epitome Cosmografica; b) Aratus' Phaenomena and the art of composing acrostics; c)Latin poets between astronomy and mythology d) Lemmatisation and Semi-automated linguistic analysis of Latin texts e) Musisque Deoque: a powerful instrument to study intertextuality},
KEYWORDS = {Digital Humanities, Digital Philology, Summer School, MQD, NLP},
URL = {https://www.unive.it/data/33113/2/60398},
}
@MISC{DELGROSSO_2022_MISC_D_462937,
AUTHOR = {Del Grosso, A. M.},
TITLE = {Forme di elaborazione per il Codice Pelavicino Digitale. Usare, Riusare ed Estendere l'Edizione},
YEAR = {2022},
ABSTRACT = {Il contributo illustra alcune attività condotte in seno al progetto di edizione digitale denominato "Codice Pelavicino". In particolare la presentazione si focalizza sulla rappresentazione dei termini notevoli, sulla presentazione del testo in formato PDF e sulla specificità della codifica come componente di un sistema FAIR},
KEYWORDS = {Codice Pelavicino, Digital Humanities, Filologia Digitale, Edition Visualization Technology, XML/TEI},
URL = {https://pelavicino.labcd.unipi.it/},
CONFERENCE_NAME = {L'edizione digitale del Codice Pelavicino-Presentazione del lavoro completo},
}
@MISC{DELGROSSO_2022_MISC_DZB_462878,
AUTHOR = {Del Grosso, A. M. and Zenzaro, S. and Boschetti, F.},
TITLE = {CNR-ILC team e il progetto ERC 885222-GreekSchools},
YEAR = {2022},
ABSTRACT = {Presentazione del team di lavoro e delle attività svolte in seno al progetto ERC 885222-GreekSchools durante il convegno di Papirologia Ercolanese organizzato dal 5 al 9 settembre 2022 presso il Castello Pasquini di Castiglioncello (Livorno)},
KEYWORDS = {Digital Humanities, Digital Papyrology, Digital Scholarly Edition, ERC, GreekSchools, DSL-based DSE},
URL = {https://greekschools.eu},
CONFERENCE_NAME = {Convegno di Papirologia Ercolanese},
}
@MISC{FRONTINI_2022_MISC_FBQMMZUW_441101,
AUTHOR = {Frontini, F. and Bellandi, A. and Quochi, V. and Monachini, M. and Mörth, K. and Zhanial, S. and Ďurčo, M. and Woldrich, A.},
TITLE = {CLARIN Tools and Resources for Lexicographic Work},
YEAR = {2022},
ABSTRACT = {This course introduces lexicographers to the CLARIN Research Infrastructure and highlights language resources and tools useful for lexicographic practices. The course consists of two parts. In Part 1, you will learn about CLARIN, its technical and knowledge infrastructure, and about how to deposit and find lexical resources in CLARIN. In Part 2, you will become acquainted with CLARIN tools that can be used to create lexical resources},
KEYWORDS = {CLARIN, lexicography},
URL = {https://elexis.humanistika.org/id/UnwYPq70Dewbn7XDEjsMM},
}
@MISC{MARCHI_2022_MISC_M_458610,
AUTHOR = {Marchi, S.},
TITLE = {LexicO scripts: a collection of perl scripts and mysql queries to build LexicO starting from Parole-Simple-Clips},
YEAR = {2022},
ABSTRACT = {Collezione di script in perl e di query SQL per la costruzione di LexicO a partire da Parole-Simple-Clips},
URL = {https://iris.cnr.it/handle/20.500.14243/458610},
}
@MISC{MARCHI_2022_MISC_M_458611,
AUTHOR = {Marchi, S.},
TITLE = {PSC critical entries: a PHP web site to consult them},
YEAR = {2022},
ABSTRACT = {Insieme di script PHP per l'interrogazione della risorse Parole-Simple-Clips memorizzata in un DBMS (MySQL)},
URL = {https://iris.cnr.it/handle/20.500.14243/458611},
}
@MISC{MARTELLI_2022_MISC_MNKKGKNSOLKKDUSLVGLQMFTTCSIM_446359,
AUTHOR = {Martelli, F. and Navigli, R. and Krek, S. and Kallas, J. and Gantar, P. and Koeva, S. and Nimb, S. and Sandford Pedersen, B. and Olsen, S. and Langemets, M. and Koppel, K. and Üksik, T. and Dobrovoljc, K. and Ureñaruiz, R. and Sanchosánchez, J. and Lipp, V. and Váradi, T. and Gyrffy, A. and László, S. and Quochi, V. and Monachini, M. and Frontini, F. and Tiberius, C. and Tempelaars, R. and Costa, R. and Salgado, A. and Ibej, J. and Munda, T.},
TITLE = {Parallel sense-annotated corpus ELEXIS-WSD 1. 0},
YEAR = {2022},
ABSTRACT = {ELEXIS-WSD is a parallel sense-annotated corpus in which content words (nouns, adjectives, verbs, and adverbs) have been assigned senses. Version 1. 0 contains sentences for 10 languages: Bulgarian, Danish, English, Spanish, Estonian, Hungarian, Italian, Dutch, Portuguese, and Slovene. The corpus was compiled by automatically extracting a set of sentences from WikiMatrix (Schwenk et al., 2019), a large open-access collection of parallel sentences derived from Wikipedia, using an automatic approach based on multilingual sentence embeddings. The sentences were manually validated according to specific formal, lexical and semantic criteria (e. g. by removing incorrect punctuation, morphological errors, notes in square brackets and etymological information typically provided in Wikipedia pages). To obtain a satisfying semantic coverage, we filtered out sentences with less than 5 words and less than 2 polysemous words were filtered out. Subsequently, in order to obtain datasets in the other nine target languages, for each selected sentence in English, the corresponding WikiMatrix translation into each of the other languages was retrieved. If no translation was available, the English sentence was translated manually. The resulting corpus is comprised of 2, 024 sentences for each language},
KEYWORDS = {Word Sense Disambiguation, corpus parallelo, disambiguazione automatica del senso, annotazione semantica multilingue},
URL = {https://iris.cnr.it/handle/20.500.14243/446359},
}
@MISC{MARZI_2022_MISC_MP_448878,
AUTHOR = {Marzi, C. and Pirrelli, V.},
TITLE = {Psycholinguistic Research on Inflectional Morphology in the Romance Languages},
YEAR = {2022},
ABSTRACT = {Over the past decades, psycholinguistic aspects of word processing have made a considerable impact on views of language theory and language architecture. In the quest for the principles governing the ways human speakers perceive, store, access, and produce words, inflection issues have provided a challenging realm of scientific inquiry, and a battlefield for radically opposing views. It is somewhat ironic that some of the most influential cognitive models of inflection have long been based on evidence from an inflectionally impoverished language like English, where the notions of inflectional regularity, (de)composability, predictability, phonological complexity, and default productivity appear to be mutually implied. An analysis of more "complex" inflection systems such as those of Romance languages shows that this mutual implication is not a universal property of inflection, but a contingency of poorly contrastive, nearly isolating inflection systems. Far from presenting minor faults in a solid, theoretical edifice, Romance evidence appears to call into question the subdivision of labor between rules and exceptions, the on-line processing vs. long-term memory dichotomy, and the distinction between morphological processes and lexical representations. A dynamic, learning-based view of inflection is more compatible with this data, whereby morphological structure is an emergent property of the ways inflected forms are processed and stored, grounded in universal principles of lexical self-organization and their neuro-functional correlates},
KEYWORDS = {Romance language morphology, paradigms, inflectional classes, lexical self-organisation, frequency effects, priming, discriminative learning, lexical blocking, long-term and short-term memory},
PAGES = {1-44},
URL = {https://oxfordre.com/linguistics/view/10.1093/acrefore/9780199384655.001.0001/acrefore-9780199384655-e-709},
DOI = {10.1093/acrefore/9780199384655.013.709},
PUBLISHER = {Oxford University Press (Oxford, GBR)},
ISBN = {9780199384655},
CONFERENCE_PLACE = {Oxford},
EDITOR = {Loporcaro, M.},
}
@MISC{PROVOST_2022_MISC_P_475284,
AUTHOR = {Provost, L. M.},
TITLE = {La formazione online sulla Scienza Aperta nell'ambito del progetto H2020 TRIPLE, e il TRIPLE Training Toolkit},
YEAR = {2022},
ABSTRACT = {Il seminario presenta il lavoro svolto nell'ambito del task dedicato alla formazione online e alle linee guida sull’Open Science e l'European Open Science Cloud (EOSC) nel progetto Horizon 2020 TRIPLE (Transforming Research through Innovative Practices for Linked Interdisciplinary Exploration, Grant Agreement n. 863420). In particolare, sono presentati due risultati riutilizzabili prodotti per supportare l'adozione e l'implementazione di pratiche aperte all'interno delle comunità di ricerca e formazione nelle Scienze Sociale e Umanistiche (SSH). Il primo è la TRIPLE Open Science Training Series (https: //project. gotriple. eu/training/), una serie di 12 eventi di formazione online progettata per migliorare le competenze dei ricercatori in materia di FAIR e Open Science. Il secondo è il TRIPLE Training Toolkit (https: //doi. org/10. 5281/zenodo. 6256198), un workflow aperto dedicato ai formatori per organizzare eventi di formazione secondo il metodo FAIR-by-design},
KEYWORDS = {TRIPLE, Training, Open Science, Scienza Aperta, EOSC},
URL = {https://zenodo.org/records/7078752},
DOI = {10.5281/ZENODO.7078752},
CONFERENCE_NAME = {Seminari del CNR-ILC},
}
@MISC{QUOCHI_2022_MISC_QB_446071,
AUTHOR = {Quochi, V. and Bellandi, A.},
TITLE = {LexO editor: the basics-video tutorial},
YEAR = {2022},
ABSTRACT = {Video tutorial sull'uso di LexO, un editor di lessici secondo il modello Ontolex-lemon. Il tutoria è parte dell' ELEXIS training programme disponibile sulla piattaforma DARIAH-teach},
KEYWORDS = {lexicon editor, video tutorial, training material, lexO, online web application},
URL = {https://www.youtube.com/watch?v=9KE0laMaTAs\&list=PLoD829qNERpYKq8JRkY4EIGgZCdi0QHOd},
}
@MISC{SCIOLETTE_2022_MISC_SGM_455982,
AUTHOR = {Sciolette, F. and Giovannetti, E. and Marchi, S.},
TITLE = {LexicO},
YEAR = {2022},
ABSTRACT = {LexicO is a resource deriving from Parole-Simple-Clips (http: //hdl. handle. net/20. 500. 11752/ILC-88). This resource contains all four levels of linguistic information represented in PSC (phonology, morphology, syntax, and semantics) which have been automatically analysed to find redundant, erroneous and missing data. The process of updating that conducted to the current version of LexicO starting from PSC included: i) the removal of all sure redundant entries (i. e. duplicates) belonging to all four linguistic levels; ii) the creation of tables dedicated to candidate redundants, detected by considering specific similarities amongst entries; iii) the correction of missing semantic and syntax-semantics interface relations amongst the entries of lexicon},
KEYWORDS = {computational lexic, Lexical Database, semantics, morphology, syntax, phonology},
URL = {https://dspace-clarin-it.ilc.cnr.it/repository/xmlui/handle/20.500.11752/ILC-977},
}
@MISC{VENUTI_2022_MISC_VD_462938,
AUTHOR = {Venuti, M. and Del Grosso, A. M.},
TITLE = {La Galassia Musisque Deoque},
YEAR = {2022},
ABSTRACT = {Il contributo illustra il lavoro di riorganizzazione della galassia MQDQ in un sistema distribuito e collaborativo, facendo uso di Domain Specific Languages accanto alla modalità tradizionale di codifica mediante XML/TEI},
KEYWORDS = {Digital Humanities, Filologia Digitale, MQDQ, Filologia Collaborativa, Domain Specific Languages},
URL = {https://iris.cnr.it/handle/20.500.14243/462938},
CONFERENCE_NAME = {Maratona DH},
}
@MISC{ZENZARO_2022_MISC_ZBD_420372,
AUTHOR = {Zenzaro, S. and Boschetti, F. and Del Grosso, A. M.},
TITLE = {Relazione sugli avanzamenti della piattaforma per il progetto GreekSchools},
YEAR = {2022},
ABSTRACT = {Relazione sugli avanzamenti della piattaforma per il progetto GreekSchools},
KEYWORDS = {GreekSchools, Digital Humanities, Digital papyrology},
URL = {https://iris.cnr.it/handle/20.500.14243/420372},
}
@MISC{ZENZARO_2022_MISC_ZDB_462863,
AUTHOR = {Zenzaro, S. and Del Grosso, A. M. and Boschetti, F.},
TITLE = {CophiEditor & Viewer},
YEAR = {2022},
ABSTRACT = {Piattaforma di Filologia Digitale, Computazionale, Collaborativa e Cooperativa in sviluppo presso CNR-ILC nel contesto del progetto ERC Advanced Grant 885222-GreekSchools "The Greek Philosophical Schools according to Europe's earliest 'history of philosophy'. Towards a new pioneering critical edition of Philodemus' Arrangement of the Philosopher". La piattaforma implementa il modello di Edizioni Scientifiche Digitali DSL-based DSE},
KEYWORDS = {Digital Humanities, Filologia Digitale, Filologia Computazionale, Filologia Collaborativa, Edizione Scientifica Digitale, GreekSchools, DSL-based DSE},
URL = {https://cophi.github.io/gs-data-service-api/#/},
}
@ARTICLE{BACCO_2021_ARTICLE_BCDM_444101,
AUTHOR = {Bacco, L. and Cimino, A. and Dell'Orletta, F. and Merone, M.},
TITLE = {Explainable sentiment analysis: A hierarchical transformer-based extractive summarization approach},
YEAR = {2021},
ABSTRACT = {In recent years, the explainable artificial intelligence (XAI) paradigm is gaining wide research interest. The natural language processing (NLP) community is also approaching the shift of paradigm: building a suite of models that provide an explanation of the decision on some main task, without affecting the performances. It is not an easy job for sure, especially when very poorly interpretable models are involved, like the almost ubiquitous (at least in the NLP literature of the last years) transformers. Here, we propose two different transformer-based methodologies exploiting the inner hierarchy of the documents to perform a sentiment analysis task while extracting the most important (with regards to the model decision) sentences to build a summary as the explanation of the output. For the first architecture, we placed two transformers in cascade and leveraged the attention weights of the second one to build the summary. For the other architecture, we employed a single transformer to classify the single sentences in the document and then combine the probability scores of each to perform the classification and then build the summary. We compared the two methodologies by using the IMDB dataset, both in terms of classification and explainability performances. To assess the explainability part, we propose two kinds of metrics, based on benchmarking the models' summaries with human annotations. We recruited four independent operators to annotate few documents retrieved from the original dataset. Furthermore, we conducted an ablation study to highlight how implementing some strategies leads to important improvements on the explainability performance of the cascade transformers model},
KEYWORDS = {Natural Language Processing, Sentiment Analysis, Explainable IA},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85114289346\&origin=inward},
VOLUME = {10},
DOI = {10.3390/electronics10182195},
ISSN = {2079-9292},
JOURNAL = {ELECTRONICS},
}
@ARTICLE{BELLANDI_2021_ARTICLE_B_446103,
AUTHOR = {Bellandi, A.},
TITLE = {LexO: an open-source system for managing OntoLex-Lemon resources},
YEAR = {2021},
ABSTRACT = {The adoption of Semantic Web technologies and the Linked Data paradigm has been driven by the need to ensure the construction of resources that are at the same time interoperable, shareable and reusable by the scientific community. OntoLex-Lemon, which exploits the expressive power of ontologies, has come to be the de facto standard model for the representation of lexica and terminologies. The number of users potentially interested in editing or consuming OntoLex-Lemon data is thus very large. Unfortunately, the use of ontology editors for constructing such language resources can be very tedious due to the complexity and verbosity of the model, which heavily relies on specific modeling technicalities. This underlines the importance of developing tools and services that facilitate the creation and editing of resources and bring lexicography and terminology closer to the Semantic Web. In this paper we present LexO, a collaborative web editor for easily building and managing lexical and terminological resources in the context of the Semantic Web, based on the OntoLex-Lemon model. It makes the model accessible to users who do not possess the needed technical skills, thus allowing for wider adoption of new technological advances in the Semantic Web},
KEYWORDS = {OntoLex-Lemon, e-lexicography, Terminology, Semantic Web, Linked Data, LexO},
PAGES = {1093-1126},
URL = {https://link.springer.com/article/10.1007/s10579-021-09546-4},
VOLUME = {55 (4)},
DOI = {10.1007/s10579-021-09546-4},
ISSN = {1574-020X},
JOURNAL = {LANGUAGE RESOURCES AND EVALUATION},
}
@ARTICLE{BENOTTO_2021_ARTICLE_B_530941,
AUTHOR = {Benotto, G.},
TITLE = {Can an author style be unveiled through word distribution?},
YEAR = {2021},
ABSTRACT = {The inclusion of semantic features in the stylometric analysis of literary texts appears to be poorly investigated. In this work, we experiment with the application of Distributional Semantics to a corpus of Italian literature to test if words distribution can convey stylistic cues. To verify our hypothesis, we have set up an Authorship Attribution experiment. Indeed, the results we have obtained suggest that the style of an author can reveal itself through words distribution too},
KEYWORDS = {Authorship attribution, Stylometry, Plagiarism},
URL = {https://iris.cnr.it/handle/20.500.14243/530941},
VOLUME = {15 (1)},
ISSN = {1938-4122},
JOURNAL = {DIGITAL HUMANITIES QUARTERLY},
}
@ARTICLE{BOSCHETTI_2021_ARTICLE_B_420377,
AUTHOR = {Boschetti, F.},
TITLE = {INTERPRETAZIONE E VOLONTÀ DI INTERPRETAZIONE TRA LINGUISTICA COMPUTAZIONALE E LITERARY COMPUTING},
YEAR = {2021},
ABSTRACT = {Interpretation and will to interpret between computational linguistics and literary computing · By building on Rajna's comparison between Angelica and Europa, this article tries to reflect on quantitative methods applied to literary criticism in the digital era, which are largely borrowed from computational linguistics. According to Royce, every interpretation starts first of all from a will to interpret, consistent with the principles of the community to which the interpreters feel they belong. Thus, it is important to consider the new methods of interpretation in their historical perspective and widen the view from the primary sources to the traditions of studies documented in the secondary sources. This approach can help to establish fruitful links among different communities of interpretation},
KEYWORDS = {Digital hermeneutics, Digital philology, Literary criticism, Intertextuality, Computational linguistics},
PAGES = {211-225},
URL = {https://iris.cnr.it/handle/20.500.14243/420377},
VOLUME = {46 (1-2)},
DOI = {10.19272/202101602009},
ISSN = {0392-6915},
JOURNAL = {LINGUISTICA E LETTERATURA},
}
@ARTICLE{BOSCHETTI_2021_ARTICLE_BM_420376,
AUTHOR = {Boschetti, F. and Mugelli, G.},
TITLE = {Il metodo Euporia per creare nuovi archivi digitali sulla tragedia greca},
YEAR = {2021},
ABSTRACT = {This article illustrates Euporia, i. e. a method for annotating literary texts based on Domain-Specific Languages. The annotation systems developed using this method are modeled on the needs of the users, their specific habits of studying and annotating texts, and the aims of their research. The two case studies discussed in this contribution show the application of the method in the context of two projects focused on the texts of Greek tragedy: on the one hand, a didactic project based on Aeschylus' Persians, on the other hand, a research project in the field of anthropology of the ancient world, based on the entire corpus of the Greek tragedy. The discussion aims to illustrate how text annotation through DSL can have both a didactic function and a scientific interest},
KEYWORDS = {Domain-Specific Languages, textual annotation, Ancient Greek Tragedy},
PAGES = {83-113},
URL = {https://ojs.cimedoc.uniba.it/index.php/fc/article/view/1381},
VOLUME = {7},
DOI = {10.15162/2465-0951/1381},
ISSN = {2465-0951},
JOURNAL = {FUTUROCLASSICO FCL},
}
@ARTICLE{CARDILLO_2021_ARTICLE_CS_402940,
AUTHOR = {Cardillo, F. and Straccia, U.},
TITLE = {Fuzzy OWL-Boost: learning fuzzy concept inclusions via real-valued boosting},
YEAR = {2021},
ABSTRACT = {OWL ontologies are nowadays a quite popular way to describe structured knowledge in terms of classes, relations among classes and class instances. In this paper, given an OWL ontology and a target class T, we address the problem of learning fuzzy concept inclusion axioms that describe sufficient conditions for being an individual instance of T (and to which degree). To do so, we present FUZZY OWL-BOOST that relies on the Real AdaBoost boosting algorithm adapted to the (fuzzy) OWL case. We illustrate its effectiveness by means of an experimentation with several ontologies},
KEYWORDS = {OWL Ontology, Machine Learning, Fuzzy Logic, Boosting},
PAGES = {164-186},
URL = {https://www.sciencedirect.com/science/article/abs/pii/S0165011421002426},
VOLUME = {438 (2022)},
DOI = {10.1016/j.fss.2021.07.002},
ISSN = {0165-0114},
JOURNAL = {FUZZY SETS AND SYSTEMS},
}
@ARTICLE{CHINELLO_2021_ARTICLE_CRFDBE_401397,
AUTHOR = {Chinello, A. and Richichi, V. and Fanelli, M. and Dell'Orletta, F. and Boschetti, F. and Enrico Zappa, L.},
TITLE = {La semantica del potere nella rappresentazione materna e paterna: uno studio-pilota linguistico e computazionale dei siti proana in Italia},
YEAR = {2021},
ABSTRACT = {Numerose ricerche hanno cercato di tratteggiare le caratteristiche relazionali dei genitori con figlie affette da Anoressia Nervosa (AN) utilizzando metodi strutturati (interviste, questionari). Considerando il modello delle polarità semantiche, il presente studio pilota vuole esplorare la presenza della semantica del potere, tipica delle famiglie con AN, nei commenti degli utenti di 10 blog pro-anoressia attraverso l'analisi testuale (T-LAB), focalizzando l'attenzione sulle rappresentazioni delle due figure genitoriali. Le analisi mostrano un'alta frequenza dei commenti riguardanti la figura materna e paterna, associate a specifici sentimenti (colpa, conflitto), all'interno di una vasta rete di attori sociali. La rappresentazione materna risulta essere associata a tematiche riguardanti la semantica del potere, il controllo e la conversazione su tematiche alimentari. Alternativamente, la figura paterna risulta essere maggiormente legata ai simboli del potere lavorativo-economico e al tema della mancanza. Questi risultati, sebbene preliminari, suggeriscono la presenza di alcuni termini legati al potere anche negli utenti di blog pro-anoressia in linea a quanto già mostrato in pazienti con AN},
KEYWORDS = {natural language processing, anoressia},
URL = {https://iris.cnr.it/handle/20.500.14243/401397},
VOLUME = {68},
ISSN = {0030-5391},
JOURNAL = {ORIENTAMENTI PEDAGOGICI},
}
@ARTICLE{CININI_2021_ARTICLE_CCFFMMN_391604,
AUTHOR = {Cinini, A. and Cutugno, P. and Ferraris, C. and Ferretti, M. and Marconi, L. and Morgavi, G. and Nerino, R.},
TITLE = {Final results of the NINFA project: impact of new technologies in the daily life of elderly people},
YEAR = {2021},
ABSTRACT = {Background: The paper presents the work carried out within NINFA (iNtelligent Integrated Network For Aged people), a project for the wellbeing of the elderly people at home. Aims: The impact of new technologies on elderly people is evaluated with respect to the three main topics faced by NINFA. Methods: NINFA was structured into three main topics: (1) active user engagement from the very beginning of the plan-ning stage: the use of specially designed questionnaires to evaluate the acceptability of new technology in general and robot caregiver specifically; (2) assessment of the well-being through non-invasive techniques: natural language processing for language change monitoring in elderly subjects; (3) automated assessment of motor and cognitive functions at home: systems to deliver tests and exergames through user interfaces compliant with elderly subjects. Results: The analysis shows that there is no a priori closure to support the technology, but it must not be invasive and must allow social interactions. The study of speech transcripts shows that a large variations in the number of words used to describe the same situation could be a sign on the onset of cognitive impairments. The specifically designed systems highlight, after the training period, significant improvements in the performances of the participants and a satisfaction with regards to the systems usability. Conclusions: The outcomes of NINFA project highlight some important aspects of the relationship between elderly people and new technologies concerning: engagement and acceptability, assessment of the wellbeing and of the modifications of motor, cognitive and language functions},
KEYWORDS = {User Engagement, Wellbeing assessment, Linguistic and Cognitive Analysis, Movement Analysis, Exergames, At-Home monitoring, Postural stability},
PAGES = {1213-1222},
URL = {https://link.springer.com/content/pdf/10.1007/s40520-019-01357-6.pdf},
VOLUME = {33},
DOI = {10.1007/s40520-019-01357-6},
ISSN = {1720-8319},
JOURNAL = {AGING CLINICAL AND EXPERIMENTAL RESEARCH (ONLINE)},
}
@ARTICLE{DELGRATTA_2021_ARTICLE_DBBS_449188,
AUTHOR = {Del Gratta, R. and Boschetti, F. and Bambaci, L. and Sarnari, F.},
TITLE = {Document analysis and Textual philology: A Formal Perspective},
YEAR = {2021},
ABSTRACT = {We introduce a formal approach to document and text analysis. The method proposed herein results in a mathematical model/framework which can formalize different challenges in research fields such as computational linguistics, digital philology, and software engineering, principally if applied to document and text analysis. We examine texts and documents from an evolutionary perspective, where both corruption and correction are involved. We describe document evolution via fibre bundles formalism. We also provide other examples to demonstrate the capabilities of the model},
KEYWORDS = {Formal model, document analysis, evolutionary approach, fibre bundles},
PAGES = {5-15},
URL = {https://www.innove.org/ijist/index.php/ijist/article/view/192},
VOLUME = {5 (1)},
ISSN = {2550-5114},
JOURNAL = {INTERNATIONAL JOURNAL OF INFORMATION SCIENCE AND TECHNOLOGY},
}
@ARTICLE{DELGRATTA_2021_ARTICLE_DGPC_402216,
AUTHOR = {Del Gratta, R. and Goggi, S. and Pardelli, G. and Calzolari, N.},
TITLE = {The LRE Map: what does it tell us about the last decade of our field?},
YEAR = {2021},
ABSTRACT = {The LRE Map of Language Resources was introduced at LREC 2010. Its intended purpose was: "to shed light on the vast amount of resources that represent the background of the research presented at LREC" (Calzolari et al. in: Calzolari et al. (eds) Proceedings of the seventh international conference on language resources and evaluation (LREC'10). European Language Resources Association (ELRA), Valletta, 2010). It also aimed at a change of culture in the field, actively engaging each researcher both in the documentation task about resources and in sharing resources. When we started to use it regularly also in other conferences, it became clear that it was an innovative instrument able to provide a picture of the field and its evolution as reflected by the creation and use of Language Resources. After 9 years we revisit the Map, considerably extending the data analysed in an LREC 2018 paper. The LRE Map data analysed here have been provided by the authors of 21 conferences during the phase of submission of papers, and contain information about 9405 resources. We analyse the LRE Map data from many different viewpoints and the paper reports on the global picture, along the many Map dimensions, on different trends emerging from a diachronic perspective and finally on some comparisons between five editions of the two major conferences present in the Map: LREC and COLING},
KEYWORDS = {LR infrastucture, metadata, LR documentation},
PAGES = {259-283},
URL = {https://link.springer.com/article/10.1007/s10579-020-09520-6},
VOLUME = {VOLUME 55 (1)},
DOI = {10.1007/s10579-020-09520-6},
ISSN = {1574-020X},
JOURNAL = {LANGUAGE RESOURCES AND EVALUATION},
}
@ARTICLE{DELGROSSO_2021_ARTICLE_DFMTN_400710,
AUTHOR = {Del Grosso, A. M. and Fihri, D. and Mohajir, M. E. and Tonazzini, A. and Nahli, O.},
TITLE = {Challenges in the digital analysis of historical laminated manuscripts},
YEAR = {2021},
ABSTRACT = {In this paper, we analyze and discuss the characteristics of a system for the effective digital preservation and fruition of historical manuscripts degraded by the process of lamination. The most significant degradation caused by lamination is that the parchment or paper support loses its flatness, and usually presents ripples and warnings. This, together with the affixed translucent varnish, dramatically impair the digital acquisition process, so that light reflections in the more disparate directions affect the digital images. A digital system to contrast this irreversible and progressive degradation and to enable an effective access to the fragile asset should provide a number of functionalities: specialized digitization, able to avoid reflections as much as possible; image enhancement, devised to correct the residual degradations and enhance the text for an easier legibility; semi-automatic transcription of the virtually restored pages; and, finally, scholarly encoding and linguistic analysis, which should adapt existing tools to the specificity of the primary source (writing system and language). As a case study, we will make reference to the "Poem in Rajaz on medicine", written by Abubacer in the XII century, and conserved in the Al Quaraouiyine Library located in Fez, Morocco. The feasibility study for the realization of such a system is of general utility, in that it can provide guidelines for the digitization, the enhancement and the text encoding of the many laminated manuscripts conserved in other historical archives. On the other hand, from the cultural heritage point of view, the experimentation on the "Poem in Rajaz on medicine" could foster the systematic philological and ontological study of a unique piece of our documental heritage: the longest poem of medieval Islamic medical literature},
KEYWORDS = {Cultural Heritage Digital Safeguard, Historical Manuscript Digitization, Document Image Processing, Linguistic Analysis, Ontological Analysis},
PAGES = {34-43},
URL = {https://innove.org/ijist/index.php/ijist/article/view/190},
VOLUME = {5 (1)},
DOI = {10.57675/IMIST.PRSM/ijist-v5i1.190},
ISSN = {2550-5114},
JOURNAL = {INTERNATIONAL JOURNAL OF INFORMATION SCIENCE AND TECHNOLOGY},
}
@ARTICLE{FANTONI_2021_ARTICLE_FCCADP_401396,
AUTHOR = {Fantoni, G. and Coli, E. and Chiarello, F. and Apreda, R. and Dell'Orletta, F. and Pratelli, G.},
TITLE = {Text mining tool for translating terms of contract into technical specifications: Development and application in the railway sector},
YEAR = {2021},
ABSTRACT = {Tenders or technical terms contain a large quantity of both technical, legal, managerial information mixed in a nested and complex net of relationships. Extracting technical and design information from a document whose aim is both legal and technical, and that is written using several specific jargons, is not a trivial task: the purpose of the research is to try to detect, extract, split and assign information from the text of a tender in an automatic way. It means being able to understand technical and legal terms and organize them in multiple ways: according to product structure, internal organisational structure, etc. The focus is in providing a handy tool that could speed up and facilitate human analysis and allow tackling also the process of transforming customer's requirements into design specifications. The approach chosen to overcome the various issues is to support state-of-the-art Computational Linguistic tools with a wide Knowledge Base. The latter has been constructed both manually and automatically and comprises not only keywords but also concepts, relationships and regular expressions. The implementation of the methodology has been carried out during a project for AnsaldoBreda S. p. A. (now Hitachi Rail Europe). A case study about the tender for a high-speed train has been included to show the functioning and output of the entire software system. (C) 2020 Elsevier B. V. All rights reserved},
KEYWORDS = {Contract terms, Technical requirements, Natural language processing},
PAGES = {17},
URL = {https://iris.cnr.it/handle/20.500.14243/401396},
VOLUME = {124},
DOI = {10.1016/j.compind.2020.103357},
ISSN = {0166-3615},
JOURNAL = {COMPUTERS IN INDUSTRY},
}
@ARTICLE{GIOVANNETTI_2021_ARTICLE_GABDDM_396547,
AUTHOR = {Giovannetti, E. and Albanesi, D. and Bellandi, A. and Dattilo, D. and Del Grosso, A. M. and Marchi, S.},
TITLE = {An ontology of masters of the Babylonian Talmud},
YEAR = {2021},
ABSTRACT = {The purpose of this research is to build an ontology of the masters appearing in the Babylonian Talmud (BT). The ontology built so far has been shared as a Linked Open Data and it will be linked to existing vocabularies. This work has been developed in the context of the Babylonian Talmud Translation Project, where more than eighty Talmudists are working together, since 2012, at the translation (comprehensive of explicative notes and glossaries) of the Talmud into Italian. The construction of the resource has involved the application of tools leveraging on computational linguistics approaches. The ontology, already describing more than 500 masters, constitutes the first portion of a more comprehensive Talmudic Knowledge Base where the text itself, the terminology, the entities, and the concepts constituting the BT will be formalized and linked to each other},
KEYWORDS = {ontology, babylonian talmud, terminology, word alignment, linked open data, semantic web, knowledge representation},
PAGES = {725-737},
URL = {https://academic.oup.com/dsh/article-abstract/37/3/725/6410110},
VOLUME = {37 (3)},
DOI = {10.1093/llc/fqab043},
ISSN = {2055-7671},
JOURNAL = {DIGITAL SCHOLARSHIP IN THE HUMANITIES},
}
@ARTICLE{GOMEZCHAVEZ_2021_ARTICLE_GRCB_395179,
AUTHOR = {Gomez Chavez, A. and Ranieri, A. and Chiarella, D. and Birk, A.},
TITLE = {Underwater Vision-Based Gesture Recognition: A Robustness Validation for Safe Human-Robot Interaction},
YEAR = {2021},
ABSTRACT = {Underwater robotics requires very reliable and safe operations. This holds especially for missions in cooperation with divers who are-despite the significant advancements of marine robotics in recent years-still essential for many underwater operations. Possible application cases of underwater human-robot collaboration include marine science, archeology, oil-and gas production (OGP), handling of unexploded ordnance (UXO), e. g., from WWII ammunition dumped in the seas, or inspection and maintenance of marine infrastructure like pipelines, harbors, or renewable energy installations-to name just a few examples. We present a fully integrated approach to Underwater Human Robot Interaction (U-HRI) in form of a front-end for gesture recognition combined with a back-end with a full language interpreter. The gesture-based language is derived from the existing standard gestures for communication between human divers. It enables a diver to issue single commands as well as complex mission specifications to an Autonomous Underwater Vehicle (AUV) as demonstrated in several field trials. The gesture recognition is an essential component of the overall approach. It requires high reliability under the challenging conditions of the underwater domain. There is especially a high amount of variation in visual data due to various effects in the underwater image formation. We hence investigate in this article different Machine Learning (ML) methods for robust diver gesture recognition. This includes a classical ML approach and four state-of-the-art Deep Learning (DL) methods. Furthermore, we introduce a physically realistic way to use range information for adding underwater haze to produce meaningful additional data from existing real-world data. This can be of interest for creating evaluation data for underwater perception in general or to produce additional training data for ML-based approaches},
KEYWORDS = {Gesture recognition, gesture-based language, underwater human-robot interaction, data augmentation, deep learning},
PAGES = {67-78},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85107221665\&origin=inward},
VOLUME = {28 (3)},
DOI = {10.1109/MRA.2021.3075560},
ISSN = {1070-9932},
JOURNAL = {IEEE ROBOTICS AND AUTOMATION MAGAZINE},
}
@ARTICLE{GUADAGNINI_2021_ARTICLE_G_399858,
AUTHOR = {Guadagnini, E.},
TITLE = {3. 5. Paolo e Francesca per bambini, Paolo e Francesca per adulti: censure, revisioni, riletture},
YEAR = {2021},
ABSTRACT = {Selezione e commento di alcune riletture della vicenda di Paolo e Francesca (Dante, Inf. 5)},
KEYWORDS = {Dante Alighieri, riscritture, fumetto, letteratura per l'infanzia},
URL = {http://www.arabeschi.it/35-paolo-e-francesca-per-bambini-adulti-censure-revisioni-riletture/},
VOLUME = {17},
ISSN = {2282-0876},
JOURNAL = {ARABESCHI},
}
@ARTICLE{GUADAGNINI_2021_ARTICLE_G_401370,
AUTHOR = {Guadagnini, E.},
TITLE = {Les volgarizzamenti des « Métamorphoses » ovidiennes: notes sur les traductions italiennes par Arrigo Simintendi et Giovanni Bonsignori},
YEAR = {2021},
ABSTRACT = {L'on connaît deux traductions italiennes médiévales des Métamorphoses: celle faite par le notaire Arrigo Simintendi dans la première moitié du XIVe siècle et la traduction-commentaire de Giovanni Bonsignori (1375 environ). Ces deux oeuvres proposent deux "modèles" de livre différents et présentent deux stratégies distinctes de traduction, que nous allons essayer de décrire brièvement},
URL = {https://iris.cnr.it/handle/20.500.14243/401370},
DOI = {10.48611/isbn.978-2-406-11996-8.p.0145},
ISSN = {2115-6360},
JOURNAL = {CAHIERS DE RECHERCHES MÉDIÉVALES ET HUMANISTES},
}
@ARTICLE{KHAN_2021_ARTICLE_KEJCM_441096,
AUTHOR = {Khan, F. and E Díazvera, J. and Javier Minaya Gómez, F. and Cruz González, R. and Monachini, M.},
TITLE = {Mapping Conceptual Variation through A Thesaurus of Old English and Evoke: Towards a Topical Thesaurus of Old English Emotional Expressions},
YEAR = {2021},
ABSTRACT = {The topic of figurative language in Old English (OE) has recently become the focus of substantial research. In this article, the authors will describe work on the semantic description of the lexicon of shame words in OE and in particular the taxonomical organisation of this lexicon on the basis of different kinds of semantic mappings (metonymic, metaphorical). Next, they will explore the use of the Evoke platform as a means of visualising and navigating this lexicon and show how it can be used to enrich A Thesaurus of Old English (TOE). The authors also describe ongoing work on the modelling and publication of this data as a linked data resource consisting of a lexicon and a taxonomy in SKOS of different kinds of metaphoric/metonymic sense shifts},
KEYWORDS = {semantic mappings, metaphor, metonymy, Old English, shame, emotions, onomasiology},
PAGES = {442-456},
URL = {https://doi.org/10.1163/18756719-12340238},
DOI = {10.1163/18756719-12340238},
ISSN = {1875-6719},
JOURNAL = {AMSTERDAMER BEITRÄGE ZUR ÄLTEREN GERMANISTIK},
}
@ARTICLE{LACIVITA_2021_ARTICLE_LLCCFLCIBFT_518412,
AUTHOR = {La Civita, E. and Liotti, A. and Cennamo, M. and Crocetto, F. and Ferro, M. and Liguoro, P. and Cimmino, A. and Imbimbo, C. and Beguinot, F. and Formisano, P. and Terracciano, D.},
TITLE = {Peri-prostatic adipocyte-released tgfβ enhances prostate cancer cell motility by upregulation of connective tissue growth factor},
YEAR = {2021},
ABSTRACT = {Periprostatic adipose tissue (PPAT) has emerged as a key player in the prostate cancer (PCa) microenvironment. In this study, we evaluated the ability of PPAT to promote PCa cell migration, as well as the molecular mechanisms involved. Methods: We collected conditioned mediums from in vitro differentiated adipocytes isolated from PPAT taken from PCa patients during radical prostatectomy. Migration was studied by scratch assay. Results: Culture with CM of human PPAT (AdipoCM) promotes migration in two different human androgen-independent (AI) PCa cell lines (DU145 and PC3) and upregulated the expression of CTGF. SB431542, a well-known TGFβ receptor inhibitor, counteracts the increased migration observed in presence of AdipoCM and decreased CTGF expression, suggesting that a paracrine secretion of TGFβ by PPAT affects motility of PCa cells. Conclusions: Collectively, our study showed that factors secreted by PPAT enhanced migration through CTGF upregulation in AI PCa cell lines. These findings reveal the potential of novel therapeutic strategies targeting adipocyte-released factors and TGFβ/CTGF axis to fight advanced PCa dissemination},
KEYWORDS = {adipocytes, Cell migration, Peri-prostatic adipose tissue, Prostate cancer, TGFβ1},
URL = {https://www.mdpi.com/2227-9059/9/11/1692},
VOLUME = {9 (11)},
DOI = {10.3390/biomedicines9111692},
ISSN = {2227-9059},
JOURNAL = {BIOMEDICINES},
}
@ARTICLE{MARZI_2021_ARTICLE_MGSV_424727,
AUTHOR = {Marzi, C. and Greco, A. and Scilingo, E. and Vanello, N.},
TITLE = {Towards a model of arousal change after affective word pronunciation based on electrodermal activity and speech analysis},
YEAR = {2021},
ABSTRACT = {In this paper, we explore the possibility of building a model of subject arousal by exploiting the acquisition and the analysis of speech and electrodermal activity (EDA). Several issues have to be addressed to reach this goal as the estimation of the relationship between arousal and behavioral measures and the reliability of EDA signal during speech production. To accomplish this task, we will investigate the relation among EDA, speech activity and subject arousal, during isolated affective word pronunciation. Our results show that significant information on subject arousal can be obtained by analyzing EDA during the processing of out-of-context words with an emotional content in a reading aloud task. Based on a sample of eighteen Italian participants, we observed a significant relation between EDA features and self-reported arousal scores. Quantitative models relating EDA andspeech-derived features are proposed and discussed. We found that increasing values of tonic and phasic components of EDA signals correspond to increasing self-assessed arousal scores; Mel-frequency cepstral analysis of speech was also shown to carry relevant information about subject arousal, with a significant inverse relation to self-assessed scores. Our results suggest how the analysis of concurrent acquisition of EDA and speech featuresmay offer a valid approach for the prediction of subject arousal during speech production, as well as a method for validating self-assessment ratings themselves},
KEYWORDS = {speech, electrodermal activity, statistical models, arousal, word pronunciation},
PAGES = {1-8},
URL = {http://www.elsevier.com/locate/bspc},
VOLUME = {67 (102517)},
DOI = {10.1016/j.bspc.2021.102517},
ISSN = {1746-8094},
JOURNAL = {BIOMEDICAL SIGNAL PROCESSING AND CONTROL},
}
@ARTICLE{MIASCHI_2021_ARTICLE_MBD_402654,
AUTHOR = {Miaschi, A. and Brunato, D. P. and Dell'Orletta, F.},
TITLE = {A NLP-based stylometric approach for tracking the evolution of L1 written language competence},
YEAR = {2021},
ABSTRACT = {In this study we present a Natural Language Processing (NLP)-based stylometric approach for tracking the evolution of written language competence in Italian L1 learners. The approach relies on a wide set of linguistically motivated features capturing stylistic aspects of a text, which were extracted from students' essays contained in CItA (Corpus Italiano di Apprendenti L1), the first longitudinal corpus of texts written by Italian L1 learners enrolled in the first and second year of lower secondary school. We address the problem of modeling written language development as a supervised classification task consisting in predicting the chronological order of essays written by the same student at different temporal spans. The promising results obtained in several classification scenarios allow us to conclude that it is possible to automatically model the highly relevant changes affecting written language evolution across time, as well as identifying which features are more predictive of this process. In the last part of the article, we focus the attention on the possible influence of background variables on language learning and we present preliminary results of a pilot study aiming at understanding how the observed developmental patterns are affected by information related to the school environment of the student},
KEYWORDS = {stylometry, computational linguistics, language competence},
PAGES = {71-105},
URL = {https://www.jowr.org/abstracts/vol13_1/Miaschi_et_al_2021_13_1_abstract.html},
VOLUME = {VOL. 13},
DOI = {10.17239/jowr-2021.13.01.03},
ISSN = {2030-1006},
JOURNAL = {JOURNAL OF WRITING RESEARCH},
}
@ARTICLE{MONACHINI_2021_ARTICLE_MSCPB_533011,
AUTHOR = {Monachini, M. and Stamuli, F. M. and Calamai, S. and Pretto, N. and Bianchi, S.},
TITLE = {The Grey-Side of Audio Archives},
YEAR = {2021},
ABSTRACT = {Archives often include documents that can hardly be considered publications or grey literature as such, yet they maintain their documentary value and play a role of primary sources for the specialists. These documents, indeed, can help archivists to reveal the sedimentation process of the archive itself and to preserve the authentic context of the documentary production. They also appear to be very useful for the community of researchers and scholars. This happens more frequently with oral archives which include ‘non-conventional sources’, thus bringing together audio documents, fieldworks notes, correspondence, slipcases, analogic compact cassettes or open reels. At the cross-road of two disciplines, Archival Science and Grey Literature, this paper aims to argue the applicability of the concept of grey literature to this wide range of documentary materials, by showing the experience of Archivio Vi. Vo, a regional project aiming at building a model for archiving, preserving, managing and disseminating audio documents},
KEYWORDS = {oral archives infrastructures archival science grey literature},
PAGES = {41-44},
URL = {https://iris.cnr.it/handle/20.500.14243/533011},
VOLUME = {17 (1)},
ISSN = {1574-180X},
JOURNAL = {The Grey Journal},
}
@ARTICLE{MUGELLI_2021_ARTICLE_MBBDKT_449240,
AUTHOR = {Mugelli, G. and Boschetti, F. and Bellandi, A. and Del Gratta, R. and Khan, A. and Taddei, A.},
TITLE = {Annotating ritual in ancient greek tragedy: A bottom-up approach in action},
YEAR = {2021},
ABSTRACT = {EuporiaRAGT is one of the pilot projects that adopt the Euporia system as a digital support to an historico-anthropological research on the form and function of rituals in the texts of ancient Greek tragedy. This paper describes the bottom-up approach adopted in the project: During the annotation stage, performed with a Domain Specific Language designed with a usercentred approach, the domain expert can annotate ritual and religious phenomena, with the possibility of registering different textual and interpretive variants; the design of a search engine, in a second phase of the work, allows the database to be tested and reorganized. Finally, the construction of an ontology allows to structure the tags, in order to perform complex queries on the database},
KEYWORDS = {digital philology, dsl, ancient Greek},
PAGES = {17},
URL = {http://digitalhumanities.org:8081/dhq/vol/15/1/000538/000538.html},
VOLUME = {15},
ISSN = {1938-4122},
JOURNAL = {DIGITAL HUMANITIES QUARTERLY},
}
@ARTICLE{PICCINI_2021_ARTICLE_P_448305,
AUTHOR = {Piccini, S.},
TITLE = {Termes et théories de Ferdinand de Saussure dans le Manuel d'accentuation grecque de Bally},
YEAR = {2021},
ABSTRACT = {In 1945 Charles Bally published his last work, the Manuel d'accentuation grecque. In this small handbook of almost 130 pages, the laws and the principles governing the accent in Greek are described in a clear and innovative way, through the introduction of new categories and new terms. This article aims at demonstrating that the original approach used by Bally in his handbook was strongly influenced by the ideas that Saussure elaborated during his Course of Lithuanian held at the University of Geneva in 1901-1902},
KEYWORDS = {Greek accent, Lithuanian accent, Saussure's Course of Lithuanian, acrotonic accent, mesotonic accent., Charles Bally, Manuel d'accentuation grecque},
PAGES = {85-103},
URL = {https://revues.droz.org/index.php/CFS/article/view/CFS_73_85-103},
VOLUME = {73},
DOI = {10.47421/CFS73_85-103},
ISSN = {0068-516X},
JOURNAL = {CAHIERS FERDINAND DE SAUSSURE},
}
@ARTICLE{PICCINI_2021_ARTICLE_P_519787,
AUTHOR = {Piccini, S.},
TITLE = {La correspondance de Saussure à Niedermann (1904-1908). L’école de Saussure: admirer et pourtant ne pas comprendre},
YEAR = {2021},
ABSTRACT = {This paper examines two letters and two visit cards written between 1904 and 1908 by Ferdinand de Saussure to his colleague Max Niedermann. This correspondence, so far unpublished, is preserved in the Niederman Fund of the Public and University Library (BPU) in Neuchâtel. The analysis focuses mainly on the letter written on the 18th of July 1904, where Saussure addresses, albeit briefly, some methodological issues on the correct formulation of phonetic changes, anticipating to Niedermann a crucial aspect of his theoretical thought, i. e. the distinction between the synchronic and diachronic order},
KEYWORDS = {Max Niedermann, Spécimen d'un Précis de Phonétique historique latine, Phonetic change, Diachrony},
PAGES = {141-164},
URL = {https://revues.droz.org/CFS/article/view/CFS_72_141-164/pdf},
VOLUME = {72},
ISSN = {0068-516X},
JOURNAL = {CAHIERS FERDINAND DE SAUSSURE},
}
@ARTICLE{PICCINI_2021_ARTICLE_PBG_396586,
AUTHOR = {Piccini, S. and Bellandi, A. and Giovannetti, E.},
TITLE = {A Model for Representing Diachronic Terminologies: the Saussure Case Study},
YEAR = {2021},
ABSTRACT = {The aim of this article is to present a model for representing in an explicit and formal way the diachronic evolution of concepts and terms in a given domain, so that this formalization can be machine-actionable. The approach we here propose is based on Semantic Web technologies in order to guarantee interoperability and reuse across scientific communities of diachronic terminological resources that can be thus easily accessed, interconnected and mutually enriched. More specifically, the representation of dynamic evolution of terms and concepts was performed in OWL using the N-ary relations mechanisms. In addition, a set of SWRL rules was set up, in order to automatically identify the evolution of the concepts evoked within a text, as well as the terms representing these concepts. Our model was adopted to formally represent diachronic aspects of Saussure's terminology as they emerge from his works. An example will be provided to highlight the potential of such a knowledge structuration for gaining a wider understanding of the profound terminological and conceptual changes brought about by the paradigmatic and epistemological revolutions in sciences},
KEYWORDS = {diachronic terminology, Saussure's terminology, semantic web, linked data},
URL = {http://digitalhumanities.org/dhq/vol/15/3/000549/000549.html},
VOLUME = {15 (2)},
ISSN = {1938-4122},
JOURNAL = {DIGITAL HUMANITIES QUARTERLY},
}
@ARTICLE{PROIETTI_2021_ARTICLE_PY_395537,
AUTHOR = {Proietti, C. and Yuste Ginel, A.},
TITLE = {Dynamic epistemic logics for abstract argumentation},
YEAR = {2021},
ABSTRACT = {This paper introduces a multi-agent dynamic epistemic logic for abstract argumentation. Its main motivation is to build a general framework for modelling the dynamics of a debate, which entails reasoning about goals, beliefs, as well as policies of communication and information update by the participants. After locating our proposal and introducing the relevant tools from abstract argumentation, we proceed to build a three-tiered logical approach. At the first level, we use the language of propositional logic to encode states of a multi-agent debate. This language allows to specify which arguments any agent is aware of, as well as their subjective justification status. We then extend our language and semantics to that of epistemic logic, in order to model individuals' beliefs about the state of the debate, which includes uncertainty about the information available to others. As a third step, we introduce a framework of dynamic epistemic logic and its semantics, which is essentially based on so-called event models with factual change. We provide completeness results for a number of systems and show how existing formalisms for argumentation dynamics and unquantified uncertainty can be reduced to their semantics. The resulting framework allows reasoning about subtle epistemic and argumentative updates-such as the effects of different levels of trust in a source-and more in general about the epistemic dimensions of strategic communication},
KEYWORDS = {Abstract argumentation, Dynamic epistemic logic, Awareness logics, Multi-agent argumentation frameworks, Persuasion, Strategic Argumentation},
PAGES = {1-60},
URL = {https://link.springer.com/article/10.1007/s11229-021-03178-5#citeas},
DOI = {10.1007/s11229-021-03178-5},
ISSN = {0039-7857},
JOURNAL = {SYNTHESE},
}
@ARTICLE{SALVATI_2021_ARTICLE_SR_416964,
AUTHOR = {Salvati, L. and Russo, I.},
TITLE = {Indicatori di complessità nel parlato degli insegnanti di italiano L2: un'analisi quantitativa},
YEAR = {2021},
ABSTRACT = {Sul parlato dell'insegnante di L2 (identificato anche come teacher talk) esiste una vasta letteratura, in particolare per quanto riguarda l'insegnamento dell'inglese come lingua seconda. Agli approcci di carattere più teorico-normativo si accompagnano, negli ultimi trenta anni, approcci che prendono spunto dalle tecniche di analisi della linguistica dei corporae che si focalizzano su casi di studio specifici, andando a verificare su dati concreti le ipotesi formulate dalla teoria. L'ipotesi di base di questo ambito di ricerca è che gli insegnanti compiono-in maniera non sempre consapevole e pianificata-degli adeguamenti nel loro modo di parlare di fronte ad una classe di apprendenti. Tali adeguamenti riguardano più livelli linguistici e variano di intensità a seconda del livello complessivo di competenza degli apprendenti. Nel presente lavoro ci proponiamo di analizzare quantitativamente la complessità del parlato di insegnanti madrelingua di italiano L2 raccolto e trascritto durante lezioni appartenenti a due livelli del), Quadro comune europeo di riferimento per le lingue: apprendimento, insegnamento, valutazione(QCER, Council of Europe, 2002 [2001]), A1 e B13. Una parte delle trascrizioni riguarda lezioni svolte in classe (corpusParInIt, Parlato di Insegnanti di Italiano), nella quale vi è compresenza fisica tra insegnante e apprendenti, un secondo corpusè invece composto da lezioni somministrate onlinein maniera asincrona, tramite un canale YouTube (corpus Oneworlditaliano). Proponiamo una classificazione degli adeguamenti rispetto alla quale l'analisi quantitativa della complessità degli indicatori linguistici verificherà se è possibile distinguere sia tra il livello A1 e il livello B1 nel corpus raccolto in presenza e nelcorpusrelativo alle lezionion line. L'obiettivo finale è comprendere se un'analisi quantitativa dei dati possa aiutare ad individuare gli adeguamenti e le modifiche linguistiche attuate dai docenti per favorire una maggiore comprensibilità dell'inputda parte degli apprendenti},
KEYWORDS = {teacher talk, corpus linguistics, complessità lessicale},
PAGES = {122-132},
URL = {https://riviste.unimi.it/index.php/promoitals/article/view/17132/15088},
VOLUME = {13 (2)},
ISSN = {2037-3597},
JOURNAL = {ITALIANO LINGUADUE},
}
@ARTICLE{VARGAS_2021_ARTICLE_VCDS_400917,
AUTHOR = {Vargas, A. M. and Cominelli, L. and Dell'Orletta, F. and Scilingo, E. P.},
TITLE = {Verbal communication in robotics: a study on salient terms, research fields and trends in the last decades based on a computational linguistic analysis},
YEAR = {2021},
ABSTRACT = {Verbal communication is an expanding field in robotics showing a significant increase in both the industrial and research field. The application of verbal communication in robotics aims to reach a natural human-like interaction with robots. In this study, we investigated how salient terms related to verbal communication in robotics have evolved over the years, what are the topics that recur in the related literature, and what are their trends. The study is based on a computational linguistic analysis conducted on a database of 7, 435 scientific publications over the last 2 decades. This comprehensive dataset was extracted from the Scopus database using specific key-words. Our results show how relevant terms of verbal communication evolved, which are the main coherent topics and how they have changed over the years. We highlighted positive and negative trends for the most coherent topics and the distribution over the years for the most significant ones. In particular, verbal communication resulted in being highly relevant for social robotics. Potentially, achieving natural verbal communication with a robot can have a great impact on the scientific, societal, and economic role of robotics in the future},
KEYWORDS = {social robotics, affective computing, speech synthesis, speech generation, computational linguistic analysis, data mining, topic modeling, verbal communication},
URL = {https://iris.cnr.it/handle/20.500.14243/400917},
DOI = {10.3389/fcomp.2020.591164},
ISSN = {2624-9898},
JOURNAL = {FRONTIERS IN COMPUTER SCIENCE},
}
@BOOK{MARZI_2021_BOOK_M_443291,
AUTHOR = {Marzi, C.},
TITLE = {Modelling the morphological lexicon-A computational approach to mono-and bilingual learning and processing of verb inflection},
YEAR = {2021},
ABSTRACT = {This work aims at defining an explanatory model of the morphological lexicon as a dynamic system of word learning and processing in both mono-and bilingual contexts. The main focus is on exploring some relevant aspects of the paradigmatic organisation of the mental lexicon in language learning, basedon a dynamic analysis of mono-and bilingual contexts. The proposed interdisciplinary approach to lexical acquisition combines theoretically-motivated accounts, psycho-cognitive evidence and methodologies, and machine learning technologies. In particular, I will take into account those basic psychological and cognitive mechanisms that are considered as crucial in language acquisition: (i) the ability to perceive recurrent morphological structures (invariances) in varying temporal contexts, (ii) the capability to access/activate time series of symbols in the short term memory and to selectively integrate them with long term memory expectations, (iii) the attitude towards building novel forms through analogical extension of intra-and inter-paradigmatic relations (generalisation). This investigation is pursued through a computational model based on a recurrent Self-Organising Map, with Hebbian connections defined over a temporal layer (Temporal Self-Organising Map, TSOM), providing a principled algorithmic account of effects of lexical acquisition, processing and access. The computational simulation of a biologically inspired neural architecture of the mental lexicon offers the possibility to reproduce a wide range of conditions of mono-and bi-lingual input exposure, and to illustrate the dynamic of word acquisition and the emergence of morphological organisation. The proposed model provides an adaptive multifactorial account of morphology acquisition affected by a variety of input factors, such as word frequency distributions, paradigm regularity and wordlikeness, whereby lexical perception and organisation are grounded in memory-based processing strategies. In addition, it suggests a processing-based notion of morpheme, as a by-product of processing dynamics, with paradigms emerging as specialised surface relations between inflected forms},
KEYWORDS = {morphology, learning and processing, monolingual and bilingual acquisition, verb inflection, artificial neural networks, temporal self-organising maps},
PAGES = {5-171},
URL = {https://iris.cnr.it/handle/20.500.14243/443291},
PUBLISHER = {Franco Angeli (Milano, ITA)},
ISBN = {978-88-351-3548-7},
CONFERENCE_PLACE = {Milano},
}
@INCOLLECTION{BOSCHETTI_2021_INCOLLECTION_BDMBMR_443434,
AUTHOR = {Boschetti, F. and Del Gratta, R. and Monachini, M. and Buzzoni, M. and Monella, P. and Rosselli Del Turco, R.},
TITLE = {"Tea for two": the Archive of the Italian Latinity of the Middle Ages Meets the CLARIN Infrastructure},
YEAR = {2021},
ABSTRACT = {This paper gives an overview of the Latin resources, from the ALIM project, hosted and described at the ILC4CLARIN repository},
KEYWORDS = {Latin resources, CLARIN, corpus, repository},
PAGES = {37-46},
URL = {https://ecp.ep.liu.se/index.php/clarin/issue/view/1/37},
ISBN = {978-91-7929-609-4},
BOOKTITLE = {Selected Papers from the CLARIN Annual Conference 2020},
EDITOR = {Navarretta and Costanza and Eskevich and Maria},
}
@INCOLLECTION{BOSCHETTI_2021_INCOLLECTION_BDS_449235,
AUTHOR = {Boschetti, F. and Del Grosso, A. M. and Spinazzè, L.},
TITLE = {La galassia Musisque Deoque: storia e prospettive},
YEAR = {2021},
ABSTRACT = {The resources in support of Latin scholars created under the scientific direction of Paolo Mastandrea are numerous; the undertaking of Musisque Deoque, which aims at equipping the entire corpus of ancient Latin poetry with "significant variants", is the most emblematic effort, open to further developments. Looking at the general history of these projects, we try to trace the future path of the "Musisque Deoque galaxy" within Open Science},
KEYWORDS = {Classical philology, Latin poetry, Intertextuality, Open data, FAIR principles},
PAGES = {405-419},
URL = {https://edizionicafoscari.unive.it/media/pdf/books/978-88-6969-558-2/978-88-6969-558-2-ch-26.pdf},
DOI = {10.30687/978-88-6969-557-5/026},
PUBLISHER = {Edizioni Ca' Foscari (Venezia, ITA)},
ISBN = {978-88-6969-557-5},
CONFERENCE_PLACE = {Venezia},
BOOKTITLE = {Paulo maiora canamus-Raccolta di studi per Paolo Mastandrea},
}
@INCOLLECTION{CAPPA_2021_INCOLLECTION_CFG_444774,
AUTHOR = {Cappa, C. and Ferro, M. and Giulivi, S.},
TITLE = {Valutare l'efficienza di lettura in classe, fra "ecologia" e tecnologie},
YEAR = {2021},
ABSTRACT = {La sperimentazione AEREST ha consentito la creazione di un protocollo in grado di offrire una valutazione accurata e dettagliata delle abilità di lettura e comprensione del testo. Lo strumento si è rivelato semplice da utilizzare per gli insegnanti, ed è stato accolto con curiosità e interesse dagli allievi, certamente attratti dal supporto utilizzato per la somministrazione (il tablet), ma anche dai testi, che sono stati scelti e adattati con particolare cura. L'analisi dei dati ha consentito di identificare una considerevole varietà di profili di lettori, per i quali sarà possibile progettare percorsi di potenziamento mirati. Come già accennato, si è potuta constatare l'efficacia dello strumento nell'identificazione di allievi le cui difficoltà (pur evidenti agli occhi degli insegnanti) non vengono rilevate dai test comunemente utilizzati per la valutazione, ma la cui lettura non può essere considerata 'efficiente'. Costituiscono esempi in questo senso gli allievi che decodificano in modo accurato e veloce, con buone prestazioni nella comprensione all'ascolto, ma che manifestano difficoltà nella comprensione di un testo in lettura silente, poiché in questa attività devono integrare la decodifica con l'accesso al significato. Un ulteriore esempio è costituito dagli allievi che ottengono buoni risultati in tutti i test, impiegando però un tempo eccessivamente lungo per svolgerli. Nella prospettiva qui adottata, anche per questi allievi è necessario individuare strategie di supporto volte a evitare che le attività scolastiche, in particolare i compiti a casa, occupino una parte troppo ampia del tempo dell'allievo, togliendo spazio al gioco, allo svago, agli interessi personali e alla socializzazione. Questi ultimi sono aspetti che, come sottolinea la Carta internazionale dei diritti dei bambini (1959), rivestono un'importanza cruciale per il processo di crescita e il benessere generale di ciascuno. Oltre alle difficoltà, il protocollo AEREST consente di mettere in evidenza le prestazioni eccellenti, grazie alla struttura dei test e alle caratteristiche dei testi e delle domande che li accompagnano. Capire a fondo come "funzionano" gli allievi è indispensabile per poterli sostenere al meglio negli apprendimenti, indipendentemente dalla presenza o meno di un'"etichetta" diagnostica. Gli insegnanti hanno in questo senso una grande responsabilità, e uno strumento come AEREST, grazie anche all'implementazione su piattaforma tecnologica, può aiutarli in quella che forse è la loro principale sfida quotidiana: fare in modo che le difficoltà scolastiche non siano vissute come barriere all'apprendimento, al successo scolastico, alle opportunità professionali, alla realizzazione personale, ma come soglie da superare e da trasformare in trampolini di lancio},
KEYWORDS = {efficienza di lettura, decodifca, comprensione, scuola primaria},
PAGES = {49-69},
URL = {https://buponline.com/prodotto/disturbi-specifici-dellapprendimento-e-insegnamento-linguistico/},
PUBLISHER = {Bononia University Press (Bologna, ITA)},
ISBN = {978-88-6923-829-1},
CONFERENCE_PLACE = {Bologna},
BOOKTITLE = {Didattica dell'italiano},
EDITOR = {Garulli, V. and Pasetti, L. and Viale, M.},
}
@INCOLLECTION{CHAHINIAN_2021_INCOLLECTION_CBFDJPRSDT_394922,
AUTHOR = {Chahinian, N. and Bonnabaud La Bruyère, T. and Frontini, F. and Delenne, C. and Julien, M. and Panckhurst, R. and Roche, M. and Sautot, L. and Deruelle, L. and Teisseire, M.},
TITLE = {WEIR-P: An Information Extraction Pipeline for the Wastewater Domain},
YEAR = {2021},
ABSTRACT = {We present the MeDO project, aimed at developing resources for text mining and information extraction in the wastewater domain. We developed a specific Natural Language Processing (NLP) pipeline named WEIR-P (WastewatEr InfoRmation extraction Platform) which identifies the entities and relations to be extracted from texts, pertaining to information, wastewater treatment, accidents and works, organizations, spatio-temporal information, measures and water quality. We presentand evaluate the first version of the NLP system which was developed to automate the extraction of the aforementioned annotation from texts and its integration with existing domain knowledge. The preliminary results obtained on the Montpellier corpus are encouraging and show how a mix of supervised and rule-based techniques can be used to extract useful information and reconstruct the various phases of the extension of a given wastewater network. While the NLP and Information Extraction (IE) methods used are state of the art, the novelty of our work lies in their adaptation to the domain, and in particular in the wastewater management conceptual model, which defines the relations between entities. French resources are less developed in the NLP community than English ones. The datasets obtained in this project are another original aspect of this work},
KEYWORDS = {Wastewater, text mining, Information extraction, NLP, NER, Domain adapted systems},
PAGES = {171-188},
URL = {https://www.springer.com/gp/book/9783030750176},
PUBLISHER = {Springer Nature Switzerland (Basel, CHE)},
ISBN = {978-3-030-75017-6},
CONFERENCE_PLACE = {Basel},
BOOKTITLE = {Research Challenges in Information Science-15th International Conference, RCIS 2021, Limassol, Cyprus, May 11-14, 2021, Proceedings},
}
@INCOLLECTION{CUTUGNO_2021_INCOLLECTION_CFCM_420847,
AUTHOR = {Cutugno, P. and Ferretti, M. and Chiarella, D. and Marconi, L.},
TITLE = {A Linguistic preliminary study about noise perception},
YEAR = {2021},
ABSTRACT = {The activities of the project "TRIPLO: TRasporti e collegamenti Innovativi e sostenibili tra Porti e piattaformeLogistiche", financed with the resources of the Interregional Operational Programme Italy-France Maritime 2014-2020, have as specific objective to improve the sustainability of commercial ports and related logistic platforms, contributing to the reduction of noise pollution [1][2]. Some activities in the project are aimed at assessing theacoustic impact on the population exposed to noise generated by back port activities, in relation to individualperception. In environmental surveys, only technical investigations can objectively describe a phenomenon [3], but at the same time they do not guarantee its universality with respect to perception; a sound can be consideredboth as a physical phenomenon, and therefore measurable through objective parameters, and as a phenomenonlinked to sound perception, of a subjective nature and consequent to the psycho-physical-emotional state of thesubject. These two characteristics are strictly interdependent, so it is insufficient to limit to examine themseparately. The population constitutes a precious source of information in the evaluation of the quality of thespace in which they live or work, suggesting the relationships between environment, comfort and productivity. It istherefore important to use subjective investigation tools through which the opinion of the population can become avalid support to traditional methods of analysis and improve the overall evaluation},
KEYWORDS = {noise perception, questionnaire, applied linguistics},
PAGES = {57-61},
URL = {https://iris.cnr.it/handle/20.500.14243/420847},
PUBLISHER = {Centro de Lingüística Aplicada (Santiago de Cuba, CUB)},
ISBN = {978-959-7174-40-0},
CONFERENCE_PLACE = {Santiago de Cuba},
BOOKTITLE = {Contribuciones a la Lingüística y a la Comunicación Social. Tributo a Vitelio Ruiz Hernández},
}
@INCOLLECTION{DOLOWYRYBINSKA_2021_INCOLLECTION_DS_421904,
AUTHOR = {Dolowyrybinska, N. and Soria, C.},
TITLE = {Surveying the ethnolinguistic vitality of two contested languages. The case of Kashubian and Piedmontese},
YEAR = {2021},
ABSTRACT = {In this chapter we present the results of a Polish-Italian research project aimed at evaluating and comparing the vitality of two contested languages: Kashubian in Poland and Piedmontese in Italy},
KEYWORDS = {ethnolinguistic vitality, contested languages},
PAGES = {125-142},
URL = {https://benjamins.com/catalog/wlp.8.07dol?srsltid=AfmBOoorsncLmdcBkTj2Av942qvxVn2_jBD3WzR1tREhvcUM4YFZkDr-},
DOI = {10.1075/wlp.8.07dol},
PUBLISHER = {John Benjamins (Amsterdam, NLD)},
ISBN = {9789027208040},
CONFERENCE_PLACE = {Amsterdam},
BOOKTITLE = {Contested Languages. The hidden multilingualism of Europe},
}
@INCOLLECTION{GIULIVI_2021_INCOLLECTION_GCF_444779,
AUTHOR = {Giulivi, S. and Cappa, C. and Ferro, M.},
TITLE = {Le difficoltà di lettura. Limiti o soglie calpestabili?},
YEAR = {2021},
ABSTRACT = {'Se alzi un muro, pensa a ciò che resta fuori', scrive Italo Calvino in uno dei suoi romanzi più celebri, Il barone rampante. Quante volte alziamo muri, nelle situazioni e negli ambiti più disparati, magari senza che ce ne sia volontà o consapevolezza? La scuola, paradossalmente, è forse uno dei contesti in cui più spesso ciò accade. Non per negligenza, né per carenza di competenze-almeno nella maggioranza dei casi-ma perché la complessità dell'universo educativo, e di una classe, è spesso difficile da afferrare, accettare, accogliere, gestire, percepire come un valore. Il problema è che, in certi casi, a restare fuori dal muro sono le opportunità di apprendimento degli allievi, il loro benessere scolastico ed extrascolastico, le loro possibilità future. La lettura e le opportunità di accesso al testo possono costituire uno dei migliori trampolini di lancio, oppure una delle maggiori barriere, verso un'educazione adeguata, verso la possibilità di partecipazione attiva nella società, verso future opportunità accademiche e professionali. Le abilità legate alla lettura, la maggiore o minore efficienza con cui l'allievo le sviluppa costituiscono anche una delle principali fonti di complessità in classe. Da qualche tempo si assiste in Ticino a una crescente attenzione verso le difficoltà e i disturbi della lettura. I docenti sono sempre più sensibili, informati e aggiornati sul tema. Ciò che ancora sfugge, tuttavia, è l'estrema eterogeneità dei profili dei 'piccoli lettori', e la reale natura delle difficoltà che possono manifestarsi in età scolare. Consideriamo, per esempio, una delle cause di tali difficoltà: la dislessia, il disturbo specifico dell'apprendimento (DSA) che impedisce l'automatizzazione della decodifica del testo scritto. Si tratta di un disturbo di origine neurobiologica; ciò non significa, tuttavia, che si manifesti in modi sempre uguali o costanti nel tempo. Ogni dislessia (o altro DSA) è diversa da ogni altra e ogni dislessia evolve nel tempo insieme all'allievo. Come ricorda Giovanni Bollea, fondatore della neuropsichiatria infantile in Italia, "i disturbi dei bambini sono disturbi che cambiano in persone che cambiano" (Bollea, 1980). I DSA possono cambiare per una molteplicità di fattori, che spaziano dalle caratteristiche cognitive ed emotive del singolo, a quelle dei contesti in cui vive, agisce, apprende: la scuola, la famiglia, gli spazi di svago e socializzazione. Riuscire a gestire a scuola questo genere di complessità significa creare le condizioni per trasformare potenziali barriere in trampolini di lancio; significa permettere a tutti gli allievi, anche a coloro che devono fare i conti con un disturbo o una difficoltà di lettura, di trarre il massimo dal luogo primariamente preposto agli apprendimenti e all'educazione},
KEYWORDS = {scuola primaria, didattica, apprendimento},
PAGES = {32-37},
URL = {https://iris.cnr.it/handle/20.500.14243/444779},
BOOKTITLE = {Scuola Ticinese},
EDITOR = {Biffi, C. and Falconi, R.},
}
@INCOLLECTION{GUADAGNINI_2021_INCOLLECTION_G_426116,
AUTHOR = {Guadagnini, E.},
TITLE = {Scripta},
YEAR = {2021},
ABSTRACT = {Il concetto di "scripta" negli studi linguistici romanzi},
KEYWORDS = {linguistica italiana, linguistica romanza},
PAGES = {125-151},
URL = {http://www.carocci.it/index.php?option=com_content\&view=article\&id=98},
VOLUME = {VI},
PUBLISHER = {Carocci (Roma, ITA)},
ISBN = {9788829004294},
CONFERENCE_PLACE = {Roma},
BOOKTITLE = {Storia dell'italiano scritto, vol. VI, Supporti, forme, pratiche di scrittura},
}
@INCOLLECTION{ONIGA_2021_INCOLLECTION_OCPGBPCCGMCFTA_448229,
AUTHOR = {Oniga, D. and Cantalupo, B. and Perlo, D. and Grangetto, M. and Bolelli, F. and Pollastri, F. and Cancilla, M. and Canalini, L. and Grana, C. and Muñoz Alcalde, C. and Cardillo, F. A. and Florea, M. and Tartaglione, E. and Aldinucci, M.},
TITLE = {Applications of AI and HPC in the Health Domain},
YEAR = {2021},
ABSTRACT = {This chapter presents the applications of artificial intelligence (AI) and high-computing performance (HPC) in the health domain, illustrated by the description of five of the use cases that are developed in the DeepHealth project. In the context of the European Commission supporting the use of AI and HPC in the health sector, DeepHealth Project is helping health experts process large quantities of images, putting at their disposal DeepLearning and computer vision techniques, combined in the DeepHealth toolkit and HPC infrastructures. The DeepHealth toolkit is tested and validated through 15 use cases, each of them representing a biomedical application. The most promising use cases are described in the chapter, which concludes with the value proposition and the benefits that DeepHealth toolkit offers to future end users},
KEYWORDS = {artificial intelligence, high performance computing},
PAGES = {217-239},
URL = {https://www.taylorfrancis.com/chapters/edit/10.1201/9781003176664-11/applications-ai-hpc-health-domain-dana-oniga-barbara-cantalupo-enzo-tartaglione-daniele-perlo-marco-grangetto-marco-aldinucci-federico-bolelli-federico-pollastri-michele-cancilla-laura-canalini-costantino-grana-cristina-muñoz-alcalde-franco-alberto-cardillo-monica-florea},
DOI = {10.1201/9781003176664-11},
PUBLISHER = {CRC Press-Taylor \& Francis Group (London, GBR)},
ISBN = {9781003176664},
CONFERENCE_PLACE = {London},
BOOKTITLE = {HPC, Big Data, and AI Convergence Towards Exascale: Challenge and Vision},
}
@INCOLLECTION{PANCKHURST_2021_INCOLLECTION_PF_397005,
AUTHOR = {Panckhurst, R. and Frontini, F.},
TITLE = {An Internationally Fair Mediated Digital Discourse Corpus: Improving Knowledge on Reuse},
YEAR = {2021},
ABSTRACT = {In this paper, the authors present a French Mediated Digital Discourse corpus, (88milSMShttp: //88milsms. huma-num. fr https: //hdl. handle. net/11403/comere/cmr-88milsms). Efforts were undertaken over the years to ensure its publication accordingto the best practices and standards of the community, thus guaranteeing compliance with FAIRprinciples and CLARIN recommendations with pertinent scientific and pedagogical reuse. Sinceknowledge on how resources are reused is sometimes difficult to obtain, ways of improving thisare also envisaged},
KEYWORDS = {Reuse, FAIR, SMS, corpus},
PAGES = {185-193},
URL = {https://ecp.ep.liu.se/index.php/clarin/article/view/20},
VOLUME = {180},
DOI = {10.3384/ecp18020},
BOOKTITLE = {Selected Papers from the CLARIN Annual Conference 2020},
}
@INCOLLECTION{PICCINI_2021_INCOLLECTION_PABG_396587,
AUTHOR = {Piccini, S. and Abrate, M. and Bellandi, A. and Giovannetti, E.},
TITLE = {Rappresentazione, costruzione e visualizzazione di risorse terminologiche diacroniche nell'era del web semantico},
YEAR = {2021},
ABSTRACT = {This article introduces the model DIATERM, devoted to representing the diachronic evolution of concepts and terms in a given domain, according to Semantic Web standards and Linked Data technologies. The approach adopted for the representation of temporal information is based on the reification of N-ary relationships. DIATERM is articulated on three levels, textual, terminological and conceptual. Each level can be affected, more or less simultaneously, by change. The use of SWRL rules allows to automatically assign temporal information, thus facilitating the construction of the terminological resource and highlighting any inconsistencies. Two examples of interrogation and visualization of diachronic terminological resources will be illustrated. The first example is taken from the resource dedicated to the astronomical terminology introduced by Christopher Clavius in his Commentary on the Sacrobosco's Tractatus de Sphaera. The second example is taken from the electronic lexicon of Ferdinand de Saussure's linguistic terminology},
KEYWORDS = {computational terminology, diachronic terminology, ontology, semantic web, linked data},
PAGES = {125-139},
URL = {https://iris.cnr.it/handle/20.500.14243/396587},
DOI = {10.36253/978-88-5518-364-2.12},
PUBLISHER = {Firenze University Press (Firenze, ITA)},
ISBN = {978-88-5518-363-5},
CONFERENCE_PLACE = {Firenze},
BOOKTITLE = {Terminologie e vocabolari Lessici specialistici e tesauri, glossari e dizionari},
EDITOR = {Grimaldi, C. and Zanola, M. T.},
}
@INCOLLECTION{STAMULI_2021_INCOLLECTION_SCM_441302,
AUTHOR = {Stamuli, F. M. and Calamai, S. and Monachini, M.},
TITLE = {L'Archivio Vi. Vo.: una piattaforma per la conservazione e l'accesso alle fonti orali in Toscana},
YEAR = {2021},
ABSTRACT = {Archivio Vi. Vo. si colloca nel quadro di programmazione e finanziamento per il triennio 2019-2021 previsto dall'Accordo di valorizzazione del patrimonio archivistico e bibliografico tra Regione Toscana e Soprintendenza Archivistica e Biblioteconomica della Toscana. L'obiettivo del progetto è la realizzazione di un modello ed una piattaforma per la salvaguardia e la fruizione delle fonti orali e audio-visive in vari ambiti disciplinari. La piattaforma mette in sicurezza la documentazione sonora e audiovisiva prodotta in Toscana attraverso processi di digitalizzazione di tipo filologico ed è integrata all'interno di CLARIN-II, nodo italiano della infrastruttura europea CLARIN-ERIC},
KEYWORDS = {Archivi orali Preservazione Infrastrutture},
PAGES = {533-540},
URL = {https://iris.cnr.it/handle/20.500.14243/441302},
PUBLISHER = {Centro Studi Piemontesi (Torino, ITA)},
ISBN = {978-88-8262-272-5},
CONFERENCE_PLACE = {Torino},
BOOKTITLE = {Documenti sonori. Voce, suono, musica in archivi e raccolte},
EDITOR = {Brunetti, D. and Robotti, D. and Salvalaggio, E.},
}
@EDITORIAL{BOSCHETTI_2021_EDITORIAL_BDS_446360,
AUTHOR = {Boschetti, F. and Del Grosso, A. M. and Salvatori, E.},
TITLE = {AIUCD 2021-DH per la società: e-guaglianza, partecipazione, diritti e valori nell'era digitale-DHs for society: e-quality, participation, rights and values in the Digital Age},
YEAR = {2021},
ABSTRACT = {All the extended abstracts published in this volume have received favourable reviews by experts in the field of DH, through an anonymous double-blind peer review process under the responsibility of the AIUCD 2021 Scientific Committee. The AIUCD 2021 conference program is available online https: //aiucd2021. labcd. unipi. it/},
KEYWORDS = {Digital Humanities, AIUCD, informatica umanistica},
PAGES = {624},
URL = {https://aiucd2021.labcd.unipi.it/wp-content/uploads/2021/05/AIUCD2021_BOA-versione3A.pdf},
DOI = {10.6092/unibo/amsacta/6712},
ISBN = {9788894253559},
}
@EDITORIAL{BURGASSI_2021_EDITORIAL_BGV_445814,
AUTHOR = {Burgassi, C. and Guadagnini, E. and Vaccaro, G.},
TITLE = {Migrazioni linguistiche e trasmissioni culturali in Italia (secoli XIII-XV)},
YEAR = {2021},
ABSTRACT = {Il terzo volume della collana Plurilinguismo e Migrazioni si concentra sui temi della traduzione, un'istanza storica fondamentale per l'area italoromanza antica che può essere intesa sia nel senso ristretto di riproposizione puntuale di un testo in una lingua diversa da quella originale sia, in senso lato, come operazione che importa nella lingua locale un contenuto originariamente espresso in altra lingua. Migrazioni linguistiche e trasmissioni culturali in Italia (secoli XIII-XV) adotta la traduzione, entro i due poli di senso ora definiti, come punto di vista privilegiato per lo studio della lingua e della cultura italiana del Medioevo: i nove contributi raccolti affrontano temi e problemi relativi a traduzioni dal latino e dal francese, rispetto a testi composti originariamente dall'Antichità all'epoca coeva, caratterizzati da tradizioni "passive" o "attive" (secondo la terminologia classica)},
KEYWORDS = {Traduzione, Volgarizzamenti, Eredità classica},
URL = {https://www.cnr.it/sites/default/files/public/media/attivita/editoria/collana_plurimi/PLURIMI_3_2021.pdf},
DOI = {10.36173/PLURIMI-2021-3},
PUBLISHER = {CNR EDIZIONI (ROMA, ITA)},
ISBN = {9788880804888},
CONFERENCE_PLACE = {ROMA},
}
@EDITORIAL{MONACHINI_2021_EDITORIAL_ME_420368,
AUTHOR = {Monachini, M. and Eskevich, M.},
TITLE = {CLARIN Annual Conference Proceedings},
YEAR = {2021},
ABSTRACT = {CLARIN2021 is organised for the wider Humanities and Social Sciences communities in order to exchange ideas and experiences within the CLARIN infrastructure. This includes the design, construction and operation of the CLARIN infrastructure, the data, tools and services that it contains or for which there is a need, its actual use by researchers, its relation to other infrastructures and projects, and the CLARIN Knowledge Sharing Infrastructure},
KEYWORDS = {Language Resource Infrastrucuture},
PAGES = {1-178},
URL = {https://iris.cnr.it/handle/20.500.14243/420368},
}
@EDITORIAL{SALVATORI_2021_EDITORIAL_SBD_455965,
AUTHOR = {Salvatori, E. and Boschetti, F. and Del Grosso, A. M.},
TITLE = {DH per la società: e-guaglianza, partecipazione, diritti e valori nell'era digitale (Selected Papers AIUCD 2021)},
YEAR = {2021},
ABSTRACT = {Curatela dei selected paper (Dossier) della conferenza AIUCD2021},
KEYWORDS = {Digital Humanities, AIUCD2021, AIUCD, Umanistica Digitale, Informatica Umanistica},
PAGES = {1-197},
URL = {https://umanisticadigitale.unibo.it/issue/view/1033},
ISSN = {2532-8816},
}
@EDITORIAL{NAHLI_2021_EDITORIAL_NTL_400711,
AUTHOR = {Nahli, O. and Tonazzini, A. and Legnaioli, S.},
TITLE = {Special Issue on Digital preservation of Written Heritage and Text Processing Technology-Preface},
YEAR = {2021},
ABSTRACT = {[Extract] The notion of “written heritage” concerns the immense field regarding written culture. It is difficult to attempt a definition of written heritage. In very general terms, it can be said that it includes any surface containing something written. Different writing supports can be involved, such as papyri, parchments, manuscripts, books, but also contemporary type of medium, such as posters, newspapers, magazines, etc. The written cultural heritage such as general written records are means of communication through space and time of costumes, culture, and beliefs. They constitute the archive of the evolution of mentality, knowledge, sciences, and arts and are considered guardians of the language},
KEYWORDS = {preservation, written heritage},
PAGES = {1-4},
URL = {https://www.innove.org/ijist/index.php/ijist/issue/view/14},
VOLUME = {5 (1)},
ISSN = {2550-5114},
}
@INPROCEEDINGS{ALBERTIN_2021_INPROCEEDINGS_AMB_440996,
AUTHOR = {Albertin, G. and Miaschi, A. and Brunato, D.},
TITLE = {On the role of textual connectives in sentence comprehension: A new dataset for Italian},
YEAR = {2021},
ABSTRACT = {In this paper we present a new evaluation resource for Italian aimed at assessing the role of textual connectives in the comprehension of the meaning of a sentence. The resource is arranged in two sections (acceptability assessment and cloze test), each one corresponding to a distinct challenge task conceived to test how subtle modifications involving connectives in real usage sentences influence the perceived acceptability of the sentence by native speakers and Neural Language Models (NLMs). Although the main focus is the presentation of the dataset, we also provide some preliminary data comparing human judgments and NLMs performance in the two tasks},
KEYWORDS = {neural language models, textual connectives, sentence acceptability},
URL = {http://ceur-ws.org/Vol-3033/paper16.pdf},
VOLUME = {3033},
CONFERENCE_NAME = {8th Italian Conference on Computational Linguistics (CLIC-it 2021)},
}
@INPROCEEDINGS{BRUNO_2021_INPROCEEDINGS_BGCMF_446977,
AUTHOR = {Bruno, E. and Giulivi, S. and Cappa, C. and Marini, M. and Ferro, M.},
TITLE = {Evaluating the accuracy of decoding in children who read aloud},
YEAR = {2021},
ABSTRACT = {Digital tools based on automatic speech recognition (ASR) could be a useful support for teachers in assessing the reading skills of the students. We focus on the evaluation of the decoding accuracy of children with grade level ranging from the 3rd to the 6th performing a reading aloud task on a narrative text displayed on an ordinary tablet using the ReadLet platform. On the basis of previously collected data, we built a gold dataset with sentences characterised by the audio data, the original text to be read, and the text actually spoken by the child. By using the open-source Kaldi toolkit an ASR system based on the GMM-HMM model was trained on the training portion of the gold dataset. The accuracy of the ASR system was calculated as the ability to correctly decode the test audio data with respect to the annotated text, and the decoding accuracy of the children was estimated by measuring the gap between the results obtained with the annotated text and the original text. A consistent trend with increasing grade level was found in terms of word correctness, substitutions and insertions, while the trained model appears to be significantly able to evaluate the children decoding accuracy},
KEYWORDS = {speech recognition, decoding accuracy, reading aloud, voice parameters, Kaldi, GMM-HMM acoustic model},
PAGES = {145-148},
URL = {https://iris.cnr.it/handle/20.500.14243/446977},
DOI = {10.36253/978-88-5518-449-6},
PUBLISHER = {Firenze University Press (Firenze, ITA)},
ISBN = {978-88-5518-449-6},
CONFERENCE_NAME = {12th International Workshop on Models and Analysis of Vocal Emissions for Biomedical Applications (MAVEBA'21)},
CONFERENCE_PLACE = {Firenze},
BOOKTITLE = {Proceedings of the 12th International Workshop on Models and Analysis of Vocal Emissions for Biomedical Applications (MAVEBA'21)},
EDITOR = {Manfredi, C.},
}
@INPROCEEDINGS{CALAMAI_2021_INPROCEEDINGS_CPSPCBM_446744,
AUTHOR = {Calamai, S. and Pretto, N. and Stamuli, F. M. and Piccardi, D. and Candeo, G. and Bianchi, S. and Monachini, M.},
TITLE = {COMMUNITY-BASED SURVEY AND ORAL ARCHIVE INFRASTRUCTURE IN THE ARCHIVIO VI. VO. PROJECT},
YEAR = {2021},
ABSTRACT = {Audio and audiovisual archives are at the crossroads of different fields of knowledge, yet they require common solutions for both their long-term preservation and their description, availability, use and reuse. Archivio Vi. Vo. is an Italian project financed by the Tuscany Region, aiming to (i) explore methods for long-term preservation and secure access to oral sources and (ii) develop an infrastructure under the CLARIN-IT umbrella offering several services for scholars from different domains interested in oral sources. This paper describes the project's infrastructure and its methodology through a case study on the Caterina Bueno's audio archive},
KEYWORDS = {inglese},
URL = {https://iris.cnr.it/handle/20.500.14243/446744},
DOI = {10.3384/ecp180},
ISBN = {978-91-7929-609-4},
CONFERENCE_NAME = {CLARIN2020 Annual Conference},
BOOKTITLE = {SELECTED PAPERS FROM THE CLARIN ANNUAL CONFERENCE 2020},
EDITOR = {Navarretta, C. and Eskevich, M.},
}
@INPROCEEDINGS{DEMATTEI_2021_INPROCEEDINGS_DLDN_445812,
AUTHOR = {De Mattei, L. and Lai, H. and Dell'Orletta, F. and Nissim, M.},
TITLE = {Human Perception in Natural Language Generation},
YEAR = {2021},
ABSTRACT = {We take a collection of short texts, some of which are human-written, while others are automatically generated, and ask subjects, who are unaware of the texts' source, whether they perceive them as human-produced. We use this data to fine-tune a GPT-2 model to push it to generate more human-like texts, and observe that the production of this fine-tuned model is indeed perceived as more human-like than that of the original model. Contextually, we show that our automatic evaluation strategy correlates well with human judgements. We also run a linguistic analysis to unveil the characteristics of human-vs machine-perceived language},
KEYWORDS = {Natural Language Generation, Neural Language Models, Evaluation},
PAGES = {15-23},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85123713456\&origin=inward},
DOI = {10.18653/v1/2021.gem-1.2},
ISBN = {978-1-954085-67-1},
CONFERENCE_NAME = {First Workshop on Generation Evaluation and Metrics (GEM 2021)},
BOOKTITLE = {Proceedings of the First Workshop on Generation Evaluation and Metrics (GEM 2021)},
}
@INPROCEEDINGS{DELFANTE_2021_INPROCEEDINGS_DD_417365,
AUTHOR = {Del Fante, D. and Di Nunzio, G. M.},
TITLE = {A Quantitative/Qualitative Approach to {OCR} Error Detection and Correction in Old Newspapers for Corpus-assisted Discourse Studies},
YEAR = {2021},
ABSTRACT = {The use of OCR software to convert printed characters to digital text is a fundamental tool within diachronic approaches to Corpusassisted discourse Studies because allow researchers to expand their interest by making many texts available and analysable through a computer. However, OCR software are not totally accurate, and the resulting error rate compromises their effectiveness. This paper proposes a mixed qualitative-quantitative approach to OCR error detection and correction in order to develop a methodology for compiling historical corpora. The proposed approach consists of three main steps: corpus creation, OCR detection and correction, and application of the automatic rules. The rules are implemented in R using a "tidyverse" approach for a better reproducibility of the experiments},
KEYWORDS = {OCR, OCR POST-PROCESSING CORRECTION, Historical Newspapers},
URL = {http://ceur-ws.org/Vol-2816/paper5.pdf},
CONFERENCE_NAME = {Proceedings of the 17th Italian Research Conference on Digital Libraries, Padua, Italy (virtual event due to the Covid-19 pandemic), February18-19, 2021},
}
@INPROCEEDINGS{DELFANTE_2021_INPROCEEDINGS_DFMQ_447069,
AUTHOR = {Del Fante, D. and Frontini, F. and Monachini, M. and Quochi, V.},
TITLE = {CLARIN-IT Resources in CLARIN ERIC-a Bird's-Eye View},
YEAR = {2021},
ABSTRACT = {The paper investigates the visibility of CLARIN-IT language resources within the services of the CLARINERICcentral infrastructure, notably the Virtual Language Observatory, the Switchboard and the Federated Content Search, from a user perspective in order to identify possible issues. While the experiment focused on one national consortium, the ultimate goal is to develop an assessment methodology that can be used by any national consortia aiming to review the accessibility of their resources and tools within the CLARIN central services},
KEYWORDS = {FAIR, research infrastructure for SSH, language resources, findability, CLARIN},
PAGES = {129-133},
URL = {https://office.clarin.eu/v/CE-2021-1923-CLARIN2021_ConferenceProceedings.pdf},
ISSN = {2021-1923},
CONFERENCE_NAME = {CLARIN Annual Conference 2021},
}
@INPROCEEDINGS{DELGRATTA_2021_INPROCEEDINGS_DBDB_446363,
AUTHOR = {Del Gratta, R. and Boschetti, F. and Del Grosso, A. M. and Bambaci, L.},
TITLE = {La Filologia come sistema dinamico: qualche considerazione preliminare},
YEAR = {2021},
ABSTRACT = {In questo articolo introduciamo un approccio formale all'evoluzione dei documenti con particolare attenzione alla prospettiva filologica e alle problematiche tipiche connesse. Proponiamo un modello/framework matematico in grado di formalizzare diversi fenomeni complessi in vari ambiti di ricerca quali la Linguistica Computazionale, la Filologia Digitale e l'Ingegneria del Software, in particolare quando questa viene applicata all'analisi di documenti e testi di interesse storico-letterario},
KEYWORDS = {approccio evoluzionistico, modello formale, analisi documentale e testuale, sistema dinamico, filologia computazionale},
PAGES = {484-490},
URL = {http://amsacta.unibo.it/6712/1/AIUCD2021_BOA-versione3A.pdf#page=500},
VOLUME = {AIUCD2021},
DOI = {10.6092/unibo/amsacta/6712},
ISBN = {9788894253559},
CONFERENCE_NAME = {AIUCD 2021-DH per la società: e-guaglianza, partecipazione, diritti e valori nell'era digitale-DHs for society: e-quality, participation, rights and values in the Digital Age},
BOOKTITLE = {AIUCD 2021-DH per la società: e-guaglianza, partecipazione, diritti e valori nell'era digitale-DHs for society: e-quality, participation, rights and values in the Digital Age. Book of extended abstracts of the 10th national conference},
}
@INPROCEEDINGS{DELGROSSO_2021_INPROCEEDINGS_DFENT_387319,
AUTHOR = {Del Grosso, A. M. and Fassi Fihri, D. and El Mohajir, M. and Nahli, O. and Tonazzini, A.},
TITLE = {Digital safeguard of laminated historical manuscripts: the treatise "Poem in Rajaz on medicine" as a case study},
YEAR = {2021},
ABSTRACT = {In this paper, we analyze and discuss the characteristics of a system for the effective digital preservation and fruition of historical manuscripts degraded by the process of lamination. As a case study, we will make reference to the "Poem in Rajaz on medicine", written by Abubacer in the XII century, and conserved in the Al Quaraouiyine Library located in Fez, Morocco. The conceived system should have at least four main functionalities: image acquisition (i. e. digitization), image enhancement, text encoding, and linguistic analysis. Based on the evaluation of the manuscript damages, the acquisition set up should be designed in such a way to be able to avoid reflections as much as possible. Suitable digital image processing techniques should also be devised to correct the residual degradations and enhance the text for an easier legibility. Finally, semi-automatic transcription, scholarly encoding and linguistic analysis, to be performed on the virtually restored pages, should adapt existing tools to the specificity of the primary source writing system and language. The feasibility study for the realization of such a system is of general utility, in that it can provide guidelines for the digitization, the enhancement and the text encoding of the many laminated manuscripts conserved in other historical archives. On the other hand, from the cultural heritage point of view, the experimentation on the "Poem in Rajaz on medicine" could foster the systematic philological and ontological study of a unique piece of our documental heritage: the longest poem of medieval Islamic medical literature},
KEYWORDS = {Cultural Heritage, Digital Safeguard, Historical Manuscript Digitization, Document Image Processing, Linguistic Analysis, Ontological Analysis},
PAGES = {192-197},
URL = {https://ieeexplore.ieee.org/document/9357192},
DOI = {10.1109/CiSt49399.2021.9357192},
PUBLISHER = {IEEE (345 E 47TH ST, NEW YORK, NY 10017 USA, USA)},
ISBN = {978-1-7281-6646-9},
CONFERENCE_NAME = {6th IEEE International Congress on Information Science and Technology (IEEE CiSt)},
CONFERENCE_PLACE = {345 E 47TH ST, NEW YORK, NY 10017 USA},
BOOKTITLE = {2020 6TH IEEE CONGRESS ON INFORMATION SCIENCE AND TECHNOLOGY (IEEE CIST'20},
}
@INPROCEEDINGS{DIDONATO_2021_INPROCEEDINGS_DDMP_447058,
AUTHOR = {Di Donato, F. and Dumouchel, S. and Monachini, M. and Pohle, S.},
TITLE = {The discovery platform GOTRIPLE: An EOSC service for social sciences and humanities research},
YEAR = {2021},
ABSTRACT = {In this paper we present TRIPLE-Transforming Research through Innovative Practices for Linked Interdisciplinary Exploration-an on-going project funded as part of the European Horizon 2020 programme INFRAEOSC-02-2019 "Prototyping new innovative services" (2019-2023). The project's main objective is to develop a multilingual and multicultural discovery solution for the social sciences and humanities (SSH), which will provide a single access point that allows users to explore, find, access and reuse materials such as literature, data, projects and researcher profiles at European scale. The paper first provides an overview of TRIPLE's main goals and impacts. It then describes the methodology adopted for the design and development of the project platform, GOTRIPLE. Finally, it contextualises the project within the European research landscape, and more specifically in the European Open Science Cloud (EOSC) ecosystem. In the conclusion, some current challenges and open issues are presented},
KEYWORDS = {EOSC, Open Science, scholarly communication, discoverability, OPERAS, TRIPLE},
PAGES = {31-38},
URL = {http://amsacta.unibo.it/6712/1/AIUCD2021_BOA-versione3A.pdf},
DOI = {10.6092/unibo/amsacta/6712},
CONFERENCE_NAME = {AIUCD 2021-DH per la società: e-guaglianza, partecipazione, diritti e valori nell'era digitale},
BOOKTITLE = {AIUCD 2021-Book of Extended Abstracts. p. 624},
EDITOR = {Boschetti, F. and Del Grosso, A. M. and Salvatori, E.},
}
@INPROCEEDINGS{FERRETTI_2021_INPROCEEDINGS_FCCMDCM_395180,
AUTHOR = {Ferretti, M. and Chiarella, D. and Cutugno, P. and Marconi, L. and Di Feo, G. and Cerniglia, A. and Magrini, A.},
TITLE = {A linguistic and psychoacoustic study for questionnaire analysis: first results},
YEAR = {2021},
ABSTRACT = {This research is inspired by the consideration that language represents a significant dimension of perception and description of the soundscape. A language is a strategic tool that can consistently describe the qualities of physical acoustic environments, introducing an efficient metric to describe the sound perception by people. In this paper, we explore the possibility of using sentiment analysis for extracting the emotional impact of noise from lists of adjectives that describe sounds. To address this, an investigation campaign was conducted to identify the Italian adjectives that best describe the noise sources associated with port and retro-port infrastructures. 402 Italian university students responded to a listening experiment. They were asked to associate adjectives with audios. The association of these adjectives with the sources of sound formed the basis for sentiment analysis. Psychoacoustic parameters were calculated following measurements and processed for each of the sounds administered to look for possible correlations between the different perceptual aspects. The first results show how industrial or traffic sounds are as expected associated with negative sentiment whereas natural sounds evoke positive emotions. The proposed sentiment analysis, in connection with the psychoacoustic investigations developed, provides a framework for future research in the investigation of sound perception},
KEYWORDS = {Sound perception, Sentiment Analysis, Psychoacoustics, Acoustics, Synesthesia},
PAGES = {1181-1188},
URL = {https://www.iiav.org/icsv27/},
VOLUME = {1 (6)},
PUBLISHER = {Society of Acoustics (USA)},
ISBN = {978-83-7880-799-5},
CONFERENCE_NAME = {27th International Congress on Sound and Vibration (ICSV27)},
CONFERENCE_PLACE = {USA},
BOOKTITLE = {Proceedings of the 27th International Congress on Sound and Vibration},
}
@INPROCEEDINGS{GALLO_2021_INPROCEEDINGS_GBFFR_397311,
AUTHOR = {Gallo, G. and Buscemi, F. and Ferro, M. and Figuera, M. and Riela, P. M.},
TITLE = {Abstracting Stone Walls for Visualization and Analysis},
YEAR = {2021},
ABSTRACT = {An innovative abstraction technique to represent both mathematically and visually some geometric properties of the facing stones in a wall is presented. The technique has been developed within the W. A. L. (L) Project, an interdisciplinary effort to apply Machine Learning techniques to support and integrate archaeological research. More precisely the paper introduces an original way to "abstract" the complex and irregular 3D shapes of stones in a wall with suitable ellipsoids. A wall is first digitized into a unique 3D point cloud and it is successively segmented into the sub-meshes of its stones. Each stone mesh is then "summarized" by the inertial ellipsoid relative to the point cloud of its vertices. A wall is in this way turned into a "population" of ellipsoid shapes statistical properties of which may be processed with Machine Learning algorithms to identify typologies of the walls under study. The paper also reports two simple case studies to assess the effectiveness of the proposed approach},
KEYWORDS = {Quantitative archaeology, Data visualization, Machine learning in Cultural Heritage, Photogrammetry applied to arcaheology},
PAGES = {215-222},
URL = {https://iris.cnr.it/handle/20.500.14243/397311},
VOLUME = {12667},
DOI = {10.1007/978-3-030-68787-8_15},
PUBLISHER = {Springer Nature Switzerland (Basel, CHE)},
ISBN = {978-3-030-68787-8},
CONFERENCE_PLACE = {Basel},
BOOKTITLE = {Pattern Recognition. ICPR International Workshops and Challenges},
EDITOR = {Del Bimbo, A. and Cucchiara, R. and Sclaroff, S. and Farinella, G. M. and Mei, T. and Bertini, M. and Escalante H J, V. R.},
}
@INPROCEEDINGS{GIOVANNETTI_2021_INPROCEEDINGS_GABMPS_446010,
AUTHOR = {Giovannetti, E. and Albanesi, D. and Bellandi, A. and Marchi, S. and Papini, M. and Sciolette, F.},
TITLE = {The role of a computational lexicon for query expansion in full-text search},
YEAR = {2021},
ABSTRACT = {This work describes the first experiments conducted with a computational lexicon of Italian in a context of query expansion for full-text search. An application, composed of a graphical user interface and backend services to access the lexicon and the database containing the corpus to be queried, was developed. The text was morphologically analysed to improve the precision of the search process. Some examples of queries are given to show the potential of a text search approach supported by a complex and stratified lexical resource},
KEYWORDS = {full-text search, computational lexicon, query expansion},
PAGES = {162-168},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85121247840\&origin=inward},
VOLUME = {3033},
DOI = {10.4000/books.aaccademia.10417},
PUBLISHER = {Accademia University Press (Torino, ITA)},
ISBN = {9791280136947},
CONFERENCE_NAME = {CLiC-it 2021 Italian Conference on Computational Linguistics 2021},
CONFERENCE_PLACE = {Torino},
BOOKTITLE = {Proceedings of the Eight Italian Conference on Computational Linguistics (Clic-it 2021)},
EDITOR = {Fersini, E. and Passarotti, M. and Patti, V.},
}
@INPROCEEDINGS{IAVARONE_2021_INPROCEEDINGS_IBD_440176,
AUTHOR = {Iavarone, B. and Brunato, D. and Dell'Orletta, F.},
TITLE = {Sentence Complexity in Context},
YEAR = {2021},
ABSTRACT = {We study the influence of context on how humans evaluate the complexity of a sentence in English. We collect a new dataset of sentences, where each sentence is rated for perceived complexity within different contextual windows. We carry out an in-depth analysis to detect which linguistic features correlate more with complexity judgments and with the degree of agreement among annotators. We train several regression models, using either explicit linguistic features or contextualized word embeddings, to predict the mean complexity values assigned to sentences in the different contextual windows, as well as their standard deviation. Results show that models leveraging explicit features capturing morphosyntactic and syntactic phenomena perform always better, especially when they have access to features extracted from all contextual sentences},
URL = {https://iris.cnr.it/handle/20.500.14243/440176},
DOI = {10.18653/v1/2021.cmcl-1.23},
ISBN = {978-1-954085-35-0},
}
@INPROCEEDINGS{IAVARONE_2021_INPROCEEDINGS_IMBGSVDG_445809,
AUTHOR = {Iavarone, B. and Morelli, M. S. and Brunato, D. and Ghiasi, S. and Scilingo, E. P. and Vanello, N. and Dell'Orletta, F. and Greco, A.},
TITLE = {Analyzing the Interaction between the Reader's Voice and the Linguistic Structure of the Text: a Preliminary Study},
YEAR = {2021},
ABSTRACT = {In this study, we present a preliminary analysis of the relationship between the linguistic profile of a text and the voice properties of the reader aiming to improve the speech-based emotion recognition systems. To this aim, we recorded the speech signals from a group of 32 healthy volunteers reading aloud neutral and affective texts and used the BioVoice toolbox to compute some of the main speech features. The selected texts were analyzed to quantify their lexical, morpho-syntactic, and syntactic content. Correlation and Support Vector Regressor analyses between linguistic and speech features have shown a significant modulation of some voice acoustic properties performed by the linguistic structure of the text. Particularly, a significant effect was shown on some specific speech features often used for the assessment of human emotional state (e. g., F0). This suggests that the lexical, morpho-syntactic, and syntactic properties could play an important role in the emotional dynamics of a person},
KEYWORDS = {Natural Language Processing, Speech analysis, linguistic profile},
URL = {https://iris.cnr.it/handle/20.500.14243/445809},
DOI = {10.36253/978-88-5518-449-6},
ISBN = {978-88-5518-448-9},
CONFERENCE_NAME = {12th INTERNATIONAL WORKSHOP "MODELS AND ANALYSIS OF VOCAL EMISSIONS FOR BIOMEDICAL APPLICATIONS"},
BOOKTITLE = {Proceedings of 12th INTERNATIONAL WORKSHOP "MODELS AND ANALYSIS OF VOCAL EMISSIONS FOR BIOMEDICAL APPLICATIONS"},
}
@INPROCEEDINGS{KELLI_2021_INPROCEEDINGS_KLKVLBMHDVTV_443454,
AUTHOR = {Kelli, A. and Lindén, K. and Kamocki, P. and Vider, K. and Labropoulou, P. and Birtonas, R. and Mantrov, V. and Hannesschläger, V. and Del Gratta, R. and Värv, A. and Tavits, G. and Vutt, A.},
TITLE = {The Interplay of Legal Regimes of Personal Data, Intellectual Property and Freedom of Expression in Language Research},
YEAR = {2021},
ABSTRACT = {Sometimes legal scholars get relevant but baffling questions from laypersons like: "The reference to a workis personal data, so does the GDPR actually require me to anonymise it? Or, as my voice data is personaldata, does the GDPR automatically give me access to a speech recognizer using my voice sample? Or, canI say anything about myself without the GDPR requiring the web host to anonymise or remove the post?What can I say about others like politicians? And, what can researchers say about patients in a researchreport?" Based on these questions, the authors address the interaction of intellectual property and dataprotection law in the context of data minimisation and attribution rights, access rights, trade secret protection, and freedom of expression},
KEYWORDS = {Legal aspects, research data},
PAGES = {154-159},
URL = {https://office.clarin.eu/v/CE-2021-1923-CLARIN2021_ConferenceProceedings.pdf},
ISSN = {2021-1923},
CONFERENCE_NAME = {CLARIN Annual Conferece 2021},
BOOKTITLE = {CLARIN Annual Conferece 2021},
EDITOR = {Monachini, M. and Eskevich, M.},
}
@INPROCEEDINGS{MARTELLI_2021_INPROCEEDINGS_MNKTKGKNPOLKKDUSLVGLQMFTCSIM_443238,
AUTHOR = {Martelli, F. and Navigli, R. and Krek, S. and Tiberius, C. and Kallas, J. and Gantar, P. and Koeva, S. and Nimb, S. and Pedersen, B. S. and Olsen, S. and Langements, M. and Koppel, K. and Üksik, T. and Dobrovolijc, K. and Ureña Ruiz, R. J. and Sancho Sánchez, J. L. and Lipp, V. and Váradi, T. and Győrffy, A. and László, S. and Quochi, V. and Monachini, M. and Frontini, F. and Tempelaars, R. and Costa, R. and Salgado, A. and Čibej, J. and Munda, T.},
TITLE = {Designing the ELEXIS Parallel Sense-Annotated Dataset in 10 European Languages},
YEAR = {2021},
ABSTRACT = {Over the course of the last few years, lexicography has witnessed the burgeoning of increasingly reliable automaticapproaches supporting the creation of lexicographic resources such as dictionaries, lexical knowledge bases andannotated datasets. In fact, recent achievements in the field of Natural Language Processing and particularly inWord Sense Disambiguation have widely demonstrated their effectiveness not only for the creation of lexicographicresources, but also for enabling a deeper analysis of lexical-semantic data both within and across languages. Nevertheless, we argue that the potential derived from the connections between the two fields is far from exhausted. In this work, we address a serious limitation affecting both lexicography and Word Sense Disambiguation, i. e. thelack of high-quality sense-annotated data and describe our efforts aimed at constructing a novel entirely manuallyannotated parallel dataset in 10 European languages. For the purposes of the present paper, we concentrate on theannotation of morpho-syntactic features. Finally, unlike many of the currently available sense-annotated datasets, we will annotate semantically by using senses derived from high-quality lexicographic repositories},
KEYWORDS = {Digital lexicography, Word Sense Disambiguation, Computational Linguistics, Corpus Linguistics, Natural Language Processing},
PAGES = {377-395},
URL = {https://static-curis.ku.dk/portal/files/279888836/eLex_2021_22_pp377_395.pdf},
VOLUME = {2021},
PUBLISHER = {Lexical Computing (Brno, CZE)},
CONFERENCE_NAME = {eLex 2021},
CONFERENCE_PLACE = {Brno},
BOOKTITLE = {Electronic lexicography in the 21st century (eLex 2021): Post-editing lexicography},
}
@INPROCEEDINGS{MESSINA_2021_INPROCEEDINGS_MBCMPSN_400472,
AUTHOR = {Messina, L. and Busso, L. and Combei, C. R. and Miaschi, A. and Pannitto, L. and Sarti, G. and Nissim, M.},
TITLE = {A dissemination workshop for introducing young Italian students to NLP},
YEAR = {2021},
ABSTRACT = {We describe and make available the game-based material developed for a laboratory run at several Italian science festivals to popularize NLP among young students},
KEYWORDS = {nlp, teaching},
PAGES = {52-54},
URL = {https://www.aclweb.org/anthology/2021.teachingnlp-1.7},
ISBN = {978-1-954085-36-7},
CONFERENCE_NAME = {5th Workshop on Teaching NLP},
BOOKTITLE = {Proceedings of the 5th Workshop on Teaching NLP},
}
@INPROCEEDINGS{MIASCHI_2021_INPROCEEDINGS_MABDV_446048,
AUTHOR = {Miaschi, A. and Alzetta, C. and Brunato, D. and Dell'Orletta, F. and Venturi, G.},
TITLE = {Probing tasks under pressure},
YEAR = {2021},
ABSTRACT = {Probing tasks are frequently used to evaluate whether the representations of Neural Language Models (NLMs) encode linguistic information. However, it is still questioned if probing classification tasks really enable such investigation or they simply hint for surface patterns in the data. We present a method to investigate this question by comparing the accuracies of a set of probing tasks on gold and automatically generated control datasets. Our results suggest that probing tasks can be used as reliable diagnostic methods to investigate the linguistic information encoded in NLMs representations},
KEYWORDS = {Neural Language Models, Linguistic probing, Treebanks},
PAGES = {1-7},
URL = {http://ceur-ws.org/Vol-3033/paper29.pdf},
VOLUME = {3033},
CONFERENCE_NAME = {8th Italian Conference on Computational Linguistics (CLIC-it 2021)},
}
@INPROCEEDINGS{MIASCHI_2021_INPROCEEDINGS_MBDV_400474,
AUTHOR = {Miaschi, A. and Brunato, D. P. and Dell'Orletta, F. and Venturi, G.},
TITLE = {What Makes My Model Perplexed? A Linguistic Investigation on Neural Language Models Perplexity},
YEAR = {2021},
ABSTRACT = {This paper presents an investigation aimed at studying how the linguistic structure of a sentence affects the perplexity of two of the most popular Neural Language Models (NLMs), BERT and GPT-2. We first compare the sentence-level likelihood computed with BERT and the GPT-2's perplexity showing that the two metrics are correlated. In addition, we exploit linguistic features capturing a wide set of morpho-syntactic and syntactic phenomena showing how they contribute to predict the perplexity of the two NLMs},
KEYWORDS = {nlp, interpretability, deep learning},
PAGES = {40-47},
URL = {https://www.aclweb.org/anthology/2021.deelio-1.5},
ISBN = {978-1-954085-30-5},
CONFERENCE_NAME = {2nd Workshop on Knowledge Extraction and Integrationfor Deep Learning Architectures},
BOOKTITLE = {Proceedings of the 2nd Workshop on Knowledge Extraction and Integrationfor Deep Learning Architectures},
}
@INPROCEEDINGS{MIASCHI_2021_INPROCEEDINGS_MRD_443055,
AUTHOR = {Miaschi, A. and Ravelli, A. A. and Dell'Orletta, F.},
TITLE = {Evaluating Transformer Models for Punctuation Restoration in Italian},
YEAR = {2021},
ABSTRACT = {In this paper, we propose an evaluation of a Transformerbased punctuation restoration model for the Italian language. Experimenting with a BERT-base model, we perform several fine-tuning with different training data and sizes and tested them in an in-and crossdomain scenario. Moreover, we offer a comparison in a multilingual setting with the same model fine-tuned on English transcriptions. Finally, we conclude with an error analysis of the main weaknesses of the model related to specific punctuation marks},
KEYWORDS = {transformer models, nlp, punctuation restoration},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85121647978\&origin=inward},
VOLUME = {3015},
CONFERENCE_NAME = {5th Workshop on Natural Language for Artificial Intelligence (NL4AI 2021)},
}
@INPROCEEDINGS{MONACHINI_2021_INPROCEEDINGS_MSCPB_446737,
AUTHOR = {Monachini, M. and Stamuli Maria, F. and Calamai, S. and Pretto, N. and Bianchi, S.},
TITLE = {The Grey-side of Audio Archives},
YEAR = {2021},
ABSTRACT = {Archives often include documents that can hardly be considered publications or grey literature as such, yet they maintain their documentary value and play a role of primary sources for the specialists. These documents, indeed, can help archivists to reveal the sedimentation process of the archive itself and to preserve the authentic context of the documentary production. They also appear to be very useful for the community of researchers and scholars. This happens more frequently with oral archives which include 'non-conventional sources', thus bringing together audio documents, fieldworks notes, correspondence, slipcases, analogic compact cassettes or open reels. At the cross-road of two disciplines, Archival Science and Grey Literature, this paper aims to argue the applicability of the concept of grey literature to this wide range of documentary materials, by showing the experience of Archivio Vi. Vo, a regional project aiming at building a model for archiving, preserving, managing and disseminating audio documents},
KEYWORDS = {oral archives, infrastructures},
PAGES = {34-37},
URL = {https://iris.cnr.it/handle/20.500.14243/446737},
VOLUME = {22},
ISSN = {1386-2316},
ISBN = {978-90-77484-38-8},
CONFERENCE_NAME = {Twenty-Second International Conference on Grey Literature-Applications of Grey Literature for Science and Society},
CONFERENCE_PLACE = {Amsterdam},
BOOKTITLE = {THE GL-CONFERENCE SERIES. CONFERENCE PROCEEDINGS},
}
@INPROCEEDINGS{NAHLI_2021_INPROCEEDINGS_ND_394192,
AUTHOR = {Nahli, O. and Del Grosso, A. M.},
TITLE = {Creating Arabic Lexical Resources in TEI; A Schema for Discontinuous Morphology Encoding},
YEAR = {2021},
ABSTRACT = {An Arabic word can be described according to its lexical and morphological information. Lexical analysis consists in gathering both semantic information (meaning and translation) and syntactic properties (parts of speech). Morphological analysis, instead, identifies word patterns that group the words having the same syntactic, inflectional and semantic behaviour. Such descriptions constitute two different but complementary levels of study. This paper illustrates our work, aimed at creating an exhaustive resource consisting of two levels: lexical and morphological. The lexical level collects information extracted from the dictionary al=q (a) over barm (u) over bars al=mu\< (h)under dot\> (i) over bar\< (t)under dot\>. The morphological level describes the word patterns. The two levels are autonomous but complementary. Each word described at the lexical level is linked to its corresponding pattern. The formalization of the word pattern makes it possible to enrich word descriptions with additional morphosyntactic and inflectional information. To obtain a digital systematic resource, we followed the guidelines provided by the Text Encoding Initiative (TEI). We adopted the TEI module devoted to encoding digital dictionaries and lexicons in order to formally represent the medieval primary source al=q (a) over barm (u) over bars al=mu\< (h)under dot\> (i) over bar\< (t)under dot\>. We also used the TEI interpretation approach to encode the morphological word patterns keeping the two levels separate but at the same time allowing them to be linked},
KEYWORDS = {classical Arabic dictionary, digital lexicography, al=qamus al=muHiyT, word patterns, TEI},
PAGES = {178-187},
URL = {https://ieeexplore.ieee.org/stamp/stamp.jsp?tp=\&arnumber=9357273},
DOI = {10.1109/CiSt49399.2021.9357273},
PUBLISHER = {IEEE (345 E 47TH ST, NEW YORK, NY 10017 USA, USA)},
ISBN = {978-1-7281-6646-9},
CONFERENCE_NAME = {IEEE-CIST2020 DPWH},
CONFERENCE_PLACE = {345 E 47TH ST, NEW YORK, NY 10017 USA},
BOOKTITLE = {2020 6TH IEEE CONGRESS ON INFORMATION SCIENCE AND TECHNOLOGY (IEEE CIST'20)},
}
@INPROCEEDINGS{PANNITTO_2021_INPROCEEDINGS_PBCMMSN_400471,
AUTHOR = {Pannitto, L. and Busso, L. and Combei, C. R. and Messina, L. and Miaschi, A. and Sarti, G. and Nissim, M.},
TITLE = {Teaching NLP with Bracelets and Restaurant Menus: An Interactive Workshop for Italian Students},
YEAR = {2021},
ABSTRACT = {Although Natural Language Processing is at the core of many tools young people use in their everyday life, high school curricula (in Italy) do not include any computational linguistics education. This lack of exposure makes the use of such tools less responsible than it could be, and makes choosing computational linguistics as a university degree unlikely. To raise awareness, curiosity, and longer-term interest in young people, we have developed an interactive workshop designed to illustrate the basic principles of NLP and computational linguistics to high school Italian students aged between 13 and 18 years. The workshop takes the form of a game in which participants play the role of machines needing to solve some of the most common problems a computer faces in understanding language: from voice recognition to Markov chains to syntactic parsing. Participants are guided through the workshop with the help of instructors, who present the activities and explain core concepts from computational linguistics. The workshop was presented at numerous outlets in Italy between 2019 and 2020, both face-to-face and online},
KEYWORDS = {nlp, teaching},
PAGES = {160-170},
URL = {https://www.aclweb.org/anthology/2021.teachingnlp-1.26},
ISBN = {978-1-954085-36-7},
CONFERENCE_NAME = {5th Workshop on Teaching NLP},
BOOKTITLE = {Proceedings of the 5th Workshop on Teaching NLP},
}
@INPROCEEDINGS{PROIETTI_2021_INPROCEEDINGS_PC_441147,
AUTHOR = {Proietti, C. and Chiarella, D.},
TITLE = {Measuring bi-polarization with argument graphs},
YEAR = {2021},
ABSTRACT = {Multi-agent models play a significant role in testing hypotheses about the unfolding of opinion dynamics in complex social networks. The model of the Argument Communication Theory of Bi-polarization (ACTB), developed by Maes and Flache (2013), shows that simple circulation of arguments among individuals in a group can determine strong differentiation of opinions (bi-polarization effects) even with a small degree of homophily. The ACTB model and similar ones have nevertheless one limitation: given a topic of discussion, only direct pro and con arguments for it are considered. This does not allow to account for the topology of a more complex debate, where arguments may also interact indirectly with the topic at stake. This gap can be filled by using Quantitative Bipolar Argument Frameworks (QBAF). More specifically, by applying measures of argument strength for QBAFs in order to calculate the agents' opinion. In the present paper we generalize the ACTB measure of opinion strength to acyclic bipolar graphs and compare it with other measures from the literature. We then present a revised version of the ACTB model, where the agents' knowledge bases are structured as subgraphs of an underlying global knowledge base (described as a QBAF). We first test that the predictions of the ACTB model are confirmed when the underlying QBAF contains only direct pro and con arguments for a topic. We then explore more complex topologies of debate with two additional batches of simulations. Our first results show that changing the topology, while keeping the same number of pro and con arguments, has no significant impact on bi-polarization dynamics},
KEYWORDS = {bi-polarization, abstract argumentation, opinion dynamics, multi-agent modelling},
PAGES = {13},
URL = {https://ceur-ws.org/Vol-3086/},
CONFERENCE_NAME = {20th International Conference Italian Association for Artificial Intelligence-5th Workshop on Advances in Argumentation in Artificial Intelligence},
BOOKTITLE = {Advances in Argumentation in Artificial Intelligence 2021},
}
@INPROCEEDINGS{PUCCETTI_2021_INPROCEEDINGS_PMD_400473,
AUTHOR = {Puccetti, G. and Miaschi, A. and Dell'Orletta, F.},
TITLE = {How do BERT embeddings organize linguistic knowledge?},
YEAR = {2021},
ABSTRACT = {Several studies investigated the linguistic information implicitly encoded in Neural Language Models. Most of these works focused on quantifying the amount and type of information available within their internal representations and across their layers. In line with this scenario, we proposed a different study, based on Lasso regression, aimed at understanding how the information encoded by BERT sentence-level representations is arrange within its hidden units. Using a suite of several probing tasks, we showed the existence of a relationship between the implicit knowledge learned by the model and the number of individual units involved in the encodings of this competence. Moreover, we found that it is possible to identify groups of hidden units more relevant for specific linguistic properties},
KEYWORDS = {NLP, Interpretability, Deep Learning},
PAGES = {48-57},
URL = {https://www.aclweb.org/anthology/2021.deelio-1.6},
DOI = {10.18653/v1/2021.deelio-1.6},
ISBN = {978-1-954085-30-5},
CONFERENCE_NAME = {2nd Workshop on Knowledge Extraction and Integrationfor Deep Learning Architectures},
BOOKTITLE = {Proceedings of the 2nd Workshop on Knowledge Extraction and Integrationfor Deep Learning Architectures},
}
@INPROCEEDINGS{RICCUCCI_2021_INPROCEEDINGS_RDVC_420367,
AUTHOR = {Riccucci, M. and Del Grosso, A. M. and Valecchi, F. and Causarano, G.},
TITLE = {Testimoniare il Lager: l'informatica al servizio della memoria},
YEAR = {2021},
ABSTRACT = {Il contributo illustra il lavoro condotto in seno al progetto di ricerca Voci dall'inferno: le parole per dirlo, condotto e coordinato da Marina Riccucci (Università di Pisa) con il supporto del Dott. Angelo Mario Del Grosso (Università di Pisa) e della Prof. ssa Frida Valecchi. Nel caso specifico sarà dedicata particolare attenzione alla rappresentazione digitale XML-TEI di una testimonianza manoscritta inedita di una donna sopravvissuta alla deportazione in Lager, nonché allo sviluppo di un componente innovativo per l'elaborazione dei documenti digitali, integrato nell'applicazione web Memoriarchivio-software creato specificamente per Voci dall'inferno e che rappresenta un fondamentale strumento per archiviare e analizzare le risorse testuali oggetto d'analisi},
KEYWORDS = {italianistica digitale, codifica del testo, testimonianze, lager, lessico dantesco, XML-TEI, Saxon-js},
PAGES = {567-572},
URL = {http://amsacta.unibo.it/6712/1/AIUCD2021_BOA-versione3A.pdf#page=583},
DOI = {10.6092/unibo/amsacta/6712},
ISBN = {9788894253559},
CONFERENCE_NAME = {AIUCD 2021-DH per la società: e-guaglianza, partecipazione, diritti e valori nell'era digitale-DHs for society: e-quality, participation, rights and values in the Digital Age},
BOOKTITLE = {AIUCD 2021-DH per la società: e-guaglianza, partecipazione, diritti e valori nell'era digitale-DHs for society: e-quality, participation, rights and values in the Digital Age. Book of extended abstracts of the 10th national conference},
}
@INPROCEEDINGS{RUSSO_2021_INPROCEEDINGS_R_505402,
AUTHOR = {Russo, I.},
TITLE = {archer at SemEval-2021 task 1: Contextualising lexical complexity},
YEAR = {2021},
ABSTRACT = {Evaluating the complexity of a target word in a sentential context is the aim of the Lexical Complexity Prediction task at SemEval-2021. This paper presents the system created to as-sess single words lexical complexity, combin-ing linguistic and psycholinguistic variables in a set of experiments involving random forest and XGboost regressors. Beyond encoding out-of-context information about the lemma, we implemented features based on pre-trained language models to model the target word’s in-context complexity},
KEYWORDS = {lexical complexity},
PAGES = {694-699},
URL = {https://iris.cnr.it/handle/20.500.14243/505402},
CONFERENCE_NAME = {15th International Workshop on Semantic Evaluation (SemEval-2021)},
BOOKTITLE = {Proceedings of the 15th International Workshop on Semantic Evaluation (SemEval-2021)},
}
@INPROCEEDINGS{SANNA_2021_INPROCEEDINGS_SCBN_387253,
AUTHOR = {Sanna, A. and Cinerari, R. and Boschetti, F. and Nahli, O.},
TITLE = {Digitizing and Encoding a Multilingual Literary Review: Commerce Numerique},
YEAR = {2021},
ABSTRACT = {Commerce was an important literary review founded in Paris by Princess Margherita Caetani, Prince Roffredo Caetani's wife. Born in America, she was polyglot and maecenas. Between 1924 and 1932 she surrounded herself with three prestigious collaborators: Paul Valéry, Léon-Paul Fargue, Valéry Larbaud. The review promoted the translation of World and European literature in French, translating some of the most important authors like Joyce, T. S. Eliot, Pirandello, Ungaretti, Saint-John Perse, Rilke, Hofmannsthal. The aim of this project is to promote by digitizing the dissemination of the review, to develop studies and research concerning the Caetani family's cultural activities in Europe. All the volumes of the literary review Commerce have been scanned, acquired by OCR and encoded in TEI-XML. The cultural value of the operation is discussed and the work-flow to create the digital textual corpus is described in detail},
KEYWORDS = {Review Commerce, OCR, TEI encoding, literary review, digital resources},
PAGES = {204-207},
URL = {https://ieeexplore.ieee.org/document/9357208},
DOI = {10.1109/CIST49399.2021.9357208},
PUBLISHER = {IEEE (345 E 47TH ST, NEW YORK, NY 10017 USA, USA)},
ISBN = {978-1-7281-6646-9},
CONFERENCE_NAME = {IEEE-CIST2020 DPWH},
CONFERENCE_PLACE = {345 E 47TH ST, NEW YORK, NY 10017 USA},
BOOKTITLE = {2020 6TH IEEE CONGRESS ON INFORMATION SCIENCE AND TECHNOLOGY (IEEE CIST'20)},
}
@INPROCEEDINGS{SARTI_2021_INPROCEEDINGS_SBD_440173,
AUTHOR = {Sarti, G. and Brunato, D. and Dell'Orletta, F.},
TITLE = {That Looks Hard: Characterizing Linguistic Complexity in Humans and Language Models},
YEAR = {2021},
ABSTRACT = {This paper investigates the relationship between two complementary perspectives in the human assessment of sentence complexity and how they are modeled in a neural language model (NLM). The first perspective takes into account multiple online behavioral metrics obtained from eye-tracking recordings. The second one concerns the offline perception of complexity measured by explicit human judgments. Using a broad spectrum of linguistic features modeling lexical, morpho-syntactic, and syntactic properties of sentences, we perform a comprehensive analysis of linguistic phenomena associated with the two complexity viewpoints and report similarities and differences. We then show the effectiveness of linguistic features when explicitly leveraged by a regression model for predicting sentence complexity and compare its results with the ones obtained by a fine-tuned neural language model. We finally probe the NLM's linguistic competence before and after fine-tuning, highlighting how linguistic information encoded in representations changes when the model learns to predict complexity},
KEYWORDS = {linguistic complexity, eyetracking, human evaluation},
PAGES = {48-60},
URL = {https://aclanthology.org/2021.cmcl-1.5},
DOI = {10.18653/v1/2021.cmcl-1.5},
ISBN = {978-1-954085-35-0},
CONFERENCE_NAME = {Proceedings of Workshop on Cognitive Modeling and Computational Linguistics (CMCL 2021)},
}
@INPROCEEDINGS{SASSOLINI_2021_INPROCEEDINGS_SBDGM_401787,
AUTHOR = {Sassolini, E. and Biffi, M. and De Blasi, F. and Guadagnini, E. and Montemagni, S.},
TITLE = {La digitalizzazione del GDLI: un approccio linguistico per la corretta acquisizione del testo?},
YEAR = {2021},
ABSTRACT = {In questo articolo sono discussi metodi e strategie in via di elaborazione per la correzione (propedeutica alla successiva strutturazione) dei contenuti del Grande dizionario della lingua italiana (GDLI) fondato da Salvatore Battaglia, estratti da un formato digitale non standard. La presenza, in questo formato, di errori distribuiti di vario tipo ha condizionato la scelta dell'approccio all'estrazione e messo in luce tutte le difficoltà dell'operazione. Le sperimentazioni fatte sino a oggi portano a privilegiare una strategia di correzione multilivello, che procede scomponendo in sezioni distinte l'individuazione e la correzione degli errori, in modo da rendere gestibili interventi complessi di correzione semi-automatica, altrimenti improponibili, e consentire un loro raffinamento progressivo. Parallelamente alla definizione di regole di riconoscimento di struttura e formato, stiamo analizzando metodi e procedure in grado di migliorare la qualità dell'input e specializzare i moduli di estrazione per i singoli campi della voce a partire dal "lemma". Le finalità del lavoro sono duplici: l'estrazione e strutturazione dei contenuti e la produzione di un formato standard di rappresentazione dei dati. Si tratta di un percorso difficile perché il formato dei dati rende l'uso di strumenti reperibili in letteratura non applicabile. Solamente al termine del lavoro potremo capire se esistono le condizioni per trasformare l'approccio adottato in un protocollo di intervento replicabile},
KEYWORDS = {dizionari digitali, risorse linguistiche, estrazione dell'informazione, correzione del testo post OCR},
PAGES = {159-166},
URL = {https://aiucd2021.labcd.unipi.it/wp-content/uploads/2021/05/AIUCD2021_BOA-versione3A.pdf},
DOI = {10.6092/unibo/amsacta/6712},
ISBN = {9788894253559},
CONFERENCE_NAME = {AIUCD 2021-DH per la società: e-guaglianza, partecipazione, diritti e valori nell'era digitale},
}
@INPROCEEDINGS{TAXITARI_2021_INPROCEEDINGS_TCFMNP_423945,
AUTHOR = {Taxitari, L. and Cappa, C. and Ferro, M. and Marzi, C. and Nadalini, A. and Pirrelli, V.},
TITLE = {Using mobile technology for reading assessment},
YEAR = {2021},
ABSTRACT = {The enormous potential of Information and Communication Technologies (ICT) for addressing critical educational issues is generally acknowledged, but its use in the assessment of the complex skills of reading and understanding a text has been very limited to date. The paper contrasts traditional reading assessment protocols with ReadLet, an ICT platform with a tablet front-end, designed to support online monitoring of silent and oral reading abilities in early graders. ReadLet makes use of cloud computing and mobile technology for large-scale data collection and allows the time alignment of the child's reading behaviour with texts tagged using Natural Language Processing (NLP) tools. Initial findings replicate established benchmarks from the psycholinguistic literature on reading in both typically and atypically developing children, making the application a new ground-breaking approach in the evaluation of reading skills. Index Terms-reading assessment, reading research, mobile technology, NLP, cloud computing, special education needs},
KEYWORDS = {reading assessment, reading research, mobile technology, NLP, cloud computing, special education needs},
PAGES = {1-6},
URL = {http://www.ieee.ma/cist20/component/content/?id=26\&Itemid=185},
ISBN = {9781728166469},
CONFERENCE_NAME = {6th IEEE Congress on Information Science \& Technology (IEEE CIST'20)},
BOOKTITLE = {Proceedings of the 6th IEEE Congress on Information Science and Technology (CiSt)},
}
@INPROCEEDINGS{VAGIONAKIS_2021_INPROCEEDINGS_VDBBDMM_449230,
AUTHOR = {Vagionakis, I. and Del Gratta, R. and Boschetti, F. and Baroni, P. and Del Grosso, A. M. and Mancinelli, T. and Monachini, M.},
TITLE = {'Cretan Institutional Inscriptions' Meets CLARIN-IT},
YEAR = {2021},
ABSTRACT = {This paper describes a project in the domain of Digital Epigraphy named 'Cretan Institutional Inscriptions' and developed at the Ca' Foscari University of Venice. The project is supported by CLARIN-IT as part of the actions addressed to initiatives, projects and events in the field of Humanities and Social Sciences. The main goal is to make the project visible through CLARIN channels with the hope that it will be a forerunner for other digital epigraphy projects in CLARIN. The article illustrates also the dockerization process applied to the 'Cretan Institutional Inscriptions' project, currently hosted on the CLARIN-IT servers},
KEYWORDS = {Digital Epigraphy, Digital Classics, Ancient Greek, Crete, Institutions, Text Encoding Initiative, TEI, EpiDoc, EpiDoc Front-End Services, EFES, Virtual Language Observatory, Dockerization, ILC4CLARIN, CLARIN-IT, CLARIN},
PAGES = {48-53},
URL = {https://office.clarin.eu/v/CE-2021-1923-CLARIN2021_ConferenceProceedings.pdf},
ISSN = {2021-1923},
CONFERENCE_NAME = {CLARIN Annual Conference 2021},
BOOKTITLE = {Proceedings of CLARIN Annual Conference 2021 (Virtual Edition)},
EDITOR = {Monachini, M. and Eskevich, M.},
}
@INPROCEEDINGS{AIOLA_2021_INPROCEEDINGS_AADL_447062,
AUTHOR = {Aiola, C. and Andreini, G. and Di Donato, F. and Lombardo, T.},
TITLE = {Sharing Knowledge Digitally. The Muruca case study},
YEAR = {2021},
ABSTRACT = {In this poster we present the evolution of Muruca, a platform that has been conceived as a framework to allow Digital Humanities researchers and research teams to create, curate and share their own Digital Editions. The poster describes the main features of the framework, its evolution over the years in synergy with the researchers' needs and with the progress of technologies and policies, and the open challenges and opportunities of the framework in a European context},
KEYWORDS = {open culture, digital humanities, digital libraries, digital editions, electronic objects},
PAGES = {428-431},
URL = {https://aiucd2021.labcd.unipi.it/wp-content/uploads/2021/01/27_Aiola-AIUCD2021_presentation_46.pdf},
DOI = {10.6092/unibo/amsacta/6712},
ISBN = {9788894253559},
CONFERENCE_NAME = {AIUCD 2021-DH per la società: eguaglianza, partecipazione, diritti e valori nell'era digitale},
}
@INPROCEEDINGS{BELLANDI_2021_INPROCEEDINGS_BGMPS_446104,
AUTHOR = {Bellandi, A. and Giovannetti, E. and Marchi, S. and Piccini, S. and Sciolette, F.},
TITLE = {Fostering the Collaborative Creation of Linguistic Linked Open Data with LexO, an open source Editor of Multilingual Lexicons and Terminologies},
YEAR = {2021},
ABSTRACT = {In the context of the semanitc web and the linguistic linked open data paradigm, we propose LexO, a web editor of computational lexicons and terminologies based on the OntoLex-Lemon model},
KEYWORDS = {LexO, Linguistic Linked Open Data, Semantic Web, Computational Lexicography, Terminology, CLARIN},
PAGES = {436-439},
URL = {https://aiucd2021.labcd.unipi.it/book-of-abstracts/},
CONFERENCE_NAME = {AIUCD 2021-DH per la società: e-guaglianza, partecipazione, diritti e valori nell'era digitale},
BOOKTITLE = {DHs for society: e-quality, participation, rights and values in the Digital Age},
}
@INPROCEEDINGS{CARDILLO_2021_INPROCEEDINGS_CDS_448228,
AUTHOR = {Cardillo, F. A. and Di Ludovico, A. and Straccia, U.},
TITLE = {Mathematical investigation of Glyptic Iconographies: a new synthesis},
YEAR = {2021},
ABSTRACT = {The huge and long-lasting production of cylinder seals in ancient Western Asia is one of the most typical features which characterized its civilizations along almost three millennia. In the history of the past experiences of quantitative research on artefacts and visual languages of pre-classical Near and Middle East the cylinder seals have played a major role. This is probably due to the long life of these products, but also to their peculiar functions and to some technical issues, like, e. g., the physical constraints bound to the shape and dimensions of these objects. This paper presents an approach to Mesopotamian glyptic iconography which is, on one hand, the evolution of the application of long tested mathematical methods integrated with new ones, and, on the other hand, the possible starting point for new ways of approaching the interpretation and classification of the figurative languages represented in cylinder seals' carvings},
KEYWORDS = {Artificial intelligence, Computational archaeology, Fuzzy logic},
URL = {https://www.orientlab.net/icaane/12icaane/12icaane/proceedings.html},
ISBN = {978-3-447-11873-6},
CONFERENCE_NAME = {ICAANE 2021-12th International Congress on the Archaeology of the Ancient Near East},
BOOKTITLE = {Procceedings of the 12th International Congress on the Archaeology of the Ancient Near East},
}
@INPROCEEDINGS{CARDILLO_2021_INPROCEEDINGS_CS_448749,
AUTHOR = {Cardillo, F. A. and Straccia, U.},
TITLE = {Learning fuzzy concept inclusions from OWL real-valued data},
YEAR = {2021},
URL = {https://iris.cnr.it/handle/20.500.14243/448749},
}
@INPROCEEDINGS{MARINETTI_2021_INPROCEEDINGS_MMQBBDPRS_449219,
AUTHOR = {Marinetti, A. and Murano, F. and Quochi, V. and Ballerini, M. and Boschetti, F. and Del Grosso, A. M. and Piccini, S. and Rigobianco, L. and Solinas, P.},
TITLE = {Languages and Cultures of Ancient Italy. Historical Linguistics and Digital Models},
YEAR = {2021},
ABSTRACT = {The abstract accompanies a poster presenting an overview of the project "Languages and cultures of Ancient Italy", which had just started. The project brings together competences from Historical Linguistics, Computational Lexicography and Digital Humanities. The main objective of the project is to investigate the cultures of ancient Italy on the basis of theirlinguistic documentation (7th-1stc. B. C.) by means of digital tools specifically tailored for their peculiarities},
KEYWORDS = {digital epigraphy, computational lexicons, text -lexicon linking, restsprachen, digital models, digital humanities},
PAGES = {528-532},
URL = {https://amsacta.unibo.it/id/eprint/6712/},
ISBN = {9788894253559},
CONFERENCE_NAME = {10th National Conference of Associazione per l'Informatica Umanistica e la Cultura Digitale},
BOOKTITLE = {AIUCD 2021-Book of Extended Abstracts},
}
@INPROCEEDINGS{MARZI_2021_INPROCEEDINGS_MTFNP_426392,
AUTHOR = {Marzi, C. and Taxitari, L. and Ferro, M. and Nadalini, A. and Pirrelli, V.},
TITLE = {Valutare la lettura "in tempo reale": un esempio di integrazione tra linguistica computazionale e linguistica applicata},
YEAR = {2021},
ABSTRACT = {In anni recenti, linguistica computazionale e linguistica applicata hanno ampliato i loro rispettivi ambiti d'indagine, utilizzando l'ontologia formale della linguistica teorica e i modelli cognitivi della psicolinguistica per studiare le difficoltà che i parlanti incontrano nello svolgimento di "compiti" linguistici specifici. Nell'ambito della lettura, le tecnologie per il Trattamento Automatico del Linguaggio (TAL) si sono dimostrate capaci di classificare il livello di leggibilità di un testo, basandosi sulla distribuzione di alcuni parametri linguistici in testi pre-classificati per età dei lettori destinatari, o per grado di scolarità, o per livello di sviluppo cognitivo. Ad esempio, parole o frasi più lunghe, o parole più rare tendono a distribuirsi in testi di più difficile comprensione, o destinati a lettori più maturi. E' possibile così assegnare a un testo, o a ogni singola frase, un punteggio di leggibilità in funzione (inversa) della complessità lessicale, morfologica, sintattica o pragmatica dell'unità testuale analizzata. In Linguistica Applicata (LA) la valutazione della difficoltà di lettura ha seguito un approccio funzionale. Nel modello semplice di lettura, ad esempio, la capacità di leggere un testo è analizzata come il prodotto dell'interazione tra decodifica e comprensione. Attraverso l'osservazione di un campione di bambini impegnati nella lettura, è possibile valutare la loro fluenza in decodifica, gli errori di decodifica e comprensione, e l'efficacia di percorsi educativi personalizzati. La piattaforma ReadLet è stata sviluppata con l'obiettivo di integrare l'approccio classificatorio del TAL con quello funzionale della LA. Il bambino legge un breve testo visualizzato sullo schermo di un tablet, ad alta voce o in modalità silente. In entrambi i casi, al bambino viene chiesto di "tenere il segno" con il dito sullo schermo nel corso della lettura. La traccia tattile è registrata e allineata con il testo visualizzato sullo schermo mediante un algoritmo di convoluzione. Al contempo, il testo è annotato automaticamente per tratti linguistici. Alla fine della sessione di lettura silente, il bambino risponde ad alcune semplici domande sul contenuto del testo. I dati raccolti consentono di valutare le difficoltà (rallentamenti o errori) che il bambino incontra nella lettura, e di mettere in relazione "in tempo reale" queste difficoltà con aspetti linguistici specifici del testo. Un'analisi preliminare dei dati raccolti da ReadLet su oltre 400 allievi di alcune scuole elementari toscane e della Svizzera italiana, ha evidenziato il differente "passo" di lettura tra lettori con sviluppo tipico e atipico, e il peso che variabili come lunghezza, frequenza e lessicalità hanno su profili di lettura individuali e aggregati. La possibilità di "controllare" automaticamente la distribuzione di queste variabili nel testo e di correlarle con le difficoltà del singolo bambino consente, infine, di somministrare testi con livelli di difficoltàgradualmente crescenti, rendendo possibili percorsi personalizzati di potenziamento},
KEYWORDS = {reading assessment, reading strategies, NLP, ICT mobile technologies},
PAGES = {5-5},
URL = {https://iris.cnr.it/handle/20.500.14243/426392},
VOLUME = {2021},
CONFERENCE_NAME = {XXI Congresso Internazionale di AItLA},
BOOKTITLE = {FARE LINGUISTICA APPLICATA CON LE DIGITAL HUMANITIES},
}
@TECHREPORT{ALBANESI_2021_TECHREPORT_ABCPGS_446083,
AUTHOR = {Albanesi, D. and Bellandi, A. and Colombo, M. and Papini, M. and Giovannetti, E. and Sciolette, F.},
TITLE = {Traduco: l'Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-Rapporto tecnico 19},
YEAR = {2021},
ABSTRACT = {La presente relazione tecnico-scientifica descrive l'attività svolta da ILC-CNR nel contesto del Progetto Traduzione Talmud Babilonese nel periodo novembre 2020-aprile 2021. Le principali attività tecniche svolte sul sistema Traduco sono state la risoluzione di bug, l'implementazione di nuove funzionalità richieste e lo sviluppo di una nuova interfaccia grafica utente. Le attività di ricerca sono state condotte, in continuità a quelle descritte nel rapporto precedente, nella rappresentazione del lessico, della terminologia e della conoscenza del Talmud},
KEYWORDS = {Linguistica Computazionale, Traduzione di Testi Religiosi, Traduzione Assistita dal Calcolatore, Traduzione Collaborativa, Lessici elettronici, rappresentazione della conoscenza},
PAGES = {28},
URL = {https://iris.cnr.it/handle/20.500.14243/446083},
}
@TECHREPORT{ALBANESI_2021_TECHREPORT_ABCPGS_446085,
AUTHOR = {Albanesi, D. and Bellandi, A. and Colombo, M. and Papini, M. and Giovannetti, E. and Sciolette, F.},
TITLE = {Traduco: l'Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-Rapporto tecnico 20},
YEAR = {2021},
ABSTRACT = {La presente relazione tecnico-scientifica descrive l'attività svolta da ILC-CNR nel contesto del Progetto Traduzione Talmud Babilonese nel periodo maggio 2021-ottobre 2021. Le principali attività tecniche svolte sul sistema Traduco sono state la risoluzione di bug e l'implementazione di nuove funzionalità richieste. Parallelamente, sono proseguite le attività volte alla visualizzazione di risorse testuali e linguistiche tramite grafi e per la conversione e l'utilizzo del lessico computazionale PSC a supporto di ricerca "full-text" sul testo talmudico italiano},
KEYWORDS = {Traduzione Assistita dal Calcolatore, Traduzione Collaborativa, Lessici elettronici, rappresentazione della conoscenza, Linguistica Computazionale, traduzione di testi religiosi},
PAGES = {20},
URL = {https://iris.cnr.it/handle/20.500.14243/446085},
}
@TECHREPORT{ALBANESI_2021_TECHREPORT_AGPS_446086,
AUTHOR = {Albanesi, D. and Giovannetti, E. and Papini, M. and Sciolette, F.},
TITLE = {Traduco: l'Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-rapporto integrativo 3},
YEAR = {2021},
ABSTRACT = {La presente relazione tecnico-scientifica descrive l'attività svolta da ILC-CNR nel contesto delle attività di progetto previste dalla convenzione integrativa stipulata tra PTTB e ILC-CNR in data 10/07/2018 e condotte nel periodo febbraio 2020-gennaio 2021},
KEYWORDS = {Linguistica Computazionale, Traduzione di Testi Religiosi, Traduzione Assistita dal Calcolatore, Traduzione Collaborativa, Sviluppo front-end, lessici computazionali},
PAGES = {17},
URL = {https://iris.cnr.it/handle/20.500.14243/446086},
}
@TECHREPORT{ALRAHABI_2021_TECHREPORT_ABFPJBKG_394923,
AUTHOR = {Alrahabi, M. and Brando, C. and Frontini, F. and Provenier, A. and Jalabert, R. and Bordry, M. and Koskas, C. and Gawley, J.},
TITLE = {Guide d'annotation manuelle d'entités nommées dans des corpus littéraires},
YEAR = {2021},
ABSTRACT = {Guide d'annotation manuelle d'entités nommées dans des corpus littéraires Campagne d'annotation OBVIL 2019-2021},
KEYWORDS = {NER},
URL = {https://hal.archives-ouvertes.fr/hal-03156278},
}
@TECHREPORT{BANDINI_2021_TECHREPORT_BBN_461479,
AUTHOR = {Bandini, M. and Boschetti, F. and Nahli, O.},
TITLE = {How to encode the literary French journal Commerce using TEI},
YEAR = {2021},
ABSTRACT = {This technical report aims to show all the steps followed to encode the literary journal Commerce according to the TEI P5 Guidelines. Commerce is a literary French journal founded in 1924 by Paul Valéry, Léon-Paul Fargue, and Valery Larbaud, composed of 29 volumes published between 1924 and 1932. Each volume collects different literary material from various well-known and unknown writers as poems or novels which are all translations into French. In detail, with this paper we want to provide a guideline for the encoding of the volumes, showing all the tags and attributes which should be used and many examples taken from the XML of volumes number 5 and 6. This report is the result of work done in collaboration with the University of Pisa and the Institute for Computational Linguistics "A. Zampolli" CNR Pisa},
URL = {https://iris.cnr.it/handle/20.500.14243/461479},
}
@TECHREPORT{DIDONATO_2021_TECHREPORT_DDLKOTCCEMDT_433201,
AUTHOR = {Di Donato, F. and Dumouchel, S. and Lombardo, T. and Katsaloulis, I. and Ocansey Joshua, T. and Thiel, C. and Capelli, L. and Chen, Y. and Eskevich, M. and Moranville, Y. and De Santis, L. and Tóthczifra, E.},
TITLE = {TRIPLE Deliverable: D6. 2 Report on Procedure to Follow to Be Part of the EOSC Catalogue},
YEAR = {2021},
ABSTRACT = {The 6. 2 Deliverable presents the procedure to onboard the future GoTriple platform into the EOSC catalogue. This deliverable is supposed to guide the TRIPLE consortium in the purpose of adding a SSH discovery platform to the EOSC catalogue but it can also guide other service providers for their own purposes, especially services that are made with different components. Part 1 of this deliverable provides an overview of the GoTriple platform and the five innovative services that are integrated into it, e. g. ScaR, MEOH App, Visualisation components, Pundit, and Head Start. As those innovative services are independent tools, the perspectives, challenges and potential solutions of their onboarding into the EOSC catalogue are discussed in detail on a case-by-case basis. Part 2 contains the core information of this deliverable. First, an overview of the three main steps in the onboarding process (2. 1.) provides the overall context of the task. Second, the timeline of all needed steps (already taken and planned closer to the end of the project) to define the final federation that will serve as GoTriple provider is outlined (2. 2). Essentially, all project partners that are committed to continue their support of the developed service after the project will be identified as GoTriple providers in the EOSC portal, while the GoTriple discovery service will be part of the OPERAS Research Infrastructure's catalogue. Third, the details of the resource profile that are mandatory and optional, are listed according to the set of fields in the EOSC portal. Part 3 summarises the two main steps in the roadmap for integration which are planned to take place in September 2021 and March 2023. In conclusion, the authors highlight the fact that the EOSC development is an ongoing process, and therefore, the current report reflects the procedures and planning steps that are valid at this point of time and fit the current requirements},
KEYWORDS = {EOSC, GoTRIPLE},
URL = {https://zenodo.org/record/5702705#.YZYgApDMKHs},
}
@TECHREPORT{LAZZERI_2021_TECHREPORT_LTPAABBCCCCCCCDDDFFFGGGKLLMNOOPPPPRRRSSSSTTVVZ_442328,
AUTHOR = {Lazzeri, E. and Tanlongo, F. and Pavone, G. and Alpi, F. and Ansuini, A. and Bertazzon, E. and Bonaccorsi, D. and Cappelluti, F. and Casati, S. and Castelli, D. and Cippitani, R. and Colcelli, V. and Costantini, A. and Cozzini, S. and Degl'Innocenti, E. and Di Donato, F. and Di Giorgio, S. and Fava, I. and Fiore, S. and Forni, M. and Galimberti, G. and Giglia, E. and Giorgetti, A. and Kurapati, S. and Landoni, M. and Lavitrano, M. and Marras, C. and Niccolucci, F. and Occioni, M. and Osmenaj, E. and Paolini, G. and Pasquale, V. and Petrillo, C. and Pugliese, R. and Ripepi, E. and Rivoira, G. and Rossi, G. and Salon, S. and Sarretta, A. and Sartori, A. and Spiga, D. and Tamagno, D. and Tammaro, A. and Vellico, M. and Vignocchi, M. and Zane, D.},
TITLE = {Competence Centre ICDI per Open Science, FAIR, ed EOSC-Mission, strategia e piano d'azione},
YEAR = {2021},
ABSTRACT = {This document presents the mission and strategy of the Italian Competence Centre on Open Science, FAIR, and EOSC. The Competence Centre is an initiative born within the Italian Computing and Data Infrastructure (ICDI), a forum created by representatives of major Italian Research Infrastructures and e-Infrastructures, with the aim of promoting sinergies at the national level, and optimising the Italian participation to European and global challenges in this field, including the European Open Science Cloud (EOSC), the European Data Infrastructure (EDI) and HPC. This working paper depicts the mission and objectives of the ICDI Competence Centre, a network of experts with various skills and competences that are supporting the national stakeholders on topics related to Open Science, FAIR principles application and participation to the EOSC. The different actors and roles are described in the document as well as the activities and services offered, and the added value each stakeholder can find the in Competence Centre. The tools and services provided, in particular the concept for the portal, though which the Centre will connect to the national landscape and users, are also presented. An english translation of this document is provided in Zenodo: Lazzeri, Emma, et all. (2021). ICDI Competence Centre for Open Science, FAIR and EOSC-Mission, Strategy and Action Plan. Zenodo. https: //doi. org/10. 5281/zenodo. 5512638},
KEYWORDS = {EOSC, Competence Centre, ICDI, Open Science, FAIR, EDI, HPC},
PAGES = {13},
URL = {https://doi.org/10.32079/ISTI-TR-2022/022},
DOI = {10.32079/ISTI},
}
@TECHREPORT{SAYERS_2021_TECHREPORT_SSHAAABBBCECDDDDDFFGGGGHLLJJKKMMMMMNRPSASSSTYBCCLKRP_444079,
AUTHOR = {Sayers, D. and Sousasilva, R. and Höhn, S. and Ahmedi, L. and Allkivimetsoja, K. and Anastasiou, D. and Beu, T. and Bowker, L. and Bytyçi, E. and Catala, A. and Çepani, A. and Chacónbeltrán, R. and Dadi, S. and Dalipi, F. and Despotovic, V. and Doczekalska, A. and Drude, S. and Fort, K. and Fuchs, R. and Galinski, C. and Gobbo, F. and Gungor, T. and Guo, S. and Höckner, K. and Láncos, P. and Libal, T. and Jantunen, T. and Jones, D. and Klimova, B. and Korkmaz, E. and Mauec, M. S. and Melo, M. and Meunier, F. and Migge, B. and Mititelu, V. B. and Névéol, A. and Rossi, A. and Parejalora, A. and Sanchezstockhammer, C. and Ahin, A. and Soltan, A. and Soria, C. and Shaikh, S. and Turchi, M. and Yildirim Yayilgan, S. and Bessa, M. and Cabral, L. and Coler, M. and Liebeskind, C. and Kernerman, I. and Rousi, R. and Prys, C.},
TITLE = {The Dawn of the Human-Machine Era: A forecast of new and emerging language technologies},
YEAR = {2021},
ABSTRACT = {New language technologies are coming, thanks to the huge and competing private investment fuelling rapid progress; we can either understand and foresee their effects, or be taken by surprise and spend our time trying to catch up. This report scketches out some transformative new technologies that are likely to fundamentally change our use of language. Some of these may feel unrealistically futuristic or far-fetched, but a central purpose of this report-and the wider LITHME network-is to illustrate that these are mostly just the logical development and maturation of technologies currently in prototype. But will everyone benefit from all these shiny new gadgets? Throughout this report we emphasise a range of groups who will be disadvantaged and issues of inequality. Important issues of security and privacy will accompany new language technologies. A further caution is to re-emphasise the current limitations of AI. Looking ahead, we see many intriguing opportunities and new capabilities, but a range of other uncertainties and inequalities. New devices will enable new ways to talk, to translate, to remember, and to learn. But advances in technology will reproduce existing inequalities among those who cannot afford these devices, among the world's smaller languages, and especially for sign language. Debates over privacy and security will flare and crackle with every new immersive gadget. We will move together into this curious new world with a mix of excitement and apprehension-reacting, debating, sharing and disagreeing as we always do. Plug in, as the human-machine era dawns},
KEYWORDS = {language technologies, human-machine communication},
URL = {https://doi.org/10.17011/jyx/reports/20210518/1},
DOI = {10.17011/jyx},
}
@MISC{BARONI_2021_MISC_B_461443,
AUTHOR = {Baroni, P.},
TITLE = {DiPText-KC Web Site},
YEAR = {2021},
ABSTRACT = {Web Site of the CLARIN Knowledge Centre for Digital and Public Textual Scholarship, powered by WordPress, developed in English},
KEYWORDS = {CLARIN, Knowledge Centre, Digital and Public Textual Scholarship},
URL = {https://diptext-kc.clarin-it.it},
}
@MISC{BOSCHETTI_2021_MISC_BD_462933,
AUTHOR = {Boschetti, F. and Del Grosso, A. M.},
TITLE = {Problemi tecnici e questioni teoriche nella gestione degli archivi digitali di testi},
YEAR = {2021},
ABSTRACT = {Il seminario illustra alcune potenzialità offerte dalla rappresentazione digitale di testi d'interesse umanistico. Si prenderà spunto dall'archivio di testi latini conservato e fruibile dalla piattaforma Musisque Deoque per poi passare ad alcuni esempi di indagine condotti mediante il linguaggio di interrogazione XQuery},
KEYWORDS = {Digital Humanities, Filologia Digitale, Filologia Computazionale, MQDQ, Archivi Digitali di Testi, XML/TEI},
URL = {https://iris.cnr.it/handle/20.500.14243/462933},
}
@MISC{BROEDER_2021_MISC_B_441098,
AUTHOR = {Broeder, F. F. G. M.},
TITLE = {SSHOC Multilingual Data Stewardship Terminology},
YEAR = {2021},
ABSTRACT = {The SSHOC Multilingual Data Stewardship Terminology is a multilingual terminology that collects terms specific to the domain of Data Stewardship, as well as their definitions. A list of domain-specific terms was automatically extracted from a corpus pertaining to the domain of Data Stewardship and Curation, validated by domain experts, assigned a definition, and linked to other existing terminologies (Loterre Open Science Thesaurus, terms4FAIRskills, Linked Open Vocabularies, ISO terms and definitions). Each term-definition pair was then automatically translated into multiple languages (Dutch, French, German, Greek, Italian, Slovenian) by employing Deep-L. The Multilingual Data Stewardship Terminology thus consists of 210 concepts available in Dutch, French, German, Greek, Italian, Slovenian. This resource was created within the frame of the SSHOC (Social Sciences and Humanities Open Cloud) project (H2020-INFRAEOSC-2018-2-823782). It is the result of the work of Task 3. 1. 2 "extraction of terminology from technical documentation about standards and interoperability", as described in D3. 9, carried out jointly by ILC-CNR and CLARIN ERIC},
URL = {https://iris.cnr.it/handle/20.500.14243/441098},
}
@MISC{DELGROSSO_2021_MISC_D_462935,
AUTHOR = {Del Grosso, A. M.},
TITLE = {How to leverage Domain-Driven Design to foster Digital Scholarly Editing and DSL},
YEAR = {2021},
ABSTRACT = {The field of digital scholarly editing is deemed to be particularly challenging from a software engineering point of view. Indeed, after decades of research activities, computational philology still lacks effective tools and efficient procedures organized in common interfaces, decoupled application services and domain-specific commodities. As a matter of fact, there is neither convergence on how to model software applications to meet philological requirements nor traditional philologists fully satisfied with the current digital solutions. By adopting the Domain Driven Design approach, we start our modeling activities by defining the problem space of our domain which, in turn, is broken into small components (called sub-domains) to progressively refine the ongoing digital models. In this way, together with the experts, we are able to identify the main capabilities of the field we want to model and strive to design coherent domain-specific solutions for such capabilities (bounded contexts)},
KEYWORDS = {Digital Humanities, Domain-Driven Design, Digital Philology, Euporia, Domain-Specific Languages},
URL = {https://easychair.org/cfp/EUPORIA2021},
CONFERENCE_NAME = {EUPORIA2021: Webinars in Theories and Practices of the Annotation through Domain-Specific Languages},
}
@MISC{DELGROSSO_2021_MISC_D_462934,
AUTHOR = {Del Grosso, A. M.},
TITLE = {Preparing the XML-TEI text for Euporia},
YEAR = {2021},
ABSTRACT = {Seminario introduttivo alla codifica XML/TEI per la rappresentazione digitale di testi d'interesse storico, letterario e umanistico},
KEYWORDS = {Digital Humanities, Euporia, Filologia Digitale, XML/TEI, CoPhiLab},
URL = {https://cophilab.ilc.cnr.it/euporia-2021/},
}
@MISC{DELGROSSO_2021_MISC_D_462936,
AUTHOR = {Del Grosso, A. M.},
TITLE = {La codifica testuale delle testimonianze inedite, manoscritte, audio e video},
YEAR = {2021},
ABSTRACT = {Il contributo intende illustrare gli aspetti più significativi della rappresentazione digitale delle testimonianze sia scritte sia orali, inquadrando la proposta in una prospettiva infrastrutturale e di sostenibilità delle risorse digitali prodotte},
KEYWORDS = {Digital Humanities, Informatica Umanistica, Archivi Digitali, Voci dall'Inferno, XML/TEI},
URL = {https://www.unipi.it/index.php/archivio/event/6081-voci-dall-inferno-le-testimonianze-dei-sopravvissuti-ai-lager},
CONFERENCE_NAME = {Voci dall'Inferno. Le testimonianze dei sopravvissuti ai Lager},
}
@MISC{DELGROSSO_2021_MISC_DT_462929,
AUTHOR = {Del Grosso, A. M. and Tessarolo, L.},
TITLE = {Lavori in corso: trasferimento di competenze per una re-ingegnerizzazione del sistema la "galassia MQDQ"},
YEAR = {2021},
ABSTRACT = {L'intervento illustra le attività in corso presso il centro VeDPH dell'Università Ca' Foscari di Venezia informate dal progetto di visiting scholar tra il dipartimento di Scienze Umane e l'Istituto di Linguistica Computazionale CNR-ILC volto alla reingegnerizzazione della tecnologia su cui poggiano i progetti della galassia Musisque Deoque (MQDQ)},
KEYWORDS = {Digital Humanties, Archivi Digitali Latini, MQDQ, XML/TEI, Filologia Co},
URL = {https://iris.cnr.it/handle/20.500.14243/462929},
CONFERENCE_NAME = {Biblioteche digitali di testi latini in Italia. Per un progetto di archivio comune},
}
@MISC{DIDONATO_2021_MISC_DL_431593,
AUTHOR = {Di Donato, F. and Lazzeri, E.},
TITLE = {Horizon Europe: L'Open Science e la nuova normalita},
YEAR = {2021},
ABSTRACT = {Nel programma quadro Horizon Europe, l'adozione dell'Open Science e delle sue pratiche è un requisito fondamentale. Questo evento, rivolto a ricercatori, tecnologi e personale di supporto alla ricerca, intende fornire gli elementi introduttivi per comprendere come rispondere in modo adeguato alle nuove richieste introdotte dalla Commissione europea. In particolare ci concentreremo sugli elementi fondamentali della comunicazione scientifica, sulla definizione di scienza aperta e dei suoi elementi fondanti, e su come l'Open Science sta cambiando il paradigma di valutazione della ricerca. Programma-Modulo 1. 0: Intro e warm-up-Modulo 1. 1: La valutazione della ricerca e l'Open Science-Modulo 1. 2: Comunicazione scientifica e Open Science-Domande-Modulo 1. 3: Open Science e Horizon Europe-Domande-Chiusura lavori},
KEYWORDS = {open science, Horizon Europe, valutazione},
URL = {https://doi.org/10.5281/zenodo.5604541},
DOI = {10.5281/zenodo},
}
@MISC{DIDONATO_2021_MISC_DL_431592,
AUTHOR = {Di Donato, F. and Lazzeri, E.},
TITLE = {Data Management},
YEAR = {2021},
ABSTRACT = {The Data Management course has been organised by AREA Science Park and tailored to their researchers and support research staff. The course is focused on FAIR data management and introduces to all aspects of Open Science and provides the skills, tools and standards required to embed Open Science in the research workflow. It has been structured in 4 on-line training modules, each one built on 20 mins sub-modules of frontal lessons and on several interactions. The structure of the 4 modules is the following: Module 1: An Introduction to Open Science and Open Data (2hrs) Module 2: Open Science in Horizon Europe, the FAIR principles and Open data (4 hrs) Module 3: Data Management Plans (3hrs) Module 4: Data Management Plans and Metadata schemas (3hrs) Materials of each module start with MX. 0. A readme file is associated with each module},
KEYWORDS = {open science, research data management},
URL = {https://doi.org/10.5281/zenodo.5575096},
DOI = {10.5281/zenodo},
}
@MISC{DIDONATO_2021_MISC_DL_440560,
AUTHOR = {Di Donato, F. and Lazzeri, E.},
TITLE = {Open Science e Research Data Management},
YEAR = {2021},
ABSTRACT = {Materiale didattico per il Corso di alta formazione ORMA (aprile-maggio 2021), durata: 10 ore},
URL = {https://iris.cnr.it/handle/20.500.14243/440560},
}
@MISC{ERJAVEC_2021_MISC_EOOLSGRPKBSVDDJHNCDVMLCAFMQVRMBSRDUPBKMBCDLR_446080,
AUTHOR = {Erjavec, T. and Ogrodniczuk, M. and Osenova, P. and Ljubei, N. and Simov, K. and Grigorova, V. and Rudolf, M. and Panur, A. and Kopp, M. and Barkarson, S. and Steingrímsson, S. and Van Der Pol, H. and Depoorter, G. and De Does, J. and Jongejan, B. and Haltrup Hansen, D. and Navarretta, C. and Calzada Pérez, M. and D De Macedo, L. and Van Heusden, R. and Marx, M. and Çöltekin, Ç. and Coole, M. and Agnoloni, T. and Frontini, F. and Montemagni, S. and Quochi, V. and Venturi, G. and Ruisi, M. and Marchetti, C. and Battistoni, R. and Sebk, M. and Ring, O. and Daris, R. and Utka, A. and Petkeviius, M. and Briediené, M. and Krilaviius, T. and Morkeviius, V. and Bartolini, R. and Cimino, A. and Diwersy, S. and Luxardo, G. and Rayson, P.},
TITLE = {Multilingual comparable corpora of parliamentary debates ParlaMint 2. 1},
YEAR = {2021},
ABSTRACT = {ParlaMint 2. 1 is a multilingual set of 17 comparable corpora containing parliamentary debates mostly starting in 2015 and extending to mid-2020, with each corpus being about 20 million words in size. The sessions in the corpora are marked as belonging to the COVID-19 period (after November 1st 2019), or being "reference" (before that date). The corpora have extensive metadata, including aspects of the parliament; the speakers (name, gender, MP status, party affiliation, party coalition/opposition); are structured into time-stamped terms, sessions and meetings; with speeches being marked by the speaker and their role (e. g. chair, regular speaker). The speeches also contain marked-up transcriber comments, such as gaps in the transcription, interruptions, applause, etc. Note that some corpora have further information, e. g. the year of birth of the speakers, links to their Wikipedia articles, their membership in various committees, etc. The corpora are encoded according to the Parla-CLARIN TEI recommendation (https: //clarin-eric. github. io/parla-clarin/), but have been validated against the compatible, but much stricter ParlaMint schemas. This entry contains the ParlaMint TEI-encoded corpora with the derived plain text version of the corpus along with TSV metadata on the speeches. Also included is the 2. 0 release of the data and scripts available at the GitHub repository of the ParlaMint project. Note that there also exists the linguistically marked-up version of the corpus, which is available at http: //hdl. handle. net/11356/1431},
URL = {https://iris.cnr.it/handle/20.500.14243/446080},
}
@MISC{ERJAVEC_2021_MISC_EOOLSGRPKBSVDDJHNCDVMLCAFMQVRMBSRDUPBKMBCDLR_446076,
AUTHOR = {Erjavec, T. and Ogrodniczuk, M. and Osenova, P. and Ljubei, N. and Simov, K. and Grigorova, V. and Rudolf, M. and Panur, A. and Kopp, M. and Barkarson, S. and Steingrímsson, S. and Van Der Pol, H. and Depoorter, G. and De Does, J. and Jongejan, B. and Haltrup Hansen, D. and Navarretta, C. and Calzada Pérez, M. and D De Macedo, L. and Van Heusden, R. and Marx, M. and Çöltekin, Ç. and Coole, M. and Agnoloni, T. and Frontini, F. and Montemagni, S. and Quochi, V. and Venturi, G. and Ruisi, M. and Marchetti, C. and Battistoni, R. and Sebk, M. and Ring, O. and Daris, R. and Utka, A. and Petkeviius, M. and Briediené, M. and Krilaviius, T. and Morkeviius, V. and Bartolini, R. and Cimino, A. and Diwersy, S. and Luxardo, G. and Rayson, P.},
TITLE = {Linguistically annotated multilingual comparable corpora of parliamentary debates ParlaMint. ana 2. 1},
YEAR = {2021},
ABSTRACT = {ParlaMint 2. 1 is a multilingual set of 17 comparable corpora containing parliamentary debates mostly starting in 2015 and extending to mid-2020, with each corpus being about 20 million words in size. The sessions in the corpora are marked as belonging to the COVID-19 period (from November 1st 2019), or being "reference" (before that date). The corpora have extensive metadata, including aspects of the parliament; the speakers (name, gender, MP status, party affiliation, party coalition/opposition); are structured into time-stamped terms, sessions and meetings; with speeches being marked by the speaker and their role (e. g. chair, regular speaker). The speeches also contain marked-up transcriber comments, such as gaps in the transcription, interruptions, applause, etc. Note that some corpora have further information, e. g. the year of birth of the speakers, links to their Wikipedia articles, their membership in various committees, etc. The corpora are encoded according to the Parla-CLARIN TEI recommendation (https: //clarin-eric. github. io/parla-clarin/), but have been validated against the compatible, but much stricter ParlaMint schemas. This entry contains the linguistically marked-up version of the corpus, while the text version is available at http: //hdl. handle. net/11356/1432. The ParlaMint. ana linguistic annotation includes tokenization, sentence segmentation, lemmatisation, Universal Dependencies part-of-speech, morphological features, and syntactic dependencies, and the 4-class CoNLL-2003 named entities. Some corpora also have further linguistic annotations, such as PoS tagging or named entities according to language-specific schemes, with their corpus TEI headers giving further details on the annotation vocabularies and tools},
KEYWORDS = {covid-19, ParlaCLARIN, CLARIN, linguistic annotation, pos-tagging, Named Entity Recognition, linguistic dependency annotation, UD, dibattiti parlamentari, parlamenti, discorso politico},
URL = {https://iris.cnr.it/handle/20.500.14243/446076},
}
@MISC{FRONTINI_2021_MISC_F_399153,
AUTHOR = {Frontini, M. E.},
TITLE = {SSHOC'ing drama in the cloud},
YEAR = {2021},
ABSTRACT = {At LIBER 2021 Online Conference, CLARIN and SSHOC presented a webinar showcasing how SSH researchers can benefit from the resources and services offered by SSH research infrastructures in order to produce and exploit highly encoded historical textual data. After the webinar, the participants were able to successfully guide and advise SSH researchers (with a particular focus on literature studies) in their choice amongst existing resources and tools, based on their research question},
URL = {https://iris.cnr.it/handle/20.500.14243/399153},
}
@MISC{GIGLIA_2021_MISC_GLD_431590,
AUTHOR = {Giglia, E. and Lazzeri, E. and Di Donato, F.},
TITLE = {Scienza aperta e gestione dei dati per le scienze umane e del patrimonio culturale},
YEAR = {2021},
ABSTRACT = {Corso tenuto per gli istituti CNR di area umanistica, maggio-giugno 2021. Modulo1: Open Science, perché serve; il diritto d'autore; come siamo arrivati alla comunicazione scientifica attuale Modulo 2: Open Access e politiche europee Modulo 3: Gestione dei dati e dati FAIR Modulo 4: Data management plan ed esempi concreti Moduli 5-8: presentazione delle infrastrutture di ricerca, CLARIN, DARIAH, OPERAS, ERHIS, Parthenos, Ariadne},
KEYWORDS = {open science, fair data, humanities},
URL = {https://zenodo.org/record/5497914#.YjCP05PMJfU},
}
@MISC{GUADAGNINI_2021_MISC_G_447012,
AUTHOR = {Guadagnini, E.},
TITLE = {Hélène Miesse, Un laboratorio di carte. Il linguaggio della politica nel «carteggio» di Francesco Guicciardini},
YEAR = {2021},
KEYWORDS = {Guicciardini, lessico, politica},
PAGES = {206-212},
URL = {https://iris.cnr.it/handle/20.500.14243/447012},
VOLUME = {85},
ISSN = {0035-1458},
}
@MISC{GUADAGNINI_2021_MISC_G_447010,
AUTHOR = {Guadagnini, E.},
TITLE = {Marco Tullio Cicerone (attr.), Rettorica nova},
YEAR = {2021},
ABSTRACT = {Scheda relativa alla "Rettorica nova", presente nella lista dei libri posseduti da Leonardo},
KEYWORDS = {Leonardo, Cicerone, Retorica},
PAGES = {187-189},
URL = {https://bibliotecadileonardo.museogalileo.it/index.php/esplora/scheda/La%20biblioteca/61572},
PUBLISHER = {Giunti (Firenze, ITA)},
ISBN = {9788809897786},
CONFERENCE_PLACE = {Firenze},
EDITOR = {Vecce, C.},
}
@MISC{LAZZERI_2021_MISC_LTPAABBCCCCCCCDDDFFFGGGKLLMNOOPPPPRRRSSSSTTVVZ_435530,
AUTHOR = {Lazzeri, E. and Tanlongo, F. and Pavone, G. and Alpi, F. and Ansuini, A. and Bertazzon, E. and Bonaccorsi, D. and Cappelluti, F. and Casati, S. and Castelli, D. and Cippitani, R. and Colcelli, V. and Costantini, A. and Cozzini, S. and Degl'Innocenti, E. and Di Donato, F. and Di Giorgio, S. and Fava, I. and Fiore, S. and Forni, M. and Galimberti, G. and Giglia, E. and Giorgetti, A. and Kurapati, S. and Landoni, M. and Lavitrano, M. and Marras, C. and Niccolucci, F. and Occioni, M. and Osmenaj, E. and Paolini, G. and Pasquale, V. and Petrillo, C. and Pugliese, R. and Ripepi, E. and Rivoira, G. and Rossi, G. and Salon, S. and Sarretta, A. and Sartori, A. and Spiga, D. and Tamagno, D. and Tammaro, A. M. and Vellico, M. and Vignocchi, M. and Zane, D.},
TITLE = {ICDI Competence Centre for Open Science, FAIR and EOSC-Mission, Strategy and Action Plan},
YEAR = {2021},
ABSTRACT = {This document presents the mission and strategy of the Italian Competence Centre on Open Science, FAIR, and EOSC. The Competence Centre is an initiative born within the Italian Computing and Data Infrastructure (ICDI), a forum created by representatives of major Italian Research Infrastructures and e-Infrastructures, with the aim of promoting synergies at the national level, and optimising the Italian participation to European and global challenges in this field, including the European Open Science Cloud (EOSC), the European Data Infrastructure (EDI) and HPC. This working paper depicts the mission and objectives of the ICDI Competence Centre, a network of experts with various skills and competencies that are supporting the national stakeholders on topics related to Open Science, FAIR principles application and participation to the EOSC. The different actors and roles are described in the document as well as the activities and services offered, and the added value each stakeholder can find the in Competence Centre. The tools and services provided, in particular the concept for the portal, through which the Centre will connect to the national landscape and users, are also presented. This record is the English translation of the original Italian (2021). Competence Centre ICDI per Open Science, FAIR, ed EOSC-Mission, Strategia e piano d'azione. Zenodo},
KEYWORDS = {EOSC, Competence Centre, ICDI, Open Science, FAIR, EDI, HPC},
URL = {https://doi.org/10.5281/zenodo.5071055},
DOI = {10.5281/zenodo},
ISBN = {9786526304839},
}
@MISC{LAZZERI_2021_MISC_LTPAABBCCCCCCCDDDFFFGGGKLLMNOOPPPPRRRSSSSTTVVZ_442324,
AUTHOR = {Lazzeri, E. and Tanlongo, F. and Pavone, G. and Alpi, F. and Ansuini, A. and Bertazzon, E. and Bonaccorsi, D. and Cappelluti, F. and Casati, S. and Castelli, D. and Cippitani, R. and Colcelli, V. and Costantini, A. and Cozzini, S. and Degl'Innocenti, E. and Di Donato, F. and Di Giorgio, S. and Fava, I. and Fiore, S. and Forni, M. and Galimberti, G. and Giglia, E. and Giorgetti, A. and Kurapati, S. and Landoni, M. and Lavitrano, M. and Marras, C. and Niccolucci, F. and Occioni, M. and Osmenaj, E. and Paolini, G. and Pasquale, V. and Petrillo, C. and Pugliese, R. and Ripepi, E. and Rivoira, G. and Rossi, G. and Salon, S. and Sarretta, A. and Sartori, A. and Spiga, D. and Tamagno, D. and Tammaro, A. and Vellico, M. and Vignocchi, M. and Zane, D.},
TITLE = {ICDI Competence Centre for Open Science, FAIR and EOSC-Mission, strategy and action plan},
YEAR = {2021},
ABSTRACT = {This document presents the mission and strategy of the Italian Competence Centre on Open Science, FAIR, and EOSC. The Competence Centre is an initiative born within the Italian Computing and Data Infrastructure (ICDI), a forum created by representatives of major Italian Research Infrastructures and e-Infrastructures, with the aim of promoting synergies at the national level, and optimising the Italian participation to European and global challenges in this field, including the European Open Science Cloud (EOSC), the European Data Infrastructure (EDI) and HPC. This working paper depicts the mission and objectives of the ICDI Competence Centre, a network of experts with various skills and competencies that are supporting the national stakeholders on topics related to Open Science, FAIR principles application and participation to the EOSC. The different actors and roles are described in the document as well as the activities and services offered, and the added value each stakeholder can find the in Competence Centre. The tools and services provided, in particular the concept for the portal, through which the Centre will connect to the national landscape and users, are also presented. This record is the English translation of the original Italian (2021). Competence Centre ICDI per Open Science, FAIR, ed EOSC-Mission, Strategia e piano d'azione. Zenodo. https: //doi. org/10. 5281/zenodo. 5071055},
KEYWORDS = {EOSC, Competence Centre, ICDI, Open Science, FAIR, EDI, HPC},
PAGES = {7},
URL = {https://doi.org/10.32079/ISTI-TR-2021/023},
DOI = {10.32079/ISTI},
}
@MISC{MATHIAK_2021_MISC_MBJNHTDDJJWHFACABCJKP_431676,
AUTHOR = {Mathiak and Brigitte and Juty and Nick and Heger and Tina and Donato, D. and Di Donato, F. and Jeschke and Jonathan and Widmann and Heinrich and Flügel and Annalena and Culina and Antica and Bardi, A. and Colomb and Julien and Kraker and Peter},
TITLE = {Stocktaking GO FAIR Discovery IN-Use cases, infrastructure (0. 95)},
YEAR = {2021},
ABSTRACT = {In order to build a better ecosystem for data discovery tools the Data Discovery Implementation Group of GO Fair (https: //www. go-fair. org/implementation-networks/overview/discovery) collected use cases between 2019 and 2020 from a variety of sources. We also detail the 'Actors' for these use cases and the 'Source' providing links, whenever possible. Since we found over a hundred individual use cases, we decided to cluster them to provide a better overview. The clustering, as well as the results of a small survey among data infrastructure specialists to find how they rate the importance of the clusters are detailed in the documentation to this dataset, a draft of which can currently be found here. The code and data to produce the figures in the documentation are available as R code in the GO_FAIR_Discovery_Use_case-master. zip file. The use cases themselves are available as Excel sheet and csv},
KEYWORDS = {discovery, gofair},
URL = {https://doi.org/10.5281/zenodo.5211196},
DOI = {10.5281/zenodo},
}
@MISC{PROVOST_2021_MISC_P_475250,
AUTHOR = {Provost, L. M.},
TITLE = {TRIPLE Training activities on Open Science and the EOSC},
YEAR = {2021},
ABSTRACT = {In the last years, Open Science made a significant headway in European research policy and advocacy. Alongside the benefits of working towards enabling “open by default” in all disciplines, this momentum led to a complex, increasingly crowded and multidimensional landscape of Open Science enablers, infrastructures and policies. Questions of what exactly are we talking about when talking about the EOSC, how to navigate the latest generation of discovery services or whether to find no author-facing-fee OA funding schemes became recurrent points of discussions even among those who are actively involved in implementing certain aspects of the European OS roadmap. TRIPLE is a H2020 project with a primary aim of developing a discovery platform for SSH. Within TRIPLE, we found it important to dedicate a specific task force to pave the way towards exchange and a shared understanding of the latest European Open Science advancements, filtered by the TRIPLE project perspective. Despite the original intention to address our events only to Consortium members, we decided to open them to the community and to focus on topics which have relevance for specific TRIPLE’s activities and tasks (i. e. the EOSC onboarding), and on services and solutions which are of interest to the whole community (i. e. Open Research Europe, and the EOSC state-of-the-art and objectives). The presentation will specifically focus on: the synergies that have been implemented with the main RIs in the SSH field (OPERAS, CLARIN, CESSDA, DARIAH) and with training coordinators communities (EOSC Skills and Training Working Group, OpenAIRE CoP of Training coordinators, SSHOC Training community, ICDI Competence Center) the strategies adopted to a) provide support to TRIPLE members on Open Science and the EOSC via adequate training; b) engage new potential interested audiences in TRIPLE’s events; c) produce FAIR training materials, to ensure their reusability by the general public},
KEYWORDS = {TRIPLE, Training, Open Science, Horizon 2020},
URL = {https://iris.cnr.it/handle/20.500.14243/475250},
DOI = {10.5281/ZENODO.5544032},
CONFERENCE_NAME = {Open Science FAIR 2021},
}
@MISC{SALVATORI_2021_MISC_SBD_446344,
AUTHOR = {Salvatori, E. and Boschetti, F. and Del Grosso, A. M.},
TITLE = {A un anno da AIUCD2021},
YEAR = {2021},
KEYWORDS = {Digital Humanities, AIUCD},
PAGES = {1-4},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85127630558\&origin=inward},
VOLUME = {2021},
DOI = {10.6092/issn.2532-8816/14209},
ISSN = {2532-8816},
}
@MISC{TESSAROLO_2021_MISC_TDB_455961,
AUTHOR = {Tessarolo, L. and Del Grosso, A. M. and Boschetti, F.},
TITLE = {florilegiasyriaca},
YEAR = {2021},
ABSTRACT = {Il portale di produzione e fruizione delle edizioni dei testi critici restituiti al pubblico durante il lavoro del team del progetto ERC 758732-FLOS},
KEYWORDS = {ERC, Digital Humanities, Digital Philology, FLOS, DSL-based DSE},
URL = {https://www.florilegiasyriaca.eu/},
}
@MISC{ZENZARO_2021_MISC_ZBD_420370,
AUTHOR = {Zenzaro, S. and Boschetti, F. and Del Grosso, A. M.},
TITLE = {Domain Specific Languages on editing papyri: the GreekSchools case study},
YEAR = {2021},
ABSTRACT = {Within the ERC AdG 885222-GreekSchools we aim to manage the edit of multiple papyrologic texts: diplomatic and literary editions and the corresponding apparatuses and their translations. To endow scholars with automatic consistency and coherence of editorial choices and to support the whole editing process, we leverage Domain Specific Languages (DSLs): a formal language definition in a bounded domain. Digital text editing can be handled in multiple ways depending on the editorial purpose. We identify four possible editing approaches to digital textual scholarship: (1) word processor; (2) structured text (e. g. XML); (3) GUI-centric; (4) domain specific language (DSL). Each of them has pros and cons. In particular we analyse five dimensions: familiarity, compactness, completeness, data elaboration support, and the need of technical training. With familiarity we refer to how much the scholar can avoid shifting his established working paradigm/environment. Compactness is the ratio between quantity of information and formalisation size. Completeness refers to the information the content represents. The capability to extract or deduce information from the data is addressed by data elaboration support. Finally, we consider important to evaluate the amount of technical training for text editing. For example, structured texts grant completeness of information, while requiring extensive technical training. In this context only the DSL approach encompasses all these dimensions while the other approaches compromises on some of them. We propose a DSL-based editor that will support and improve the editing workflow in the context of the ERC project},
KEYWORDS = {Digital Humanities, Digital Papyrology, GreekSchools, Computational philology},
URL = {https://www.clarin.eu/content/clarin-bazaar-2021#data-curation-using-nlp},
CONFERENCE_NAME = {CLARIN Annual Conference 2021},
}
@MISC{ZENZARO_2021_MISC_ZDB_420374,
AUTHOR = {Zenzaro, S. and Del Grosso, A. M. and Boschetti, F.},
TITLE = {CophiEditor A collaborative web platform for the creation of scholarly digital editions},
YEAR = {2021},
ABSTRACT = {Relazione di avanzamento della piattaforma per il progetto GreekSchools},
KEYWORDS = {Digital Humanities, Digital papyrology, GreekSchools},
URL = {https://iris.cnr.it/handle/20.500.14243/420374},
}
@ARTICLE{ACERNESE_2020_ARTICLE_AAAAAAAAAAAABBBBBBBBBBBBBBBBBBBBBBBBBBBBBBBBBBBBBBBBBBBCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCDDDDDDDDDDDDDDDDDDDDDDDDEEEFFFFFFFFFFFFFFFFGGGGGGGGGGGGGGGGGGGGHHHHHHHHHHHIIIIJJJKKKKKKKKLLLLLLLLLLLLLMMMMMMMMMMMMMMMMMMMMMMMMMMMMMMMNNNNNNNNNOOPPPPPPPPPPPPPPPPPPPPPPPPPPPPPPPRRRRRRRRRRRRRRRRSSSSSSSSSSSSSSSSSSSSSTTTTTTTTTVVVVVVVVVVVVVVWWWZZZ_516176,
AUTHOR = {Acernese, F. and Agathos, M. and Aiello, L. and Allocca, A. and Aloy, M. A. and Amato, A. and Antier, S. and Arene, M. and Arnaud, N. and Ascenzi, S. and Astone, P. and Aubin, F. and Babak, S. and Bacon, P. and Badaracco, F. and Bader, M. K. M. and Baird, J. and Baldaccini, F. and Ballardin, G. and Barbieri, C. and Barone, F. and Barsuglia, M. and Barta, D. and Basti, A. and Bawaj, M. and Bazzan, M. and Bejger, M. and Belahcene, I. and Bernuzzi, S. and Bersanetti, D. and Bertolini, A. and Bischi, M. and Bitossi, M. and Bizouard, M. A. and Bloemen, S. and Bobba, F. and Boer, M. and Bogaert, G. and Bondu, F. and Bonnand, R. and Boom, B. A. and Boschi, V. and Bouffanais, Y. and Bozzi, A. and Bradaschia, C. and Branchesi, M. and Breschi, M. and Briant, T. and Brighenti, F. and Brillet, A. and Brooks, J. and Bulik, T. and Bulten, H. J. and Buskulic, D. and Buy, C. and Cagnoli, G. and Calloni, E. and Canepa, M. and Carapella, G. and Carbognani, F. and Carullo, G. and Casanueva Diaz, J. and Casentini, C. and Caudill, S. and Cavalier, F. and Cavalieri, R. and Cella, G. and Cerda Duran, P. and Cesarini, E. and Chaibi, O. and Chassande Mottin, E. and Chincarini, A. and Chiummo, A. and Christensen, N. and Chua, S. and Ciani, G. and Cieslar, M. and Ciolfi, R. and Cipriano, F. and Cirone, A. and Cleva, F. and Coccia, E. and Cohadon, P. F. and Cohen, D. and Colpi, M. and Conti, L. and Cordero Carrion, I. and Corezzi, S. and Corre, D. and Cortese, S. and Coulon, J. P. and Croquette, M. and Cuoco, E. and Dangelo, B. and D'Antonio, S. and Dattilo, V. and Davier, M. and Degallaix, J. and De Laurentis, M. and Deleglise, S. and Del Pozzo, W. and De Pietri, R. and De Rosa, R. and De Rossi, C. and Dietrich, T. and Di Fiore, L. and Di Giorgio, C. and Di Giovanni, F. and Di Giovanni, M. and Di Girolamo, T. and Di Lieto, A. and Di Pace, S. and Di Palma, I. and Di Renzo, F. and Drago, M. and Ducoin, J. G. and Durante, O. and Eisenmann, M. and Errico, L. and Estevez, D. and Fafone, V. and Farinon, S. and Feng, F. and Ferrante, I. and Fidecaro, F. and Fiori, I. and Fiorucci, D. and Fittipaldi, R. and Fiumara, V. and Flaminio, R. and Font, J. A. and Fournier, J. D. and Frasca, S. and Frasconi, F. and Frey, V. and Fronze, G. and Gammaitoni, L. and Garufi, F. and Gemme, G. and Genin, E. and Gennai, A. and Ghosh, A. and Giacomazzo, B. and Gonzalez Castro, J. M. and Gosselin, M. and Gouaty, R. and Grado, A. and Granata, M. and Greco, G. and Grimaldi, A. and Grimm, S. J. and Groot, P. and Gruning, P. and Guidi, G. M. and Guo, Y. and Gupta, P. and Halim, O. and Harder, T. and Harms, J. and Heidmann, A. and Heitmann, H. and Hello, P. and Hemming, G. and Hinderer, T. and Hofman, D. and Huet, D. and Hui, V. and Idzkowski, B. and Iess, A. and Intini, G. and Isac, J. M. and Jacqmin, T. and Jaranowski, P. and Jonker, R. J. G. and Katsanevas, S. and Kefelian, F. and Khan, I. and Khetan, N. and Koekoek, G. and Koley, S. and Krolak, A. and Kutynia, A. and Laghi, D. and Lartaux Vollard, A. and Lazzaro, C. and Leaci, P. and Leroy, N. and Letendre, N. and Linde, F. and Llorens Monteagudo, M. and Longo, A. and Lorenzini, M. and Loriette, V. and Losurdo, G. and Lumaca, D. and Macquet, A. and Majorana, E. and Maksimovic, I. and Man, N. and Mangano, V. and Mantovani, M. and Mapelli, M. and Marchesoni, F. and Marion, F. and Marquina, A. and Marsat, S. and Martelli, F. and Martinez, V. and Masserot, A. and Mastrogiovanni, S. and Meidam, J. and Mejuto Villa, E. and Mereni, L. and Merzougui, M. and Messina, F. and Metzdorff, R. and Miani, A. and Michel, C. and Milano, L. and Miller, A. and Minazzoli, O. and Minenkov, Y. and Montani, M. and Morawski, F. and Mours, B. and Muciaccia, F. and Nagar, A. and Nardecchia, I. and Naticchioni, L. and Neilson, J. and Nelemans, G. and Nguyen, C. and Nichols, D. and Nissanke, S. and Nocera, F. and Obergaulinger, M. and Oganesyan, G. and Pagano, G. and Pagliaroli, G. and Palomba, C. and Pang, P. T. H. and Pannarale, F. and Paoletti, F. and Paoli, A. and Pascucci, D. and Pasqualetti, A. and Passaquieti, R. and Passuello, D. and Patil, M. and Patricelli, B. and Pedurand, R. and Perego, A. and Perigois, C. and Perreca, A. and Piccinni, O. J. and Pichot, M. and Piergiovanni, F. and Pierro, V. and Pillant, G. and Pinard, L. and Pinto, I. M. and Plastino, W. and Poggiani, R. and Popolizio, P. and Porter, E. K. and Prodi, G. A. and Punturo, M. and Puppo, P. and Raaijmakers, G. and Radulescu, N. and Rapagnani, P. and Razzano, M. and Regimbau, T. and Rei, L. and Rettegno, P. and Ricci, F. and Riemenschneider, G. and Robinet, F. and Rocchi, A. and Rolland, L. and Romanelli, M. and Romano, R. and Rosinska, D. and Ruggi, P. and Salafia, O. S. and Salconi, L. and Samajdar, A. and Sanchis Gual, N. and Santos, E. and Sassolas, B. and Sauter, O. and Schmidt, P. and Sentenac, D. and Sequino, V. and Sharma, A. and Sieniawska, M. and Singh, N. and Singhal, A. and Sorrentino, F. and Spera, M. and Stachie, C. and Steer, D. A. and Stratta, G. and Sur, A. and Swinkels, B. L. and Tacca, M. and Tiwari, S. and Tonelli, M. and Torres Forne, A. and Travasso, F. and Tringali, M. C. and Trovato, A. and Trozzo, L. and Tsang, K. W. and Valentini, M. and Van Bakel, N. and Van Beuzekom, M. and Van Den Brand, J. F. J. and Van Den Broeck, C. and Van Der Schaaf, L. and Vardaro, M. and Vasuth, M. and Vedovato, G. and Verkindt, D. and Vetrano, F. and Vicere, A. and Vinet, J. Y. and Vocca, H. and Walet, R. and Was, M. and Williamson, A. R. and Zadrozny, A. and Zelenova, T. and Zendri, J. P.},
TITLE = {The advanced Virgo longitudinal control system for the O2 observing run},
YEAR = {2020},
ABSTRACT = {Following a successful period of data-taking between 2006 and 2011, the Virgo gravitational-wave detector was taken offline for a major upgrade. The changes made to the instrument significantly increased the complexity of the control systems and meant that an extended period of commissioning was required to reach a sensitivity appropriate for science data-taking. This commissioning period was completed in July of 2017 and the second-generation Advanced Virgo detector went on to join the Advanced LIGO detectors in the O2 science run in August of the same year. The upgraded detector was approximately twice as sensitive to binary neutron star mergers as the first-generation instrument. During the August 2017 science run, Advanced Virgo detected its first gravitational wave signal, with the binary black hole merger, GW170729. This paper describes the control of the longitudinal degrees of freedom in the Advanced Virgo instrument during the O2 science run and the process that brought the detector from an uncontrolled, non-resonant state to its target working point},
KEYWORDS = {Control loops, Gravitational wave detectors, Interferometer, Suspended optical cavities},
URL = {https://iris.cnr.it/handle/20.500.14243/516176},
VOLUME = {116},
DOI = {10.1016/j.astropartphys.2019.07.005},
ISSN = {0927-6505},
JOURNAL = {ASTROPARTICLE PHYSICS},
}
@ARTICLE{ALZETTA_2020_ARTICLE_ADMV_446043,
AUTHOR = {Alzetta, C. and Dell'Orletta, F. and Montemagni, S. and Venturi, G.},
TITLE = {Linguistically-driven Selection of Difficult-to-Parse Dependency Structures},
YEAR = {2020},
ABSTRACT = {The paper illustrates a novel methodology meeting a twofold goal, namely quantifying the reliability of automatically generated dependency relations without using gold data on the one hand, and identifying which are the linguistic constructions negatively affecting the parser performance on the other hand. These represent objectives typically investigated in different lines of research, with different methods and techniques. Our methodology, at the crossroads of these perspectives, allows not only to quantify the parsing reliability of individual dependency types but also to identify and weight the contextual properties making relation instances more or less difficult to parse. The proposed methodology was tested in two different and complementary experiments, aimed at assessing the degree of parsing difficulty across (a) different dependency relation types, and (b) different instances of the same relation. The results show that the proposed methodology is able to identify difficult-to-parse dependency relations without relying on gold data and by taking into account a variety of intertwined linguistic factors. These findings pave the way to novel applications of the methodology, both in the direction of defining new evaluation metrics based purely on automatically parsed data and towards the automatic creation of challenge sets},
KEYWORDS = {Linguistic Complexity, Syntactic Parsing, Evaluation metrics},
PAGES = {37-60},
URL = {https://journals.openedition.org/ijcol/719},
VOLUME = {6 (2)},
DOI = {10.4000/ijcol.719},
ISSN = {2499-4553},
JOURNAL = {IJCOL},
}
@ARTICLE{AMIEL_2020_ARTICLE_AFLR_529601,
AUTHOR = {Amiel, P. and Frontini, F. and Lacour, P. Y. and Robin, A.},
TITLE = {Pratiques de gestion des données de la recherche : une nécessaire acculturation des chercheurs aux enjeux de la science ouverte ?},
YEAR = {2020},
ABSTRACT = {The article presents the results of an exploratory survey, conducted in June 2018 in the Montpellier’s basin by the CommonData Research Program, on the researchers’ management practices of research data. The principles objectives were to see if research data management is the result of an elaborated and strategic plan, to verify the ability or inability of researchers to qualify legally their explored, collected or produced datasets in order to determine their management in regard of the current Open Science politics and, at last, to observe the property feeling improved by researchers toward the datas they contribute to produce, which comes up with the broader question of the personal and/or institutional dimension of research’s work and its consequences in the awarding of property},
KEYWORDS = {research data, management, property, sharing, dissemination, valorization, public domain, open science, données de la recherche, gestion, propriété, partage, diffusion, valorisation, domaine public, science ouverte},
PAGES = {147-168},
URL = {https://iris.cnr.it/handle/20.500.14243/529601},
VOLUME = {(10)},
DOI = {10.4000/cdst.2061},
ISSN = {1967-0311},
JOURNAL = {CAHIERS DROIT, SCIENCES \& TECHNOLOGIES},
}
@ARTICLE{BOSCHETTI_2020_ARTICLE_BD_446357,
AUTHOR = {Boschetti, F. and Del Grosso, A. M.},
TITLE = {L'annotazione di testi storico-letterari al tempo dei social media},
YEAR = {2020},
ABSTRACT = {The annotation of historical and literary texts is approached differently by traditional philologists and digital philologists. The former are concentrated on the detailed study of a given text (close reading) while the latter are focused on the study of large quantities of texts (distant reading). A structured and collaborative annotation makes it possible both to add information to particular passages of individual texts, as in a traditional linear comment, and to connect data from entire textual collections through rigorous protocols. However, the standards developed by digital philologists are not highly appreciated by traditional academics, since the effort necessary to apply the proposed technologies allegedly diverts researchers' attention from the object of study. As opposed to thisobjection, we intend to highlight that it is indeed possible to maintain the precision requisite for the application of computational tools to digital resources without renouncing the annotation practices established in traditional contexts. In support of the method, we report a number of case studies of digital scientific editions whose goals include both reconstructing respective texts and encouraging the dissemination of contents and public participation in the academic debate. In particular, we will discuss the following projects: a) the stylistic annotation of three different editions of Giacomo Leopardi's translation of the Batracomiomachia; b) the scientific edition of Bellini's letters; c) the multi-level annotated edition of Bassani; and d) the comparison of Umberto Eco's variants of his Il nome della rosa},
KEYWORDS = {digital philology, collaborative annotation, communities, digital scholarly edition, formalisation},
PAGES = {65-99},
URL = {https://czasopisma.marszalek.com.pl/images/pliki/iw/11_1/iw11103.pdf},
VOLUME = {11 (1)},
DOI = {10.15804/IW.2020.11.1.03},
ISSN = {2084-4514},
JOURNAL = {ITALICA WRATISLAVIENSIA},
}
@ARTICLE{BUONGIOVANN_2020_ARTICLE_BGBD_401391,
AUTHOR = {Buongiovann, C. and Gracci, F. and Brunato, D. and Dell'Orletta, F.},
TITLE = {Lost in Text: A Cross-Genre Analysis of Linguistic Phenomena within Text},
YEAR = {2020},
ABSTRACT = {Moving from the assumption that formal, rather than content features, can be used to detect differences and similarities among textual genres and registers, this paper presents a new approach to linguistic profiling-a well-established methodological framework to study language variation-which is applied to detect significant variations within the internal structure of a text. We test this approach on the Italian language using a wide spectrum of linguistic features automatically extracted from parsed corpora representative of four main genres and two levels of complexity for each, and we show that it is possible to model the degree of stylistic variance within texts according to genre and language complexity},
KEYWORDS = {natural language processing, computational stylometry},
URL = {https://www.ai-lc.it/wp-content/uploads/2021/03/IJCOL_6_1_3_buongiovanni_et_al.pdf},
VOLUME = {6 (1)},
ISSN = {2499-4553},
JOURNAL = {IJCOL},
}
@ARTICLE{CHINELLO_2020_ARTICLE_CPFGRZDB_401387,
AUTHOR = {Chinello, A. and Parma, F. and Frigerio, F. and Galli, C. M. and Richichi, V. and Zappa, L. E. and Dell'Orletta, F. and Boschetti, F.},
TITLE = {Food semantics on pro-anorexia websites in Italy},
YEAR = {2020},
ABSTRACT = {Introduction. The term pro-ana (pro-anorexia) means the spread of restrictive eating behaviors and anorectic advices in virtual spaces written by teenagers. The purpose of this pilot study consists in a qualitative and quantitative analysis of foods contained in a linguistic corpus made up of users' comments on pro-ana websites. Method. The corpus of pro-ana websites was analyzed through the T2K tool based on word-frequency processing. Results. The results show conversations regarding beverages, products of vegetable origin (fruit, vegetables) and low-calorie foods, with a tendency to limit the fear linked to the choice of high-calorie foods through reassuring and reconcilable language labels ("light", "sugar free"). Conclusions. These findings specify the food semantics on pro-ana websites associated to an anorectic vocabulary with restrictive diets. The results could be used to characterize the most common food as risk factors within the eating disorders framework},
KEYWORDS = {pro-ana, anorexia, language, food, natural language processing},
PAGES = {297-300},
URL = {https://iris.cnr.it/handle/20.500.14243/401387},
VOLUME = {55 (5)},
ISSN = {0035-6484},
JOURNAL = {RIVISTA DI PSICHIATRIA (TESTO STAMP.)},
}
@ARTICLE{DEROSIS_2020_ARTICLE_DGZVF_384935,
AUTHOR = {De Rosis, S. and Guidotti, E. and Zuccarino, S. and Venturi, G. and Ferre, F.},
TITLE = {Waiting time information in the Italian NHS: A citizen perspective},
YEAR = {2020},
ABSTRACT = {Public involvement in the management and communication of waiting times is known to support initiatives to reduce waiting times, as well as increase fairness and promote transparency and accountability. In order to improve transparency and communication to citizens, Italy recently updated the National Regulatory Plan for Waiting Lists (2019-2021), which calls for the disclosure of waiting time information on healthcare provider webpages. This study analyses waiting time information for outpatient visits and digital services available on the institutional website pages of 144 public healthcare organisations in nine regions and two autonomous provinces of Italy. Web pages were analysed both in terms of the available information/services, using a grid, and in terms of the quality of the text using an advanced readability assessment tool (READ-IT). This information was complemented and validated by regional healthcare key informants during research-specific workshops. Waiting time information disclosure, digital services and text readability varied both within and between the regional healthcare systems and organisations. The types and characteristics of waiting time information and statistics vary considerably with a negative impact on their use for benchmarking and their readability and usability for booking purposes. Overall, communication weaknesses due to low harmonization and clarity of information can undermine efforts in effectively informing and involving the public through online waiting time data disclosure. (C) 2020 The Author(s). Published by Elsevier B. V},
KEYWORDS = {Waiting times, Healthcare, Online information, Readability, Italy},
PAGES = {796-804},
URL = {https://www.sciencedirect.com/science/article/pii/S0168851020301111?via%3Dihub},
VOLUME = {124 (8)},
DOI = {10.1016/j.healthpol.2020.05.012},
ISSN = {0168-8510},
JOURNAL = {HEALTH POLICY},
}
@ARTICLE{DUMOUCHEL_2020_ARTICLE_DBBCDEFGGGMPDPT_378105,
AUTHOR = {Dumouchel, S. and Blotière, E. and Breitfuss, G. and Chen, Y. and Di Donato, F. and Eskevich, M. and Forbes, P. and Georgiadis, H. and Gingold, A. and Gorgaini, E. and Moranville, Y. and Pohle, S. and De Paoli, S. and Petitfils, C. and Tothczifra, E.},
TITLE = {GOTRIPLE: A User-Centric Process to Develop a Discovery Platform},
YEAR = {2020},
ABSTRACT = {Social sciences and humanities (SSH) research is divided across a wide array of disciplines, sub-disciplines and languages. While this specialization makes it possible to investigate the extensive variety of SSH topics, it also leads to a fragmentation that prevents SSH research from reaching its full potential. The TRIPLE project brings answers to these issues by developing an innovative discovery platform for SSH data, researchers' projects and profiles. Having started in October 2019, the project has already three main achievements that are presented in this paper: (1) the definition of main features of the GOTRIPLE platform; (2) its interoperability; (3) its multilingual, multicultural and interdisciplinary vocation. These results have been achieved thanks to different methodologies such as a co-design process, market analysis and benchmarking, monitoring and co-building. These preliminary results highlight the need for respecting diversity of practices and communities through coordination and harmonization},
KEYWORDS = {user-centric approach, user research, social sciences and humanitie, open science, European Open Science Cloud (EOSC), FAIR principle, discovery, research data},
PAGES = {24},
URL = {https://www.mdpi.com/2078-2489/11/12/563},
VOLUME = {2020, 11 (563)},
DOI = {10.3390/info11120563},
ISSN = {2078-2489},
JOURNAL = {INFORMATION},
}
@ARTICLE{FERRO_2020_ARTICLE_FDVBCLMDHGBGDDPPVBSABLACFBRIMDTCSMDSSB_518413,
AUTHOR = {Ferro, M. and Di Lorenzo, G. and Vartolomei, M. D. and Bruzzese, D. and Cantiello, F. and Lucarelli, G. and Musi, G. and Di Stasi, S. and Hurle, R. and Guazzoni, G. and Busetto, G. M. and Gabriele, A. and Del Giudice, F. and Damiano, R. and Perri, F. and Perdona, S. and Verze, P. and Borghesi, M. and Schiavina, R. and Almeida, G. L. and Bove, P. and Lima, E. and Autorino, R. and Crisan, N. and Farhan, A. R. A. and Battaglia, M. and Russo, G. I. and Ieluzzi, V. and Morgia, G. and De Placido, P. and Terracciano, D. and Cimmino, A. and Scafuri, L. and Mirone, V. and De Cobelli, O. and Shariat, S. and Sonpavde, G. and Buonerba, C.},
TITLE = {Absolute basophil count is associated with time to recurrence in patients with high-grade T1 bladder cancer receiving bacillus Calmette–Guérin after transurethral resection of the bladder tumor},
YEAR = {2020},
ABSTRACT = {Background: Basophils, eosinophils and monocytes may be involved in BCG-induced immune responses and be associated with outcomes of bladder cancer patients receiving intravesical BCG. Our objective was to explore the association of baseline counts of basophils, eosinophils and monocytes with outcomes of patients with high-grade T1 bladder cancer receiving a standard course of intravesical BCG. Methods: We retrospectively reviewed medical records of patients with primary T1 HG/G3 bladder cancer. After re-TURBT, patients were treated with a 6-week course of intravesical BCG induction followed by intravesical BCG every week for 3\ weeks given at 3, 6, 12, 18, 24, 30 and 36\ months from initiation of therapy The analysis of potential risk factors for recurrence, muscle invasion and cancer-specific and overall survival was performed using univariable Cox regression models. Those factors that presented, at univariate analysis, an association with the event at a liberal p \< 0. 1, have been selected for the development of a multivariable model. Results: A total of 1045 patients with primary T1 HG/G3 were included. A total of 678 (64. 9%) recurrences, 303 (29. 0%) progressions and 150 (14. 3%) deaths were observed during follow-up. Multivariate analysis showed that logarithmic transformation of basophils count was associated with a 30% increment in the hazard of recurrence per unit increase of logarithmic basophils count (HR 1. 30; 95% confidence interval 1. 09–1. 54; p = 0. 0026). Basophil count modeled by quartiles was also significantly associated with time to recurrence [second vs. lower quartile HR 1. 42 (1. 12–1. 79); p = 0. 003, third vs. lower quartile HR 1. 26 (1. 01–1. 57); p = 0. 041; upper vs. lower quartile HR 1. 36 (1. 1–1. 68); p = 0. 005]. The limitations of a retrospective study are applicable. Conclusion: Baseline basophil count may predict recurrence in BCG-treated HG/G3 T1 bladder cancer patients. External validation is warranted},
KEYWORDS = {Basophils, BCG, Bladder cancer},
PAGES = {143-150},
URL = {https://link.springer.com/article/10.1007/s00345-019-02754-2},
VOLUME = {38 (1)},
DOI = {10.1007/s00345-019-02754-2},
ISSN = {0724-4983},
JOURNAL = {WORLD JOURNAL OF UROLOGY},
}
@ARTICLE{GIOVANNETTI_2020_ARTICLE_GBDDMPP_400775,
AUTHOR = {Giovannetti, E. and Bellandi, A. and Dattilo, D. and Del Grosso, A. M. and Marchi, S. and Pecchioli, A. and Piccini, S.},
TITLE = {The Terminology of the Babylonian Talmud: Extraction, Representation and Use in the Context of Computational Linguistics},
YEAR = {2020},
ABSTRACT = {A formal digital structuring of the terminology of the Talmud is being carried out in the context of the Project for the Translation of the Babylonian Talmud in Italian. The terminological resource was encoded in the form of a multi-language Explanatory Combinatorial Dictionary (Hebrew-Aramaic-Italian) according to the principles of the Meaning-Text Theory. The construction of such a resource was supported by text processing and computational linguistics techniques aimed at automatically extracting terms from the Italian translation of the Talmud and aligning them with the corresponding Hebrew/Aramaic source terms. The paper describes the process that was set up for the construction of the terminological resource with the ultimate goal of illustrating the advantages of the adoption of a formal linguistic model. The terminological resource aims, indeed, to be a useful tool to deepen the characteristics of the languages of the Talmud, to help translators in their work and more generally scholars in their study of the Talmud itself},
KEYWORDS = {Babylonian Talmud, Computational Linguistics, Explanatory and Combinatorial Lexicology},
PAGES = {61-74},
URL = {http://aisg.cise.unipi.it/Materia-giudaica-2020/006_Giovannettipp61-74.pdf},
VOLUME = {XXV},
DOI = {10.1400/283235},
ISSN = {2282-4499},
JOURNAL = {MATERIA GIUDAICA},
}
@ARTICLE{GUADAGNINI_2020_ARTICLE_G_409997,
AUTHOR = {Guadagnini, E.},
TITLE = {Alessandro, la 'cautela' e altri latinismi: un esercizio traduttologico su un estratto della tradizione latino-romanza del "Secretum secretorum" (SS/B)},
YEAR = {2020},
ABSTRACT = {This paper takes into consideration several translation and linguistic issues concerning the Secretum secretorum and its various Romance versions, including the Franco-Italian Amaestramens (ms. Paris BnF fr. 821). Romance inflections of Latin the words cautela, custodia, munimen, providentia, and salus are considered as well},
KEYWORDS = {Secretum secretorum, Traductology, Lexicology, Latinism},
PAGES = {243-278},
URL = {https://www.francigena-unipd.com/index.php/francigena/article/view/50},
VOLUME = {6},
DOI = {10.25430/2420-9767/V6-239-278},
ISSN = {2420-9767},
JOURNAL = {FRANCIGENA},
}
@ARTICLE{KHALFI_2020_ARTICLE_KZN_380998,
AUTHOR = {Khalfi, M. and Zarghili, A. and Nahli, O.},
TITLE = {A New Rich Lexical Resource For Classical Arabic},
YEAR = {2020},
ABSTRACT = {Currently, large lexical resources are getting a high potential relevance for information systems and need of Lexical resources in Natural Language Processing (NLP) fields is paramount. To contribute meet these needs, we build a lexical resource from the famous dictionary al=q?m?s al=mu???(AQAM). Using a rule based approach, we have designed a system that allows extracting morpho-syntactical, semantics and lexical information from the famous dictionary. So, we obtained a digitized and structured version of AQAM, enriched by morpho-syntactical and lexical explicit information. In addition, the obtained resource is enriched by English translations of lemma and accompanying senses using a bilingual English-Arabic dictionary. Then we present an overview of an experiment alignment of the section of the letter b?" on Princeton"s WordNet (PWN) and Suggested Upper Merged Ontology (SUMO). This experience turned out to be interesting because it revealed that mapping an Arabic lexical resource on an English resource shows commonality between the two languages, but it allows especially to emphasize the non-equivalences between them. All obtained resources are represented in XML format anddistributed under free license},
KEYWORDS = {Al Qamus Al Muhit, Information Extraction, Arabic Lexicon, Machine-readable dictionary, Arabic Lexical Resource},
PAGES = {3863-3884},
URL = {https://ijact.in/index.php/j/article/view/594/571},
VOLUME = {VOLUME-IX, ISSUE-X (10)},
ISSN = {2320-0790},
JOURNAL = {COMPUSOFT: AN INTERNATIONAL JOURNAL OF ADVANCED COMPUTER TECHNOLOGY},
}
@ARTICLE{MARZI_2020_ARTICLE_M_409499,
AUTHOR = {Marzi, C.},
TITLE = {Modeling Word Learning and Processing with Recurrent Neural Networks},
YEAR = {2020},
ABSTRACT = {The paper focuses on what two different types of Recurrent Neural Networks, namely arecurrent Long Short-Term Memory and a recurrent variant of self-organizing memories, a TemporalSelf-Organizing Map, can tell us about speakers' learning and processing a set of fully inflectedverb forms selected from the top-frequency paradigms of Italian and German. Both architectures, due to the re-entrant layer of temporal connectivity, can develop a strong sensitivity to sequentialpatterns that are highly attested in the training data. The main goal is to evaluate learningand processing dynamics of verb inflection data in the two neural networks by focusing onthe effects of morphological structure on word production and word recognition, as well as onword generalization for untrained verb forms. For both models, results show that productionand recognition, as well as generalization, are facilitated for verb forms in regular paradigms. However, the two models are differently influenced by structural effects, with the TemporalSelf-Organizing Map more prone to adaptively find a balance between processing issues of learnabilityand generalization, on the one side, and discriminability on the other side},
KEYWORDS = {word-learning, serial word processing, recurrent neural networks, long short-term memories, temporal self-organizing memories},
PAGES = {14},
URL = {https://www.mdpi.com/2078-2489/11/6/320},
VOLUME = {11 (6)},
DOI = {10.3390/info11060320},
ISSN = {2078-2489},
JOURNAL = {INFORMATION},
}
@ARTICLE{MARZI_2020_ARTICLE_M_407424,
AUTHOR = {Marzi, C.},
TITLE = {Modelling the interaction of regularity and morphological structure: the case of Russian verb inflection},
YEAR = {2020},
ABSTRACT = {The main focus of this paper is to investigate how aspects of morphologicalregularity may have an impact on early stages of word processing, prior to full lexical access. Here I explore the interaction of regularity andmorphological structure by using a computational simulation of the processof learning Russian verb forms, without any morpho-syntactic or morphosemanticadditional information. With a recurrent variant of self-organisingmemories, namely a Temporal Self-Organising Map, or TSOM, experimentalresults allow an investigation of the impact of incremental learning and onlineprocessing principles on paradigm organisation, by assessing the differentialimpact of several aspects of regularity, ranging from formal transparency andpredictability to allomorphy, on the processing/learning behaviour in a connectionistframework. The proposed analysis suggests a performance-orientedaccount of inflectional regularity in morphology, whereby perception of morphologicalstructure is not the by-product of the design of the human wordprocessor, with rules separated from exceptions, but rather an emergent propertyof the dynamic self-organisation of stored lexical representations, dependenton the adaptive processing history of inflected word forms, intrinsicallygraded and probabilistic},
KEYWORDS = {morphological complexity, discriminative learning, recurrent neural networks, self-organisation, Russian verb inflection},
PAGES = {131-156},
URL = {https://www.mulino.it/riviste/issn/1720-9331},
VOLUME = {XIX (1)},
DOI = {10.1418/97534},
ISSN = {1720-9331},
JOURNAL = {LINGUE E LINGUAGGIO},
}
@ARTICLE{MASINI_2020_ARTICLE_MP_424255,
AUTHOR = {Masini, F. and Pirrelli, V.},
TITLE = {L'evidenza morfologica nell'era digitale: per un'integrazione di teoria e computazione},
YEAR = {2020},
ABSTRACT = {This article proposes a research perspective on morphological and lexical data based on an integrated approach that merges linguistic theory and computational analyses of a large quantity of textual data. Starting from a description of the units and processes of morphology, and of the issues they raise, we discuss to what extent these theoretical notions can be translated into the algorithmic procedures of Natural Language Processing (NLP) and what resources and methods are nowadays available to make morphological and lexical knowledge explicit within texts. At the same time, we explore the repercussions that the application of computational (but also psycho-/neuro-linguistic) techniques may have on our theoretical representations and on their plausibility},
KEYWORDS = {morphology - lexicon - categories - Natural Language Processing - Italian},
PAGES = {77-126},
URL = {https://iris.cnr.it/handle/20.500.14243/424255},
VOLUME = {VI},
ISSN = {0393-1226},
JOURNAL = {QUADERNI DI SEMANTICA},
}
@ARTICLE{NICOLOSI_2020_ARTICLE_NMN_405360,
AUTHOR = {Nicolosi, A. and Monachini, M. and Nava, B.},
TITLE = {CLARIN-IT and the Definition of a Digital Critical Edition for Ancient Greek Poetry},
YEAR = {2020},
ABSTRACT = {Ancient Greek studies, and Classics in general, is a perfect field of investigation in Digital Humanities. Indeed, DH approaches could become a means of building models for complex realities, analyzing them with computational methods and sharing the results with a broader public. Ancient texts have a complex tradition, which includes many witnesses (texts that handed down other texts) and different typologies of supports (papyri, manuscripts, and epigraphs). These texts are the basis of all European Literatures and it is crucial to spread their knowledge, in a reliable and easy way. Our project on ancient Greek fragmentary poetry (DEA-Digital Edition of Archilochus: New models and tools for authoring, editing and indexing an ancient Greek fragmentary author), growing out of the existing experience, tries to define a TEI-based digital critical edition combined with NLP techniques and semantic web technologies. Our goal is to provide a complete and reliable tool for scholars, suitable for critical studies in Classics, and a user-friendly environment also for non-specialist users. The project represents one of the attempts within the context of CLARIN-IT to contribute to the wider impact of CLARIN on the specific Italian community interested in Digital Classics. It is intended to improve services in fostering new knowledge in SSH digital research and sustaining the existing one},
KEYWORDS = {Digital edition, Ancient Greek, research infrastructures, digital humanities, digital classics},
PAGES = {85-93},
URL = {https://ep.liu.se/ecp/172/011/ecp20172011.pdf},
VOLUME = {172},
DOI = {10.3384/ecp2020172011},
ISSN = {1650-3740},
JOURNAL = {LINKÖPING ELECTRONIC CONFERENCE PROCEEDINGS (ONLINE)},
}
@ARTICLE{PROIETTI_2020_ARTICLE_PS_405489,
AUTHOR = {Proietti, C. and Smid, J.},
TITLE = {Mereology and time travel},
YEAR = {2020},
ABSTRACT = {Core principles of mereology have been questioned by appealing to time travel scenarios. This paper questions the methodology of employing time travel scenarios to argue against mereology. We show some time travel scenarios are structurally equivalent to more standard ones not involving time travel; and that the three main theories about persistence through time (i. e., endurantism, perdurantism, and stage theory) can each solve both the time travel scenario as well as the structurally similar classical scenario. Time travel scenarios that are not similar to more standard arguments are instead problematic because they are open to different, incompatible interpretations. We conclude that compared to the classical arguments against mereological principles, time travel scenarios do not add anything new},
KEYWORDS = {Mereology, Time travel, Methodology, Parthood, Multilocation},
PAGES = {2245-2260},
URL = {https://link.springer.com/article/10.1007/s11098-019-01308-x#citeas},
VOLUME = {177 (8)},
DOI = {10.1007/s11098-019-01308-x},
ISSN = {0031-8116},
JOURNAL = {PHILOSOPHICAL STUDIES},
}
@ARTICLE{TAYLOR_2020_ARTICLE_TD_417367,
AUTHOR = {Taylor, C. and Del Fante, D.},
TITLE = {Comparing across languages in corpus and discourse analysis: some issues and approaches},
YEAR = {2020},
ABSTRACT = {Corpus-assisted discourse studies is, by its nature, interdisciplinary. However, this need to reach across borders becomes even more salient when we study discourses across languages, and this represents a natural intersection with translation studies. The aim of this paper is to reflect on the issue of comparison in cross-linguistic corpus-assisted discourse studies, positing a series of key questions including: How do we compare across or within corpora containing different languages? How do we identify meaningful language units for comparison in this context? How do we know that we are comparing like with like? Using a series of case studies, we start by addressing how we can approach comparison at the lexical level. We then move on to consider methods which allow us to abstract above the lexical level using three case studies which illustrate the use of semantic fields, discourse frames and rhetorical features. By presenting some issues and partial solutions regarding comparison across and within multilingual corpora, we hope to initiate a productive discussion in which we will also be able to collectively enrich and inform this set of resources},
KEYWORDS = {corpus linguistics, discourse analysis, critical discourse analysis, comparative discourse analysis, cross-linguistic comparison},
URL = {http://www.scopus.com/inward/record.url?eid=2-s2.0-85097898230\&partnerID=MN8TOARS},
DOI = {10.7202/1073635AR},
JOURNAL = {META},
}
@ARTICLE{VENTURI_2020_ARTICLE_VDMM_426118,
AUTHOR = {Venturi, G. and Dell'Orletta, F. and Montemagni, S. and Morini E, S. M.},
TITLE = {Metodi e Tecniche di Trattamento Automatico della Lingua per l'Estrazione di Conoscenza dalla Documentazione Scolastica},
YEAR = {2020},
ABSTRACT = {Il contributo riguarda la creazione di un sistema integrato di "knowledge management", per la gestione e condivisione della conoscenza prodotta e utilizzata dalla scuola},
KEYWORDS = {Estrazione di informazione, Documenti scolastici, Indicizzazione, Terminology extraction},
PAGES = {49-68},
URL = {https://iris.cnr.it/handle/20.500.14243/426118},
VOLUME = {2},
DOI = {10.3280/CAD2020-002005},
ISSN = {1122-5165},
JOURNAL = {CADMO},
}
@ARTICLE{VERTECCHI_2020_ARTICLE_VADMV_426114,
AUTHOR = {Vertecchi, B. and Agrusti, F. and Dell'Orletta, F. and Montemagni, S. and Venturi, G.},
TITLE = {Verba et Acta. Un esperimento per promuovere l'evoluzione delle compe-tenze linguistiche degli studenti degli istituti professionali},
YEAR = {2020},
ABSTRACT = {Ricerche in corso. Verba et Acta. Un esperimento per promuovere l'evoluzione delle competenze linguistiche degli studenti degli istituti professionali},
KEYWORDS = {Evoluzione competenze linguistiche, Annotazione linguistica, Previsione dello sviluppo delle competenze di scrittura},
PAGES = {109-117},
URL = {https://iris.cnr.it/handle/20.500.14243/426114},
VOLUME = {(1)},
DOI = {10.3280/CAD2020-001008},
ISSN = {1122-5165},
JOURNAL = {CADMO},
}
@INCOLLECTION{BURGASSI_2020_INCOLLECTION_B_532791,
AUTHOR = {Burgassi, C.},
TITLE = {Une image ovidienne et son succès linguistique. Quelques réflexions autour du « chaos »},
YEAR = {2020},
ABSTRACT = {L’article vise à contribuer à l’étude de l’influence des adaptations des fables d’Ovide sur les langues vernaculaires au niveau de la sémantique lexicale. L’analyse linguistique, développée à partir des traductions italiennes des Métamorphoses du Moyen Âge à la Renaissance tardive, porte en particulier sur la relation entre l’image ovidienne du phénomène du Chaos (figuré au tout début du chef-d’oeuvre d’Ovide) et le sens du mot correspondant en italien (caos en tant que “confusion”)},
KEYWORDS = {Ovide, littérature italienne du Moyen Âge, langue italienne médiévale, lexicologie, histoire des mots, histoire des idées, réception de l’Antiquité, le chaos},
PAGES = {237-253},
URL = {https://iris.cnr.it/handle/20.500.14243/532791},
DOI = {10.15122/isbn.978-2-406-10508-4.p.0237},
ISBN = {978-2-406-10506-0},
BOOKTITLE = {Traire de latin et espondre. Études sur la réception médiévale d’Ovide},
}
@INCOLLECTION{BURGASSI_2020_INCOLLECTION_B_532544,
AUTHOR = {Burgassi, C.},
TITLE = {«Parole di conforto». Tappe storiche di una concorrenza lessicale},
YEAR = {2020},
ABSTRACT = {Il contributo traccia la storia della concorrenza lessicale sinonimica tra "confortare" ed "esortare" in italiano. Dall'analisi della fase linguistica medievale, risulta che l'area semantica coperta da "confortare" comprendeva anche il significato modernamente veicolato da "esortare". La progressiva affermazione di quest'ultimo vocabolo nell'italiano, come recupero dotto dal latino, ha verosimilmente innescato un riassestamento di valori lessico-semantici del suo concorrente onomasiologico "confortare", fino alla definizione dell'assetto odierno},
KEYWORDS = {Concorrenza lessicale, onomasiologia, semantica storica},
PAGES = {61-78},
URL = {https://iris.cnr.it/handle/20.500.14243/532544},
PUBLISHER = {ETS (Pisa)},
ISBN = {9788846757968},
CONFERENCE_PLACE = {Pisa},
BOOKTITLE = {Studi di filologia offerti dagli allievi a Claudio Ciociola},
}
@INCOLLECTION{GUADAGNINI_2020_INCOLLECTION_G_421521,
AUTHOR = {Guadagnini, E.},
TITLE = {Les Métamorphoses d'Ovide et le Moyen Âge italien: une esquisse du cadre général},
YEAR = {2020},
ABSTRACT = {Cette contribution propose un cadre d'ensemble de la réception des Métamorphoses ovidiennes dans la production vernaculaire italienne du Moyen Âge (XII-XIV siècles). Trois typologies de réception sont isolées: le poème en tant que source de contenus, le poème en tant que source textuelle et les traductions du poème. Une attention particulière est accordée à la tradition manuscrite des oeuvres citées, ainsi qu'à la recherche des sources vraisemblablement employées par les auteurs},
KEYWORDS = {Volgarizzamenti, eredità dei classici, Ovidio, Filologia romanza},
PAGES = {209-236},
URL = {https://classiques-garnier.com/traire-de-latin-et-espondre-etudes-sur-la-reception-medievale-d-ovide.html},
PUBLISHER = {Editions Classiques Garnier (Paris, FRA)},
ISBN = {9782406105077},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {« Traire du latin et espondre ». Études sur la réception médiévale d'Ovide},
EDITOR = {Baker, C. and Cavagna, M. and Guadagnini, E.},
}
@INCOLLECTION{MARZI_2020_INCOLLECTION_MBBP_408279,
AUTHOR = {Marzi, C. and Blevins, J. P. and Booij, G. and Pirrelli, V.},
TITLE = {Inflection at the morphology-syntax interface},
YEAR = {2020},
ABSTRACT = {What is inflection? Is it part of language morphology, syntax or both?What are the basic units of inflection and how do speakers acquire and processthem? How do they vary across languages? Are some inflection systems somewhatmore complex than others, and does inflectional complexity affect the wayspeakers process words? This chapter addresses these and other related issuesfrom an interdisciplinary perspective. Our main goal is to map out the place ofinflection in our current understanding of the grammar architecture. In doingthat, we will embark on an interdisciplinary tour, which will touch upon theoretical, psychological, typological, historical and computational issues in morphology, with a view to looking for points of methodological and substantialconvergence from a rather heterogeneous array of scientific approaches and theoreticalperspectives. The main upshot is that we can learn more from this thanjust an additive medley of domain-specific results. In the end, a cross-domainsurvey can help us look at traditional issues in a surprisingly novel light},
KEYWORDS = {inflection, paradigmatic relations, word processing, word learning, inflectional complexity, family size, entropy},
PAGES = {228-294},
URL = {https://www.degruyter.com/view/book/9783110440577/10.1515/9783110440577-007.xml},
DOI = {10.1515/9783110440577-007},
PUBLISHER = {De Gruyter Saur (Berlin/Munich, DEU)},
ISBN = {9783110440577},
CONFERENCE_PLACE = {Berlin/Munich},
BOOKTITLE = {Word Knowledge and Word Usage. A cross-interdisciplinary guide to the mental lexicon},
EDITOR = {Pirrelli, V. and Plag, I. and Dressler, W. U.},
}
@INCOLLECTION{PANCKHURST_2020_INCOLLECTION_PF_529606,
AUTHOR = {Panckhurst, R. and Frontini, F.},
TITLE = {Evolving interactional practices of emoji in text messages},
YEAR = {2020},
ABSTRACT = {In this article, we examine the usage of emoji in the 88milSMS corpus. After differentiating between emoji and emoticons, we situate the context, indicate general statistics and mention press interest. Next, we address linguistic issues: are emoji used more often in addition (either redundantly or necessarily, sometimes as “softeners” (adoucisseurs, Détrie \& Verine 2015) or for lexical replacement, denoting a reference/referential function (Referenzfunktion, Dürscheid \& Siever 2017)? Concerning emoji insertion positioning, which is the most popular and what does this mean? Other researchers refer to “the emoji code” (Danesi 2016; Evans 2017), and emoji classifications have been proposed, including references to syntactic, semantic (Barbieri, Ronzano \& Saggion 2016), semiotic, phatic and emotive/sentiment (Novak et al. 2015) levels. Are these satisfactory or do we need to redefine levels, contexts and potential ambiguity? Part-ofspeech tagging (POS) and NLP software are then used to annotate SMS containing emoji within 88milSMS in order to investigate the immediate grammatical environment. This allows us to conduct contextual analysis relating to syntactic linguistic functions of emoji. Finally, results from two questionnaires are explored: 1. sociolinguistic factors (age, gender) of the SMS donors having used emoji in 88milSMS; 2. Comparison of SMS emoji usage with other instant messaging applications and social networks via a user-orientated questionnaire (Rascol 20171)},
KEYWORDS = {emoji, computer mediated communication, corpus},
PAGES = {81-104},
URL = {https://doi.org/10.1515/9781501510113-005},
DOI = {10.1515/9781501510113-005},
PUBLISHER = {De Gruyter Mouton},
ISBN = {978-1-5015-1011-3},
BOOKTITLE = {Visualizing Digital Discourse: Interactional, Institutional and Ideological Perspectives},
}
@INCOLLECTION{PIRRELLI_2020_INCOLLECTION_PMFCBM_408278,
AUTHOR = {Pirrelli, V. and Marzi, C. and Ferro, M. and Cardillo, F. A. and Baayen Harald, R. and Milin, P.},
TITLE = {Psycho-computational modelling of the mental lexicon},
YEAR = {2020},
ABSTRACT = {Over the last decades, a growing body of evidence on the mechanismsgoverning lexical storage, access, acquisition and processing has questionedtraditional models of language architecture and word usage based on the hypothesisof a direct correspondence between modular components of grammarcompetence (lexicon vs. rules), processing correlates (memory vs. computation)and neuro-anatomical localizations (prefrontal vs. temporo-parietal perisylvianareas of the left hemisphere). In the present chapter, we explore the empiricaland theoretical consequences of a distributed, integrative model of the mentallexicon, whereby words are seen as emergent properties of the functional interactionbetween basic, language-independent processing principles and the language-specific nature and organization of the input. From this perspective, language learning appears to be inextricably related to the way language isprocessed and internalized by the speakers, and key to an interdisciplinary understandingof such a way, in line with Tomaso Poggio's suggestion that the developmentof a cognitive skill is causally and ontogenetically prior to itsexecution (and sits "on top of it"). In particular, we discuss conditions, potentialand prospects of the epistemological continuity between psycholinguistic andcomputational modelling of word learning, and illustrate the yet largely untappedpotential of their integration. We use David Marr's hierarchy to clarify the complementarityof the two viewpoints. Psycholinguistic models are informative abouthow speakers learn to use language (interfacing Marr's levels 1 and 2). When wemove from the psycholinguistic analysis of the functional operations involved inlanguage learning to an algorithmic description of how they are computed, computersimulations can help us explore the relation between speakers' behavior andgeneral learning principles in more detail. In the end, psycho-computational models can be instrumental to bridge Marr's levels 2 and 3, bringing us closer tounderstanding the nature of word knowledge in the brain},
KEYWORDS = {mental lexicon, word storage and processing, psycholinguistics, computational linguistics, connectionist models, discriminative learning},
PAGES = {23-82},
URL = {https://www.degruyter.com/view/book/9783110440577/10.1515/9783110440577-002.xml},
DOI = {10.1515/9783110440577-002},
PUBLISHER = {De Gruyter Saur (Berlin/Munich, DEU)},
ISBN = {9783110440577},
CONFERENCE_PLACE = {Berlin/Munich},
BOOKTITLE = {Word Knowledge and Word Usage},
EDITOR = {Pirrelli, V. and Plag, I. and Dressler, W. U.},
}
@INCOLLECTION{PIRRELLI_2020_INCOLLECTION_PPD_405086,
AUTHOR = {Pirrelli, V. and Plag, I. and Dressler, U. W.},
TITLE = {Word knowledge in a cross-disciplinary world},
YEAR = {2020},
ABSTRACT = {This editorial project stemmed from a 4-year period of intense interdisciplinary research networking funded by the European Science Foundation within the framework of the NetWordS project (09-RNP-089). The project mission was to bring together experts of various research fields (from brain sciences and computing to cognition and linguistics) and of different theoretical inclinations, to advance the current awareness of theoretical, typological, psycholinguistic, computational and neurophysiological evidence on the structure and processing of words, with a view to promoting novel methods of research and assessment for grammar architecture and language usage. The unprecedented cross-disciplinary fertilization prompted by a wide range of scientific and educational initiatives (three international workshops, two summer schools, one main conference and over a hundred grants supporting short visits and multilateral exchanges) persuaded us to pursue this effort beyond the project lifespan, spawning the idea of an interdisciplinary handbook, where a wide range of central topics on word knowledge and usage are dealt with by teams of authors with common interests and different backgrounds. Unsurprisingly (with the benefit of the hindsight), the project turned out to be more challenging and time-consuming than initially planned. Cross-boundary talking and mutual understanding are neither short-term, nor immediately rewarding efforts, but part of a long-sighted, strategic vision, where stamina, motivation and planning ahead play a prominent role. We believe that this book, published as an open access volume, significantly sharpens the current understanding of issues of word knowledge and usage, and has a real potential for promoting novel research paradigms, and bringing up a new generation of language scholars},
KEYWORDS = {interdisciplinarity, word knowledge, word usage, language units, statistical and computer modeling, levels of understanding, between-level mapping, linking hypotheses, scale effects},
PAGES = {1-20},
URL = {https://doi.org/10.1515/9783110440577},
DOI = {10.1515/9783110440577},
PUBLISHER = {De Gruyter Saur (Berlin/Munich, DEU)},
ISBN = {9783110440577},
CONFERENCE_PLACE = {Berlin/Munich},
BOOKTITLE = {Word Knowledge and Word Usage. A Cross-Disciplinary Guide to the Mental Lexicon},
}
@EDITORIAL{BAKER_2020_EDITORIAL_BCG_421524,
AUTHOR = {Baker, C. and Cavagna, M. and Guadagnini, E.},
TITLE = {«Traire du latin et espondre». Études sur la réception médiévale d'Ovide},
YEAR = {2020},
ABSTRACT = {Les contributions à ce volume explorent la réception médiévale d'Ovide dans les domaines latin, catalan, français et italien. Elles invitent à nuancer l'opposition entre latin et vernaculaire au profit d'une vision plus complexe des rapports entre texte, traduction et glose},
KEYWORDS = {Ovide, mythologie classique, littérature du Moyen Âge, réception de l'Antiquité, traduction et commentaire, allégorie, L'Ovide moralisé},
URL = {https://classiques-garnier.com/traire-de-latin-et-espondre-etudes-sur-la-reception-medievale-d-ovide.html},
PUBLISHER = {Editions Classiques Garnier (Paris, FRA)},
ISBN = {978-2-406-10506-0},
CONFERENCE_PLACE = {Paris},
}
@EDITORIAL{BEERMANN_2020_EDITORIAL_BBSS_444081,
AUTHOR = {Beermann, D. and Besacier, L. and Sakriani, S. and Soria, C.},
TITLE = {Proceedings of 1st Joint SLTU and CCURL Workshop (SLTU-CCURL 2020)},
YEAR = {2020},
ABSTRACT = {Proceedings of the 1st Joint SLTU and CCURL Workshop (SLTU-CCURL 2020)},
KEYWORDS = {less-resourced languages, NLP, language resources},
URL = {https://aclanthology.org/events/lrec-2020/#2020-sltu-1},
ISBN = {979-10-95546-35-1},
}
@EDITORIAL{BROEDER_2020_EDITORIAL_BEM_420393,
AUTHOR = {Broeder, D. and Eskevich, M. and Monachini, M.},
TITLE = {Proceedings of the Workshop about Language Resources for the SSH Cloud},
YEAR = {2020},
ABSTRACT = {This workshop was envisaged to focus on the goals and aims of realising the SSHOC part of theEOSC, where SSH data, language processing tools, and services are made available, adjusted andaccessible for users across SSH domain. It provides a forum to discuss common requirements, challenges and opportunities for developing, enhancing, integrating tools and services for managing andprocessing SSH research data. Such SSH scenarios based implementations of currently existing languagetools and services demonstrate their multidisciplinary usability and stimulate further multidisciplinarycollaboration across the various subfields of SSH and beyond, which will increase the potential forsocietal impact},
KEYWORDS = {Social Science and Humanties Open Cloud, EOSC, Language Resource Infrastructure},
PAGES = {1-46},
URL = {https://aclanthology.org/2020.lr4sshoc-1},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {979-10-95546-43-6},
CONFERENCE_PLACE = {Paris},
}
@EDITORIAL{PIRRELLI_2020_EDITORIAL_PPD_408986,
AUTHOR = {Pirrelli, V. and Plag, I. and Dressler Wolfgang, U.},
TITLE = {Word knowledge and word usage: a cross-disciplinary guide to the mental lexicon},
YEAR = {2020},
ABSTRACT = {This editorial project stemmed from a 4-year period of intense interdisciplinary research networking funded by the European Science Foundation within the framework of the NetWordS project (09-RNP-089)},
KEYWORDS = {interdisciplinarity, word knowledge, word usage, language units, statistical and computer modeling, levels of understanding, between-level mapping, linking hypotheses, scale effects},
PAGES = {1-717},
URL = {https://doi.org/10.1515/9783110440577},
VOLUME = {337},
DOI = {10.1515/9783110440577},
PUBLISHER = {De Gruyter Saur (Berlin/Munich, DEU)},
ISBN = {978-3-11-051748-4},
CONFERENCE_PLACE = {Berlin/Munich},
}
@INPROCEEDINGS{AHMADI_2020_INPROCEEDINGS_AMNKMPDWBPTOKLVSGTSMRALKLKOFCLASSUZSOKRSPG_404924,
AUTHOR = {Ahmadi, S. and McCrae John, P. and Nimb, S. and Khan, F. and Monachini, M. and Pedersen Bolette, S. and Declerck, T. and Wissik, T. and Bellandi, A. and Pisani, I. and Troelsgårdthomas and Olsen, S. and Krek, S. and Lipp, V. and Váraditamás and Simon, L. and Gyorffy, A. and Tiberius, C. and Schoonheim, T. and Moshe Yifat, B. and Rudich, M. and Ahmad Raya, A. and Lonke, D. and Kovalenko, K. and Langemets, M. and Kallas, J. and Oksana, D. and Fransentheodorus and Cillessen, D. and Lindemann, D. and Alonsomikel and Salgado, A. and Sancho Jose, L. and Urenaruiz, R. and Zamorano Jordi, P. and Simov, K. and Osenova, P. and Kancheva, Z. and Radev, I. and Stankovic, R. and Perdihandrej and Gabrovsek, D.},
TITLE = {A multilingual evaluation dataset for monolingual word sense alignment},
YEAR = {2020},
ABSTRACT = {Aligning senses across resources and languages is a challenging task with beneficial applications in the field of natural language processing and electronic lexicography. In this paper, we describe our efforts in manually aligning monolingual dictionaries. The alignment is carried out at sense-level for various resources in 15 languages. Moreover, senses are annotated with possible semantic relationships such as broadness, narrowness, relatedness, and equivalence. In comparison to previous datasets for this task, this dataset covers a wide range of languages and resources and focuses on the more challenging task of linking general-purpose language. We believe that our data will pave the way for further advances in alignment and evaluation of word senses by creating new solutions, particularly those notoriously requiring data such as neural networks. Our resources are publicly available at https: //github. com/elexis-eu/MWSA},
KEYWORDS = {lexical semantic resources, sense alignment, lexicography, language resource},
URL = {https://iris.cnr.it/handle/20.500.14243/404924},
ISBN = {979-10-95546-34-4},
CONFERENCE_NAME = {Proceedings of the 12th Conference on Language Resources and Evaluation (LREC 2020)},
BOOKTITLE = {Proceedings of the 12th Language Resources and Evaluation Conference-LREC 2020},
}
@INPROCEEDINGS{ALZETTA_2020_INPROCEEDINGS_ADMOSV_423610,
AUTHOR = {Alzetta, C. and Dell'Orletta, F. and Montemagni, S. and Osenova, P. and Simov, K. and Venturi, G.},
TITLE = {Quantitative linguistic investigations across universal dependencies treebanks},
YEAR = {2020},
ABSTRACT = {The paper illustrates a case study aimed at identifying cross-lingual quantitative trends in the distribution of dependency relations in treebanks for typologically different languages. Preliminary results show interesting differences rooted either in language-specific peculiarities or cross-lingual annotation inconsistencies, with a potential impact on different application scenarios},
KEYWORDS = {Universal Dependencies Treebanks, Cross-linguistic analysis, Typology},
PAGES = {1-7},
URL = {http://ceur-ws.org/Vol-2769/paper_59.pdf},
VOLUME = {2769},
ISBN = {979-12-80136-28-2},
CONFERENCE_NAME = {7th Italian Conference on Computational Linguistics (CLiC-it)},
}
@INPROCEEDINGS{ALZETTA_2020_INPROCEEDINGS_AGKPT_493643,
AUTHOR = {Alzetta, C. and Galluccio, I. and Koceva, F. and Passalacqua, S. and Torre, I.},
TITLE = {Digging into prerequisite annotation},
YEAR = {2020},
ABSTRACT = {Intelligent textbooks are often engineered with an explicit representation of their concepts and prerequisite relations (PR). PR identification is hence crucial for intelligent textbooks but still presents some challenges, also when performed by human experts. This may cause PR-annotated datasets to be inconsistent and compromise the accuracy of automatic creation of enhanced learning materials. This paper investigates possible reasons for PR disagreement and the nature of PR itself, with the aim of contributing to the development of shared strategies for PR annotation, analysis and modelling in textbooks},
KEYWORDS = {Agreement, Annotation, Prerequisite relation},
PAGES = {29-34},
URL = {https://iris.cnr.it/handle/20.500.14243/493643},
VOLUME = {2674},
PUBLISHER = {CEUR-WS},
CONFERENCE_NAME = {2nd International Workshop on Intelligent Textbooks, iTextbooks 2020},
BOOKTITLE = {CEUR Workshop Proceedings of the 2nd International Workshop on Intelligent Textbooks, iTextbooks 2020},
}
@INPROCEEDINGS{ALZETTA_2020_INPROCEEDINGS_AMDKFTI_421771,
AUTHOR = {Alzetta, C. and Miaschi, A. and Dell'Orletta, F. and Koceva and Frosina and Torre and Ilaria},
TITLE = {PRELEARN @ EVALITA 2020: Overview of the Prerequisite Relation Learning Task for Italian},
YEAR = {2020},
ABSTRACT = {The Prerequisite Relation Learning (PRELEARN) task is the EVALITA 2020 shared task on concept prerequisite learning, which consists of classifying prerequisite relations between pairs of concepts distinguishing between prerequisite pairs and non-prerequisite pairs. Four sub-tasks were defined: two of them define different types of features that participants are allowed to use when training their model, while the other two define the classification scenarios where the proposed models would be tested. In total, 14 runs were submitted by 3 teams comprising 9 total individual participants},
KEYWORDS = {nlp, prerequisite learning, shared task},
URL = {http://ceur-ws.org/Vol-2765/paper164.pdf},
CONFERENCE_NAME = {Seventh Evaluation Campaign of Natural Language Processing and Speech Tools for Italian (EVALITA)},
BOOKTITLE = {Proceedings of the Seventh Evaluation Campaign of Natural Language Processing and Speech Tools for Italian (EVALITA)},
}
@INPROCEEDINGS{BACCO_2020_INPROCEEDINGS_BBDF_370407,
AUTHOR = {Bacco, F. and Brunori, G. and Dell'Orletta, F. and Ferrari, A.},
TITLE = {Using NLP to support terminology extraction and domain scoping: report on the H2020 DESIRA project},
YEAR = {2020},
ABSTRACT = {The ongoing phenomenon of digitisation is changing social and work life, with tangible effects on the socio-economic context. Understanding the impact, opportunities, and threats of digital transformation requires the identication of viewpoints from a large diversity of stakeholders, from policy makers to domain experts, and from engineers to common citizens. The DESIRA (Digitisation: Economic and Social Impacts in Rural Areas) EU H2020 project1 considers rural areas, with a strong focus on agricultural and forestry activities, and aims at assessing the impact of digital technologies in those domains by involving a large number of stakeholders, all across Europe, around 20 focal questions. Given the involvement of stakeholders with diverse background and skills, a primary goal of the project is to develop domain-specic and interactive reference taxonomies (i. e., structured classications of terms) to facilitate common understanding of technologies in use in each domain at today. The taxonomies, which aims at easing the learning of the meaning of technical and domain-specic terms, are going to be exploited by the stakeholders in 20 Living Labs built around the focal questions. This report paper focuses on the semi-automatic development of the taxonomies through natural language processing (NLP) techniques based on context-specic term extraction. Furthermore, we crawl Wikipedia to enrich the taxonomies with additional categories and denitions. We plan to validate the taxonomies through fieeld studies within the Living Labs},
KEYWORDS = {NLP, WIkipedia, Socio-economic impact, Taxonomy, Knowledge graph, Terminology extraction, Domain scoping},
PAGES = {1-5},
URL = {http://ceur-ws.org/Vol-2584/},
PUBLISHER = {CEUR-WS. org (Aachen, DEU)},
CONFERENCE_NAME = {Third Workshop on Natural Language Processing for Requirements Engineering},
CONFERENCE_PLACE = {Aachen},
}
@INPROCEEDINGS{BACCO_2020_INPROCEEDINGS_BCPMD_401373,
AUTHOR = {Bacco, L. and Cimino, A. and Paulon, L. and Merone, M. and Dell'Orletta, F.},
TITLE = {A Machine Learning approach for Sentiment Analysis for Italian Reviews in Healthcare},
YEAR = {2020},
ABSTRACT = {In this paper, we present our approach to the task of binary sentiment classification for Italian reviews in healthcare domain. We first collected a new dataset for such domain. Then, we compared the results obtained by two different systems, one including a Support Vector Machine and one with BERT. For the first one, we linguistic pre-processed the dataset to extract hand-crafted features exploited by the classifier. For the second one, we oversampled the dataset to achieve better results. Our results show that the SVM-based system, without the worry of having to oversample, has better performance than the BERT-based one, achieving anF1-score of 91. 21%},
KEYWORDS = {natural language processing, sentiment analisys},
URL = {https://iris.cnr.it/handle/20.500.14243/401373},
CONFERENCE_NAME = {Seventh Italian Conference on Computational Linguistics (CLiC-it 2020)},
}
@INPROCEEDINGS{BELLANDI_2020_INPROCEEDINGS_BG_411285,
AUTHOR = {Bellandi, A. and Giovannetti, E.},
TITLE = {Involving Lexicographers in the LLOD Cloud with LexO, an Easy-to-use Editor of Lemon Lexical Resources},
YEAR = {2020},
ABSTRACT = {In this contribution, we show LexO, a user-friendly web collaborative editor of lexical resources based on the lemon model. LexO has been developed in the context of Digital Humanities projects, in which a key point in the design of an editor was the ease of use by lexicographers with no skill in Linked Data or Semantic Web technologies. Though the tool already allows creating a lemon lexicon from scratch and lets a team of users work on it collaboratively, many developments are possible. The involvement of the LLOD community appears now crucial both to find new users and application fields where to test it, and, even more importantly, to understand in which way it should evolve},
KEYWORDS = {lexO, lexical resources editor, semantic web, llod},
PAGES = {70-74},
URL = {https://www.aclweb.org/anthology/2020.ldl-1.10.pdf},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {979-10-95546-36-8},
CONFERENCE_NAME = {7th Workshop on Linked Data in Linguistics (LDL-2020)},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the 7th Workshop on Linked Data in Linguistics (LDL-2020)},
EDITOR = {Ionov and Maxim and McCrae and John, P. and Chiarcos and Christian and Declerck and Thierry and Bosque Gil and Julia and Gracia and Jorge},
}
@INPROCEEDINGS{BOSCHETTI_2020_INPROCEEDINGS_BDMBMR_443457,
AUTHOR = {Boschetti, F. and Del Gratta, R. and Monachini, M. and Buzzoni, M. and Monella, P. and Rosselli Del Turco, R.},
TITLE = {"Tea for two": the Archive of the Italian Latinity of the Middle Ages meets the CLARIN infrastructure},
YEAR = {2020},
ABSTRACT = {This paper presents the Archive of the Italian Latinity of the Middle Ages (ALIM) and focuses, particularly, on its structure and metadata for its integration into the ILC4CLARIN repository. Access to this archive of Latin texts produced in Italy during the Middle Ages is of great importance in providing CLARIN-IT and the CLARIN community, at large, with critically reliabletexts for the use of philologists, historians of literature, historians of institutions, culture andscience of the Middle Ages},
KEYWORDS = {Latin resources, CLARIN, corpus, repository},
PAGES = {121-125},
URL = {https://office.clarin.eu/v/CE-2020-1738-CLARIN2020_ConferenceProceedings.pdf},
ISSN = {2020-1738},
CONFERENCE_NAME = {CLARIN Annual Conference 2020},
BOOKTITLE = {CLARIN Annual Conference 2020},
}
@INPROCEEDINGS{BROEDER_2020_INPROCEEDINGS_BEM_420395,
AUTHOR = {Broeder, D. and Eskevich, M. and Monachini, M.},
TITLE = {LR4SSHOC: The Future of Language Resources in the Context of the Social Sciences and Humanities Open Cloud},
YEAR = {2020},
ABSTRACT = {This paper outlines the future of language resources and identifies their potential contribution for creating and sustaining the social sciences and humanities (SSH) component of the European Open Science Cloud (EOSC)},
KEYWORDS = {EOSC, Social Science and Humanities Open Cloud},
PAGES = {33-36},
URL = {https://aclanthology.org/2020.lr4sshoc-1.6},
ISBN = {979-10-95546-43-6},
CONFERENCE_NAME = {LREC},
BOOKTITLE = {Proceedings of the Workshop about Language Resources for the SSH Cloud},
EDITOR = {Daan Broeder, M. E. and Monachini, M.},
}
@INPROCEEDINGS{BRUNATO_2020_INPROCEEDINGS_BCDMVZ_423611,
AUTHOR = {Brunato, D. and Chesi, C. and Dell'Orletta, F. and Montemagni, S. and Venturi, G. and Zamparelli, R.},
TITLE = {AcCompl-it @ EVALITA2020: Overview of the acceptability & complexity evaluation task for Italian},
YEAR = {2020},
ABSTRACT = {The Acceptability and Complexity evaluation task for Italian (AcCompl-it) was aimed at developing and evaluating methods to classify Italian sentences according to Acceptability and Complexity. It consists of two independent tasks asking participants to predict either the acceptability or the complexity rate (or both) of a given set of sentences previously scored by native speakers on a 1-to-7 points Likert scale. In this paper, we introduce the datasets distributed to the participants, we describe the different approaches of the participating systems and provide a first analysis of the obtained results},
KEYWORDS = {Shared Task, Linguistic Complexity, Acceptability},
PAGES = {1-8},
URL = {http://ceur-ws.org/Vol-2765/paper163.pdf},
VOLUME = {2765},
CONFERENCE_NAME = {EVALITA '20, Evaluation of NLP and Speech Tools for Italian},
}
@INPROCEEDINGS{BRUNATO_2020_INPROCEEDINGS_BCDMV_384930,
AUTHOR = {Brunato, D. and Cimino, A. and Dell'Orletta, F. and Montemagni, S. and Venturi, G.},
TITLE = {Profiling-UD: a Tool for Linguistic Profiling of Texts},
YEAR = {2020},
ABSTRACT = {In this paper, we introduce Profiling-UD, a new text analysis tool inspired to the principles of linguistic profiling that can support language variation research from different perspectives. It allows the extraction of more than 130 features, spanning across different levels of linguistic description. Beyond the large number of features that can be monitored, a main novelty of Profiling-UD is that it has been specifically devised to be multilingual since it is based on the Universal Dependencies framework. In the second part of the paper, we demonstrate the effectiveness of these features in a number of theoretical and applicative studies in which they were successfully used for text and author profiling},
KEYWORDS = {Computational Language Variation Analysis, Linguistic Profiling, Universal Dependencies},
PAGES = {7145-7151},
URL = {http://www.lrec-conf.org/proceedings/lrec2020/pdf/2020.lrec-1.883.pdf},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {979-10-95546-34-4},
CONFERENCE_NAME = {Conference on Language Resources and Evaluation (LREC)},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the 12th Language Resources and Evaluation Conference-LREC 2020},
}
@INPROCEEDINGS{CALAMAI_2020_INPROCEEDINGS_CPMSBB_446743,
AUTHOR = {Calamai, S. and Pretto, N. and Monachini, M. and Stamuli, M. F. and Bianchi, S. and Bonazzoli, P.},
TITLE = {Building a Home for Italian Audio Archives},
YEAR = {2020},
ABSTRACT = {Audio and audiovisual archives are at the crossroads of different fields of knowledge, yet they require common solutions for both their long-term preservation and their description, availability, use and reuse. Archivio Vi. Vo. is an Italian project financed by the Tuscany Region, aiming to (i) explore methods for long-term preservation and secure access to oral sources and (ii) develop an infrastructure under the CLARIN-IT umbrella offering several services for scholars from different domains interested in oral sources. This paper describes the project's infrastructure and its methodology through a case study on the Caterina Bueno's audio archive},
KEYWORDS = {oral archives, infrastructures},
PAGES = {112-116},
URL = {https://iris.cnr.it/handle/20.500.14243/446743},
CONFERENCE_NAME = {CLARIN2020 Annual Conference Proceedings ISSN 2773-2177 (online)},
}
@INPROCEEDINGS{CIMINO_2020_INPROCEEDINGS_CDN_400929,
AUTHOR = {Cimino, A. and Dell'Orletta, F. and Nissim, M.},
TITLE = {TAG-it@EVALITA2020: Overview of the Topic, Age, and Gender prediction task for Italian},
YEAR = {2020},
ABSTRACT = {The Topic, Age, and Gender (TAG-it) pre-diction task in Italian was organised in the context of EVALITA 2020, using forum posts as textual evidence for profiling their authors. The task was articulated in two separate subtasks: one where all three dimensions (topic, gender, age) were to be predicted at once; the other where training and test sets were drawn from different forum topics and gender or age had to be predicted separately. Teams tackled the problems both with classical machine learning methods as well as neural models. Using the training-data to fine-tuning a BERT-based monolingual model for Italian proved eventually as the most successful strategy in both subtasks. We observe that topic and gender are easier to predict than age. The higher results for gender obtained in this shared task with respect to a comparable challenge at EVALITA 2018might be due to the larger evidence per author provided at this edition, as well as to the availability of pre-trained large models for fine-tuning, which have shown improvement on very many NLP tasks},
KEYWORDS = {natural language processing, linguistic proifiling},
URL = {https://iris.cnr.it/handle/20.500.14243/400929},
CONFERENCE_NAME = {Seventh Evaluation Campaign of Natural Language Processing and Speech Tools for Italian (EVALITA)},
}
@INPROCEEDINGS{DEMATTEI_2020_INPROCEEDINGS_DCDN_401393,
AUTHOR = {De Mattei, L. and Cafagna, M. and Dell'Orletta, F. and Nissim, M.},
TITLE = {Invisible to People but not to Machines: Evaluation of Style-aware Headline Generation in Absence of Reliable Human Judgment},
YEAR = {2020},
ABSTRACT = {We automatically generate headlines that are expected to comply with the specific styles of two different Italian newspapers. Through a data alignment strategy and different training/testing settings, we aim at decoupling content from style and preserve the latter in generation. In order to evaluate the generated headlines' quality in terms of their specific newspaper-compliance, we devise a fine-grained evaluation strategy based on automatic classification. We observe that our models do indeed learn newspaper-specific style. Importantly, we also observe that humans aren't reliable judges for this task, since although familiar with the newspapers, they are notable to discern their specific styles even in the original human-written headlines. The utility of automatic evaluation goes therefore beyond saving the costs and hurdles of manual annotation, and deserves particular care in its design},
KEYWORDS = {Natural Language Generation, Stylistic variations, Evaluation},
URL = {http://www.lrec-conf.org/proceedings/lrec2020/pdf/2020.lrec-1.828.pdf},
CONFERENCE_NAME = {12th Edition of International Conference on Language Resources and Evaluation (LREC 2020)},
}
@INPROCEEDINGS{DEMATTEI_2020_INPROCEEDINGS_DCDNG_400923,
AUTHOR = {De Mattei, L. and Cafagna, M. and Dell'Orletta, F. and Nissim, M. and Gatt, A.},
TITLE = {CHANGE-IT@EVALITA 2020: Change Headlines, Adapt News, GEnerate},
YEAR = {2020},
ABSTRACT = {We propose a generation task for Italian-more specifically, a style transfer task for headlines of Italian newspapers. This is the first shared task on generation included in the EVALITA evaluation framework. Indeed, one of the reasons to have this task is to stimulate more research on generation within the Italian community. With this aim in mind, we release to the participating teams not only training data, but also a baseline sequence to sequence model that performs the task in order to help everyone get started, even when not accustomed to Natural Language Generation (NLG) approaches. Contextually, we explore the complex issue of automatic evaluation of generated text, which is receiving particular attention in the NLG community},
KEYWORDS = {Natural Language Generation, Style transfer},
URL = {https://iris.cnr.it/handle/20.500.14243/400923},
CONFERENCE_NAME = {Seventh Evaluation Campaign of Natural Language Processing and Speech Tools for Italian (EVALITA)},
}
@INPROCEEDINGS{DEMATTEI_2020_INPROCEEDINGS_DCDNG_401384,
AUTHOR = {De Mattei, L. and Cafagna, M. and Dell'Orletta, F. and Nissim, M. and Guerini, M.},
TITLE = {GePpeTto Carves Italian into a Language Model},
YEAR = {2020},
ABSTRACT = {In the last few years, pre-trained neural architectures have provided impressive improvements across several NLP tasks. Still, generative language models are available mainly for English. We develop GePpeTto, the first generative language model for Italian, built using the GPT-2 architecture. We provide a thorough analysis of GePpeTto's quality by means of both an automatic and a human-based evaluation. The automatic assessment consists in (i) calculating perplexity across different genres and (ii) a profiling analysis over GePpeTto's writing characteristics. We find that GePpeTto's production is a sort of bonsai version of human production, with shorter but yet complex sentences. Human evaluation is performed over a sentence completion task, whereGePpeTto's output is judged as natural more often than not, and much closer to the original human texts than to a simpler language model which we take as baseline},
KEYWORDS = {natural language generation},
URL = {https://iris.cnr.it/handle/20.500.14243/401384},
CONFERENCE_NAME = {Seventh Italian Conference on Computational Linguistics (CLiC-it 2020)},
}
@INPROCEEDINGS{DEMATTEI_2020_INPROCEEDINGS_DCLDNG_400921,
AUTHOR = {De Mattei, L. and Cafagna, M. and Lai, H. and Dell'Orletta, F. and Nissim, M. and Gatt, A.},
TITLE = {On the interaction of automatic evaluationand task framing in headline style transfer},
YEAR = {2020},
ABSTRACT = {An ongoing debate in the NLG communityconcerns the best way to evaluate systems, with human evaluation often being consideredthe most reliable method, compared to corpus-based metrics. However, tasks involving sub-tle textual differences, such as style transfer, tend to be hard for humans to perform. In thispaper, we propose an evaluation method forthis task based on purposely-trained classifiers, showing that it better reflects system differ-ences than traditional metrics such as BLEUand ROUGE},
URL = {https://iris.cnr.it/handle/20.500.14243/400921},
}
@INPROCEEDINGS{DEMATTEI_2020_INPROCEEDINGS_DDIMPR_421769,
AUTHOR = {De Mattei, L. and De Martino, G. and Iovine, A. and Miaschi, A. and Polignano, M. and Rambelli, G.},
TITLE = {ATE ABSITA@ EVALITA2020: Overview of the Aspect Term Extraction and Aspect-based Sentiment Analysis Task},
YEAR = {2020},
ABSTRACT = {Over the last years, the rise of novel sentiment analysis techniques to assess aspect-based opinions on product reviews has become a key component for providing valuable insights to both consumers and businesses. To this extent, we propose ATE\_ABSITA: the EVALITA 2020 shared task on Aspect Term Extraction and Aspect-Based Sentiment Analysis. In particular, we approach the task as a cascade of three subtasks: Aspect Term Extraction (ATE), Aspect-based Sentiment Analysis (ABSA) and Sentiment Analysis (SA). Therefore, we invited participants to submit systems designed to automatically identify the "aspect terms" in each review and to predict the sentiment expressed for each aspect, along with the sentiment of the entire review. The task received broad interest, with 27 teams registered and more than 45 participants. However, only three teams submitted their working systems. The results obtained underline the task's difficulty, but they also show how it is possible to deal with it using innovative approaches and models. Indeed, two of them are based on large pre-trained language models as typical in the current state of the art for the English language},
KEYWORDS = {nlp, sentiment analysis, shared task},
URL = {http://ceur-ws.org/Vol-2765/paper153.pdf},
CONFERENCE_NAME = {Seventh Evaluation Campaign of Natural Language Processing and Speech Tools for Italian (EVALITA)},
BOOKTITLE = {Proceedings of the Seventh Evaluation Campaign of Natural Language Processing and Speech Tools for Italian (EVALITA)},
}
@INPROCEEDINGS{DELGRATTA_2020_INPROCEEDINGS_DBBS_443439,
AUTHOR = {Del Gratta, R. and Boschetti, F. and Bambaci, L. and Sarnari, F.},
TITLE = {Approaching document analysis with a formal model},
YEAR = {2020},
ABSTRACT = {We introduce a formal approach to document and text analysis. The method proposed herein results in a mathematical and physical model/framework which can formalize different challenges in research fields such as computational linguistics, digital philology, and software engineering, principally if applied to document and text analysis. We examine texts and documents from an evolutionary perspective, where both corruption and correction are involved. We describe document evolution via fiber bundles formalism},
KEYWORDS = {Formal model, document analysis, evolutionary approach},
PAGES = {208-214},
URL = {https://ieeexplore.ieee.org/stamp/stamp.jsp?tp=\&arnumber=9357202\&tag=1},
DOI = {10.1109/CIST49399.2021.9357202},
CONFERENCE_NAME = {6th International IEEE Colloquium on Information Science and Technology},
BOOKTITLE = {6th International IEEE Colloquium on Information Science and Technology},
}
@INPROCEEDINGS{DELGROSSO_2020_INPROCEEDINGS_DGM_411284,
AUTHOR = {Del Grosso, A. M. and Giovannetti, E. and Marchi, S.},
TITLE = {Enriching a Multilingual Terminology Exploiting Parallel Texts: An Experiment on the Italian Translation of the Babylonian Talmud},
YEAR = {2020},
ABSTRACT = {Parallel texts can represent an extremely useful source of information in a number of text and linguistic processing tasks. In this work we show an experiment conducted on the Italian translation of the Babylonian Talmud, a text we have analyzed and processed to support in the construction of a multilingual Hebrew/Aramaic/Italian terminological resource. The approach we adopted comprised: i) the TEI encoding of the text, ii) the automatic extraction of the Italian terms, iii) the addition of Hebrew/Aramaic terms via word-by-word alignment, iv) the revision of the obtained results},
KEYWORDS = {multilingual terminology, parallel text, text alignment, babylonian talmud},
PAGES = {119-124},
URL = {http://amsacta.unibo.it/6316/1/AIUCD_2020_volume_FINAL.pdf},
DOI = {10.6092/unibo/amsacta/6316},
ISBN = {978-88-942535-4-2},
CONFERENCE_NAME = {IX Convegno Annuale AIUCD},
BOOKTITLE = {Atti del IX Convegno Annuale AIUCD. La svolta inevitabile: sfide e prospettive per l'Informatica Umanistica},
}
@INPROCEEDINGS{DIDONATO_2020_INPROCEEDINGS_DMEPMD_404326,
AUTHOR = {Di Donato, F. and Monachini, M. and Eskevich, M. and Pohle, S. and Moranville, Y. and Dumouchel, S.},
TITLE = {Social Sciences and Humanities Pathway. Towards the European Open Science Cloud},
YEAR = {2020},
ABSTRACT = {The paper describes a journey which starts from various social sciences and humanities (SSH) Research Infrastructures (RI) in Europe and arrives at the comprehensive "ecosystem of infrastructures", namely the European Open Science Cloud (EOSC). We highlight how the SSH Open Science infrastructures contribute to the goal of establishing the EOSC. First, through the example of OPERAS, the European Research Infrastructure for Open Scholarly Communication in the SSH, to see how its services are conceived to be part of the EOSC and to address the communities' needs. The next two sections highlight collaboration practices between partners in Europe to build the SSH component of the EOSC and a SSH discovery platform, as a service of OPERAS and the EOSC. The last two sections focus on an implementation network dedicated to SSH data fairification},
KEYWORDS = {EOSC, Open science, SSH, Infrastructures},
PAGES = {5-9},
URL = {https://www.aclweb.org/anthology/2020.lr4sshoc-1.2.pdf},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {979-10-95546-43-6},
CONFERENCE_NAME = {Language Resources and Evaluation Conference (LREC 2020)},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the Workshop about Language Resources for the SSH Cloud},
EDITOR = {Broeder, D. and Eskevich, M. and Monachini, M.},
}
@INPROCEEDINGS{DUVAL_2020_INPROCEEDINGS_DG_424499,
AUTHOR = {Duval, F. and Guadagnini, E.},
TITLE = {La rappresentazione lessicale del teatro antico nel Medioevo francese e italiano: per una lessicologia storica tra "transferts culturels" e comparatismo},
YEAR = {2020},
ABSTRACT = {Studio della ricezione italiana e francese medievale del lessico e dei concetti del teatro classico},
URL = {https://iris.cnr.it/handle/20.500.14243/424499},
ISBN = {9782503587714},
}
@INPROCEEDINGS{FAVARO_2020_INPROCEEDINGS_FBM_533916,
AUTHOR = {Favaro, M. and Biffi, M. and Montemagni, S.},
TITLE = {Risorse linguistiche di varietà storiche di italiano: Il progetto TrAVaSI},
YEAR = {2020},
ABSTRACT = {Questo contributo si propone di presentare il progetto TrAVaSI (Trattamento Automatico di Varietà Storiche di Italiano), il cui obiettivo è la creazione di risorse per il trattamento automatico di varietà storiche della lingua italiana, in particolare lessici diacronici e corpora arricchiti con annotazione linguistica da utilizzare per lo sviluppo e/o la specializzazione di strumenti di annotazione. Il contributo illustra gli obiettivi, i primi risultati conseguiti e le prospettive di sviluppo},
KEYWORDS = {Language Resources, Historical Varieties of Italian, Linguistic Annotation},
PAGES = {178-186},
URL = {https://doi.org/10.4000/books.aaccademia.8515},
DOI = {10.4000/books},
PUBLISHER = {Accademia University Press (Torino, ITA)},
ISBN = {979-12-80136-33-6},
CONFERENCE_NAME = {CLiC-it 2020-Italian Conference on Computational Linguistics},
CONFERENCE_PLACE = {Torino},
BOOKTITLE = {Proceedings of the Seventh Italian Conference on Computational Linguistics},
EDITOR = {Monti, J. and Dell'Orletta, F. and Tamburini, F.},
}
@INPROCEEDINGS{FERRO_2020_INPROCEEDINGS_FGC_423948,
AUTHOR = {Ferro, M. and Giulivi, S. and Cappa, C.},
TITLE = {The AEREST reading database},
YEAR = {2020},
ABSTRACT = {Aerest is a reading assessment protocol for the concurrent evaluation of a child's decoding and comprehension skills. Reading data complying with the Aerest protocol were automatically collected and structured with the ReadLet web-based platform in a pilot study, to form the Aerest Reading Database. The content, structure and potential of the database are described here, together with the main directions of current and future developments},
KEYWORDS = {reading database, reading efficiency, decoding, comprehension, multimodal analysis},
PAGES = {1-6},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85097912116\&origin=inward},
VOLUME = {2769},
PUBLISHER = {Accademia University Press (Torino, ITA)},
ISBN = {9791280136282},
CONFERENCE_NAME = {7th Italian Conference on Computational Linguistics (CLIC-IT'20)},
CONFERENCE_PLACE = {Torino},
}
@INPROCEEDINGS{IAVARONE_2020_INPROCEEDINGS_ID_400968,
AUTHOR = {Iavarone, B. and Dell'Orletta, F.},
TITLE = {Predicting movie-elicited emotions from dialogue in screenplay text: A study on "Forrest Gump"},
YEAR = {2020},
ABSTRACT = {We present a new dataset of sentences extracted from the movie Forrest Gump, annotated with the emotions perceived by a group of subjects while watching the movie. We run experiments to predict these emotions using two classifiers, one based on a Support Vector Machine with linguistic and lexical features, the other based on BERT. The experiments showed that contextual embeddings are effective in predicting human-perceived emotions},
KEYWORDS = {natural language processing, affective computing},
URL = {https://iris.cnr.it/handle/20.500.14243/400968},
CONFERENCE_NAME = {Seventh Italian Conference on Computational Linguistics (CLiC-it 2020)},
}
@INPROCEEDINGS{KHAN_2020_INPROCEEDINGS_K_407585,
AUTHOR = {Khan, F.},
TITLE = {Representing Temporal Information in Lexical Linked Data Resources},
YEAR = {2020},
ABSTRACT = {The increasing recognition of the utility of Linked Data as a means of publishing lexical resources has helped to underline the need for RDF-based data models with the flexibility and expressivity to be able to represent the most salient kinds of information contained in such resources as structured data; this includes, notably, information relating to time and the temporal dimension. In this article we describe a perdurantist approach to modelling diachronic lexical information which builds upon work which we have previously presented and which is based on the ontolex-lemon vocabulary. We present two extended examples, one taken from the Oxford English Dictionary, the other from a work on etymology, to show how our approach can handle different kinds of temporal information often found in lexical resources},
URL = {https://iris.cnr.it/handle/20.500.14243/407585},
ISBN = {979-10-95546-36-8},
}
@INPROCEEDINGS{KHAN_2020_INPROCEEDINGS_KRSBKT_404921,
AUTHOR = {Khan, F. and Romary, L. and Salgado, A. and Bowers, J. and Khemakhem, M. and Tasovac, T.},
TITLE = {Modelling Etymology in LMF/TEI: The Grande Dicionário Houaiss da Língua Portuguesa Dictionary as a Use Case},
YEAR = {2020},
ABSTRACT = {In this article, we will introduce two of the new parts of the new multi-part version of the Lexical Markup Framework (LMF) ISO standard, namely Part 3 of the standard (ISO 24613-3), which deals with etymological and diachronic data, and Part 4 (ISO 24613-4), which consists of a TEI serialisation of all of the prior parts of the model. We will demonstrate the use of both standards by describing the LMF encoding of a small number of examples taken from a sample conversion of the reference Portuguese dictionary Grande Dicion´ario Houaiss da L´?ngua Portuguesa, part of a broader experiment comprising the analysis of different, heterogeneously encoded, Portuguese lexical resources. We present the examples in the Unified Modelling Language (UML) and also in a couple of cases in TEI},
URL = {https://iris.cnr.it/handle/20.500.14243/404921},
ISBN = {979-10-95546-36-8},
}
@INPROCEEDINGS{LENCI_2020_INPROCEEDINGS_LMBDDDDMCPVL_384922,
AUTHOR = {Lenci, A. and Montemagni, S. and Boschetti, F. and De Felice, I. and Dei Rossi, S. and Dell'Orletta, F. and Di Giorgio, M. and Miliani, M. and C Passaro, L. and Puddu, A. and Venturi, G. and Labanca, N.},
TITLE = {Voices of the Great War: A Richly Annotated Corpus of Italian Texts on the First World War},
YEAR = {2020},
ABSTRACT = {Voci della Grande Guerra ("Voices of the Great War") is the first large corpus of Italian historical texts dating back to the period of First World War. This corpus differs from other existing resources in several respects. First, from the linguistic point of view it gives account of the wide range of varieties in which Italian was articulated in that period, namely from a diastratic (educated vs. uneducated writers), diaphasic (low/informal vs. high/formal registers) and diatopic (regional varieties, dialects) points of view. From the historical perspective, through a collection of texts belonging to different genres it represents different views on the war and the various styles of narrating war events and experiences. The final corpus is balanced along various dimensions, corresponding to the textual genre, the language variety used, the author type and the typology of conveyed contents. The corpus is annotated with lemmas, part-of-speech, terminology, and named entities. Significant corpus samples representative of the different "voices" have also been enriched with meta-linguistic and syntactic information. The layer of syntactic annotation forms the first nucleus of an Italian historical treebank complying with the Universal Dependencies standard. The paper illustrates the final resource, the methodology and tools used to build it, and the Web Interface for navigating it},
KEYWORDS = {Historical Corpora, Linguistic and Meta-linguistic Annotation, Information Extraction},
PAGES = {911-918},
URL = {https://www.aclweb.org/anthology/2020.lrec-1.114.pdf},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {979-10-95546-34-4},
CONFERENCE_NAME = {Conference on Language Resources and Evaluation (LREC)},
CONFERENCE_PLACE = {Paris},
}
@INPROCEEDINGS{MARZI_2020_INPROCEEDINGS_MRNTP_382398,
AUTHOR = {Marzi, C. and Rodella, A. and Nadalini, A. and Taxitari, L. and Pirrelli, V.},
TITLE = {Does finger-tracking point to child reading strategies?},
YEAR = {2020},
ABSTRACT = {The movement of a child's index finger that points to a printed text while (s)he is reading may provide a proxy for thechild's eye movements and attention focus. We validated this correlation by showing a quantitative analysis of patterns of "finger-tracking" of Italian early graders engaged in reading a text displayed on a tablet. A web application interfaced with the tablet monitors the reading behaviour by modelling the way the child points to the text while reading. Theanalysis found significant developmental trends in reading strategies, marking an interesting contrast between typically developing and atypically developing readers},
KEYWORDS = {reading assessment, reading strategies, mobile technology, special educiation needs},
PAGES = {1-7},
URL = {http://ceur-ws.org/Vol-2769/paper_60.pdf},
VOLUME = {2769},
PUBLISHER = {CEUR-WS. org (Aachen, DEU)},
CONFERENCE_NAME = {Italian Conference on Computational Linguistics 2020},
CONFERENCE_PLACE = {Aachen},
BOOKTITLE = {Proceedings of the Seventh Italian Conference on Computational Linguistics},
}
@INPROCEEDINGS{MATTEI_2020_INPROCEEDINGS_MBD_400967,
AUTHOR = {Mattei, A. and Brunato, D. and Dell'Orletta, F.},
TITLE = {The Style of a Successful Story: a Computational Study on the Fanfiction Genre},
YEAR = {2020},
ABSTRACT = {This paper presents a new corpus for the Italian language representative of the fan-fiction genre. It comprises about 55k user-generated stories inspired to the original fantasy saga "Harry Potter" and published on a popular website. The corpus is large enough to support data-driven investigations in many directions, from more traditional studies on language variation aimed at characterizing this genre with respect to more traditional ones, to emerging topics in computational social science such as the identification of factors involved in the success of a story. The latter is the focus of the presented case-study, in which a wide set of multi-level linguistic features has been automatically extracted from a subset of the corpus and analysed in order to detect the ones which significantly discriminate successful from unsuccessful stories},
KEYWORDS = {natural language processing, Computational Sociolinguistics, stylistic analysis},
URL = {https://iris.cnr.it/handle/20.500.14243/400967},
CONFERENCE_NAME = {Seventh Italian Conference on Computational Linguistics (CLiC-it 2020)},
}
@INPROCEEDINGS{MIASCHI_2020_INPROCEEDINGS_MABDV_421767,
AUTHOR = {Miaschi, A. and Alzetta, C. and Brunato, D. P. and Dell'Orletta, F. and Venturi, G.},
TITLE = {Is Neural Language Model Perplexity Related to Readability?},
YEAR = {2020},
ABSTRACT = {This paper explores the relationship between Neural Language Model (NLM) perplexity and sentence readability. Starting from the evidence that NLMs implicitly acquire sophisticated linguistic knowledge from a huge amount of training data, our goal is to investigate whether perplexity is affected by linguistic features used to automatically assess sentence readability and if there is a correlation between the two metrics. Our findings suggest that this correlation is actually quite weak and the two metrics are affected by different linguistic phenomena},
KEYWORDS = {nlp, neural language models, readability},
URL = {http://ceur-ws.org/Vol-2769/paper_57.pdf},
ISBN = {979-12-80136-28-2},
CONFERENCE_NAME = {Seventh Italian Conference on Computational Linguistics},
BOOKTITLE = {Proceedings of the Seventh Italian Conference on Computational Linguistics},
}
@INPROCEEDINGS{MIASCHI_2020_INPROCEEDINGS_MBDV_379646,
AUTHOR = {Miaschi, A. and Brunato, D. and Dell'Orletta, F. and Venturi, G.},
TITLE = {Linguistic Profiling of a Neural Language Model},
YEAR = {2020},
ABSTRACT = {In this paper we investigate the linguistic knowledge learned by a Neural Language Model (NLM) before and after a fine-tuning process and how this knowledge affects its predictions during several classification problems. We use a wide set of probing tasks, each of which corresponds to a distinct sentence-level feature extracted from different levels of linguistic annotation. We show that BERT is able to encode a wide range of linguistic characteristics, but it tends to lose this information when trained on specific downstream tasks. We also find that BERT's capacity to encode different kind of linguistic properties has a positive influence on its predictions: the more it stores readable linguistic information of a sentence, the higher will be its capacity of predicting the expected label assigned to that sentence},
KEYWORDS = {Linguistic Profiling, Neural Language Model, Interpretability},
PAGES = {745-756},
URL = {https://www.aclweb.org/anthology/2020.coling-main.65/},
DOI = {10.18653/v1/2020.coling-main.65},
ISBN = {978-1-952148-27-9},
CONFERENCE_NAME = {International Conference on Computational Linguistics (COLING)},
BOOKTITLE = {International Conference on Computational Linguistics (COLING)},
}
@INPROCEEDINGS{MIASCHI_2020_INPROCEEDINGS_MDBDSSV_384933,
AUTHOR = {Miaschi, A. and Davidson, S. and Brunato, D. P. and Dell'Orletta, F. and Sagae, K. and Sanchez Gutierrez, C. H. and Venturi, G.},
TITLE = {Tracking the Evolution of Written Language Competence in L2 Spanish Learners},
YEAR = {2020},
ABSTRACT = {In this paper we present an NLP-based approach for tracking the evolution of written language competence in L2 Spanish learners using a wide range of linguistic features automatically extracted from students' written productions. Beyond reporting classification results for different scenarios, we explore the connection between the most predictive features and the teaching curriculum, finding that our set of linguistic features often reflects the explicit instruction that students receive during each course},
KEYWORDS = {Evolution of Language Competence, Natural Language Processing, Linguistic Profiling},
PAGES = {92-101},
URL = {https://www.aclweb.org/anthology/2020.bea-1.9.pdf},
DOI = {10.18653/v1/W16-05},
PUBLISHER = {Association for Computational Linguistics (Stroudsburg, USA)},
ISBN = {978-1-941643-83-9},
CONFERENCE_NAME = {15th Workshop on Innovative Use of NLP for Building Educational Applications},
CONFERENCE_PLACE = {Stroudsburg},
BOOKTITLE = {Proceedings of 15th Workshop on Innovative Use of NLP for Building Educational Applications},
}
@INPROCEEDINGS{MIASCHI_2020_INPROCEEDINGS_MD_421763,
AUTHOR = {Miaschi, A. and Dell'Orletta, F.},
TITLE = {Contextual and Non-Contextual Word Embeddings: an in-depth Linguistic Investigation},
YEAR = {2020},
ABSTRACT = {In this paper we present a comparison between the linguistic knowledge encoded in the internal representations of a contextual Language Model (BERT) and a contextual-independent one (Word2vec). We use a wide set of probing tasks, each of which corresponds to a distinct sentence-level feature extracted from different levels of linguistic annotation. We show that, although BERT is capable of understanding the full context of each word in an input sequence, the implicit knowledge encoded in its aggregated sentence representations is still comparable to that of a contextual-independent model. We also find that BERT is able to encode sentence-level properties even within single-word embeddings, obtaining comparable or even superior results than those obtained with sentence representations},
KEYWORDS = {nlp, interpretability, representation learning},
PAGES = {110-119},
URL = {https://www.aclweb.org/anthology/2020.repl4nlp-1.15},
DOI = {10.18653/v1/2020.repl4nlp-1.15},
ISBN = {978-1-952148-15-6},
CONFERENCE_NAME = {5th Workshop on Representation Learning for NLP},
BOOKTITLE = {Proceedings of the 5th Workshop on Representation Learning for NLP},
}
@INPROCEEDINGS{MIASCHI_2020_INPROCEEDINGS_MSBDV_421765,
AUTHOR = {Miaschi, A. and Sarti, G. and Brunato, D. P. and Dell'Orletta, F. and Venturi, G.},
TITLE = {Italian Transformers Under the Linguistic Lens},
YEAR = {2020},
ABSTRACT = {In this paper we present an in-depth investigation of the linguistic knowledge encoded by the transformer models currently available for the Italian language. In particular, we investigate whether and how using different architectures of probing models affects the performance of Italian transformers in encoding a wide spectrum of linguistic features. Moreover, we explore how this implicit knowledge varies according to different textual genres},
KEYWORDS = {nlp, neural language models, interpretability},
URL = {http://ceur-ws.org/Vol-2769/paper_56.pdf},
ISBN = {979-12-80136-28-2},
CONFERENCE_NAME = {Seventh Italian Conference on Computational Linguistics (CLiC-it)},
BOOKTITLE = {Proceedings of the Seventh Italian Conference on Computational Linguistics (CLiC-it)},
}
@INPROCEEDINGS{MONTEMAGNI_2020_INPROCEEDINGS_M_426632,
AUTHOR = {Montemagni, S.},
TITLE = {Strategie linguistiche della divulgazione scientifica: una prospettiva linguistico-computazionale},
YEAR = {2020},
ABSTRACT = {La ricostruzione delle strategie linguistiche della divulgazione scientifica viene affrontata in questo studio a partire dall'analisi di corpora condotta con l'ausilio di metodi e tecniche di Trattamento Automatico della Lingua (TAL). Dall'analisi contrastiva di corpora arricchiti con annotazione linguistica e selezionati come rappresentativi di diverse varietà d'uso della lingua della comunicazione scientifica emerge che la lingua della divulgazione presenta marcate tendenze lessicali, morfo-sintattiche e sintattiche che la contraddistinguono rispetto ad altre varietà della lingua della scienza rappresentate dalla manualistica e dalla letteratura specialistica. Differenze significative risultano anche dal confronto tra varietà della lingua della divulgazione scientifica, relative a domini diversi (astronomia vs linguistica). In particolare, i risultati raggiunti dimostrano che le strategie linguistiche della divulgazione scientifica non sono circoscritte al versante lessicale e terminologico, ma coinvolgono anche la struttura morfo-sintattica e sintattica sottostante al testo con differenze significative anche tra domini diversi. Per quanto la lingua della divulgazione presenti i tratti peculiari della lingua della scienza in misura ridotta, è interessante rilevare che essa non è comunque assimilabile alla lingua comune rappresentata in questa sede dal linguaggio giornalistico e dalla narrativa},
KEYWORDS = {Trattamento Automatico della Lingua, Monitoraggio Linguistico, Lingua della Scienza, Divulgazione Scientifica},
PAGES = {79-104},
URL = {https://www.societadilinguisticaitaliana.net/wp-content/uploads/2020/06/eBookAtti_SLI_3_2020.pdf},
VOLUME = {3 NUOVA SERIE},
PUBLISHER = {Officinaventuno (Milano, ITA)},
ISBN = {978-88-97657-39-2},
CONFERENCE_NAME = {La linguistica della divulgazione, la divulgazione della linguistica-Atti del IV Convegno Interannuale SLI nuova serie},
CONFERENCE_PLACE = {Milano},
BOOKTITLE = {La linguistica della divulgazione, la divulgazione della linguistica},
EDITOR = {Grandi, N. and Masini, F.},
}
@INPROCEEDINGS{PICCINI_2020_INPROCEEDINGS_PBA_404488,
AUTHOR = {Piccini, S. and Bellandi, A. and Abrate, M.},
TITLE = {Diaterm: un modèle pour représenter l'évolution diachronique des terminologies dans le web sémantique},
YEAR = {2020},
ABSTRACT = {La présente contribution vise à illustrer Diaterm, un modèle à trois niveaux consacré à la représentation formelle de l'évolution diachronique des concepts et des termes dans un domaine donné. L'approche adoptée est basée sur la réification des relations N-aires. De surcroît, un ensemble de règles SWRL a été conçu permettant d'effectuer des tâches de raisonnement et d'automatiser l'attribution des informations temporelles. Diaterme a été adopté pour représenter formellement l'évolution diachronique de la terminologie de Saussure telle qu'elle émerge dans les oeuvres du Maître genevois},
URL = {https://iris.cnr.it/handle/20.500.14243/404488},
ISBN = {978-2-919732-80-7},
}
@INPROCEEDINGS{PROIETTI_2020_INPROCEEDINGS_PY_459221,
AUTHOR = {Proietti, C. and Yusteginel, A.},
TITLE = {Persuasive Argumentation and Epistemic Attitudes},
YEAR = {2020},
ABSTRACT = {This paper studies the relation between persuasive argumentation and the speaker's epistemic attitude. Dung-style abstract argumentation and dynamic epistemic logic provide the necessary tools to characterize the notion of persuasion. Within abstract argumentation, persuasive argumentation has been previously studied from a game-theoretic perspective. These approaches are blind to the fact that, in real-life situations, the epistemic attitude of the speaker determines which set of arguments will be disclosed by her in the context of a persuasive dialogue. This work is a first step to fill this gap. For this purpose we extend one of the logics of Schwarzentruber et al. with dynamic operators, designed to capture communicative phenomena. A complete axiomatization for the new logic via reduction axioms is provided. Within the new framework, a distinction between actual persuasion and persuasion from the speaker's perspective is made. Finally, we explore the relationship between the two notions},
URL = {https://iris.cnr.it/handle/20.500.14243/459221},
DOI = {10.1007/978-3-030-38808-9_7},
ISBN = {978-3-030-38807-2},
}
@INPROCEEDINGS{PROIETTI_2020_INPROCEEDINGS_PY_404079,
AUTHOR = {Proietti, C. and Yusteginel, A.},
TITLE = {Persuasive Argumentation and Epistemic Attitudes},
YEAR = {2020},
ABSTRACT = {This paper studies the relation between persuasive argumentation and the speaker's epistemic attitude. Dung-style abstract argumentation and dynamic epistemic logic provide the necessary tools to characterize the notion of persuasion. Within abstract argumentation, persuasive argumentation has been previously studied from a game-theoretic perspective. These approaches are blind to the fact that, in real-life situations, the epistemic attitude of the speaker determines which set of arguments will be disclosed by her in the context of a persuasive dialogue. This work is a first step to fill this gap. For this purpose we extend one of the logics of Schwarzentruber et al. with dynamic operators, designed to capture communicative phenomena. A complete axiomatization for the new logic via reduction axioms is provided. Within the new framework, a distinction between actual persuasion and persuasion from the speaker's perspective is made. Finally, we explore the relationship between the two notions},
KEYWORDS = {Argumentation frameworks, dynamic epistemic logic, persuasion, argument labellings},
PAGES = {104-123},
URL = {https://doi.org/10.1007/978-3-030-38808-9_7},
VOLUME = {12005},
DOI = {10.1007/978-3-030-38808-9_7},
PUBLISHER = {Springer},
ISBN = {978-3-030-38808-9},
CONFERENCE_NAME = {Second International Workshop, DaLí 2019},
BOOKTITLE = {Dynamic Logic. New Trends and Applications Second International Workshop, DaLí 2019, Porto, Portugal, October 7-11, 2019, Proceedings},
EDITOR = {Barbosa, L. S. and Baltag, A.},
}
@INPROCEEDINGS{RAVELLI_2020_INPROCEEDINGS_ROD_400965,
AUTHOR = {Ravelli, A. A. and Origlia, A. and Dell'Orletta, F.},
TITLE = {Exploring Attention in a Multimodal Corpus of Guided Tours},
YEAR = {2020},
ABSTRACT = {This paper explores the possibility to annotate engagement as an extra-linguistic information in a multimodal corpus of guided tours in cultural sites. Engagement has been annotated in terms of gain or loss of perceived attention from the audience, and this information has been aligned to the transcription of the speech from the guide. A preliminary analysis suggests that the level of engagement cor-relates with some specific linguistic features, opening up to possible future exploitation},
KEYWORDS = {Multimodal Corpus, natural language processing, engagement},
URL = {https://iris.cnr.it/handle/20.500.14243/400965},
CONFERENCE_NAME = {Seventh Italian Conference on Computational Linguistics (CLiC-it 2020)},
}
@INPROCEEDINGS{RICCI_2020_INPROCEEDINGS_RMBSD_385311,
AUTHOR = {Ricci, L. and Melighetti, F. and Boschetti, F. and Salvatori, E. and Del Grosso, A. M.},
TITLE = {DH as an Ideal Educational Environment: the Ethnographic Museum of La Spezia},
YEAR = {2020},
ABSTRACT = {The authors present the outcomes of an educational experimentation that took place in the academic year 2018-2019 at the degree course in Informatica Umanistica at the University of Pisa. The first objective of the project concerned the digitization of a corpus of postcards from the period of the First World War owned by the ethnographic Museum of La Spezia "G. Podenzana". The aims of the work are not only the historical study of the corpus, but also the organization of a public history project with the Museum},
KEYWORDS = {digital humanities},
PAGES = {222-226},
URL = {http://amsacta.unibo.it/id/eprint/6316},
DOI = {10.6092/unibo/amsacta/6316},
ISBN = {978-88-942535-4-2},
CONFERENCE_NAME = {La svolta inevitabile: sfide e prospettive per l'Informatica Umanistica},
BOOKTITLE = {Quaderni di Umanistica Digitale},
EDITOR = {Marras, C. and Passarotti, M. and Franzini, G. and Litta, E.},
}
@INPROCEEDINGS{RUSSO_2020_INPROCEEDINGS_R_505941,
AUTHOR = {Russo, I.},
TITLE = {Sadness and Fear: Classification of Fake NewsSpreaders Content on Twitter},
YEAR = {2020},
ABSTRACT = {The vast amount of accurate and inaccurate information circulating on the internet requires computational methodologies to detect low-quality content. This kind of content often constitutes fake news, as in the PAN@ CLEF 2020 competition Profiling Fake News Spreaders on Twitter. This competition asks for systems that identify possible fake news spreaders on social media as a first step to prevent fake news from being propagated among online users. In this paper, the methodology used for this classification task is reported. Preprocessing of the data and the features extracted to classify fake news spreaders is explained. A regression-as-classification approach that enables the representation of being a fake news spreader as a gradable one is proposed. The performance (accuracy) on the training and the test set with the different sets of features is reported},
KEYWORDS = {emotion analysis, fake news},
URL = {https://iris.cnr.it/handle/20.500.14243/505941},
BOOKTITLE = {Proc. Work. Notes CLEF Conf. Labs Eval. Forum},
}
@INPROCEEDINGS{RUSSO_2020_INPROCEEDINGS_R_505921,
AUTHOR = {Russo, I.},
TITLE = {Guessing the age of acquisition of italian lemmas through linear regression},
YEAR = {2020},
ABSTRACT = {The age of acquisition of a word is a psycholin-guistic variable concerning the age at which a word is typically learned. It correlates with other psycholinguistic variables such as famil-iarity, concreteness, and imageability. Exist-ing datasets for multiple languages also in-clude linguistic variables such as the length and the frequency of lemmas in different cor-pora. There are substantial sets of normative values for English, but for other languages, such as Italian, the coverage is scarce. In this paper, a set of regression experiments investigates whether it is possible to guess the age of acqui-sition of Italian lemmas that have not been pre-viously rated by humans. An intrinsic evalua-tion is proposed, correlating estimated Italian lemmas’ AoA with English lemmas’ AoA. An extrinsic evaluation-using AoA values as fea-tures for the classification of literary excerpts labeled by age appropriateness-shows how es-sential is lexical coverage for this task},
KEYWORDS = {lexical complexity, computational psycholinguistics},
PAGES = {43-48},
URL = {https://aclanthology.org/volumes/2020.cmcl-1/},
ISBN = {978-1-952148-68-2},
CONFERENCE_NAME = {Workshop on Cognitive Modeling and Computational Linguistics},
BOOKTITLE = {Proceedings of the Workshop on Cognitive Modeling and Computational Linguistics},
}
@INPROCEEDINGS{SANGUINETTI_2020_INPROCEEDINGS_SCDFSBCPR_506041,
AUTHOR = {Sanguinetti, M. and Comandini, G. and Di Nuovo, E. and Frenda, S. and Stranisci, M. and Bosco, C. and Caselli, T. and Patti, V. and Russo, I.},
TITLE = {Haspeede 2@ evalita2020: Overview of the evalita 2020 hate speech detection task},
YEAR = {2020},
ABSTRACT = {The Hate Speech Detection (HaSpeeDe 2) task is the second edition of a shared task on the detection of hateful content in Italian Twitter messages. HaSpeeDe 2 is composed of a Main task (hate speech detection) and two Pilot tasks, (stereotype and nominal utterance detection). Systems were challenged along two dimensions: (i) time, with test data coming from a different time period than the training data, and (ii) domain, with test data coming from the news domain (ie, news headlines). Overall, 14 teams participated in the Main task, the best systems achieved a macro F1-score of 0. 8088 and 0. 7744 on the indomain in the out-of-domain test sets, respectively; 6 teams submitted their results for Pilot task 1 (stereotype detection), the best systems achieved a macro F1-score of 0. 7719 and 0. 7203 on in-domain and outof-domain test sets. We did not receive any submission for Pilot task 2},
KEYWORDS = {hate speech},
URL = {https://iris.cnr.it/handle/20.500.14243/506041},
BOOKTITLE = {Evaluation Campaign of Natural Language Processing and Speech Tools for Italian},
}
@INPROCEEDINGS{SASSOLINI_2020_INPROCEEDINGS_SB_401784,
AUTHOR = {Sassolini, E. and Biffi, M.},
TITLE = {Strategie e metodi per il recupero di dizionari storici},
YEAR = {2020},
ABSTRACT = {The article describes ongoing work on the digitization of an authoritative and historically important Italian dictionary, namely Il Grande Dizionario della Lingua Italiana (GDLI) of S. Battaglia, with a focus on the stages of the conversion of this text into structured digital data. We report on the preliminary results of a collaboration between the Accademia della Crusca and Istituto di Linguistica Computazionale "A. Zampolli", which aims to extract the contents of the GDLI to convert them into structured digital data for human use, and/or to be integrated with other language resources, both dictionaries and corpora. The extraction process is articulated on the one hand in the definition of data extraction procedures, on the other hand in the adoption of strategies aimed at supporting the correction of errors},
KEYWORDS = {Archivi digitali, recupero e conservazione, estrazione dell'informazione},
PAGES = {235-239},
URL = {https://iris.cnr.it/handle/20.500.14243/401784},
DOI = {10.6092/unibo/amsacta/6316},
ISBN = {978-88-942535-4-2},
CONFERENCE_NAME = {IX Convegno annuale AIUCD: LA SVOLTA INEVITABILE: SFIDE E PROSPETTIVE PER L'INFORMATICA UMANISTICA},
}
@INPROCEEDINGS{TAXITARI_2020_INPROCEEDINGS_TCFMNP_501841,
AUTHOR = {Taxitari, L. and Cappa, C. and Ferro, M. and Marzi, C. and Nadalini, A. and Pirrelli, V.},
TITLE = {Using mobile technology for reading assessment},
YEAR = {2020},
ABSTRACT = {The enormous potential of Information and Communication Technologies (ICT) for addressing critical educational issues is generally acknowledged, but its use in the assessment of the complex skills of reading and understanding a text has been very limited to date. The paper contrasts traditional reading assessment protocols with ReadLet, an ICT platform with a tablet front-end, designed to support online monitoring of silent and oral reading abilities in early graders. ReadLet makes use of cloud computing and mobile technology for large-scale data collection and allows the time alignment of the child’s reading behaviour with texts tagged using Natural Language Processing (NLP) tools. Initial findings replicate established benchmarks from the psycholinguistic literature on reading in both typically and atypically developing children, making the application a new ground-breaking approach in the evaluation of reading skills},
KEYWORDS = {reading assessment, reading research, mobile technology, NLP, cloud computing, special education needs},
PAGES = {302-307},
URL = {https://ieeexplore.ieee.org/stamp/stamp.jsp?arnumber=9357173},
VOLUME = {2020-JUNE},
DOI = {10.1109/CiSt49399.2021.9357173},
ISBN = {978-1-7281-6646-9},
CONFERENCE_NAME = {6th IEEE Congress on Information Science and Technology (CiSt)},
BOOKTITLE = {Proceedings of the 6th IEEE Congress on Information Science and Technology (CiSt)},
}
@INPROCEEDINGS{BIANCHI_2020_INPROCEEDINGS_BCMPS_446736,
AUTHOR = {Bianchi, S. and Calamai, S. and Monachini, M. and Pretto, N. and Stamuli, M.},
TITLE = {The grey-side of audio archives},
YEAR = {2020},
ABSTRACT = {Archives often include documents that can hardly be considered publications or grey literature as such, yet they maintain their documentary value and play a role of primary sources for the specialists. These documents, indeed, can help archivists to reveal the sedimentation process of the archive itself and to preserve the authentic context of the documentary production. They also appear to be very useful for the community of researchers and scholars. This happens more frequently with oral archives which include 'non-conventional sources', thus bringing together audio documents, fieldworks notes, correspondence, slipcases, analogic compact cassettes or open reels. At the cross-road of two disciplines, Archival Science and Grey Literature, this paper aims to argue the applicability of the concept of grey literature to this wide range of documentary materials, by showing the experience of Archivio Vi. Vo, a regional project aiming at building a model for archiving, preserving, managing and disseminating audio documents},
KEYWORDS = {archivi orali},
URL = {https://iris.cnr.it/handle/20.500.14243/446736},
VOLUME = {2020-NOVEMBER},
ISSN = {1386-2316},
CONFERENCE_NAME = {GL2020 22nd International Conference on Grey Literature},
}
@INPROCEEDINGS{DONATO_2020_INPROCEEDINGS_DDPS_378119,
AUTHOR = {Donato, D. and Di Donato, F. and Pohle and Stefanie},
TITLE = {GOTRIPLE: Building an innovative discovery platform for the social sciences and humanities},
YEAR = {2020},
ABSTRACT = {The proposed poster presents the goals of the TRIPLE project and the ways the project is addressing them both through the work of its 8 intertwined work packages, and via the collaboration with existing research infrastructures in SSH, i. e. mainly CESSDA, CLARIN and DARIAH},
KEYWORDS = {GOTRIPLE, discovery, EOSC},
URL = {https://www.clarin.eu/sites/default/files/clarin2020_bazaar_didonato_triple.pdf},
CONFERENCE_NAME = {Clarin Annual Conference 2020},
}
@INPROCEEDINGS{PANCKHURST_2020_INPROCEEDINGS_PF_422985,
AUTHOR = {Panckhurst, R. and Frontini, F.},
TITLE = {An internationally FAIR Mediated Digital Discourse Corpus: towards scientific and pedagogical reuse},
YEAR = {2020},
ABSTRACT = {In this paper, the authors present a French Mediated Digital Discourse corpus, (88milSMS http: //88milsms. huma-num. fr https: //hdl. handle. net/11403/comere/ cmr-88milsms). Efforts were undertaken over the years to ensure its publication according to the best practices and standards of the community, thus guaranteeing compliance with FAIR principles and CLARIN recommendations with pertinent scientific and pedagogical reuse},
KEYWORDS = {FAIR data, SMS corpus},
URL = {https://www.clarin.eu/clarin-annual-conference-2020-abstracts},
CONFERENCE_NAME = {CLARIN Annual Conference 2020 (5-7 October). Virtual Edition},
BOOKTITLE = {Proceedings of CLARIN Annual Conference 2020 (5-7 October). Virtual Edition},
EDITOR = {Navarretta, C. and Eskevich, M.},
}
@INPROCEEDINGS{PIRRELLI_2020_INPROCEEDINGS_PCCDFGMNT_427657,
AUTHOR = {Pirrelli, V. and Cappa, C. and Crepaldi, D. and Del Pinto, V. and Ferro, M. and Giulivi, S. and Marzi, C. and Nadalini, A. and Taxitari, L.},
TITLE = {Tracking the pace of reading with finger movements},
YEAR = {2020},
ABSTRACT = {Recent experimental evidence in visual perception analysis shows that eye and finger movements strongly correlate during scene exploration, at both individual and group levels. A familiar context which exploits this synergistic behaviour is when children learn to read, with the practice of finger-pointing to text as a support for their attention focus, directional movement and voice-print match. Using a tablet to display short texts, we collected evidence on the finger-pointing behaviour of 3rd-6th Italian graders engaged in both silent and oral reading. "Finger-tracking" data, sampled by the tablet and aligned with the text, made it possible to time a child's reading paceat word and sentence level. Results are shown to replicate established benchmarks in the reading literature, such as the difference in reading pace between age-matched typical and atypical readers as a function of word frequency and length, and neighbourhood entropy and Old20. Atypical readers show increasing difficulty with longer words, with a steeper time increment for word length \> 6, integrating previous evidence. In addition, neighbourhood density plays a sparse facilitative role in atypical reading, with no significant interaction with neighbourhood entropy, pointing to a non trivial developmental interplay between sublexical reading and the richness of the Italian orthographic-phonological lexicon. Despite their different dynamics, optical and tactile strategies for text exploration prove to be highly congruent: this suggests that finger-tracking can be used as an ecological proxy for eye-tracking in reading assessment},
KEYWORDS = {Reading, Finger tracking, Mental Lexicon, Word frequency, Word Length, Neighbourhood entropy},
PAGES = {1},
URL = {https://osf.io/hr62g/},
CONFERENCE_NAME = {Words in the World International Conference},
BOOKTITLE = {Words in the World book of abstracts},
}
@TECHREPORT{ALBANESI_2020_TECHREPORT_ABCGMPPS_427138,
AUTHOR = {Albanesi, D. and Bellandi, A. and Colombo, M. and Giovannetti, E. and Marchi, S. and Papini, M. and Piccini, S. and Sciolette, F.},
TITLE = {Traduco: l'Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-Rapporto tecnico 17},
YEAR = {2020},
ABSTRACT = {La presente relazione tecnico-scientifica descrive l'attività svolta da ILC-CNR nel contesto del Progetto Traduzione Talmud Babilonese nel periodo novembre 2019-aprile 2020. Le principali attività tecniche svolte sul sistema Traduco sono state la risoluzione di bug, l'implementazione di nuove funzionalità richieste e lo sviluppo di una nuova interfaccia grafica utente. Le attività di ricerca sono state condotte, in continuità a quelle descritte nel rapporto precedente, nella rappresentazione della terminologia e della conoscenza del Talmud},
KEYWORDS = {Linguistica Computazionale, Traduzione di Testi Religiosi, Traduzione Assistita dal Calcolatore, Traduzione Collaborativa, Lessici elettronici, rappresentazione della conoscenza},
PAGES = {34},
URL = {https://iris.cnr.it/handle/20.500.14243/427138},
}
@TECHREPORT{ALBANESI_2020_TECHREPORT_ABCGMPS_427139,
AUTHOR = {Albanesi, D. and Bellandi, A. and Colombo, M. and Giovannetti, E. and Marchi, S. and Papini, M. and Sciolette, F.},
TITLE = {Traduco: l'Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-Rapporto tecnico 18},
YEAR = {2020},
ABSTRACT = {La presente relazione tecnico-scientifica descrive l'attività svolta da ILC-CNR nel contesto del Progetto Traduzione Talmud Babilonese nel periodo maggio 2020-ottobre 2020. Le principali attività tecniche svolte sul sistema Traduco sono state la risoluzione di bug, l'implementazione di nuove funzionalità richieste e lo sviluppo di una nuova interfaccia grafica utente. Le attività di ricerca sono state condotte, in continuità a quelle descritte nel rapporto precedente, nella rappresentazione del lessico, della terminologia e della conoscenza del Talmud},
KEYWORDS = {Linguistica Computazionale, Traduzione di Testi Religiosi, Traduzione Assistita dal Calcolatore, Traduzione Collaborativa, Lessici elettronici, rappresentazione della conoscenza},
PAGES = {35},
URL = {https://iris.cnr.it/handle/20.500.14243/427139},
}
@TECHREPORT{ALBANESI_2020_TECHREPORT_ABDGP_427143,
AUTHOR = {Albanesi, D. and Bellandi, A. and Del Grosso, A. M. and Giovannetti, E. and Papini, M.},
TITLE = {Traduco: l'Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-rapporto integrativo 2},
YEAR = {2020},
ABSTRACT = {La presente relazione tecnico-scientifica descrive l'attività svolta da ILC-CNR nel contesto delle attività di progetto previste dalla convenzione integrativa stipulata tra PTTB e ILC-CNR in data 10/07/2018 e condotte nel periodo febbraio 2019-gennaio 2020},
KEYWORDS = {Linguistica Computazionale, Traduzione di Testi Religiosi, Traduzione Assistita dal Calcolatore, Traduzione Collaborativa, Allineamento di Testi, Sviluppo front-end},
PAGES = {9},
URL = {https://iris.cnr.it/handle/20.500.14243/427143},
}
@TECHREPORT{BARTOLINI_2020_TECHREPORT_BQMA_398626,
AUTHOR = {Bartolini, R. and Quochi, V. and Monachini, M. and Affé, F.},
TITLE = {Relazione di fine progetto "PIM-Piattaforma Integrata Monitoraggio"},
YEAR = {2020},
ABSTRACT = {Il documento presenta l'attività svolta dal CNR-ILC nel ruolo di subcontraente di COMDATA per la realizzazione di moduli di trattamento automatico del linguaggio e la consulenza per l'integrazione di metodi di clustering automatico di documenti nella Digital Library del progetto PIM},
KEYWORDS = {accesso intelligente al testo, digital library, natural language processing},
PAGES = {156},
URL = {https://iris.cnr.it/handle/20.500.14243/398626},
}
@TECHREPORT{BREITFUSS_2020_TECHREPORT_BBDBBDF_378624,
AUTHOR = {Breitfuss, G. and Barreiros, C. and Dumouchel, S. and Blotière, E. and Bouillard, M. and Di Donato, F. and Forbes, P.},
TITLE = {TRIPLE Deliverable: D7. 1 Report on Stakeholder and Opportunity Analysis},
YEAR = {2020},
ABSTRACT = {In the present report on Stakeholder-and Opportunity Analysis (D7. 1), we provide the foundation for TRIPLE's exploitation strategy and TRIPLE's business model. By applying a broad mix of methods and tools we gained insights into relevant stakeholders, existing competition, the business environment, a first strategic orientation and derived recommendation for the future project work. From stakeholder analysis, we gained information about the stakeholder roles and needs as well as indications on their power and interest. Out of that data, we derived management strategies for specific stakeholder groups. The results are presented in an informative overview table and in a Power-Interest matrix. From our conducted environment analysis (PESTLE) we got rich information on each of the six categories. All detected factors were briefly described, classified as positive or negative and summarised in a table. The results were further processed in the finally conducted SWOT analysis. In order to get a broad overview of the competitive environment twenty-six scholarly communication platforms were evaluated through web-based research. The analysis covers an overview of offered features and functions, organisational insights, strengths \& weaknesses as well as impressions on usability and user experience. Looking at the products and services provided by the competitors, we recognize that the planned feature-set for TRIPLE platform represents unique features that will distinguish TRIPLE from the competition. Attention needs to be paid on a number of agile platforms which constantly release innovative (e. g. AI-powered) features. To complement the vantage points gained from the web-based competitor analysis an interview study with general Open Science Experts and executives from existing Open Science platforms was conducted. The interview results show that despite the many platforms and services available, there are still unoccupied market niches and underrepresented user groups. Finally, the conducted SWOT analysis shows first insights on how we can use our strength to balance our threats and weaknesses, to minimize risks, and to take the greatest possible advantage of chances for success},
URL = {https://iris.cnr.it/handle/20.500.14243/378624},
}
@TECHREPORT{CARDILLO_2020_TECHREPORT_CS_384740,
AUTHOR = {Cardillo, F. and Straccia, U.},
TITLE = {Fuzzy OWL-BOOST: Learning Fuzzy Concept Inclusions via Real-Valued Boosting},
YEAR = {2020},
ABSTRACT = {OWL ontologies are nowadays a quite popular way to describe structured knowledge in terms of classes, relations among classes and class instances. In this paper, given a target class T of an OWL ontology, we address the problem of learning fuzzy concept inclusion axioms that describe sufficient conditions for being an individual instance of T. To do so, we present Fuzzy OWL-BOOST that relies on the Real AdaBoost boosting algorithm adapted to the (fuzzy) OWL case. We illustrate its effectiveness by means of an experimentation. An interesting feature is that the learned rules can be represented directly into Fuzzy OWL 2. As a consequence, any Fuzzy OWL 2 reasoner can then be used to automatically determine/classify (and to which degree) whether an individual belongs to the target class T},
KEYWORDS = {Fuzzy Logic, Description Logics, OWL 2, Machine Learning, AdaBoost},
PAGES = {1-26},
URL = {https://arxiv.org/abs/2008.05297},
}
@TECHREPORT{DIDONATO_2020_TECHREPORT_DLBCDEGGMMOTT_378120,
AUTHOR = {Di Donato, F. and Lombardo, T. and Breitfuss, G. and Chen, Y. and Dumouchel, S. and Eskevich, M. and Gingold, A. and Gorgaini, E. and Monachini, M. and Moranville, Y. and Ocansey, J. T. and Thiel, C. and Tóthczifra, E.},
TITLE = {TRIPLE D 6. 1-Report on the General Interoperability Requirements},
YEAR = {2020},
ABSTRACT = {TRIPLE-Transforming Research Through Innovative Practices for Linked Interdisciplinary Exploration is a EU funded project under the INFRAEOSC-02-2019-Prototyping new innovative services topic, which started in October 2019 and will end in March 2023. Its main objective is to design and develop a discovery platform for SSH, called GOTRIPLE. This deliverable is the main outcome of Task 6. 1 which started at M4 at ends at M36, whose aim is to deal with the definition and the set-up of general TRIPLE's interoperability requirements, considering all the components which are composing the TRIPLE ecosystem (data, resources and tools). As preliminary results, we thus present here a general overview of the main EOSC interoperability requirements and specifications, both coming from a mapping of the EOSC Working Groups outputs, and of the most relevant results of EOSC related projects related to TRIPLE. We also attempt to provide TRIPLE's answers, proposals and solutions to the above mentioned requirements. The final picture presents different levels of precision, which depends on the fluidity of the EOSC definition on the one hand, and on the consequent fact that some implications are still unclear, and a discussion on the measures to address EOSC requirements is still on-going. While tackling interoperability, we introduce TRIPLE in its context in order to locate the GOTRIPLE platform in the EOSC frame, and more specifically in the SSH cluster of the EOSC (section 1). Section 2 defines the general interoperability requirements, starting with the software (2. 2) and then presents an analysis of the main outputs released by the EOSC Working groups (2. 3), taking into consideration as a general reference, the EOSC Interoperability Framework, and, more specifically, the FAIR and Architecture WGs documents (2. 3. 2, 2. 3. 4). These are the main guiding references for the design and realization of the EOSC, considering specifically interoperability. Section 2. 3. 3 illustrates how TRIPLE is translating into practice the FAIR requirements, while section 2. 3. 5 is focused on TRIPLE current decisions regarding the integration of the TRIPLE solution into the EOSC. To present an enriched scenario, the section includes as well a brief overview of other relevant outputs released by the EOSC WGs (Landscape, RoP, Sustainability and Skills and Training) (2. 3. 6). With the aim to provide a comprehensive analysis of the EOSC interoperability requirements, the WP6 partners have analyzed relevant deliverables produced by the main EOSC related projects as preparatory activity. The analysis was useful to understand the EOSC environment and its evolution in terms of interoperability and at the same time to understand which external deliverables have to be taken into consideration for the overall project development in TRIPLE. Section 3 includes a synthesis of this work, which is fully presented in Annex I. Section 4-Conclusions and Outlook, outlines TRIPLE's the next steps to achieve interoperability and the strategies that will be adopted},
KEYWORDS = {TRIPLE, GOTRIPLE, EOSC},
URL = {https://zenodo.org/record/4322806},
}
@MISC{BLOTIRE_2020_MISC_BDBBCDFPP_381974,
AUTHOR = {Blotière, E. and Dumouchel, S. and Barbot, L. and Breitfuss, G. and Chen, Y. and Di Donato, F. and Forbes, P. and Petitfils, C. and Pohle, S.},
TITLE = {TRIPLE project: building a discovery platform to enhance collaboration},
YEAR = {2020},
ABSTRACT = {Social Sciences and Humanities research is divided across a wide array of disciplines, sub-disciplines and languages. While this specialisation makes it possible to investigate the extensive variety of SSH topics, it also leads to a fragmentation that prevents SSH research from reaching its full potential. Use and reuse of research is suboptimal, interdisciplinary collaboration possibilities are often missed partially because of missing standards and referential keys between disciplines. Often, the reuse of data may paradoxically complicate a relevant sorting of data and a trust relationship between researchers. As a result, societal, economic and academic impacts are limited. Conceptually, there is a wealth of transdisciplinary collaborations, but in practice there is a need to help researchers and research institutions to connect them and support them, to prepare the research data for these overarching approaches and to make them findable and usable. The TRIPLE (Targeting Researchers through Innovative Practices and Linked Exploration) project is a practical answer to the above issues, as it aims at designing and developing the European discovery platform dedicated to Social Sciences and Humanities resources. Funded under the European Commission program INFRAEOSC-02-2019 "Prototyping new innovative services", thanks to a consortium of 19 partners, TRIPLE will develop a full multilingual and multicultural solution for the discovery and the reuse of Social Sciences and Humanities resources. The project started in October 2019 for a duration of 42 months thanks to European funding of 5. 6 million EUR},
URL = {https://iris.cnr.it/handle/20.500.14243/381974},
}
@MISC{BOSCHETTI_2020_MISC_BD_462909,
AUTHOR = {Boschetti, F. and Del Grosso, A. M.},
TITLE = {Textual markup (typographic, structural, semantic: HTML, CSS, XML)},
YEAR = {2020},
ABSTRACT = {Lezione tenuta nel contesto dell Summer School organizzata nel 2020 dal centro Venice Centre for Digital and Public Humanities (VeDPH)},
KEYWORDS = {Digital Humanities, Public Humanities, XML/TEI, Digital Scholarly Edition, VeDPH},
URL = {https://vedph.github.io/summercamp/},
}
@MISC{DELGROSSO_2020_MISC_D_462915,
AUTHOR = {Del Grosso, A. M.},
TITLE = {Git per edizioni digitali collaborative su GitHub},
YEAR = {2020},
ABSTRACT = {This workshop will cover the basic functionalities of the software Git and the platform GitHub. Two days, each day divided into two parts of three hours each. Morning sessions: presentation of Git topics/features (theory and practice) Afternoon sessions: hands-on exercises (developing a dynamic and collaborative digital scholarly edition) Total hours for the workshop 12 hours. Objectives of the workshop: Learning the most relevant features regarding Git tool with references to GitHub platform. Git is a "distributed" Version Control System. It is able to handle the history of the changes made to tracked resources over a time period. Git allows users to manage the evolution of collaborative documents and to revisit and/or revert the content of these documents to a particular older state. GitHub is a development platform where it is possible to host and review Git repositories, and many more functionalities. First day topics: Introduction to systems for version control Preliminaries about command line environment Installing Git and testing the correctness of the local installation Git design model and the basic work-flow Local version control: git init, git status, git add, git commit, git log Local files: git rm, git mv Second day topics: Git help: git help and man pages Remote basics: GitHub, git remote, git push, git fetch, git pull Searching and examination: git diff, git grep Advanced log options Branching system: git branch, git checkout, git merge Handling the commit history: git rebase, git reset},
KEYWORDS = {git, github, Digital Scholarly Edition, Filologia Collaborativa, Filologia Digitale},
URL = {https://www.unive.it/data/33113/2/43767},
}
@MISC{DELGROSSO_2020_MISC_D_462904,
AUTHOR = {Del Grosso, A. M.},
TITLE = {Dalla Recensio all'Emendatio Digitale. Teoria, metodi e applicazioni della filologia digitale},
YEAR = {2020},
ABSTRACT = {Presentazione svolta nel contesto del ciclo di webinars di informatica umanistica a cura di G. Ferrante e A. Mazzucchi intitolato "La tecnologia informatica applicata alle scienze filologiche e librarie". Il seminario, inserito nel corso di Alta Formazione in Storia e Filologia del Manoscritto e del Libro Antico della Scuola Superiore Meridionale (Girolamini), introduce in 5 ore di lezione all'uso dei linguaggi di markup per la rappresentazione e conservazione digitale di risorse filologiche e di apparati critici},
KEYWORDS = {Digital Humanities, Filologia Digitale, XML/TEI, Digital Scholarly Edition, Apparati Critici Digitali},
URL = {https://iris.cnr.it/handle/20.500.14243/462904},
}
@MISC{DELGROSSO_2020_MISC_DPCDFG_462924,
AUTHOR = {Del Grosso, A. M. and Piccini, S. and Cosenza, G. and D'Ottavi, G. and Fadda, E. and Gambarara, D.},
TITLE = {Saussure General Linguistics Project: Beyond the Course. A Knowledge Site for Rethinking Saussure's General Linguistics},
YEAR = {2020},
ABSTRACT = {The project is primarily committed to establish a standard scholarly edition of Saussure's General Linguistics related texts, making use of a consistent philological methodology, i. e. aware of the profoundly different textualities of the available sources, that is: autograph unfinished notes for a book, didactic materials (students' notes and Saussure's), and an edited volume},
KEYWORDS = {Digital Humaniteis, Digital Scholarly Edition, Saussure's manuscripts, Filologia Digitale, Filologia computazionale},
URL = {https://github.com/saussure-team/general-linguistics-project},
}
@MISC{DONATO_2020_MISC_DD_385055,
AUTHOR = {Donato, D. and Di Donato, F.},
TITLE = {TRIPLE. A European Discovery Platform for SSH},
YEAR = {2020},
ABSTRACT = {TRIPLE presentation at the workshop "Prospecting a FAIR continuum for SSH data and publications"},
URL = {https://iris.cnr.it/handle/20.500.14243/385055},
}
@MISC{FRONTINI_2020_MISC_F_384006,
AUTHOR = {Frontini, F.},
TITLE = {Dans les coulisses des infrastructures européennes en SHS. Rôle et opportunités pour les acteurs de la recherche (ingénieurs et chercheurs)},
YEAR = {2020},
ABSTRACT = {La composante technologique prend une dimension de jour en jour plus importante en LLASHS. Les projets de recherche sont de plus en plus nombreux à mobiliser de gros volumes de données exigeant des services adaptés garants de formes de méthodologies augmentées (exploitation, interopérabilité, accessibilité, archivage). Afin de partager les savoirs et de garantir l'interopérabilité et la préservation à long terme de ces ressources et services, de grandes infrastructures informatiques se mettent en place aux niveaux national et international. Dans cette présentation, vous allez découvrir le panorama, en la matière, des e-infrastructures et des grands projets européens à caractère infrastructurel, avec un accent particulier sur les technologies utilisées, les principaux services offerts, et les aspects les plus intéressants en termes de synergie entre approches et disciplines différentes. La présentation portera sur des ERICs (European Research Infrastructure Consortium) établis, comme CLARIN et DARIAH, et sur des projets récents ou en cours de développement, comme PARTHENOS, SSHOC, ELEXIS et TRIPLE. Concernant les aspects techniques, on abordera les questions liées au dépôt, au stockage, à l'identification (sigle sign on), aux formats et choix des métadonnées et de modélisation formelle, à la recherche fédérée des sources. Nous soulignerons en particulier l'interaction de ces projets avec les infrastructures nationales, notamment Huma-Num, ainsi qu'avec la récemment constituée European Open Science Cloud (EOSC). La présentation aura une visée pratique, avec l'objectif de fournir des indications concrètes aux acteurs de la recherche (chercheurs, ingénieurs.) qui souhaitent participer à ces initiatives et aux groupes de travail qui les animent, ou plus largement favoriser l'accès des chercheurs français aux nombreux services et opportunités offerts},
KEYWORDS = {Infrastrutture di ricerca, Scienze umane e sociali},
URL = {https://ja-mate2020.sciencesconf.org/data/pages/Resume_Frontini_Nov.pdf},
CONFERENCE_NAME = {Journées annuelles du réseau Mate-shs (JA2020)},
}
@MISC{KRAKER_2020_MISC_KMJDCB_385056,
AUTHOR = {Kraker, P. and Mathiak, B. and Juty, N. and Di Donato, F. and Culina, A. and Bardi, A.},
TITLE = {Designing a FAIR data discovery ecosystem},
YEAR = {2020},
ABSTRACT = {The presentation is focused on the design of a FAIR data discovery ecosystem, with a particular focus on user interfaces and other user-facing services. Specifically, it explores the following topics:-Creation and further development of FAIR and open infrastructures enabling interoperable, cross-domain reuse and continued innovation-User involvement and participatory design to increase usability and usefulness of the developed solutions},
KEYWORDS = {Discovery, FAIR},
URL = {https://conference.codata.org/FAIRconvergence2020/sessions/206/},
CONFERENCE_NAME = {International FAIR Convergence Symposium 2020},
}
@MISC{PROIETTI_2020_MISC_PS_411390,
AUTHOR = {Proietti, C. and Smets, S.},
TITLE = {The wisdom and madness of crowds: argumentation, information exchange and social interaction},
YEAR = {2020},
KEYWORDS = {fromal argumentation, logic, social sciences},
PAGES = {15-16},
URL = {https://iris.cnr.it/handle/20.500.14243/411390},
VOLUME = {14 (3)},
ISSN = {1757-0522},
}
@MISC{ROSSELLIDELTURCO_2020_MISC_RCDDMMSZ_462886,
AUTHOR = {Rosselli Del Turco, R. and Cacioli, G. and Del Grosso, A. M. and Di Pietro, C. and Martignano, C. and Memaj, J. and Spinelli, F. and Zenzaro, S.},
TITLE = {EVT-Edition Visualization Technology 2 (v. beta 2)},
YEAR = {2020},
ABSTRACT = {EVT (Edition Visualization Technology) is a software for creating and browsing digital editions of manuscripts based on text encoded according to the TEI XML (http: //www. tei-c. org/) schemas and Guidelines. This tool was born as part of the [Digital Vercelli Book] (http: //vbd. humnet. unipi. it/) project in order to allow the creation of a digital edition of the Vercelli Book, a parchment codex of the late tenth century, now preserved in the Archivio e Biblioteca Capitolare of Vercelli and regarded as one of the four most important manuscripts of the Anglo-Saxon period as regards the transmission of poetic texts in the Old English language. To ensure that it will be working on all the most recent web browsers, and for as long as possible on the World Wide Web itself, EVT is built on open and standard web technologies such as HTML, CSS and JavaScript. Specific features, such as the image viewer, are entrusted to the most effective and stable ones (e. g. Openseadragon in the case of the image viewer), again chosen among the open source and best supported ones to reduce the risk of future incompatibilities. The general architecture of the software, in any case, is modular, so that any component which may cause trouble or turn out to be not completely up to the task can be replaced easily. This version is based on the AngularJS programming framework and implements the MVC (Model-View-Controller) design pattern},
KEYWORDS = {edizioni scientifiche digitali, filologia digitale, critica testuale, filologia di testi medievali, edizioni diplomatiche, web-publishing, XML/TEI, HTML5, CSS, AngularJS, visualization software, manuscript viewer},
URL = {http://evt.labcd.unipi.it/},
}
@ARTICLE{ALZETTA_2019_ARTICLE_ADMV_403586,
AUTHOR = {Alzetta, C. and Dell'Orletta, F. and Montemagni, S. and Venturi, G.},
TITLE = {INFERRING QUANTITATIVE TYPOLOGICAL TRENDS FROM MULTILINGUAL TREEBANKS. A CASE STUDY},
YEAR = {2019},
ABSTRACT = {In the past decades, linguistic typology went through a renewing phase that involved a significant change in the research questions and methods of the discipline, which is now interested in fine-grained features underlying language diversity. In this paper, we propose a novel approach to address the newly defined needs of linguistic typology by extracting qualitative and quantitative information about a wide range of features from multilingual annotated corpora based on Natural Language Processing methods and techniques. We tested our method in a case study focusing on word order variation in two widely investigated constructions, VERB-SUBJ(ect) and NOUN-ADJ(ective), with a specific view to structural and functional factors underlying the preference for one or the other order, both intra-and cross-linguistically, and their interaction. Preliminary experiments have been carried out aimed at acquiring typological evidence from a selection of linguistically annotated treebanks for three different languages, namely Italian, Spanish and English. Our results show the effectiveness of the method in letting similarities and differences also emerge from typologically close languages},
KEYWORDS = {language typology, multilingual annotated corpora, linguistic knowledge extraction and modelling, word order variation},
PAGES = {209-242},
URL = {https://www.rivisteweb.it/doi/10.1418/95391},
VOLUME = {18 (2)},
DOI = {10.1418/95391},
ISSN = {1720-9331},
JOURNAL = {LINGUE E LINGUAGGIO},
}
@ARTICLE{APREDA_2019_ARTICLE_ABDF_392529,
AUTHOR = {Apreda, R. and Bonaccorsi, A. and Dell'Orletta, F. and Fantoni, G.},
TITLE = {Expert forecast and realized outcomes in technology foresight},
YEAR = {2019},
ABSTRACT = {Contrary to what happens in forecasting, in which the repetitive nature of events lends itself to the ex post validation of expert judgments, it is usually very difficult to compare directly the forecast of technology foresight studies with realized outcomes. When the comparison is feasible, therefore, there is large opportunity for learning and methodological refinement. The authors of this study had the opportunity to re-examine the findings of a technology foresight exercise on the medical device industry with realized technological performance, five years later. Among the findings of the comparison exercise, intriguing false positive as well as false negative cases have been identified. The paper suggests that these cases are due to specific cognitive and motivational biases of experts and examines the way in which they are at work in the foresight process. It argues that these biases are due to the inability of experts to reason systematically in abstract (or "functional") terms during the whole foresight process. It also suggests a methodology to mitigate the biases and to manage the emergence of false positives and false negatives},
KEYWORDS = {Expert forecast, Medical device industry, Cognitive biases, Abstract reasoning, Failure mode analysis, Functional analysis},
PAGES = {277-288},
URL = {https://iris.cnr.it/handle/20.500.14243/392529},
VOLUME = {141},
DOI = {10.1016/j.techfore.2018.12.006},
ISSN = {0040-1625},
JOURNAL = {TECHNOLOGICAL FORECASTING AND SOCIAL CHANGE},
}
@ARTICLE{BAMBACI_2019_ARTICLE_BBD_520083,
AUTHOR = {Bambaci, L. and Boschetti, F. and Del Gratta, R.},
TITLE = {Qohelet Euporia: a Domain specific Language for the Encoding of the critical Apparatus},
YEAR = {2019},
ABSTRACT = {Encoding multilingual variant readings is timeconsuming and error-prone. The guidelines provided by the Text Encoding Initiative (TEI) ensure data interchange, but the TEIXML verbosity risks to distract annotators with a traditional background in philological studies from their critical activity. We illustrate how a Domain Specific Language (DSL) facilitates both the manual annotation of the critical apparatus and the data interchange. Our case study is based on the multilingual tradition of the biblical book of Qohelet, which has been annotated through the annotation tool based on DSLs named Euporia},
KEYWORDS = {digital philology, biblical studies, digital scholarly editing, textual criticism},
PAGES = {26-37},
URL = {http://dx.doi.org/10.57675/IMIST.PRSM/ijist-v3i5.136},
VOLUME = {3 (5)},
DOI = {10.57675/IMIST},
ISSN = {2550-5114},
JOURNAL = {INTERNATIONAL JOURNAL OF INFORMATION SCIENCE AND TECHNOLOGY},
}
@ARTICLE{BURGASSI_2019_ARTICLE_BG_393447,
AUTHOR = {Burgassi, C. and Guadagnini, E.},
TITLE = {Il campione dei 'moderni'. Note sul Morgante nel Vocabolario degli Accademici della Crusca (1612, 1623)},
YEAR = {2019},
ABSTRACT = {Il saggio analizza la presenza di Luigi Pulci, e in particolare del Morgante, nelle prime due impressioni del Vocabolario della Crusca (1612, 1623). Un primo paragrafo, di Cosimo Burgassi, fornisce le coordinate per inquadrare la presenza nel Vocabolario degli 'autori moderni': fra questi, si rileva come Pulci goda di largo credito nell'ambiente fiorentino coevo e immediatamente precedente alla compilazione della prima Crusca. Il secondo paragrafo, di Elisa Guadagnini, presenta i dati raccolti dallo spoglio completo delle citazioni pulciane nella prima e nella seconda impressione del Vocabolario: la loro interpretazione consente di individuare la specificità del ruolo assunto dal Morgante nelle due opere lessicografiche. Particolarmente interessante è la differenza osservabile tra la prima e la seconda edizione del Vocabolario, che 'ritorna' al Morgante per implementare il lessico latamente tecnico (nella fattispecie, i nomi di animale). Un breve paragrafo conclusivo riassume le risultanze dello studio},
KEYWORDS = {Luigi Pulci, Morgante, Vocabolario della Crusca, Lessicografia italiana, Firenze nel Rinascimento, Storia della lingua italiana},
URL = {https://doi.org/10.1080/00751634.2019.1587233},
DOI = {10.1080/00751634.2019.1587233},
ISSN = {1748-6181},
JOURNAL = {ITALIAN STUDIES},
}
@ARTICLE{BURGASSI_2019_ARTICLE_BG_474483,
AUTHOR = {Burgassi, C. and Guadagnini, E.},
TITLE = {Il campione dei ‘moderni’. Note sul Morgante nel Vocabolario degli Accademici della Crusca (1612, 1623)*},
YEAR = {2019},
PAGES = {186-196},
URL = {https://iris.cnr.it/handle/20.500.14243/474483},
VOLUME = {74 (2)},
DOI = {10.1080/00751634.2019.1587233},
ISSN = {0075-1634},
JOURNAL = {ITALIAN STUDIES},
}
@ARTICLE{CONNOR_2019_ARTICLE_CVCR_387101,
AUTHOR = {Connor, R. and Vadicamo, L. and Cardillo, F. A. and Rabitti, F.},
TITLE = {Supermetric search},
YEAR = {2019},
ABSTRACT = {Metric search is concerned with the efficient evaluation of queries in metric spaces. In general, a large space of objects is arranged in such a way that, when a further object is presented as a query, those objects most similar to the query can be efficiently found. Most mechanisms rely upon the triangle inequality property of the metric governing the space. The triangle inequality property is equivalent to a finite embedding property, which states that any three points of the space can be isometrically embedded in two-dimensional Euclidean space. In this paper, we examine a class of semimetric space which is finitely four-embeddable in three-dimensional Euclidean space. In mathematics this property has been extensively studied and is generally known as the four-point property. All spaces with the four-point property are metric spaces, but they also have some stronger geometric guarantees. We coin the term supermetric(1) space as, in terms of metric search, they are significantly more tractable. Supermetric spaces include all those governed by Euclidean, Cosine, (2) Jensen-Shannon and Triangular distances, and are thus commonly used within many domains. In previous work we have given a generic mathematical basis for the supermetric property and shown how it can improve indexing performance for a given exact search structure. Here we present a full investigation into its use within a variety of different hyperplane partition indexing structures, and go on to show some more of its flexibility by examining a search structure whose partition and exclusion conditions are tailored, at each node, to suit the individual reference points and data set present there. Among the results given, we show a new best performance for exact search using a well-known benchmark. (C) 2018 Elsevier Ltd. All rights reserved},
KEYWORDS = {Similarity search, Metric space, Supermetric space, Metric indexing, Four-point property, Hilbert Exclusion},
PAGES = {108-123},
URL = {https://www.sciencedirect.com/science/article/pii/S0306437917301588?via%3Dihub},
VOLUME = {80},
DOI = {10.1016/j.is.2018.01.002},
ISSN = {0306-4379},
JOURNAL = {INFORMATION SYSTEMS},
}
@ARTICLE{DELGROSSO_2019_ARTICLE_DCCDGMSS_411280,
AUTHOR = {Del Grosso, A. M. and Capizzi, E. and Cristofaro, S. and De Luca, M. R. and Giovannetti, E. and Marchi, S. and Seminara, G. and Spampinato, D.},
TITLE = {Bellini's Correspondence: a Digital Scholarly Edition for a Multimedia Museum},
YEAR = {2019},
ABSTRACT = {Within the "Museo Virtuale della Musica BellinInRete" project, a corpus of letters, written by the renowned composer Vincenzo Bellini (1801-1835) from Catania, will be encoded and made publicly available. This contribution aims at illustrating the part of the project regarding the implementation of the prototype for the metadata and text encoding, indexing and visualisation of Bellini's correspondence. The encoding scheme has been defined according to the latest guidelines of the Text Encoding Initiative and it has been instantiated on a sample of letters. Contextually, a first environment has been implemented by customizing two open source tools: Edition Visualization Technology and Omega Scholarly platform. The main objective of the digital edition is to engage general public with the cultural heritage held by the Belliniano Civic Museum of Catania. This wide access to Bellini's correspondence has been conceived preserving the scholarly transcriptions of the letters edited by Seminara within her most recent critical edition (Olschki, 2017). The digital edition of the corpus takes care of handling the correspondence metadata by means of the correspDesc TEI tagset. Finally, Bellini's letters will be accessible via the Web platform as well as integrated into a forthcoming interactive and multimedia tour hosted at the museum},
KEYWORDS = {digital scholarly edition, correspondence, Digital and Computational Philology, Software Design, Vincenzo Bellini, Music, Multimedia Museum},
PAGES = {23-47},
URL = {https://umanisticadigitale.unibo.it/article/view/9162/9918},
VOLUME = {7},
DOI = {10.6092/issn.2532-8816/9162},
ISSN = {2532-8816},
JOURNAL = {UMANISTICA DIGITALE},
}
@ARTICLE{DELLORLETTA_2019_ARTICLE_DGMMRSV_403580,
AUTHOR = {Dell'Orletta, F. and Greco, S. and Montemagni, S. and Morini, E. and Rossi, F. and Sagri, M. and Venturi, G.},
TITLE = {Le parole del miglioramento. Come le scuole descrivono il cambiamento},
YEAR = {2019},
ABSTRACT = {Il presente contributo intende illustrare i risultati di una ricerca condotta con l'uso di strumenti di trattamento automatico del linguaggio (Natural Language Processing: nlp) su quanto dichiarato dalle scuole in circa 2500 Piani di Miglioramento (modello indire) con l'obiettivo di comprendere le scelte strategiche in un'ottica di miglioramento continuo. Il disegno d'analisi permette di restituire sia una visione complessiva dei Piani di Miglioramento che approfondimenti qualitativi di confronto tra tipologie di scuola e aree geografiche e relativi a tematiche strategiche quali formazione e innovazione},
KEYWORDS = {Piano d, Natural Language Processing, Formazione, Innovazione},
PAGES = {47-68},
URL = {https://www.rivistainfanzia.it/pvw/app/default/pvw_sito.php?sede_codice=1PWPSE01\&page=2432193},
VOLUME = {1/2019},
ISSN = {1971-3711},
JOURNAL = {PSICOLOGIA DELL'EDUCAZIONE},
}
@ARTICLE{DELLAGALA_2019_ARTICLE_DCDPV_403584,
AUTHOR = {Della Gala, V. and Chiriatti, G. and Dell'Orletta, F. and Pettenati, M. C. and Venturi, G.},
TITLE = {Analytics dei testi riflessivi scritti dai docenti neoassunti nel portfolio digitale},
YEAR = {2019},
ABSTRACT = {Presentiamo i risultati preliminari e l'analisi svolta su circa 50. 000 testi scritti dai docenti neo nominati in ruolo per riflettere su due attività didattiche svolte con gli studenti, nel contesto del percorso dell'anno di formazione e prova 2016/17. Il percorso prevede attività in presenza e attività a distanza completate sul portfolio digitale, ospitato nell'ambiente online gestito dall'Indire. Nell'ambito del monitoraggio della formazione, con il fine di ottimizzare gli strumenti e il supporto fornito, abbiamo interrogato i dati testuali prodotti dai docenti nell'interazione con l'ambiente per capire se i testi presentassero evidenze riconducibili alle scritture riflessive. Obiettivi dell'indagine sono stati la definizione di uno schema per la classificazione dei testi sulla base del livello di riflessività evidenziato e l'impiego di strumenti di Trattamento Automatico del Linguaggio (TAL) per l'analisi dell'interocorpus testuale prodotto dai docenti. Descriveremo il contesto scientifico e progettuale, le caratteristiche dei dati analizzati, come questo abbia determinato il disegno d'indagine; descriveremo inoltre la sua implementazione e dunque le procedure, gli strumenti e le metriche adottate o elaborate per rappresentare il contenuto dei dati; infine discuteremo i primi risultati e alcuni vantaggi e limiti dell'approccio adottato},
KEYWORDS = {Teacher professional development, Natural Language Processing, Reflective writing, Linguistic Profiling, Document Classification},
PAGES = {187-204},
URL = {https://ojs.pensamultimedia.it/index.php/sird/article/view/3454/3360},
VOLUME = {SPECIAL ISSUE},
DOI = {10.7346/SIRD-2S2019-P189},
ISSN = {2038-9744},
JOURNAL = {GIORNALE ITALIANO DELLA RICERCA EDUCATIVA (ONLINE)},
}
@ARTICLE{GERBAUDO_2019_ARTICLE_GMA_493651,
AUTHOR = {Gerbaudo, P. and Marogna, F. and Alzetta, C.},
TITLE = {When “Positive Posting” Attracts Voters: User Engagement and Emotions in the 2017 UK Election Campaign on Facebook},
YEAR = {2019},
ABSTRACT = {Social media are widely held to have played an important role in the 2017 UK general elections. But it is not altogether clear how exactly they contributed to the communication battle between Labour and the Conservatives. This article analyses the posts and comments on the official Facebook pages of the Labour Party and the Conservative Party and their respective leaders, Jeremy Corbyn and Theresa May. We look at the relationship between topics, emotions, and user engagement. Labour clearly outperformed the Tories, with Corbyn’s personal page having 10 times the interactions of May’s. We retrieve part of the reason for this success in the “positive posting” strategy adopted by Labour and the way it helped to attract user engagement. While the Conservative Party focused on negative issues such as Brexit, terrorism, and national security, Labour focused on positive issues, such as the promise of higher social spending and appeals to the grassroots, generating far higher levels of engagement. Overall, positive topic tended to fare better than more negative and controversial issues, such as security and Brexit. Our findings thus suggest the need for a more balanced understanding of the relationship between content, emotions, and user engagement on social media, moving beyond simplistic views of social media politics as necessarily biased in favor of aggressive and negative campaigning},
KEYWORDS = {2017 UK national elections, Corbyn, Facebook, Labour, online campaigning, social media},
URL = {https://iris.cnr.it/handle/20.500.14243/493651},
VOLUME = {5 (4)},
DOI = {10.1177/2056305119881695},
ISSN = {2056-3051},
JOURNAL = {SOCIAL MEDIA SOCIETY},
}
@ARTICLE{GOGGI_2019_ARTICLE_GPBMBC_360573,
AUTHOR = {Goggi, S. and Pardelli, G. and Bartolini, R. and Monachini, M. and Biagioni, S. and Carlesi, C.},
TITLE = {Semantic Query Analysis from the Global Science Gateway},
YEAR = {2019},
ABSTRACT = {Nowadays web portals play an essential role in searching and retrieving information in the several fields of knowledge: they are ever more technologically advanced and designed for supporting the storage of a huge amount of information in natural language originating from the queries launched by users worldwide. Given this scenario, we focused on building a corpus constituted by the query logs registered by the GreyGuide: Repository and Portal to Good Practices and Resources in Grey Literature and received by the WorldWideScience. org (The Global Science Gateway) portal: the aim is to retrieve information related to social media which as of today represent a considerable source of data more and more widely used for research ends},
KEYWORDS = {Information Extraction, Query Log, WorldWideScience Alliance, Information gateways, Social Media},
PAGES = {147-155},
URL = {https://iris.cnr.it/handle/20.500.14243/360573},
VOLUME = {15 (3)},
ISSN = {1574-1796},
JOURNAL = {THE GREY JOURNAL},
}
@ARTICLE{GOMEZCHAVEZ_2019_ARTICLE_GRCZBB_345428,
AUTHOR = {Gomez Chavez, A. and Ranieri, A. and Chiarella, D. and Zereik, E. and Babi, A. and Birk, A.},
TITLE = {CADDY Underwater Stereo-Vision Dataset for Human-Robot Interaction (HRI) in the Context of Diver Activities},
YEAR = {2019},
ABSTRACT = {In this article, we present a novel underwater dataset collected from several field trials within the EU FP7 project "Cognitive autonomous diving buddy (CADDY)", where an Autonomous Underwater Vehicle (AUV) was used to interact with divers and monitor their activities. To our knowledge, this is one of the first efforts to collect a large public dataset in underwater environments with the purpose of studying and boosting object classification, segmentation and human pose estimation tasks. The first part of the dataset contains stereo camera recordings (?10 K) of divers performing hand gestures to communicate with an AUV in different environmental conditions. The gestures can be used to test the robustness of visual detection and classification algorithms in underwater conditions, e. g., under color attenuation and light backscatter. The second part includes stereo footage (?12. 7 K) of divers free-swimming in front of the AUV, along with synchronized measurements from Inertial Measurement Units (IMU) located throughout the diver's suit (DiverNet), which serve as ground-truth for human pose and tracking methods. In both cases, these rectified images allow the investigation of 3D representation and reasoning pipelines from low-texture targets commonly present in underwater scenarios. This work describes the recording platform, sensor calibration procedure plus the data format and the software utilities provided to use the dataset},
KEYWORDS = {dataset, underwater imaging, image processing, marine robotics, field robotics, human-robot interaction, stereo vision, object classification, human pose estimation},
PAGES = {1-14},
URL = {https://www.mdpi.com/2077-1312/7/1/16},
VOLUME = {7 (1)},
DOI = {10.3390/jmse7010016},
ISSN = {2077-1312},
JOURNAL = {JOURNAL OF MARINE SCIENCE AND ENGINEERING},
}
@ARTICLE{MAREMMANI_2019_ARTICLE_MMOSPBPDBRCC_510092,
AUTHOR = {Maremmani, C. and Monastero, R. and Orlandi, G. and Salvadori, S. and Pieroni, A. and Baschi, R. and Pecori, A. and Dolciotti, C. and Berchina, G. and Rovini, E. and Cuddemi, F. and Cavallo, F.},
TITLE = {Objective assessment of blinking and facial expressions in Parkinson's disease using vertical electrooculogram and facial surface electromyography},
YEAR = {2019},
ABSTRACT = {Objective: Hypomimia is a common and early symptom of Parkinson’s disease (PD), which reduces the ability of PD patients to manifest emotions. Currently, it is visually evaluated by the neurologist during neurological examinations for PD diagnosis, as described in task 3. 2 of the Movement Disorder Society—Unified Parkinson’s Disease Rating Scale (MDS-UPDRS). Since such an evaluation is semi-quantitative and affected by inter-variability, this paper aims to measure the physiological parameters related to eye blink and facial expressions extracted from a vertical electro-oculogram (VEOG) and facial surface electromyography (fsEMG) to differentiate PD patients from healthy control subjects (HCs). Approach: The spontaneous eye blink rate-minute (sEBR), its maximum amplitude (BMP), and facial cutaneous muscle activity were measured in 24 PD patients and 24 HCs while the subjects looked at a visual-tester composed of three main parts: static vision, dynamic vision and reading silently. Specificity and sensitivity for each parameter were calculated. Main results: The VEOG and the fsEMG allowed the identification of some parameters related to eye blink and facial expressions (i. e. sEBR, BMP, frontal and peribuccal muscular activities), being able to distinguish between PD patients and HCs with high sensitivity and specificity. Significance: The demonstration that the combination of parameters related to eye blink and facial expressions can discriminate (with high accuracy) between PD patients versus HCs, thus resulting in a useful tool to support the neurologist in objective assessment of hypomimia for improving PD diagnosis},
KEYWORDS = {Parkinson’s disease, vertical electro-oculogram, facial surface emg, spontaneous eye blink rate},
URL = {https://pubmed.ncbi.nlm.nih.gov/31018181/},
VOLUME = {40 (6)},
DOI = {10.1088/1361-6579/ab1c05},
ISSN = {0967-3334},
JOURNAL = {PHYSIOLOGICAL MEASUREMENT},
}
@ARTICLE{MARZI_2019_ARTICLE_MFP_392957,
AUTHOR = {Marzi, C. and Ferro, M. and Pirrelli, V.},
TITLE = {A processing-oriented investigation of inflectional complexity},
YEAR = {2019},
ABSTRACT = {Due to the typological diversity of their inflectional processes, some languages are intuitively more difficult than other languages. Yet, finding a single measure to quantitatively assess the comparative complexity of an inflectional system proves an exceedingly difficult endeavor. In this paper we propose to investigate the issue from a processing-oriented standpoint, using data processed by a type of recurrent neural network to quantitatively model the dynamic of word processing and learning in different input conditions. We evaluate the relative complexity of a set of typologically different inflectional systems (Greek, Italian, Spanish, German, English and Standard Modern Arabic) by training a Temporal Self-Organizing Map (TSOM), a recurrent variant of Kohonen's Self-Organizing Maps, on a fixed set of verb forms from top-frequency verb paradigms, with no information about the morphosemantic and morphosyntactic content conveyed by the forms. After training, the behavior of each language-specific TSOM is assessed on different tasks, looking at self-organizing patterns of temporal connectivity and functional responses. Our simulations show that word processing is facilitated by maximally contrastive inflectional systems, where verb forms exhibit the earliest possible point of lexical discrimination. Conversely, word learning is favored by a maximally generalizable system, where forms are inferred from the smallest possible number of their paradigm companions. Based on evidence from the literature and our own data, we conjecture that the resulting balance is the outcome of the interaction between form frequency and morphological regularity. Big families of stem-sharing, regularly inflected forms are the productive core of an inflectional system. Such a core is easier to learn but slower to discriminate. In contrast, less predictable verb forms, based on alternating and possibly suppletive stems, are easier to process but are learned by rote. Inflection systems thus strike a balance between these conflicting processing and communicative requirements, while staying within tight learnability bounds, in line with Ackermann and Malouf's Low Conditional Entropy Conjecture. Our quantitative investigation supports a discriminative view of morphological inflection as a collective, emergent system, whose global self-organization rests on a surprisingly small handful of language-independent principles of word coactivation and competition},
KEYWORDS = {Morphological complexity, Discriminative learning, Recurrent neural networks (RNNs), self-organization, emergence, processing uncertainty, stem-family size},
PAGES = {1-23},
URL = {https://www.frontiersin.org/articles/10.3389/fcomm.2019.00048/full},
VOLUME = {4 (48)},
DOI = {10.3389/fcomm.2019.00048},
ISSN = {2297-900X},
JOURNAL = {FRONTIERS IN COMMUNICATION},
}
@ARTICLE{PICCINI_2019_ARTICLE_P_519771,
AUTHOR = {Piccini, S.},
TITLE = {Questions d'accentologie lituanienne: l'hypothèse d'une isoglosse balto-germanique},
YEAR = {2019},
ABSTRACT = {L'article part d'une analyse critique de l'ouvrage de Jasanoff " The Prehistory of the Balto-Slavic Accent" pour explorer les parallèles entre les systèmes prosodiques des langues baltes et germaniques. En s'appuyant notamment sur les travaux d'Antanas Baranauskas (1882), revisités par Saussure et mis en perspective par Jasanoff, il met en lumière une hypothèse selon laquelle ces deux branches proto-indo-européennes auraient partagé des relations étroites},
KEYWORDS = {accentologie lituanienne loi de Saussure isoglosse balto-germanique},
PAGES = {241-256},
URL = {https://iris.cnr.it/handle/20.500.14243/519771},
VOLUME = {72},
ISSN = {0068-516X},
JOURNAL = {CAHIERS FERDINAND DE SAUSSURE},
}
@ARTICLE{SAROGNI_2019_ARTICLE_SPSADGCBPADSCTBFM_390441,
AUTHOR = {Sarogni, P. and Palumbo, O. and Servadio, A. and Astigiano, S. and D'Alessio, B. and Gatti, V. and Cukrov, D. and Baldari, S. and Pallotta, M. M. and Aretini, P. and Dell'Orletta, F. and Soddu, S. and Carella, M. and Toietta, G. and Barbieri, O. and Fontanini, G. and Musio, A.},
TITLE = {Overexpression of the cohesin-core subunit SMC1A contributes to colorectal cancer development},
YEAR = {2019},
ABSTRACT = {BackgroundCancer cells are characterized by chromosomal instability (CIN) and it is thought that errors in pathways involved in faithful chromosome segregation play a pivotal role in the genesis of CIN. Cohesin forms a large protein ring that binds DNA strands by encircling them. In addition to this central role in chromosome segregation, cohesin is also needed for DNA repair, gene transcription regulation and chromatin architecture. Though mutations in both cohesin and cohesin-regulator genes have been identified in many human cancers, the contribution of cohesin to cancer development is still under debate. MethodsNormal mucosa, early adenoma, and carcinoma samples deriving from 16 subjects affected by colorectal cancer (CRC) were analyzed by OncoScan for scoring both chromosome gains and losses (CNVs) and loss of heterozygosity (LOH). Then the expression of SMC1A was analyzed by immunochemistry in 66 subjects affected by CRC. The effects of SMC1A overexpression and mutated SMC1A were analyzed in vivo using immunocompromised mouse models. Finally, we measured global gene expression profiles in induced-tumors by RNA-seq. ResultsHere we showed that SMC1A cohesin core gene was present as extra-copies, mutated, and overexpressed in human colorectal carcinomas. We then demonstrated that cohesin overexpression led to the development of aggressive cancers in immunocompromised mice through gene expression dysregulation. ConclusionCollectively, these results support a role of defective cohesin in the development of human colorectal cancer},
KEYWORDS = {Cohesin, SMC1A, Chromosome instability, Gene expression dysregulation, Human colorectal cancer development},
PAGES = {16},
URL = {https://iris.cnr.it/handle/20.500.14243/390441},
VOLUME = {38},
DOI = {10.1186/s13046-019-1116-0},
ISSN = {1756-9966},
JOURNAL = {JOURNAL OF EXPERIMENTAL \& CLINICAL CANCER RESEARCH (ONLINE)},
}
@ARTICLE{SAURI_2019_ARTICLE_SMRB_365830,
AUTHOR = {Sauri, R. and Mahon, L. and Russo, I. and Bitinis, M.},
TITLE = {Cross-dictionary linking at sense level with a double-layer classifier},
YEAR = {2019},
ABSTRACT = {We present a system for linking dictionaries at the sense level, which is part of a wider programme aiming to extend current lexical resources and to create new ones by automatic means. One of the main challenges of the sense linking task is the existence of non one-to-one mappings among senses. Our system handles this issue by addressing the task as a binary classification problem using standard Machine Learning methods, where each sense pair is classified independently from the others. In addition, it implements a second, statistically-based classification layer to also model the dependence existing among sense pairs, namely, the fact that a sense in one dictionary that is already linked to a sense in the other dictionary has a lower probability of being linked to a further sense. The resulting double-layer classifier achieves global Precision and Recall scores of 0. 91 and 0. 80, respectively},
KEYWORDS = {Word sense linking, word sense mapping, lexical translation, lexical resources, language data construction, multilingual data},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85068085716\&origin=inward},
VOLUME = {70},
DOI = {10.4230/OASIcs.LDK.2019.20},
ISSN = {2190-6807},
JOURNAL = {OPEN ACCESS SERIES IN INFORMATICS},
}
@ARTICLE{SPRUGNOLI_2019_ARTICLE_SPBD_366835,
AUTHOR = {Sprugnoli, R. and Pardelli, G. and Boschetti, F. and Del Gratta, R.},
TITLE = {Un'Analisi Multidimensionale della Ricerca Italiana nel Campo delle Digital Humanities e della Linguistica Computazionale},
YEAR = {2019},
ABSTRACT = {This article proposes the first comparative study of four years of Italian conferences in the fields of Digital Humanities and Computational Linguistics. More specifically, we created a corpus consisting of the contributions presented in the AIUCD and CLiC-it conferences between 2014 and 2017 to which we applied a multidimensional analysis taking into consideration: (i) the study of collaborations between authors using social networks analysis techniques, (ii) the automatic extraction of terminology and information and (iii) the examination of citational practices. By combining both qualitative and quantitative methods of investigation, this paper aims to shed light on convergences and discrepancies between two research areas that historically have common origins},
KEYWORDS = {Digital Humanities, Computational Linguistics, Comparative study},
PAGES = {59-89},
URL = {https://umanisticadigitale.unibo.it/article/view/8581},
VOLUME = {5},
DOI = {10.6092/issn.2532-8816/8581},
ISSN = {2532-8816},
JOURNAL = {UMANISTICA DIGITALE},
}
@ARTICLE{STEFANINI_2019_ARTICLE_SNM_395106,
AUTHOR = {Stefanini, A. E. and Nicolosi, A. and Monachini, M.},
TITLE = {A Mock-up for the Development of a Digital Edition for Ancient Greek Fragmentary Poetry: Results of Its Evaluation},
YEAR = {2019},
ABSTRACT = {Ancient Greek poetry is an essential part of the western cultural heritage; thus, it is important that people have access to its texts and whatever relates to their understanding in a reliable and easy way. Whenever user evaluation is concerned, mock-ups are used by designers to acquire feedback from users. A mock-up is defined as a model of the final product, and may be used for demonstration, evaluation and other purposes. The authors prototyped a mock-up for focusing on the requirements of a scholarly digital edition of Archilochus. This was put under evaluation to assess its usability: it was submitted to extensive use and testing by a sample of prospective users, to better focus on the requirements from a product's perspective. Experimentation involved a group of university students, attending a Greek Philology course at Parma University. More than half of the respondents considered the mock-up a useful study support. The evaluation also pointed out that the mock-up had to be revised, so as to guarantee better cognitive simplicity of the user interface},
KEYWORDS = {Ancient Greek Poetry, Digital Edition, Greek Philology, Digital Humanities, Digital Philology, Didactics, Evaluation},
PAGES = {41-57},
URL = {https://www.igi-global.com/article/a-mock-up-for-the-development-of-a-digital-edition-for-ancient-greek-fragmentary-poetry/237162},
VOLUME = {8 (2)},
DOI = {10.4018/IJACDT.2019070103},
}
@BOOK{FIER_2019_BOOK_FLABDDDDDEGHKLMMNNNNNNOOQRSSTVVV_407479,
AUTHOR = {Fier, D. and Lenardi, J. and Auzia, I. and Bernstein Ratner, N. and De Smedt, K. and Dobrovoljc, K. and Dodé, R. and Domeij, R. and Dyvik, H. and Erjavec, T. and Gerassimenko, O. and Haji, J. and Ken, M. and Ljubei, N. and Macwhinney, B. and Monachini, M. and Nava, B. and Navarreta, C. and Nedyalkova, A. and Nielsen, K. and Noémi Vadászlaak, M. and Nylund Skog, S. and Offersgaard, L. and Osenova, P. and Quochi, V. and Reinsone, S. and Skadia, I. and Simov, K. and Tichý, O. and Vadász, N. and Váradi, T. and Vider, K.},
TITLE = {Tour de CLARIN Two},
YEAR = {2019},
ABSTRACT = {The second volume of Tour de CLARIN is organized into two parts. In Part 1, we present the seven countries which have been featured: Estonia, Latvia, Denmark, Italy, Slovenia, Hungary, and Bulgaria. In this part, each country is presented with five chapters: an introduction to the consortium, their members and their work; a description of one of their key resources; a presentation of an outstanding tool; an account of a successful event for the researchers and students in their network; and an interview with a renowned researcher from the digital humanities or social sciences who has successfully used the consortium infrastructure in their research},
KEYWORDS = {CLARIN, CLARIN Consortia, CLARIN resources},
PAGES = {1-87},
URL = {https://doi.org/10.5281/zenodo.3754164},
DOI = {10.5281/zenodo.3754164.svg},
PUBLISHER = {CLARIN-Common language resources technology infrastructure (Utrecht, NLD)},
ISBN = {9789082990911},
CONFERENCE_PLACE = {Utrecht},
EDITOR = {Fi?er, D. and Lenardi?, J.},
}
@INCOLLECTION{ADORNI_2019_INCOLLECTION_AAKPT_493649,
AUTHOR = {Adorni, G. and Alzetta, C. and Koceva, F. and Passalacqua, S. and Torre, I.},
TITLE = {Towards the identification of propaedeutic relations in textbooks},
YEAR = {2019},
ABSTRACT = {As well-known, structuring knowledge and digital content has a tremendous potential to enhance meaningful learning. A straightforward approach is representing key concepts of the subject matter and organizing them in a knowledge structure by means of semantic relations. This results in hypergraphs with typed n-ary relationships, including the so-called prerequisite or propaedeutic relations among concepts. While extracting the whole concept graph from a textbook is our final goal, the focus of this paper is the identification of the propaedeutic relations among concepts. To this aim, we employ a method based on burst analysis and co-occurrence which recognizes, by means of temporal reasoning, prerequisite relations among concepts that share intense periods in the text. The experimental evaluation shows promising results for the extraction of propaedeutic relations without the support of external knowledge},
KEYWORDS = {Knowledge structure, Relation extraction, Temporal reasoning},
PAGES = {1-13},
URL = {https://iris.cnr.it/handle/20.500.14243/493649},
VOLUME = {11625},
DOI = {10.1007/978-3-030-23204-7_1},
PUBLISHER = {Springer Verlag},
ISBN = {9783030232030},
BOOKTITLE = {Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)},
}
@INCOLLECTION{BELLANDI_2019_INCOLLECTION_BMK_407485,
AUTHOR = {Bellandi, A. and Monachini, M. and Khan, F.},
TITLE = {LexO: Where Lexicography Meets the Semantic Web},
YEAR = {2019},
ABSTRACT = {LexO is a collaborative web editor used for the creation and management of (multilingual) lexical and terminological resources as linked data resources. The editor makes use of Semantic Web technologies (which enrich web data with semantic information in order to make them machine readable) and the linked data publishing paradigm in order to ensure that lexical resources can be more easily shared and reused by the scientific community},
KEYWORDS = {Semantic Web technologies, multilingual lexical resources, collaborative web editor},
PAGES = {43-47},
URL = {https://iris.cnr.it/handle/20.500.14243/407485},
BOOKTITLE = {Tour de CLARIN volume two},
EDITOR = {Fiser, D. and Lenardic, J.},
}
@INCOLLECTION{BOSCHETTI_2019_INCOLLECTION_B_378928,
AUTHOR = {Boschetti, F.},
TITLE = {Semantic Analysis and Thematic Annotation},
YEAR = {2019},
ABSTRACT = {This contribution aims at investigating some methods, resources and tools devoted to the semantic analysis and the thematic annotation. The first part, devoted to the paradigmatic axis, describes available lexico-semantic resources for the classical languages, which belong to accomplished or on-going projects. The second part of the contribution, devoted to the syntagmatic axis, is focused on the semantic and thematic annotation of classical and biblical texts. The top-down approach to the annotation of themes and motifs in the Memorata Poetis Project is illustrated and pros and cons are discussed. Finally, the bottom-up approach of Euporia is discussed. In this approach, folksonomies are created by the annotators, and the labels are grouped and organized in ontologies a posteriori, during an incremental process of revision},
URL = {https://iris.cnr.it/handle/20.500.14243/378928},
DOI = {10.1515/9783110599572-018},
ISBN = {978-3-11-059678-6},
}
@INCOLLECTION{GIOVANNETTI_2019_INCOLLECTION_G_396546,
AUTHOR = {Giovannetti, E.},
TITLE = {Traduzione Talmud Babilonese},
YEAR = {2019},
ABSTRACT = {Traduzione Talmud Babilonese è un progetto di ricerca che ha come obiettivo la traduzione in lingua italiana del Talmud Babilonese, un testo fondamentale della cultura ebraica non solo in campo religioso ma che tocca anche ogni aspetto della conoscenza umana, dalla giurisprudenza alla scienza, dalla filosofia alla vita di tutti i giorni},
KEYWORDS = {traduzione assistita dal calcolatore, talmud babilonese},
PAGES = {126-126},
URL = {https://iris.cnr.it/handle/20.500.14243/396546},
DOI = {10.36173/PLURIMI-2019-1},
PUBLISHER = {CNR EDIZIONI (ROMA, ITA)},
ISBN = {9788880803775},
CONFERENCE_PLACE = {ROMA},
BOOKTITLE = {Linguaggi, ricerca, comunicazione. Focus CNR},
EDITOR = {Cadeddu, M. E. and Marras, C.},
}
@INCOLLECTION{MONACHINI_2019_INCOLLECTION_MQ_407476,
AUTHOR = {Monachini, M. and Quochi, V.},
TITLE = {Tour de CLARIN: Italy},
YEAR = {2019},
ABSTRACT = {Il Tour de CLARIN è un'iniziativa di CLARIN ERIC che mira a evidenziare periodicamente importanti attività di coinvolgimento degli utenti di un particolare consorzio nazionale CLARIN. Dopo aver visitato 11 paesi, a febbraio e marzo 2019 il Tour de CLARIN si ferma in Italia per visitare CLARIN-IT. La tappa italiana del Tour de CLARIN è iniziata con un post sul blog di CLARIN che ha presentato il consorzio italiano: "Tour de CLARIN: Italia" (01/03/2019)},
KEYWORDS = {CLARIN, CLARIN Consortia},
PAGES = {40-42},
URL = {https://office.clarin.eu/v/CE-2019-1537-Tour-de-CLARIN-volume-II-2019.pdf},
DOI = {10.5281/zenodo.3754164},
PUBLISHER = {CLARIN-Common language resources technology infrastructure (Utrecht, NLD)},
ISSN = {2019-1537},
ISBN = {9789082990911},
CONFERENCE_PLACE = {Utrecht},
BOOKTITLE = {Tour de CLARIN Volume Two},
EDITOR = {Fiser, D. and Lenardic, J.},
}
@INCOLLECTION{PROIETTI_2019_INCOLLECTION_PC_404086,
AUTHOR = {Proietti, C. and Ciuni, R.},
TITLE = {Future contingents, Supervaluationism, and relative truth},
YEAR = {2019},
ABSTRACT = {The problem of future contingents is one of the most ancient and debated puzzles in Western philosophy, and Supervaluationism is, today, one of the most prominent solutions to the problem. Recently, John MacFarlane has carried a well-known criticism to Supervaluationism and put forward a new solution of the problem of future contingents, which is known as Double Time Reference Theory. Here, we compare DTRT with Supervaluationist semantics, and we show that the success of MacFarlane's criticism crucially depends on the expressivity of the language adopted. Once a reasonable expressive power is granted, however, MacFarlane's criticism no longer applies},
KEYWORDS = {Future contingents, supervaluationism, modal logic},
PAGES = {69-88},
URL = {http://www.edizioniets.com/scheda.asp?n=9788846755193},
PUBLISHER = {ETS (Pisa, ITA)},
ISBN = {9788846755193},
CONFERENCE_PLACE = {Pisa},
BOOKTITLE = {THIRD PISA COLLOQUIUM IN LOGIC, LANGUAGE AND EPISTEMOLOGY. Essays in Honour of Mauro Mariani and Carlo Marletti},
EDITOR = {Bellotti, L. and Gili, L. and Moriconi, E. and Turbanti, G.},
}
@INCOLLECTION{PROIETTI_2019_INCOLLECTION_PC_404035,
AUTHOR = {Proietti, C. and Ciuni, R.},
TITLE = {TRL semantics and Burgess' formula},
YEAR = {2019},
ABSTRACT = {The problem of future contingents is one of the most ancient and debated puzzles in Western philosophy, and Supervaluationism is, today, one of the most prominent solutions to the problem. Recently, John MacFarlane has carried a well-known criticism to Supervaluationism (and all other standard approaches to future contingents) and put forward a new solution of the problem of future contingents, which is known as Double Time Reference Theory (DTRT). Here, we compare DTRT with Supervaluationist semantics, and we show that the success of MacFarlane's criticism crucially depends on the expressivity of the language adopted. Once a reasonable expressive power is granted, however, MacFarlane's criticism no longer applies},
KEYWORDS = {temporal logic, Burgess formula},
URL = {https://iris.cnr.it/handle/20.500.14243/404035},
BOOKTITLE = {Logic and Philosophy of Time: Themes from Prior. Volume 2-Themes from Prior},
EDITOR = {Blackburn, P. and Hasle, P. and Ohrstrom, P.},
}
@INCOLLECTION{RUSSO_2019_INCOLLECTION_RMCM_410113,
AUTHOR = {Russo, I. and Marconi, L. and Cutugno, P. and Monachini, M.},
TITLE = {Le parole sono ponti: risorse digitali per l'integrazione in contesti multilingue},
YEAR = {2019},
ABSTRACT = {Nel presente lavoro esporremo due esperienze inerenti all'uso e alla produzione di risorse linguistiche multilingui, svolte da alcuni ricercatori dell'Istituto di Linguistica Computazionale "Antonio Zampolli" (ilc) del cnr. Più nello specifico verrà descritta la realizzazione di un glossario nell'ambito del progetto Ascolto Accoglienza Azioni Offresi (aaa Offresi) e l'uso sperimentale di ImagAct (Moneglia et alii 2012)-una risorsa lessicale multilingue sui verbi d'azione-in una scuola primaria caratterizzata da una forte presenza di alunni stranieri. Il fine della ricerca è quello di favorire l'emergere delle competenze metalinguistiche degli apprendenti, valorizzando la diversità linguistica e culturale},
KEYWORDS = {Multilingual lexical resources, I2 teaching, Translanguaging, Public administration terminology},
PAGES = {127-136},
URL = {https://iris.cnr.it/handle/20.500.14243/410113},
DOI = {10.36173/PLURIMI-2019-1/09},
PUBLISHER = {Consiglio Nazionale delle Ricerche (Roma, ITA)},
ISBN = {9788880803775},
CONFERENCE_PLACE = {Roma},
BOOKTITLE = {Linguaggi, ricerca, comunicazione. Focus CNR},
EDITOR = {Cadeddu, M. E. and Marras, C.},
}
@INCOLLECTION{SORIA_2019_INCOLLECTION_S_428726,
AUTHOR = {Soria, C.},
TITLE = {Uguali opportunità linguistiche digitali: un sogno?},
YEAR = {2019},
ABSTRACT = {Una riflessione sulle opportunità offerte dalle nuove tecnologie digitali per le lingue minoritarie},
URL = {https://iris.cnr.it/handle/20.500.14243/428726},
ISBN = {978-88-8443-849-2},
}
@EDITORIAL{LEONARDI_2019_EDITORIAL_LSLMABBCDFGGLLMMNRVVZMABDI_390952,
AUTHOR = {Leonardi, L. D. and Squillacioti, D. and Larson, P. C. and Mosti, C. and Artale, E. and Barbieri, L. and Beretta, A. and Cerullo, S. and Dotto, D. and Falini, I. and Giuliani, M. and Guadagnini, E. and Lorenzi Biondi, C. and Luti, M. and Maggiore, M. and Malandrino, A. and Natale, S. and Ravani, S. and Vaccaro, G. and Verlato, Z. and Zarra, G. and Malatesta, M. C. C. and Arcidiacono, S. S. I. and Boccellari, A. S. I. and Degl'Innocenti Svil, I. and Ioriofili Svil, I.},
TITLE = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI-Edizione online: www. vocabolario. org (ISSN 2240-5216)-Versione dicembre 2019},
YEAR = {2019},
ABSTRACT = {A pdf copy of the «Tesoro della Lingua Italiana delle Origini» (TLIO), a dictionary of early Italian in progress, published online, as it was at the end of December 2019 (37, 071 entries). TLIO is the first section of the Italian Historical Dictionary which is the mission of the OVI Institute},
KEYWORDS = {Lessico, Lessicografia, Lingua italiana},
PAGES = {15796},
URL = {http://tlio.ovi.cnr.it/TLIO},
ISSN = {2240-5216},
}
@EDITORIAL{CHINELLO_2019_EDITORIAL_CFB_378956,
AUTHOR = {Chinello, A. and Faraci, G. and Boschetti, F.},
TITLE = {Nuovi contributi della ricerca sui disturbi del comportamento alimentare},
YEAR = {2019},
ABSTRACT = {Introduzione metodologica ai contenuti del volume avente per tema i disturbi del comportamento alimentare in relazione alla gravidanza. Lo studio coinvolge esperti di psicologia cognitiva, psicologia clinica e linguistica computazionale},
URL = {https://iris.cnr.it/handle/20.500.14243/378956},
ISBN = {9788891781154},
}
@INPROCEEDINGS{ALBANESI_2019_INPROCEEDINGS_AD_365034,
AUTHOR = {Albanesi, D. and Del Gratta, R.},
TITLE = {OpeNER and PANACEA: Web Services for the CLARIN Research Infrastructure},
YEAR = {2019},
ABSTRACT = {This paper describes the necessary steps for the integration of OpeNer and PANACEA WebServices within the CLARIN research infrastructure. The original Web Services are wrapped intoa framework and re-implemented as REST APIs to be further exploited through both LanguageResource Switchboard and WebLicht and made available for the CLARIN community},
KEYWORDS = {CLARIN-IT, Interoperabilità, Resea},
PAGES = {19-23},
URL = {https://office.clarin.eu/v/CE-2019-1512_CLARIN2019_ConferenceProceedings.pdf},
CONFERENCE_NAME = {CLARIN Annual Conference 2019},
BOOKTITLE = {CLARIN Annual Conference 2019},
}
@INPROCEEDINGS{ALZETTA_2019_INPROCEEDINGS_ADMV_403587,
AUTHOR = {Alzetta, C. and Dell'Orletta, F. and Montemagni, S. and Venturi, G.},
TITLE = {Dissecting Treebanks to Uncover Typological Trends. A Multilingual Comparative Approach},
YEAR = {2019},
ABSTRACT = {Over the last years, linguistic typology started attracting the interest of the community working on cross-and multi-lingual NLP as a way to tackle the bottleneck deriving from the lack of annotated data for many languages. Typological information is mostly acquired from publicly accessible typological databases, manually constructed by linguists. As reported in Ponti et al. (2018), despite the abundant information contained in them for many languages, these resources suffer from two main shortcomings, i. e. their limited coverage and the discrete nature of features (only "the majority value rather than the full range of possible values and their corresponding frequencies" is reported). Corpus-based studies can help to automatically acquire quantitative typological evidence which might be exploited for polyglot NLP. Recently, the availability of corpora annotated following a cross-linguistically consistent annotation scheme such as the one developed in the Universal Dependencies project is prompting new comparative linguistic studies aimed to identify similarities as well as idiosyncrasies among typologically different languages (Nivre, 2015). The line of research described here is aimed at acquiring quantitative typological evidence from UD treebanks through a multilingual contrastive approach},
KEYWORDS = {Natural Language Processing, Linguistic Typology},
PAGES = {1-3},
URL = {https://typology-and-nlp.github.io/2019/assets/2019/papers/5.pdf},
ISBN = {978-1-950737-29-1},
CONFERENCE_NAME = {1st TyP-NLP: The Workshop on Typology for Polyglot NLP, ACL workshop},
}
@INPROCEEDINGS{ALZETTA_2019_INPROCEEDINGS_AMADKPT_390427,
AUTHOR = {Alzetta, C. and Miaschi, A. and Adorni, G. and Dell'Orletta, F. and Koceva, F. and Passalacqua, S. and Torre, I.},
TITLE = {Prerequisite or not prerequisite? That's the problem! An NLP-based Approach for Concept Prerequisites Learning},
YEAR = {2019},
ABSTRACT = {This paper presents a method for prerequisite learning classification between educational concepts. The proposed system was developed by adapting a classification algorithm designed for sequencing Learning Objects to the task of ordering concepts from a computer science textbook. In order to apply the system to the new task, for each concept we automatically created a learning unit from the textbook using two criteria based on concept occurrences and burst intervals. Results are promising and suggest that further improvements could highly benefit the results},
URL = {https://iris.cnr.it/handle/20.500.14243/390427},
ISBN = {9791280136008},
}
@INPROCEEDINGS{BELLANDI_2019_INPROCEEDINGS_BKM_393377,
AUTHOR = {Bellandi, A. and Khan, F. and Monachini, M.},
TITLE = {Enhancing Lexicography by Means of the Linked Data Paradigm: LexO for CLARIN},
YEAR = {2019},
ABSTRACT = {This paper presents a collaborative web editor for easily building and managing lexical and terminological resources based on the OntoLex-Lemon model. The tool allows information to be easily manually curated by humans. Our primary objective is to enable lexicographers, scholarsand humanists, especially those who do not have technical skills and expertise in the Semantic Web and Linked Data technologies, to create lexical resourcesex novoeven if they are notfamiliar with the underlying technical details. This is fundamental for collecting reliable, fine-grained, and explicit information, thus allowing the adoption of new technological advances inthe Semantic Web by the Digital Humanities},
URL = {https://iris.cnr.it/handle/20.500.14243/393377},
}
@INPROCEEDINGS{BOSCHETTI_2019_INPROCEEDINGS_BPV_392228,
AUTHOR = {Boschetti, F. and Pardelli, G. and Venturi, G.},
TITLE = {Nove Anni di jTEI: What's New?},
YEAR = {2019},
ABSTRACT = {This paper illustrates methods and tools to study the development of research topics in the TEI community across the years. For this purpose, automatic terminology extraction technologies were exploited},
KEYWORDS = {Natural Language Processing, Digital Humanities},
PAGES = {1-6},
URL = {http://ceur-ws.org/Vol-2481},
PUBLISHER = {CEUR-WS. org (Aachen, DEU)},
CONFERENCE_NAME = {CLiC-it 2019-Sesta Conferenza Italiana di Linguistica Computazionale},
CONFERENCE_PLACE = {Aachen},
BOOKTITLE = {CLiC-it 2019 Italian Conference on Computational Linguistics},
EDITOR = {Bernardi, R. and Navigli, R. and Semeraro, G.},
}
@INPROCEEDINGS{BUONGIOVANNI_2019_INPROCEEDINGS_BGBD_390429,
AUTHOR = {Buongiovanni, C. and Gracci, F. and Brunato, D. and Dell'Orletta, F.},
TITLE = {Lost in text. A cross-genre analysis of linguistic phenomena within text},
YEAR = {2019},
ABSTRACT = {Moving from the assumption that formal, rather than content features, can be used to detect differences and similarities among textual genres and registers, this paper presents a new approach to the linguistic profiling methodology, which focuses on the internal parts of a text. A case study is presented showing that it is possible to model the degree of variance within texts representative of four traditional genres and two levels of complexity for each},
URL = {https://iris.cnr.it/handle/20.500.14243/390429},
ISBN = {9791280136008},
}
@INPROCEEDINGS{CERNIGLIA_2019_INPROCEEDINGS_CCCMMDF_388357,
AUTHOR = {Cerniglia, A. and Chiarella, D. and Cutugno, P. and Marconi, L. and Magrini, A. and Di Feo, G. and Ferretti, M.},
TITLE = {QUESTIONNAIRE ANALYSIS TO DEFINE THE MOST SUITABLE SURVEY FOR PORT-NOISE INVESTIGATION},
YEAR = {2019},
ABSTRACT = {The high level of noise pollution affecting the areas between ports and logistic platforms represents a problem that can be faced from different points of view. Acoustic monitoring, mapping, short-term measurements, port and road traffic flows analyses can give useful indications on the strategies to be proposed for a better management of the problem. A survey campaign through the preparation of questionnaires to be submitted to the population exposed to noise in the back-port areas will help to better understand the subjective point of view. The paper analyses a sample of questions suitable for the specific research, chosen as part of the wide database of questionnaires internationally proposed for subjective investigations. The preliminary results of a first data collection campaign are consid-ered to verify the adequacy of the number, the type of questions, and the type of sample noise used for the survey. The questionnaire will be optimized to be distributed in the TRIPLO project (TRans-ports and Innovative sustainable connections between Ports and LOgistic platforms). The results of this survey will be the starting point for the linguistic investigation carried out in combination with the acoustic monitoring, to improve understanding the connections between personal feeling and tech-nical aspects},
KEYWORDS = {port noise, acoustic monitoring, subjective survey, psychoacoustics},
URL = {https://iris.cnr.it/handle/20.500.14243/388357},
ISBN = {978-1-9991810-0-0},
CONFERENCE_NAME = {26th International Congress on Sound \& Vibration},
}
@INPROCEEDINGS{CHIRIATTI_2019_INPROCEEDINGS_CBDV_380338,
AUTHOR = {Chiriatti, G. and Brunato, D. and Dell'Orletta, F. and Venturi, G.},
TITLE = {What makes a review helpful? Predicting the helpfulness of Italian tripadvisor reviews},
YEAR = {2019},
ABSTRACT = {In this paper we introduce a classification system devoted to predict the helpfulness of Italian online reviews. It is based on a wide set of features reflecting the different factors involved and tested on different categories of TripAdvisor reviews. For this purpose, we collected the first Italian corpus of online reviews enriched with metadata related to their helpfulness and we carried out an in-depth analysis of the most predictive features},
KEYWORDS = {Natural Language Processing, Documenti Classification, Linguistic Profiling},
PAGES = {1-6},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85074834351\&origin=inward},
VOLUME = {2481},
CONFERENCE_NAME = {6th Italian Conference on Computational Linguistics (CLiC-it)},
}
@INPROCEEDINGS{CUTUGNO_2019_INPROCEEDINGS_CFM_388356,
AUTHOR = {Cutugno, P. and Ferretti, M. and Marconi, L.},
TITLE = {Construcción, exploración y análisis en un corpus de producciones escolares},
YEAR = {2019},
ABSTRACT = {La metodología desarrollada para la extracción de conocimiento a partir de datos lingüísticos, requiere primero la existencia y/o la realización de una base de conocimiento, corpus, sobre la que elaborar el análisis estadístico y lingüístico. La creación de corpus estructurados que contengan los trabajos producidos por estudiantes y la inserción de datos en estructuras informativas accesibles, que también contienen los formularios con el consentimiento informado de los padres para la recogida, análisis y publicación de los datos y las autorizaciones necesarias, es ciertamente un elemento clave del método. El uso de nuevas tecnologías por parte de los jóvenes tanto en el ámbito extracurricular como en el escolar puede favorecer la creación de un "Repositorio de producciones escolares de los estudiantes". Por un lado, el repositorio podría proporcionar una base de información completa sobre la cual llevar a cabo análisis psicológicos, sociológicos y lingüísticos por parte de todos aquellos involucrados en la educación y/o el bienestar de los estudiantes, que podría llegar a ser con la revisión y selección de los datos por parte de los docentes, una base de información a la que los propios niños podrían acceder para reutilizar los materiales existentes, actualizar y / o crear nuevos materiales y luego generar nuevos conocimientos. Los corpus además tienen una función fundamental para reconocer, analizar y clasificar un fenómeno lingüístico dado, para llevar a cabo estudios sobre la evolución del lenguaje, para contribuir a la construcción de herramientas de análisis lingüístico mediante la recopilación de información a partir de datos empíricos},
URL = {https://iris.cnr.it/handle/20.500.14243/388356},
ISBN = {978-959-7174-36-3},
}
@INPROCEEDINGS{CUTUGNO_2019_INPROCEEDINGS_CMFC_349195,
AUTHOR = {Cutugno, P. and Marconi, L. and Ferretti, M. and Chiarella, D.},
TITLE = {Estudios lingüísticos en antologías narrativas sobre la experiencia del viaje},
YEAR = {2019},
ABSTRACT = {Las antologías "Partire: Antologia narrativa di geografia emozionale" y "Partire: Antologia illustrata per eterni viaggiatori" fueron elaboradas por el CTS: Centro turístico Studentesco e Giovanile, en 2009, 2010, 2011 y 2013. Las cuatro obras relacionan historias, imágenes y pequeñas frases referidas con un "viaje de los sueños", que contiene el lugar y por qué ese viaje es el de los deseos. Cada obra contiene imágenes o historias relacionadas con temas específicos en los que se coloca cada narración; para cada una de las ediciones se anzó un concurso para estimular la participación en la redacción de las narraciones de jóvenes italianos entre dieciocho y treinta y cinco años sobre el tema del viaje. En otro artículo previamente producido, fueron analizados los componentes gramaticales de las contribuciones escritas. Los objetivos fueron identificar las posibles diferencias de las partes del discurso en los textos que componen los distintos volúmenes y, al mismo tiempo, tratar de establecer para los diversos textos, dentro de qué gama de valores se coloca la relación entre sustantivos y verbos. El análisis cualitativo y cuantitativo de las palabras más frecuentes permitió monitorear cómo algunos de los relatos de viaje se convierten en reflexiones introspectivas cambiando el enfoque de los que escriben del viaje en el mundo a los que lo hacen sobre el viaje de la vida y viceversa},
KEYWORDS = {viaggio, analisi linguistica, linguistica computazionale},
PAGES = {117-120},
URL = {https://iris.cnr.it/handle/20.500.14243/349195},
ISBN = {9789597174363},
CONFERENCE_NAME = {XVI° Simposio Internacional de Comunicación Social},
}
@INPROCEEDINGS{DOMINUTTI_2019_INPROCEEDINGS_DPDMQ_390432,
AUTHOR = {Dominutti, E. and Pifferi, L. and Dell'Orletta, F. and Montemagni, S. and Quochi, V.},
TITLE = {Building an Italian written-spoken parallel corpus: A pilot study},
YEAR = {2019},
ABSTRACT = {This paper presents a pilot study towards the creation of a monolingual written-spoken parallel corpus in Italian, featuring two main novelties in the general landscape of spoken corpora: the alignment with the written counterpart of the same content and the spoken variety dealt with, represented by transcriptions of radio news broadcasting},
URL = {https://iris.cnr.it/handle/20.500.14243/390432},
ISBN = {9791280136008},
}
@INPROCEEDINGS{FERRETTI_2019_INPROCEEDINGS_FMVMC_388354,
AUTHOR = {Ferretti, M. and Morgavi, G. and Veruggio, G. and Marconi, L. and Cutugno, P.},
TITLE = {A semantic approach to outline anthropomorphic characteristics for a robot caregiver},
YEAR = {2019},
ABSTRACT = {During the last few years, due to the ageing of the population, many scientists have developed ICT tools to offer elderly people an independent life at home as long as possible. Most of these researchers focused their efforts on problem-solving without adequate care to the agreeability and/or the acceptability of these ICT objects for their users. These resulting artefacts will hardly be used in real life by the users for which they have been developed. In this paper, we will present an experiment done on 202 elderly people over 65 on the acceptability and the likeness features a caregiver robot must have. Starting from a classification of 25 different real robot pictures and the associated questionnaire on the quality of eighteen adjectives describing the first and the last robot selected, our work tried, using a linguistic-hermeneutic approach, to better understand the hidden and implicit motivations that lead to the acceptance or the rejection of a robot and found some interesting results for appealing or unpleasant features for caregiver robot design},
URL = {https://iris.cnr.it/handle/20.500.14243/388354},
ISBN = {978-959-7174-36-3},
}
@INPROCEEDINGS{FIEROMONTE_2019_INPROCEEDINGS_FBDV_380336,
AUTHOR = {Fieromonte, M. and Brunato, D. and Dell'Orletta, F. and Venturi, G.},
TITLE = {Italian and English sentence simplification: How many differences?},
YEAR = {2019},
ABSTRACT = {The paper proposes a cross-linguistic analysis of two parallel monolingual corpora conceived for automatic text simplification in two languages, Italian and English. The aim is to find similarities and differences in the process of simplification in two typologically different languages. To carry out the comparison, 1, 000 sentences were extracted from the two corpora and annotated with a scheme previously used to annotate simplification phenomena},
KEYWORDS = {Natural Language Processing, Automatic Text Simplification},
PAGES = {1-6},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85074816689\&origin=inward},
VOLUME = {2481},
CONFERENCE_NAME = {6th Italian Conference on Computational Linguistics (CLiC-it)},
}
@INPROCEEDINGS{GOGGI_2019_INPROCEEDINGS_GPBMBC_349126,
AUTHOR = {Goggi, S. and Pardelli, G. and Bartolini, R. and Monachini, M. and Biagioni, S. and Carlesi, C.},
TITLE = {Semantic query analysis from the global science gateway},
YEAR = {2019},
ABSTRACT = {We focused on building a corpus constituted by the query logs registered by the GreyGuide: Repository and Portal to Good Practices and Resources in Grey Literature and received by the WorldWideScience. org (The Global Science Gateway) portal},
KEYWORDS = {Information Extraction, Terminology},
PAGES = {105-113},
URL = {https://iris.cnr.it/handle/20.500.14243/349126},
ISSN = {1386-2316},
ISBN = {978-90-77484-33-3},
CONFERENCE_NAME = {GL20-Twentieth International Conference on Grey Literature: Research Data Fuels and Sustains Grey Literature},
BOOKTITLE = {THE GL-CONFERENCE SERIES. CONFERENCE PROCEEDINGS},
EDITOR = {Farace, D. and Frantzen, J.},
}
@INPROCEEDINGS{GRECO_2019_INPROCEEDINGS_GMLSV_376289,
AUTHOR = {Greco, A. and Marzi, C. and Lanata, A. and Scilingo, E. and Vanello, N.},
TITLE = {Combining Electrodermal Activity and Speech Analysis towards a more Accurate Emotion Recognition System},
YEAR = {2019},
ABSTRACT = {Current research in the emotion recognition field is exploring the possibility of merging the information from physiological signals, behavioural data, and speech. Electrodermal activity (EDA) is amongst the main psychophysiological arousal indicators. Nonetheless, it is quite difficult to be analyzed in ecological scenarios, like, for instance, when the subject is speaking. On the other hand, speech carries relevant information of subject emotional state and its potential in the field of affective computing is still to be fully exploited. In this work, we aim at exploring the possibility of merging the information from electrodermal activity (EDA) and speech toimprove the recognition of human arousal level during the pronunciation of single affective words. Unlike the majority of studies in the literature, we focus on speakers' arousal rather than the emotion conveyed by the spoken word. Specifically, a support vector machine with recursive feature elimination strategy (SVM-RFE) is trained and tested on three datasets, i. e. using the two channels (i. e., speech and EDA) separately and then jointly. The results show that the merging of EDA and speech information significantly improves the marginal classifier (11. 64%). The six selected features by the RFE procedure will be used for the development of a future multivariate model of emotions},
KEYWORDS = {emotion recognition, feature selection, pattern classification, physiology, psychology, support vector machines, human arousal level, single affective words, EDA, electrodermal activity, speech analysis, emotion recognition system, speech processing},
PAGES = {229-232},
URL = {http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=\&arnumber=8857745\&isnumber=8856280},
VOLUME = {41ST ANNUAL INTERNATIONAL CONFERENCE OF THE IEEE ENGINEERING IN MEDICINE AND BIOLOGY SOCIETY (EMBC)},
DOI = {10.1109/EMBC.2019.8857745},
ISBN = {978-1-5386-1311-5},
CONFERENCE_NAME = {41st Annual International Conference of the IEEE Engineering in Medicine and Biology Society (EMBC)},
BOOKTITLE = {Proceedings on the IEEE Engineering in medicine and biology annual conference},
}
@INPROCEEDINGS{MAGRINI_2019_INPROCEEDINGS_MDCMCCF_388355,
AUTHOR = {Magrini, A. and Di Feo, G. and Cerniglia, A. and Marconi, L. and Cutugno, P. and Chiarella, D. and Ferretti, M.},
TITLE = {INDAGINE SOGGETTIVA FINALIZZATA ALLA VALUTAZIONE DEL DISTURBO DA RUMORE NELLE ZONE RETROPORTUALI},
YEAR = {2019},
ABSTRACT = {Vengono presentati alcuni risultati preliminari di una ricerca sulla percezione del rumore in zone retroportuali, che si inserisce nelle azioni previste nell'ambito del progetto TRIPLO (Programma Interreg Italia-Francia Marittimo 2014-2020). Le valutazioni riguardano le prime fasi di realizzazione e somministrazione di un questionario preliminare, realizzato su piattaforma web, e delle relative risposte: attraverso questo strumento si vogliono mettere in relazione rumori e percezione soggettiva, mediante l'uso di termini linguistici ritenuti più appropriati dai soggetti intervistati},
KEYWORDS = {port noise, acoustic monitoring, subjective survey, psychoacoustics},
PAGES = {2},
URL = {https://iris.cnr.it/handle/20.500.14243/388355},
ISBN = {978-88-88942-59-9},
CONFERENCE_NAME = {46° Convegno Nazionale Associazione Italiana di Acustica},
}
@INPROCEEDINGS{MARZI_2019_INPROCEEDINGS_MGSV_412028,
AUTHOR = {Marzi, C. and Greco, A. and Scilingo, E. and Vanello, N.},
TITLE = {Electrodermal activity and speech features as predictors for arousal level changes after affective word pronunciation},
YEAR = {2019},
ABSTRACT = {This work explores the possibility of estimating subject arousal through the analysis of speech and electrodermal activity (EDA). One critical issue to be clarified is the reliability of EDA signal during speech production. To accomplish this task, a relation among EDA, speech activity and subject arousal during isolated affective word pronunciation task, will be investigated. The results show that significant information on subject arousal can be still obtained by analyzing EDA during speech. In fact, a significant relationship between EDA features and self-reported arousal can be observed. In addition, a quantitative linear model relating EDA-and speech-related features could be identified. These preliminary results indicate how the analysis of concurrent acquisition of EDA and speech deserves further attention and could offer a valid approach for the prediction of subject arousal during speech production, as a method for validating self-assessment ratings},
KEYWORDS = {electrodermal activity, regression model, word pronunciation, arousal, speech},
PAGES = {93-96},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85086605454\&origin=inward},
VOLUME = {11},
ISBN = {978-88-6453-961-4},
CONFERENCE_NAME = {11th international workshop on Models and Analysis of Vocal Emissions for Biomedical Applications},
BOOKTITLE = {Models and Analysis of Vocal Emissions for Biomedical Applications},
EDITOR = {Manfredi, C.},
}
@INPROCEEDINGS{MASLENNIKOVA_2019_INPROCEEDINGS_MLCD_390425,
AUTHOR = {Maslennikova, A. and Labruna, P. and Cimino, A. and Dell'Orletta, F.},
TITLE = {Quanti anni hai? Age identification for Italian},
YEAR = {2019},
ABSTRACT = {We present the first work to our knowledge on automatic age identification for Italian texts. For this work we built a dataset consisting of more than 2. 400. 000 posts extracted from publicly available forums and containing authorship attribution metadata, such as age and gender. We developed an age classifier and performed a set of experiments with the aim of evaluating the possibility of assigning the correct age of an user and which information is useful to tackle this task: lexical or linguistic information spanning across different levels of linguistic descriptions. The performed experiments show the importance of lexical information in age classification, but also that exists writing style that relates to the age of an user},
URL = {https://iris.cnr.it/handle/20.500.14243/390425},
ISBN = {9791280136008},
}
@INPROCEEDINGS{MCCRAE_2019_INPROCEEDINGS_MKKDTMA_389214,
AUTHOR = {McCrae, J. P. and Khan, F. and Kernerman, I. and Declerck, T. and Tiberius, C. and Monachini, M. and Ahmadi, S.},
TITLE = {The ELEXIS Interface for Interoperable Lexical Resources},
YEAR = {2019},
ABSTRACT = {ELEXIS is a project that aims to create a European network of lexical resources, and one of the key challenges for this is the development of an interoperable interface for different lexical resources so that further tools may improve the data. This paper describes this interface and in particular describes the five methods of entrance into the infrastructure, through retrodigitization, by conversion to TEI-Lex0, by the TEILex0 format, by the OntoLex format or through the REST interface described in this paper. The interface has the role of allowing dictionaries to be ingested into the ELEXIS system, so that they can be linked to each other, used by NLP tools and made available through tools to Sketch Engine and Lexonomy. Most importantly, these dictionaries will all be linked to each other through the Dictionary Matrix, a collection of linked dictionaries that will be created by the project. There are five principal ways that a dictionary maybe entered into the Matrix Dictionary: either through retrodigitization; by conversion to TEI Lex-0 by means of the forthcoming ELEXIS conversion tool; by directly providing TEI Lex-0 data; by providing data in a compatible format (including OntoLex); or by implementing the REST interface described in this paper},
URL = {https://iris.cnr.it/handle/20.500.14243/389214},
}
@INPROCEEDINGS{MIASCHI_2019_INPROCEEDINGS_MACD_390439,
AUTHOR = {Miaschi, A. and Alzetta, C. and Cardillo, F. A. and Dell'Orletta, F.},
TITLE = {Linguistically-Driven Strategy for Concept Prerequisites Learning on Italian},
YEAR = {2019},
ABSTRACT = {We present a new concept prerequisite learning method for Learning Object (LO) ordering that exploits only linguistic features extracted from textual educational resources. The method was tested in a cross-and in-domain scenario both for Italian and English. Additionally, we performed experiments based on a incremental training strategy to study the impact of the training set size on the classifier performances. The paper also introduces ITA-PREREQ, to the best of our knowledge the first Italian dataset annotated with prerequisite relations between pairs of educational concepts, and describe the automatic strategy devised to build it},
KEYWORDS = {Concept Prerequisites Learning},
PAGES = {285-295},
URL = {https://iris.cnr.it/handle/20.500.14243/390439},
CONFERENCE_NAME = {14th Workshop on Innovative Use of NLP for Building Educational Applications},
BOOKTITLE = {Proceedings of the Fourteenth Workshop on Innovative Use of NLP for Building Educational Applications},
}
@INPROCEEDINGS{NICOLOSI_2019_INPROCEEDINGS_NMN_407455,
AUTHOR = {Nicolosi, A. and Monachini, M. and Nava, B.},
TITLE = {CLARIN-IT and the Definition of a Digital Critical Edition for Ancient Greek Poetry: a New Project for Ancient Fragmentary Texts with a Complex Tradition},
YEAR = {2019},
ABSTRACT = {Ancient Greek studies, and Classics in general, is a perfect field to demonstrate how Digital Humanities could become the humanist way of building models for complex realities, analysing them with computational methods and communicating the results to a broader public. Ancient texts have a complex tradition, which includes many witnesses (texts that handed down another texts) and different typology of supports (papyri, manuscripts and also epigraphy). These texts are fundamental for our cultural Heritage, since they are the basis of all European Literatures, and it is crucial to spread their knowledge, in a reliable and easy way. Our project on ancient Greek fragmentary poetry (DEA-Digital Edition of Archilochus: New models and tools for authoring, editing and indexing an ancient Greek fragmentary author) develops and grows out of existing experiences and try to define a new digital and critical edition which includes the use of Semantic Web and Linked Open Data. Our goal is to provide a complete and reliable tool for scholars, suitable for critical study in the field, and also user friendly and useful for non-specialist users. The project represents one of the attempts within the context of CLARIN-IT to contribute to the wider impact of CLARIN on the specific Italian community interested to Digital Classics and may improve services in fostering new (and sustaining existing) knowledge in SSH digital research},
KEYWORDS = {Digital Classics, Digital Edition, Ancient Greek},
PAGES = {150-154},
URL = {https://office.clarin.eu/v/CE-2019-1512_CLARIN2019_ConferenceProceedings.pdf},
CONFERENCE_NAME = {CLARIN Annual Conference 2019},
}
@INPROCEEDINGS{PASSALACQUA_2019_INPROCEEDINGS_PKATA_493645,
AUTHOR = {Passalacqua, S. and Koceva, F. and Alzetta, C. and Torre, I. and Adorni, G.},
TITLE = {Visualisation analysis for exploring prerequisite relations in textbooks},
YEAR = {2019},
ABSTRACT = {Building automatic strategies for organising knowledge contained in textbooks has a tremendous potential to enhance meaningful learning. Automatic identification of prerequisite relation (PR) between concepts in a textbook is a well-known way for knowledge structuring, yet it is still an open issue. Our research contributes for better understanding and exploring the phenomenon of PR in textbooks, by providing a collection of visualisation techniques for PR exploration and analysis, that we used for the design of and then the refinement of our algorithm for PR extraction},
KEYWORDS = {Information visualisation, Knowledge structuring, Prerequisite relation},
PAGES = {18-21},
URL = {https://iris.cnr.it/handle/20.500.14243/493645},
VOLUME = {2384},
PUBLISHER = {CEUR-WS},
CONFERENCE_NAME = {1st Workshop on Intelligent Textbooks, iText 2019},
BOOKTITLE = {CEUR Workshop Proceedings of the 1st International Workshop on Intelligent Textbooks},
}
@INPROCEEDINGS{PROIETTI_2019_INPROCEEDINGS_PGSV_404076,
AUTHOR = {Proietti, C. and Grossi, D. and Smets, S. and Velazquezquesada, F.},
TITLE = {Bipolar Argumentation Frameworks, Modal Logic and Semantic Paradoxes},
YEAR = {2019},
ABSTRACT = {Bipolar Argumentation Frameworks (BAF) are a natural extension of Dung's Argumentation Frameworks (AF) where a relation of support between arguments is added to the standard attack relation. Despite their interest, BAF present several difficulties and their semantics are quite complex. This paper provides a definition of semantic concepts for BAF in terms of fixpoints of the functions of neutrality and defense, thus preserving most of the fundamental properties of Dung's AF. From this angle it becomes easy to show that propositional dynamic logic provides an adequate language to talk about BAF. Finally, we illustrate how this framework allows to encode the structure of the referential discourse involved in semantic paradoxes such as the Liar. It turns out that such paradoxes can be seen as BAF without a stable extension},
KEYWORDS = {abstract argumentation, bipolar argumentation frameworks, modal logic, semantic paradoxes},
PAGES = {214-229},
URL = {https://iris.cnr.it/handle/20.500.14243/404076},
VOLUME = {11813},
ISBN = {9783662602911},
CONFERENCE_NAME = {7th International Workshop on Logic, Rationality, and Interaction, LORI 2019},
BOOKTITLE = {Logic, Rationality, and Interaction-7th International Workshop, LORI 2019, Proceedings},
EDITOR = {Blackburn, P. and Lorini, E. and Guo, M.},
}
@INPROCEEDINGS{RORBERI_2019_INPROCEEDINGS_RM_386352,
AUTHOR = {Rorberi, S. and Marzi, C.},
TITLE = {Modelling the interaction of regularity and morphological structure: the case of Russian verb inflection},
YEAR = {2019},
ABSTRACT = {Modelling complex inflection systems, such as conjugation in Modern Greek, Italian or Russian, requires careful consideration of a number of factors, ranging from pervasive stem allomorphy to the identification of the appropriate inflection class and the inferential predictability of morpho-phonological processes. Descriptive approaches have taken different views on how to account for degrees of morphological (ir)regularity, while making different predictions about the way speakers process regular and irregular forms in highly-inflecting languages. In the present paper, we assess the psycholinguistic implications of two radically different approaches to the description of the Russian verb system: a more traditional approach dating back to Jakobson (1948), and a Words and Paradigm approach (Brown 1998). Based on recent fMRI evidence (Slioussar et al. 2014) and original results of a neural network simulation with recurrent self-organising maps (Ferro et al. 2011; Marzi et al. 2014; Pirrelli et al. 2015; Marzi et al. 2016), we suggest that both approaches are prima facie compatiblewith Russian data, while being in contrast with Pinker's claim that the regular-irregular distinction is an epiphenomenon of the storage-processing dichotomy in the human languagefaculty (Pinker \& Ullman 2002). We argue that this evidence lends support to integrativemodels of the mental lexicon (Marzi \& Pirrelli 2015), accounting for a graded interactionbetween regularity and morphological structure},
KEYWORDS = {Inflectional complexity, Russian verb system, perception of morphological structure, recurrent self-organising neural network},
PAGES = {107-110},
URL = {http://drehu.linguist.univ-paris-diderot.fr/ismo-2019/?fichier=programme},
VOLUME = {2019},
CONFERENCE_NAME = {International Symposium of Morphology (ISMo) 2019},
BOOKTITLE = {International Symposium of Morphology},
EDITOR = {Crysmann, B. and Villoing, F.},
}
@INPROCEEDINGS{SASSOLINI_2019_INPROCEEDINGS_SFBMM_389211,
AUTHOR = {Sassolini, E. and Fahad Khan, A. and Biffi, M. and Monachini, M. and Montemagni, S.},
TITLE = {Converting and structuring a digital historical dictionary of Italian: a case study},
YEAR = {2019},
ABSTRACT = {The paper describes ongoing work on the digitization of an authoritative historical Italian dictionary, namely Il Grande Dizionario della Lingua Italiana (GDLI), with a specific view to creating the prerequisites for advanced human-oriented querying. After discussing the general approach taken to extract and structure the GDLI contents, in the paper we report the encouraging results of a case study carried out against two volumes which have been selected for the different conversion issues raised. Dictionary content extraction and structuring is being carried out through an iterative process based on hand coded patterns: starting from the recognition of the entry headword, a series of truth conditions are tested which allow the building and progressive structuring, in successive steps, of the whole lexical entry. We also started to design the representation of extracted and structured entries in a standard format, encoded in TEI. An outline of an example entry is also provided and illustrated in order to show what the end result will look like},
URL = {https://iris.cnr.it/handle/20.500.14243/389211},
}
@INPROCEEDINGS{ANDREINI_2019_INPROCEEDINGS_ADP_381978,
AUTHOR = {Andreini, G. and Di Donato, F. and Pezzini, S.},
TITLE = {How we designed Galassia Ariosto},
YEAR = {2019},
ABSTRACT = {In the poster we will present the User Experience work we did for the digital library Galassia Ariosto (www. galassiaariosto. sns. it). Galassia Ariosto is one of the main outputs of the ERC AdG "Looking at Words through images" (2013-2017) leaded by Lina Bolzoni of the CTL research lab at Scuola Normale Superiore di Pisa. The CTL team has always been interested in studying the relations between text and images and that's what Galassia Ariosto is about: an indepth study of the relations between the text of Orlando furioso (and other chivalric poems) and the illustrations sets that were produced to enrich the text. The project dealt with Ariosto's Orlando Furioso editions, starting from the 1516 first printed edition which soon became a "best seller". In the following years venetian editors wanted to create some more appealing editions and started adding illustrations to the text: those illustrations were engraved in wooden blocks and placed alongside the moveable types to layout the pages. These were a visual description of what's written in the text and were the first books with images ever produced. Soon this became an editorial standard and the illustrations of the Orlando furioso became very complex and detailed, and this type of illustrations were introduced in other chivalric poems like La Gerusalemme Liberata, Orlando Innamorato, Tredici canti del Floridoro and many more. Net7 was involved in the design and implementation of the digital archive where all data and information are stored and made accessible on the web: A back-end system that allows the team to do their research, inserting images, texts, comments, entities and building relations between all those elements, including portions of images and texts. A front-end user interface to make all this work public and accessible to the world. The main challenges of the project were: to make all this complex data and relations easy to browse and understand; to create an attractive UI that involves the user; to create different ways to access the content of the archive targeted to different groups of users (personas). In the project, we adopted a UX based methodology and approach. After the first user testing, the discovery process has been conceived considering 3 main macro-typologies of target users:-the domain expert (member of the research team). She knows what the DL contains, and needs to directly access single "leafs". She uses the advanced search feature, which filters results helping them through the autocomplete.-a skilled scholar, who has not precise knowledge of what the DL contains. She enters the platform from the full index of Works (Opere).-and the "culture enthusiast" (which include students, teachers, and culture lovers), who browse the highly specialized content of the archive through stories which connect texts and images through storytelling (Percorsi). The result is a rich platform strongly oriented to different user needs, with different access points},
URL = {https://iris.cnr.it/handle/20.500.14243/381978},
}
@INPROCEEDINGS{BELLANDI_2019_INPROCEEDINGS_BK_389215,
AUTHOR = {Bellandi, A. and Khan, F.},
TITLE = {Lexicography and the Semantic Web: A Demo with LexO},
YEAR = {2019},
ABSTRACT = {The purpose of this contribution is to present LexO8, the first version of a collaborative web editor for easily building and managing of lexical and terminological resources in the context of the Semantic Web. The adoption of Semantic Web technologies and the Linked Data paradigm has been driven by the need to ensure the construction of resources that are interoperable and can be shared and reused by the scientific community. LexO's primary objective is to enable terminologists and lexicographers to create a resource ex novo this is by means of the adoption of a lexical model that allows the association of detailed and structured lexical information (Bellandi et al., 2018); (Khan et al., 2016) to ontological concepts. In this respect, the lemon lexical model (McCrae et al., 2012), later renamed OntoLex-lemon (McCrae et al., 2017), is currently regarded as the de facto standard for enriching Semantic Web ontologies with lexical information. LexO can provide a support for creating, managing, publishing lexical and terminological resources as Linked Open Data, that is typically a complex task, especially for those who have not yet mastered Semantic Web-based standards and technologies, such as RDF and OWL. However, the long-term ambition of LexO would be to make a deeper contribution to e-lexicography},
URL = {https://iris.cnr.it/handle/20.500.14243/389215},
}
@INPROCEEDINGS{BOHBOT_2019_INPROCEEDINGS_BFKKR_389213,
AUTHOR = {Bohbot, H. and Frontini, F. and Khan, F. and Khemakhem, M. and Romary, L.},
TITLE = {Nénufar: Modelling a Diachronic Collection of Dictionary Editions as a Computational Lexical Resource},
YEAR = {2019},
ABSTRACT = {The Petit Larousse Illustré (PLI) is a monolingual French dictionary which has been published every year since the 1906 edition, and which is therefore a fundamental record of the evolution of the French language. As a consequence of the pre-1948 editions of the PLI entering the public domain in 2018 the Nénufar (Nouvelle édition numérique de fac-similés de référence) project was launched at the Praxiling laboratory in Montpellier with the aim of digitizing and making these editions available electronically. The project is still ongoing; various selected editions from each decade are going to be fully digitized (so far the 1906, 1924 and 1925 editions have been completed), and changes backtracked and dated to the specific year. Nénufar's primary aim is to make the editions available and searchable via an advanced search interface which will not only enable the selective querying of text by lemma and type of content (definitions, examples,.), but crucially also detect and study changes by comparing different editions. In order to do so, a specific web interface has been put in place. Alongside the digitized text, the Nénufar website contains high quality scans for each page. In compliance with current open data best practices (Wilkinson et al., 2016), the project also aims to make the source data available separately from the querying interface both for research and for A similar project which presents data and scans from subsequent editions of the same legacy dictionary has been carried out by the team behind the Swedish Academy's Wordlist (see Holmer, Malmgren, and Martens (2016) and http: //spraakdata. gu. se/saolhist/). eLex 2019: Book of Abstracts 36 long-term preservation. The primary encoding format is TEI-XML; however in our case the TEI encoding is closely inspired by the latest version of the TEI-Lex0 (Ba?ski et al., 2017, Romary \& Tasovac, 2018) guidelines for encoding lexicographic resources, which are based upon TEI. The choice of a TEI based approach allows the Nénufar project to align itself to other pre-existing initiatives and tools. By aligning ourselves to TEI-Lex0 we will be able to make use of digitisation tools such as Grobid (Khemakhem et al., 2017) which have TEI-Lex0 as their native format and which have already been tested and used within the Nénufar project to speed up the digitization of new editions. In addition we will be able to make use of ongoing initiatives to convert TEI-Lex0 datasets to RDF using the W3C recommendation for publishing lexicons as Linked Data, namely OntoLex-Lemon (McCrae et al., 2017; Bosque-Gil et al., 2016) which will allow for the publication of the Nénufar dataset as an LOD graph. The LOD version of the Nénufar dataset, now currently being developed, will be queryable from the available SPARQL endpoint and contain all available editions as one single graph, allowing for expert users to perform complex queries that could detect systematic changes in the dataset. The LOD version is particularly adapted to be linked to other datasets; more recent editions, once added, could also be of interest for NLP applications},
URL = {https://iris.cnr.it/handle/20.500.14243/389213},
}
@INPROCEEDINGS{DELGROSSO_2019_INPROCEEDINGS_DCCSS_410270,
AUTHOR = {Del Grosso, A. M. and Capizzi, E. and Cristofaro, S. and Seminara, G. and Spampinato, D.},
TITLE = {Promoting Bellini's legacy and the Italian opera by scholarly digital editing his own correspondence},
YEAR = {2019},
ABSTRACT = {This contribution aims at illustrating the ongoing work towards the digital scholarly editing, long-term preservation, web publishing and computational exploiting of 41 letters, written by the renowned composer Vincenzo Bellini. The correspondence is kept at the Belliniano Civic Museum of Catania and is being encoded in XML according to the last TEI guidelines. The edition will be made accessible both via web-exploiting the Edition Visualization Technology (EVT)-as well as integrated into an interactive and multimedia tour within the museum. The digital edition is based on the recently published transcriptions made by Seminara. The encoding scheme has been defined according to the edition requirements, the TEI best practices and the Music Encoding Initiative (MEI) guidelines-where the musical context must be specified. Our initiative has some elements of innovation that distinguish it from similar projects, such as the Van Gogh letter project or the DALF project. For instance, we encode the circumstance that the letters themselves have also the purpose of acting as envelopes. In fact, they are folded on themselves and postmarks and wax seals are sometimes affixed on them. The edition takes care of handling the correspondence metadata by means of the correspDesc TEI tagset, thus providing the opportunity to exploit the correspSearch API. This approach has allowed us to enrich the encoding of the document both in its logical and physical structure and in indexing letters by sender, recipient, date, and places. The museum context and the educational purposes have even led us to the definitions of some lists of named entities. Within these resources we have adopted the Semantic Web and LOD paradigm by encoding external references to authoritative repositories such as RISM and DBpedia. Finally, we implemented some useful EVT extensions to automatically handle hotspots and to show critical notes that accompany the text},
KEYWORDS = {TEI, DSE, Vincenzo Bellini, Digital Correspondence},
URL = {https://gams.uni-graz.at/o:tei2019.118},
DOI = {10.5281/zenodo.3461673},
CONFERENCE_NAME = {What is text, really? TEI and beyond (TEI 2019)},
BOOKTITLE = {What is text, really? TEI and beyond},
EDITOR = {Vogeler, G.},
}
@INPROCEEDINGS{DIDONATO_2019_INPROCEEDINGS_D_381979,
AUTHOR = {Di Donato, F.},
TITLE = {Filosofia digitale e uso pubblico della ragione: il paradigma della scienza aperta},
YEAR = {2019},
ABSTRACT = {Il paradigma della scienza aperta, che si è affermato negli ultimi anni, sta diventando uno standard per la comunicazione scientifica a livello europeo e internazionale, come riconosciuto dalle policy della Commissione Europea e dal Plan pubblicato nell'ottobre di quest'anno. Esso implica una trasformazione metodologica nel modo di fare ricerca, trasformazione che si fonda sull'uso delle tecnologie digitali, che sono considerate non solo come un mezzo al servizio della ricerca vera e propria, ma piuttosto come parte essenziale del modo di fare scienza. Il presente contributo intende mettere in luce come tale impostazione abbia importanti basi filosofiche e soffermarvisi, a partire dalle seguenti domande. Quali sono i concetti e le teorie filosofiche a fondamento dell'open science? Come tali concetti introducono un radicale cambio di paradigma nella tradizionale metodologia di ricerca nelle scienze umane? E in che modo la filosofia è in grado di acquisire un ruolo determinante nell'informare i processi della ricerca, sia nelle scienze umane e sociali e sia nelle cosiddette scienze "dure"? Infine, ci si concentrerà sull'analisi di workflow open science specificatamente nell'ambito dell'umanistica digitale, per proporre esempi concreti di tale approccio},
URL = {https://iris.cnr.it/handle/20.500.14243/381979},
}
@INPROCEEDINGS{MONACHINI_2019_INPROCEEDINGS_MSC_405364,
AUTHOR = {Monachini, M. and Stamuli, M. F. and Calamai, S.},
TITLE = {Folk in Tuscany: the Caterina Bueno sound archive},
YEAR = {2019},
ABSTRACT = {Caterina Bueno's sound archive is composed of 476 carriers (audio reels and compact cassettes), corresponding to nearly 714 hours of recording and was digitised during the PAR-FAS project Gra. fo (Grammo-foni. Le soffitte della voce, UNISI \& SNS, http: //sns. grafo. it). It was located at two different owners': part of it was stored at Caterina's heirs' house, while the rest was kept by the former culture counsellor of the Municipality of San Marcello Pistoiese, in the Montagna Pistoiese, where a multi-media library was supposed to be set up. Unfortunately, disagreements and misunderstandings between the two parties have so far made the archive fragmented and inaccessible to the community. Both owners, independently, have turned to Silvia Calamai for the reassembly of the whole archive in the digital domain, in respect of the artist's wishes. After digitising, the carriers were returned to their owners, who helped in finding an arrangement for the sound archive, which can be divided according to the following categories: field-research (investigations carried out in the Tuscan countryside from the late 50s to the end of the artist's life); live performances (recordings of concerts and events); performances' rehearsals (recordings of rehearsals with musicians). In 2019 Regione Toscana decided to support the project of cataloguing and disseminating Caterina Bueno Archive and the following partners were involved: Università degli Studi di Siena (Silvia Calamai), Soprintendenza Archivistica e Bibliografica della Toscana (Maria Francesca Stamuli), CLARIN-IT (Monica Monachini), and Unione dei comuni del Casentino (Pierangelo Bonazzoli). Archivio Vi. vo will thus constitute a pilot study within CLARIN-IT to experiment methods and offer services to disciplines interested in oral sources. The ILC4CLARIN Italian node offers archiving preservation access and tools for linguistic data of a written type; within Archivio Vi. vo. the repository will be improved through experimental approach to conservation, management and access to audio and audio-video data and metadata. Archivio Vi. Vo. will develop a model which can be replicated on other audio-visual archives, even outside the context of Tuscany. The experimental activity will aim to adopt the model and high-performance computing and archiving services of the new GARR network infrastructure, built along the Cloud paradigm. This model will be disseminated both to the scientific community interested in accessing these data, and to the general public who enjoy ethnomusical materials produced in the territory},
KEYWORDS = {long-term preservation, oral archives, infrastructures, conservation, access, metadata},
URL = {https://www.clarin.eu/sites/default/files/clarin2019_bazaar_calamai-stmuli-monachini.pdf},
CONFERENCE_NAME = {CLARIN 2019 Annual Conference},
BOOKTITLE = {CLARIN Annual Conference 2019 Abstracts},
}
@INPROCEEDINGS{MORGAVI_2019_INPROCEEDINGS_MNMCFFC_388910,
AUTHOR = {Morgavi, G. and Nerino, R. and Marconi, L. and Cutugno, P. and Ferraris, C. and Ferretti, M. and Cinini, A.},
TITLE = {NINFA iNtelligent Integrated Network For Aged people},
YEAR = {2019},
ABSTRACT = {Contesto: Il progressivo invecchiamento della popolazione, con conseguente aumento delle patologie corniche e neurodegenerative, porter ad affrontare importanti sfide legate alla sostenibilità economica per la cura, l'assistenza e l'inclusione sociale delle persone anziane. Attualmente, circa il 20% della popolazione europea ha più di 65 anni. Le stime indicano una progressione al 29% entro il 2050, con un picco significativo di ultraottantenni (13%). Solitudine e paura sono sentimenti comuni nell'anziano, così come l'aumento della fragilità legata a fattori fisici, motori, e cognitivi. Per minimizzare queste criticità, soluzione ICT (Information e Communication Technology) specifiche possono rappresentare un grande beneficio per l'anziano fragile, permettendo di rilevare alterazioni nella funzionalità motoria, cognitiva e verbale che possono ridurne l'indipendenza nella quotidianità. In questo contesto, NINFA si propone di individuare nuovi strumenti per migliorare la qualità della vita e l'autonomia dell'anziano in ambiente domestico, e per prevenire criticità attraverso l'analisi delle capacità fisiche e cognitive. Principali obiettivi: oValutazione dell'impatto delle tecnologie ICT su comunità di anziani oValutazione dell'accettabilità e dell'usabilità di robot e interfacce uomo-macchina naturali nel supporto al monitoraggio, al benessere ed alla socializzazione della popolazione anziana oAnalisi del linguaggio: la produzione verbale viene utilizzata per monitorare l'evoluzione del linguaggio, rilevare l'insorgenza di deficit cognitivi e le alterazioni dello stato neurologico e di benessere nell'anziano oAnalisi della funzionalità motorio-cognitiva: il movimento del corpo durante l'esecuzione di task motori ed exergames dedicati viene utilizzato per monitorare e valutare automaticamente le alterazioni motorio-cognitive nell'anziano},
URL = {https://iris.cnr.it/handle/20.500.14243/388910},
}
@INPROCEEDINGS{PARDELLI_2019_INPROCEEDINGS_PGB_358828,
AUTHOR = {Pardelli, G. and Goggi, S. and Boschetti, F.},
TITLE = {Strolling around the dawn of Digital Humanities},
YEAR = {2019},
ABSTRACT = {Nelle ricerche umanistiche l'impiego dell'elaboratore elettronico prende il via nella seconda metà del ventesimo secolo favorendo l'uso di metodi statistici sia nello studio di opere letterarie che nello studio delle lingue, promuovendo un sodalizio interdisciplinare che è arrivato ai giorni nostri senza interruzione. In questo contributo tentiamo di fissare alcuni momenti salienti del processo che ha visto la nascita comune della Linguistica Computazionale e delle Digital Humanities nonché i loro alterni allontanamenti e ricongiungimenti},
KEYWORDS = {Digital Humanities (DH), Computational Linguistics (CL), History},
PAGES = {261-264},
URL = {http://aiucd2019.uniud.it/book-of-abstracts/},
CONFERENCE_NAME = {8th Annual Conference AIUCD 2019. Teaching and research in Digital Humanities' era},
}
@INPROCEEDINGS{ROSSELLIDELTURCO_2019_INPROCEEDINGS_RMDCDZ_406307,
AUTHOR = {Rosselli Del Turco, R. and Martignano, C. and Di Pietro, C. and Cacioli, G. and Del Grosso, A. M. and Zenzaro, S.},
TITLE = {DSE Visualisation with EVT: Simplicity is Complex},
YEAR = {2019},
ABSTRACT = {Edition Visualization Technology (EVT) is an open source tool to produce digital scholarly editions on the basis of TEI XML-encoded documents. Born to serve the goals of a single project, the Digital Vercelli Book, it has been developed in such a way as to become a general purpose tool. Several DSE projects are using it to publish digital editions, in fact many researchers have found in EVT the perfect tool for their needs: it is easy to configure and deploy, it is fully customizable, it includes several useful research tools out of the box},
KEYWORDS = {Digital Philology, Digital Scholarly Editing},
URL = {https://doi.org/10.34894/B6T1YD},
DOI = {10.34894/B6T1YD},
CONFERENCE_NAME = {Compexities},
BOOKTITLE = {Complexities},
EDITOR = {Pierazzo, E. and Ciotti, F.},
}
@INPROCEEDINGS{SALVATORI_2019_INPROCEEDINGS_SBD_346963,
AUTHOR = {Salvatori, E. and Boschetti, F. and Del Grosso, A. M.},
TITLE = {From collaborative transcription to interdisciplinary education: the postcards of the Great War case},
YEAR = {2019},
KEYWORDS = {Digital Public History, Collaborative Philology, Text Encoding, Digital Philology, Web Application, Educational, Digital Textual Scholarship},
PAGES = {211-215},
URL = {http://amsacta.unibo.it/6361/},
DOI = {10.6092/unibo/amsacta/6361},
ISBN = {978-88-942535-3-5},
CONFERENCE_NAME = {Didattica e ricerca al tempo delle Digital Humanities / Teaching and research in Digital Humanities' era},
BOOKTITLE = {Didattica e ricerca al tempo delle Digital Humanities / Teaching and research in Digital Humanities' era. Ottavo Convegno Annuale 8th Annual Conference AIUCD 2019 (Udine, 23-25 gennaio 2019) Book of Abstracts},
EDITOR = {Allegrezza, S.},
}
@TECHREPORT{AHMADI_2019_TECHREPORT_AADKKKJMMRTTZ_351830,
AUTHOR = {Ahmadi, S. and Arcan, M. and Declerck, T. and Kernerman, I. and Khan, F. and Krek, S. and Johnmc Crae and McHura, M. and Monachini, M. and Roche, C. and Tiberius, C. and Troelsgård, T. and Zaytseva, K.},
TITLE = {D2. 1. Interface for Interoperable Lexical Resources},
YEAR = {2019},
ABSTRACT = {ELEXIS Deliverable D2. 1. Interface for Interoperable Lexical Resources},
URL = {https://iris.cnr.it/handle/20.500.14243/351830},
}
@TECHREPORT{ALBANESI_2019_TECHREPORT_ABDGMP_404158,
AUTHOR = {Albanesi, D. and Bellandi, A. and Del Grosso, A. M. and Giovannetti, E. and Marchi, S. and Piccini, S.},
TITLE = {Traduco: l'Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-Rapporto tecnico 16},
YEAR = {2019},
ABSTRACT = {La presente relazione tecnico-scientifica descrive l'attività svolta da ILC-CNR nel contesto del Progetto Traduzione Talmud Babilonese nel periodo giugno 2019-ottobre 2019. Le due principali attività tecniche svolte sul sistema Traduco sono la risoluzione di bug e l'implementazione di nuove funzionalità. Queste due attività sono strettamente correlate: di fatto, l'introduzione di nuove funzionalità può implicare l'introduzione di nuovi bug all'interno del sistema. Le attività di ricerca sono state condotte, in continuità a quelle descritte nel rapporto precedente, nella rappresentazione della terminologia e della conoscenza del Talmud},
KEYWORDS = {Linguistica Computazionale, Traduzione di Testi Religiosi, Traduzione Assistita dal Calcolatore, Traduzione Collaborativa, Lessici elettronici, rappresentazione della conoscenza},
URL = {https://iris.cnr.it/handle/20.500.14243/404158},
}
@TECHREPORT{ALBANESI_2019_TECHREPORT_ABDGMP_411289,
AUTHOR = {Albanesi, D. and Bellandi, A. and Del Grosso, A. M. and Giovannetti, E. and Marchi, S. and Piccini, S.},
TITLE = {Traduco: l'Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-Rapporto tecnico 15},
YEAR = {2019},
ABSTRACT = {La presente relazione tecnico-scientifica descrive l'attività svolta da ILC-CNR nel contesto del Progetto Traduzione Talmud Babilonese nel periodo dicembre 2018-maggio 2019. Le due principali attività tecniche svolte sul sistema Traduco sono la risoluzione di bug e l'implementazione di nuove funzionalità. Queste due attività sono strettamente correlate: di fatto, l'introduzione di nuove funzionalità può implicare l'introduzione di nuovi bug all'interno del sistema. Le attività di ricerca sono state condotte, in continuità a quelle descritte nel rapporto recedente, nella rappresentazione della terminologia e della conoscenza del Talmud},
KEYWORDS = {Linguistica Computazionale, Traduzione di Testi Religiosi, Traduzione Assistita dal Calcolatore, Traduzione Collaborativa, Lessici elettronici, rappresentazione della conoscenza},
URL = {https://iris.cnr.it/handle/20.500.14243/411289},
}
@TECHREPORT{ALBANESI_2019_TECHREPORT_ABGD_427142,
AUTHOR = {Albanesi, D. and Bellandi, A. and Giovannetti, E. and Del Grosso, A. M.},
TITLE = {Traduco: l'Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-rapporto integrativo 1},
YEAR = {2019},
ABSTRACT = {La presente relazione tecnico-scientifica descrive l'attività svolta da ILC-CNR nel contesto delle attività di progetto previste dalla convenzione integrativa stipulata tra PTTB e ILC-CNR in data 10/07/2018 e condotte nel periodo dicembre 2017-gennaio 2019},
KEYWORDS = {Linguistica Computazionale, Traduzione di Testi Religiosi, Traduzione Assistita dal Calcolatore, Traduzione Collaborativa, Allineamento di Testi},
PAGES = {5},
URL = {https://iris.cnr.it/handle/20.500.14243/427142},
}
@TECHREPORT{ROCCHICCIOLI_2019_TECHREPORT_RPRVCBCCSP_388338,
AUTHOR = {Rocchiccioli, S. and Pelosi, G. and Rial, M. and Vozzi, F. and Caselli, C. and Benvenuti, C. and Carpita, D. and Campolo, J. and Sbrana, S. and Parodi, O.},
TITLE = {SMARTool-Periodic Technical Report-PART B (Period 2)},
YEAR = {2019},
ABSTRACT = {The period between M19 and M36 (01/07/2017 to 31/12/2018) has been dedicated to complete and report activities required in order to achieve the objectives of WP1, WP2 and WP3 and achieve MS1, MS2, MS3, MS4, MS5, MS7, MS9 and MS10 according to the new deadline set in the deviations to the DoA following implementation of the R1 mitigation plan (see WP1 for details)-accepted by the PO during the Interim Review of September 2017 and included in the Amendment to the DoA},
URL = {https://iris.cnr.it/handle/20.500.14243/388338},
}
@TECHREPORT{TASOVAC_2019_TECHREPORT_TMK_352225,
AUTHOR = {Tasovac, T. and Monachini, M. and Khan, F.},
TITLE = {5. 1 ELEXIS SKILLSET REPORT},
YEAR = {2019},
ABSTRACT = {ELEXIS PROJECT DELIVERABLE ELEXIS SKILLSET REPORT},
URL = {https://iris.cnr.it/handle/20.500.14243/352225},
}
@MISC{BOSCHETTI_2019_MISC_BD_405214,
AUTHOR = {Boschetti, F. and Del Grosso, A. M.},
TITLE = {Digital Philology},
YEAR = {2019},
ABSTRACT = {Session outline: 1) Introduction 1a) Computational Linguistics and Digital Philology 1b) Collaboration vs Cooperation 1c) Defining Data Types and APIs for Scholarly Editing 1d) The Hermeneutical circle 2) Digital Ecdotics 2a) Representation of Textual Phenomena by TEI-XML 2b) Representation of Textual Phenomena by Domain-Specific Languages 2c) Visual Presentation of Encoded Data 2d) Stemma Codicum and Alignment of Variants 2e) Querying Encoded Data 3) Digital Hermeneutics 3a) Linguistic and Stylistic Analyses 3b) Thematic Analysis 3c) Interdisciplinary Approaches to Philological Issues 3d) Semantic Querying 4) Conclusion 4a) Putting All Together 4b) Further Perspectives Seminar readings-Boschetti, Federico, e Angelo Mario Del Grosso. 2015. «TeiCoPhiLib: A Library of Components for the Domain of Collaborative Philology». Journal of the Text Encoding Initiative, n. 8. https: //doi. org/10. 4000/jtei. 1285-Burnard, Lou. 2014. WHAT IS THE TEXT ENCODING INITIATIVE?. OpenEdition Press. http: //books. openedition. org/oep/426-Schmidt, Desmond. 2010. «The inadequacy of embedded markup for cultural heritage texts». Literary and Linguistic Computing 25 (3): 337-56. https: //doi. org/10. 1093/llc/fqq007 Further reading-Berti, Monica, Bridget Almas, David Dubin, Greta Franzini, Simona Stoyanova, e Gregory Ralph Crane. 2014. «The Linked Fragment: TEI and the Encoding of Text Reuses of Lost Authors». JTEI 8. https: //doi. org/10. 4000/jtei. 1218-Bozzi, Andrea. 2014. «Computer-assisted Scholarly Editing of Manuscript Sources». In New publication cultures in the humanities: exploring the paradigm shift, P. Davidhazi (ed.), 99-115. Amsterdam: Amsterdam University Press. http: //www. oapen. org/record/515678-Driscoll, Matthew James, e Elena Pierazzo, (eds) 2016. Digital Scholarly Editing: Theories and Practices. Vol. 4. Digital Humanities Series. Open Book Publishers. Chapters 2-4. http: //www. openbookpublishers. com/product/483/digital-scholarly-editing-theories-and-practices/eec262cdd3121ebd5eb2bf78581594f2},
KEYWORDS = {digital philology, digital humanities},
URL = {https://github.com/SunoikisisDC/SunoikisisDC-2018-2019/wiki/Summer2019-Session2},
VOLUME = {4},
ISSN = {2018-2019},
}
@MISC{CARDAMONE_2019_MISC_CD_385314,
AUTHOR = {Cardamone, R. D. and Del Grosso, A. M.},
TITLE = {L'edizione digitale: una risorsa per tutti},
YEAR = {2019},
ABSTRACT = {Presentazione dell'edizione digitale degli statuti quattrocenteschi di Monterosso al Mare completa di immagini, trascrizione e traduzione},
KEYWORDS = {digital humanities, digital scholarly edition},
URL = {https://www.cfs.unipi.it/2019/11/27/gli-statuti-quattrocenteschi-di-monterosso-restituiti-alla-comunita/},
}
@MISC{CARDILLO_2019_MISC_CS_360743,
AUTHOR = {Cardillo, F. and Straccia, U.},
TITLE = {Towards Ontology-based Explainable Classification of Rare Events},
YEAR = {2019},
ABSTRACT = {Rare events (e. g. major floods, violent conflicts) are events that have potentially widespread and/or disastrous impact on society. The overall goal is to build a framework capable to classify, predict and explain such rare events. To do so, we envisage the usage of a mixture of sub-symbolic Machine Learning (ML) and Ontology-based Statistical Relatio-nal Learning (OSRL) techniques to generate rare events classifiers and predictors, which additionally may be mapped into natural language to ease human interpretability of the decision process},
KEYWORDS = {Ontologies Explainable Classification of Rare Events, Statistical Relational Machine Learning},
PAGES = {1-2},
URL = {https://hal.archives-ouvertes.fr/hal-02104520},
}
@MISC{DELGRATTA_2019_MISC_D_459061,
AUTHOR = {Del Gratta, R.},
TITLE = {Licenses and Licensing},
YEAR = {2019},
ABSTRACT = {Presentazione sull'importanza delle licenze nella ricerca in generale e specificatamente nella Linguistica Computazionale},
KEYWORDS = {LIncenze, Open Data},
URL = {https://iris.cnr.it/handle/20.500.14243/459061},
CONFERENCE_NAME = {Seminario Formativo su "Questioni Legali e Risorse e Tecnologie Linguistiche" presso l'ILC-CNR},
}
@MISC{DELGROSSO_2019_MISC_D_406308,
AUTHOR = {Del Grosso, A. M.},
TITLE = {Multilingual Word-by-word alignment. Methodology and some preliminary outcomes towards the construction of multilingual Lexicon within the "Traduzione del Talmud Babilonese" project},
YEAR = {2019},
ABSTRACT = {Textual scholars have been exploiting for long time multilingual resources in their daily work to better understand the primary sources they inquire. Bitexts are parallel texts which turn out to be useful in a number of cross-linguistic and comparative processing tasks. This talk will show the workflow adopted within the research activities conducted on the Italian translation of the Babylonian Talmud. More specifically, I will illustrate the ongoing work towards the construction of a multilingual Hebrew/Aramaic/Italian terminological resource by means of stochastic generative approaches to word-by-word text alignment. The related literature discusses plenty of techniques concerning this topic. The alignment tool I developed is grounded on generative models (i. e., IBM and HMM models), which are a collection of non-supervised machine learning algorithms, to calculate the probability of linking two words in a multilingual term pair. From a technical standpoint, beside the adopted models, which are based on an alignment function and on an unsupervised training procedure devoted to estimating the unknown probability distributions, other machine learning approaches to word alignment exist that encompass discriminative techniques, which are based on a target function and on a supervised learning process exploiting labeled training data set. The implemented models were widely adopted in the literary domain, as they are able to profitably handle interpretative bitexts modeling also deletion, insertion, transposition phenomena without having an extant labeled data set. The workflow I will present encompasses four distinct phases: 1) The encoding of the parallel text, which has been carried out according to the last TEI recommendations. In particular, the linking-target approach described within the Module 16 of the guidelines was used. 2) The semi-automatic extraction of the Italian terms, which has been carried out by means of linguistic analysis technologies available at the Institute of Computational Linguistics (ILC-CNR). These tools include a stochastic component for terminology extraction. 3) The addition of Hebrew/Aramaic terms to the Italian extracted ones via word-by-word alignment to automatically process the three main ancient languages appearing in the Talmud, namely mishnaic Hebrew, biblical Hebrew and babylonian Aramaic. 4) Finally, the revision of the obtained results through an ad-hoc implemented web-based application. This final step is devoted to build a ground truth and/or a gold training set allowing us to perform a complete validation process of the alignment outcomes. For the time being, 219. 000 tokens have been analyzed, extracted from four tractates of the Babylonian Talmud which were translated so far. "},
KEYWORDS = {bilingual word alignment, translation},
URL = {http://www.ens-lyon.fr/evenement/recherche/machine-learning-donnees-textuelles-et-recherche-en-sciences-humaines-et},
CONFERENCE_NAME = {Machine learning, données textuelles et recherche en sciences humaines et sociales},
}
@MISC{DELGROSSO_2019_MISC_D_406309,
AUTHOR = {Del Grosso, A. M.},
TITLE = {Verso la definizione e l'implementazione di una piattaforma orientata allo studio critico del testo},
YEAR = {2019},
ABSTRACT = {Il contributo illustra le caratteristiche della piattaforma in sviluppo presso ILC per lo studio scientifico del testo e in parte impiegata per la realizzazione dell'edizione digitale delle lettere di Bellini},
KEYWORDS = {BelliniInRete, Digital Scholarly Editing, Digital Philology, Computational Philology},
URL = {https://iris.cnr.it/handle/20.500.14243/406309},
CONFERENCE_NAME = {Il progetto BellinInRete digital correspondence. Per un'edizione critica digitale delle lettere di Vincenzo Bellini},
}
@MISC{DELGROSSO_2019_MISC_D_409152,
AUTHOR = {Del Grosso, A. M.},
TITLE = {Introduzione sistema git per edizioni collaborative},
YEAR = {2019},
ABSTRACT = {Il sistema più diffuso per il controllo di versione per risorse elettroniche (VCS-Version Control System) e' oggi "git", un sistema open source ad architettura distribuita tra i più utilizzati per lo sviluppo di grandi progetti collaborativi, come ad esempio il kernel di Linux. La prima parte del seminario introdurrà il modello generale e i principi di progettazione che sottendono l'ambiente di versionamento, come ad esempio lo stato delle risorse, il workflow di lavoro, l'ambiente in locale e quello in remoto. Verranno anche mostrati i comandi più importanti per un efficace utilizzo dello strumento, come la creazione di un repository, fare commit degli aggiornamenti e salvare le modifiche su un host remoto. L'obiettivo è quello di fornire ai partecipanti una prima panoramica sul funzionamento del sistema git facendo ampio uso dell'interfaccia a riga di comando da terminale. La seconda parte del seminario introdurrà la piattaforma github, uno dei più comuni host per la gestione remota e collaborativa di repository git. Sarà mostrata quindi sia la procedura per creare un account sulla piattaforma sia le modalità di gestione per un semplice progetto collaborativo di codifica di testi},
KEYWORDS = {git, github, summer school, digital humanities},
URL = {http://digitaltools.labcd.unipi.it/past-editions/program2019/},
}
@MISC{DELGROSSO_2019_MISC_D_385326,
AUTHOR = {Del Grosso, A. M.},
TITLE = {Visualizzatore immagini con tiling per software evt2js},
YEAR = {2019},
ABSTRACT = {Sviluppo componente web per la visualizzazione ottimizzata delle immagini ad alta risoluzione in seno al progetto di visualizzazione di edizioni digitali scientifiche EVT. Nello specifico il visualizzatore è stato implementato per l'edizione digitale della vita di San Teobaldo. La fonte originale è conservata presso la Diocesi di Alba},
KEYWORDS = {digital scholarly edition, EVT, viewer},
URL = {https://www.visitmudi.it/EVT/},
}
@MISC{DELGROSSO_2019_MISC_D_385251,
AUTHOR = {Del Grosso, A. M.},
TITLE = {AliEval-Revisione allineamento di testi paralleli multilingua},
YEAR = {2019},
ABSTRACT = {Sistema per la revisione di testi paralleli allineati parola per parola},
KEYWORDS = {bitext alignment, digital humaniteis, talmud},
URL = {http://omega.ilc.cnr.it/dev/proofreader/},
}
@MISC{DELGROSSO_2019_MISC_DP_405213,
AUTHOR = {Del Grosso, A. M. and Piccini, S.},
TITLE = {Fixing the Movements of Thought in Text and Terminology: the Effectiveness of Scholarly Digital Tools on Saussure's Writings},
YEAR = {2019},
ABSTRACT = {The aim of this contribution is to present and discuss some recent activities, carried out by the Institute of Computational Linguistics (CNR-Pisa), devoted to representing in an explicit and formal way the diachronic evolution of concepts and terms occurring in Saussure's manuscripts. In the first part of the presentation, we will briefly outline some theoretical aspects concerning the diachronic standpoint in terminology and the "best practices" to be followed when modelling (diachronic) terminological resources. Then, some examples of terminological evolution will be provided, taken from the electronic lexicon Simple_FdS, built within the PRIN project "Per un'edizione digitale dei manoscritti di Ferdinand de Saussure" (2008-2011), based on the Generative Lexicon theory elaborated by Pustejovsky (1995). Terminological data will be shown in LexO, a Web-based and collaborative web editor, which allows for building lexical and terminoontological resources, compliant with the Semantic Web technologies (RDF and OWL). In the second part of the talk, starting from the outcomes of the aforementioned project, we will present the scholarly digital platform aimed at describing and analysing text resources. The encoding approach follows the current de facto standard in representing textual resources, namely the Text Encoding Initiative (TEI) guidelines. In particular, we adopted the tag sets defined in the Module for Transcription of Primary Resources. An example will be illustrated on how describe and visualize the process of writing in Saussure's manuscripts. The example was implemented exploiting the Omega framework as well as the Edition Visualization Technology (EVT). In such a way, scholars have at their disposal a powerful tool for searching additions, deletions, substitutions, retracings, different hands, transpositions, marginal and interlinear notes, and all the other textual phenomena significant to understanding the "Movements of thought" which emerge in the handwritten pages},
KEYWORDS = {Saussure, Digital Humanities, Digital Scholarly Editing, Digital Philology, Computational Philology},
URL = {https://iris.cnr.it/handle/20.500.14243/405213},
CONFERENCE_NAME = {Philosophy of Language and Digital Humanities},
}
@MISC{DELGROSSO_2019_MISC_DP_405215,
AUTHOR = {Del Grosso, A. M. and Piccini, S.},
TITLE = {Approcci digitali e computazionali allo studio dei documenti manoscritti della tarda latinità: il caso Clavius},
YEAR = {2019},
ABSTRACT = {Introduzione alle digital humanities e alla lessicografia digitale con esempi e riferimenti tratti dal progetto Clavius on the Web},
KEYWORDS = {digital humanities, digital philology, digital lexicography},
URL = {https://www.dipartimentidieccellenza-dilef.unifi.it/vp-122-calendario-attivita-didattica-marzo-2019.html},
}
@MISC{DELGROSSO_2019_MISC_DS_426812,
AUTHOR = {Del Grosso, A. M. and Spampinato, D.},
TITLE = {Edizione digitale delle Lettere di Bellini},
YEAR = {2019},
ABSTRACT = {La codifica dell'edizione scientifica digitale è condotta seguendo le ultime linee guida della Text Encoding Initiative e istanziata su un campione rappresentativo di missive. L'edizione è accessibile via web con il software open source: Edition Visualization Technology; ma è anche stata progettata per essere integrata nel percorso museale interattivo e multimediale in allestimento, senza rinunciare al rigore scientifico della trascrizione delle lettere presente nella recente edizione critica},
KEYWORDS = {Digital Scholarly Edition, TEI, Vincenzo Bellini, Digital Correspondence},
URL = {http://licodemo.ilc.cnr.it/bellini-in-rete},
}
@MISC{FABIOCATERINO_2019_MISC_FBMDSD_405211,
AUTHOR = {Fabio Caterino, A. and Battaglino, G. and Marini, A. and Di Meglio, A. and Silvi, D. and Del Grosso, A. M.},
TITLE = {Letteratura e filologia come scienze esatte: per un nuovo statuto scientifico dell'umanista informatizzato},
YEAR = {2019},
ABSTRACT = {La leggenda vuole che fosse inciso all'entrata dell'accademia platonica il motto «???????????? ?????? ??????». La geometria è qui intesa come la scienza stessa, quell'esatezza di calcolo indispensabile a cogliere determinate strutture armoniche all'interno dell'arte; strutture che, in fin dei conti, costituiscono la vera e propria ossatura del concetto di bello. Per meglio concepire il bello nella sua struttura è quindi necessario avere una capacità d'analisi matematica, geometrica. Oggi l'informatica sa venire incontro proprio alla necessità dell'umanista di rendere il suo lavoro più specifico e preciso, al fine di ottenere dal proprio lavoro migliori esegesi, migliori ricostruzioni testuali, migliori approcci critici utili a una fruizione più consapevole dello stesso testo letterario. Il panel vorrebbe quindi raccogliere ricerche e testimonianze di chi si occupa e preoccupa di applicare l'informatica agli studi filologici e letterari, con la volontà ultima di superare le barriere che contrappongono in modalità integralista gli studia humanitatis alle cosiddette scienze esatte. Esso nasce come estensione delle ricerche informatico-umanistiche condotte presso l'Università degli Studi del Molise dal gruppo di studi Eterodossie e dissenso nella letteratura italiana, ma vuole ovviamente aprirsi a chiunque creda-in maniera critica e ragionata-alla causa delle digital humanities},
KEYWORDS = {Digital Humanities},
URL = {https://www.italianisti.it/associazione/congressi-adi/letteratura-e-scienze},
CONFERENCE_NAME = {XXIII Congresso ADI-Associazione degli Italianisti},
}
@MISC{GIOVANNETTI_2019_MISC_GBDMPPS_411270,
AUTHOR = {Giovannetti, E. and Bellandi, A. and Del Grosso, A. M. and Marchi, S. and Pecchioli, A. and Piccini and S},
TITLE = {La Terminologia del Talmud Babilonese: Estrazione, Rappresentazione e Uso nel Contesto della Linguistica Computazionale},
YEAR = {2019},
ABSTRACT = {Nel contesto del Progetto per la traduzione del Talmud babilonese in italiano (PTTB) si sta procedendo a una strutturazione digitale formale della terminologia. La risorsa terminologica è stata codificata sotto forma di un dizionario combinatorio ed esplicativo, multilingue (ebraico-aramaico-italiano) secondo i principi della teoria testo-senso. La costruzione di tale risorsa è stata supportata dall'elaborazione del testo e dalle tecniche linguistiche computazionali volte a estrarre automaticamente i termini dalla traduzione italiana del Talmud e ad allinearli con i corrispondenti termini in ebraico / aramaico. L'articolo descrive il processo avviato per la costruzione della risorsa terminologica con l'obiettivo finale di illustrare i vantaggi dell'adozione di un modello linguistico formale. La risorsa terminologica mira, infatti, a essere uno strumento utile per approfondire le caratteristiche delle lingue del Talmud, per aiutare i traduttori nel loro lavoro e più in generale l'ampia platea di studiosi del Talmud},
KEYWORDS = {terminologia, talmud, teoria testo-senso, estrazione terminologica, allineamento di testi},
URL = {https://iris.cnr.it/handle/20.500.14243/411270},
CONFERENCE_NAME = {AISG "Ebraismo fra peculiarità e interculturalità"},
}
@MISC{MONACHINI_2019_MISC_M_407557,
AUTHOR = {Monachini, M.},
TITLE = {Ricerche di alta qualità negli Studi umanistici: l'infrastruttura CLARIN-IT},
YEAR = {2019},
ABSTRACT = {Nella lezione a invito presso la Scuola di Dottorato di Ateneo al Corso di UMANESIMO E TECNOLOGIE vengono descritti, il ruolo, i vantaggi e le opportunità offerte dalla infrastruttura di ricerca CLARIN. Una platea di giovani in formazione (che costituiranno i ricercatori del futuro) potrà approfondire la conoscenza degli strumenti della infrastruttura che consentono di coniugare studi umanistiche ed approcci tecnologici, al fine di compiere ricerche di alta qualità},
KEYWORDS = {CLARIN, studi umanistici, tecnologie linguistiche},
URL = {https://iris.cnr.it/handle/20.500.14243/407557},
CONFERENCE_NAME = {Scuola di Dottorato di Ateneo Corso di UMANESIMO E TECNOLOGIE},
}
@MISC{MONACHINI_2019_MISC_M_404925,
AUTHOR = {Monachini, M.},
TITLE = {CLARIN-IT nella prospettiva delle Digital Humanities},
YEAR = {2019},
ABSTRACT = {Fornire una panoramica relativa alla infrastruttura europea CLARIN e la sua emanazione italiana CLARIN-IT rispondere ai quesiti relativi alla sua missione e ai suoi obiettivi e fare il punto sui vantaggi per la comunità a cui è diretto, ricercatori del settore delle scienze umane e sociali},
KEYWORDS = {digital public humanities, infrastrutture di ricerca},
URL = {https://iris.cnr.it/handle/20.500.14243/404925},
CONFERENCE_NAME = {Seminars in Digital Public Humanities},
}
@MISC{MONACHINI_2019_MISC_M_407575,
AUTHOR = {Monachini, M.},
TITLE = {Success stories of collaboration in Social Sciences and Humanities (between Italy and Slovenia)},
YEAR = {2019},
ABSTRACT = {The collaboration Italy-Slovenia in the sector of SSH revolves, since many years, around Digital methods for language, in particular, language resources and standards for language data; with the development of e-technology and explosion of data, the support to language studies goes through RI; another hot topic linked to the digital era is "word meaning" which involves a new type of lexicography; the even greater challenge, the concept of Open Science, sees the two countries together in in the new big cluster project SSHOC, which aims to implement the EOSC vision and build the Open Cloud for the SSH sector},
KEYWORDS = {collaboration Italy Slovenija, Social Sciences and Humanities},
URL = {https://iris.cnr.it/handle/20.500.14243/407575},
CONFERENCE_NAME = {RESEARCH DAY ITALY-SLOVENIA Bilateral meeting Italy Slovenia on the role of research in the society},
}
@MISC{PICCINI_2019_MISC_P_404492,
AUTHOR = {Piccini, S.},
TITLE = {Saussure's course of lectures on Lithuanian from the notebooks of Charles Bally: a first overview},
YEAR = {2019},
ABSTRACT = {Il presente contributo è volto a presentare i risultati delle prime ricerche dedicate ai manoscritti di Bally relativi al Corso di lituano, tenuto da Saussure presso l'Università di Ginevra presumibilmente negli anni 1901-1902},
URL = {https://iris.cnr.it/handle/20.500.14243/404492},
}
@MISC{PICCINI_2019_MISC_PABGE_411275,
AUTHOR = {Piccini, S. and Abrate, M. and Bellandi, A. and Giovannetti and , E.},
TITLE = {Rappresentazione e costruzione di risorse terminologiche diacroniche nell'era del web semantico},
YEAR = {2019},
ABSTRACT = {Con il presente contributo proponiamo un modello ed uno strumento volti a rappresentare formalmente, interrogare e visualizzare l'evoluzione diacronica di concetti e termini in un dato dominio, nel quadro del web semantico. Quest'ultimo sta attirando sempre più l'attenzione di lessicografi e terminologi computazionali, in quanto garantisce interoperabilità, facile accesso e riuso delle risorse lessicali/terminologiche all'interno di una comunità scientifica},
KEYWORDS = {terminologia, terminologia diacronica, web semantico, lemon, lexO},
URL = {http://www.assiterm91.it/wp-content/uploads/2020/03/Piccini.pdf},
CONFERENCE_NAME = {XXIX Convegno Ass. I. Term},
}
@MISC{PIRRELLI_2019_MISC_PV_408988,
AUTHOR = {Pirrelli and Vito},
TITLE = {Investigating inflection as a complex system},
YEAR = {2019},
ABSTRACT = {From a cross-linguistic perspective, different inflection systems appear to apportion word processing costs differently, depending on when and where, in the full form, morpho-lexical and morpho-syntactic information is encoded. The resulting balance is the outcome of an interaction between form frequency and morphological productivity, responding to basic communicative requirements. Big families of stem-sharing inflected forms constitute the productive core of an inflection system. This core is easy to learn, as it requires memorization of one stem only, with all inflected forms being redundantly built upon it. Unsurprisingly, generalizable paradigms are less sensitive to token frequency effects, and tend to be located in the long, low-frequency tail of the Zipfian distribution of word forms. In contrast, the head of the Zipfian distribution mostly contains small families of alternating and possibly suppletive stems, which, however shorter, morpho-phonologically simpler and easier to process, require high token frequency to be learned and resist pressure towards regularization},
KEYWORDS = {Morphological paradigms, Mental Lexicon, Inflectional morphology},
PAGES = {23-24},
URL = {https://iris.cnr.it/handle/20.500.14243/408988},
CONFERENCE_NAME = {International Symposium of Morphology (ISMo) 2019},
}
@ARTICLE{BELLANDI_2018_ARTICLE_BGW_348535,
AUTHOR = {Bellandi, A. and Giovannetti, E. and Weingart, A.},
TITLE = {Multilingual and Multiword Phenomena in a lemon Old Occitan Medico-Botanical Lexicon},
YEAR = {2018},
ABSTRACT = {This article illustrates the progresses made in representing a multilingual and multi-alphabetical Old Occitan medico-botanical lexicon in the context of the project Dictionnaire de Termes Médico-botaniques de l'Ancien Occitan (DiTMAO). The chosen lexical model of reference is lemon, which has been extended accordingly to some specific linguistic and lexical features of the lexicon. In particular, issues and solutions about the modeling of multilingual and multiword phenomena are discussed, as the way they are managed through LexO, a web editor developed in the context of the project},
URL = {https://iris.cnr.it/handle/20.500.14243/348535},
DOI = {10.3390/info9030052},
ISSN = {2078-2489},
JOURNAL = {INFORMATION},
}
@ARTICLE{CARDILLO_2018_ARTICLE_CFMP_355603,
AUTHOR = {Cardillo, F. and Ferro, M. and Marzi, C. and Pirrelli, V.},
TITLE = {Deep Learning of Inflection and the Cell-Filling Problem},
YEAR = {2018},
ABSTRACT = {Machine learning offers two basic strategies for morphology induction: lexical segmentation and surface word relation. The first approach assumes that words can be segmented into morphemes. Inferring a novel inflected form requires identification of morphemic constituents and a strategy for their recombination. The second approach dispenses with segmentation: lexical representations form part of a network of associatively related inflected forms. Production of a novel form consists in filling in one empty node in the network. Here, we present the results of a task of word inflection by a recurrent LSTM network that learns to fill in paradigm cells of incomplete verb paradigms. Although the task does not require morpheme segmentation, we show that accuracy in carrying out the inflection task is a function of the model's sensitivity to paradigm distribution and morphological structure},
KEYWORDS = {Deep Learning, LSTM, Cell-Filling Problem},
PAGES = {57-75},
URL = {https://publications.cnr.it/doc/396348},
VOLUME = {4 (1)},
ISSN = {2499-4553},
JOURNAL = {IJCOL},
}
@ARTICLE{CHIARELLA_2018_ARTICLE_CBBCRZMC_345326,
AUTHOR = {Chiarella, D. and Bibuli, M. and Bruzzone, G. and Caccia, M. and Ranieri, A. and Zereik, E. and Marconi, L. and Cutugno, P.},
TITLE = {A Novel Gesture-Based Language for Underwater Human-Robot Interaction},
YEAR = {2018},
ABSTRACT = {The underwater environment is characterized by hazardous conditions that make it difficult to manage and monitor even the simplest human operation. The introduction of a robot companion with the task of supporting and monitoring the divers during their activities and operations underwater can help to solve some of the problems that usually arise in this scenario. In this context, a proper communication between the diver and the robot is imperative for the success of the dive. However, the underwater environment poses a set of technical challenges which are not readily surmountable thus limiting the spectrum from which possibilities can be chosen. This paper presents the design and development of a gesture-based communication language which has been employed for the entire duration of the European project CADDY (Cognitive Autonomous Diving Buddy). This language, the Caddian, was built upon consolidated and standardized underwater gestures that are commonly used in recreational and professional diving. Its use and integration during field tests with a remotely operated underwater vehicle (ROV) is also shown},
KEYWORDS = {marine robotics, underwater human-robot interaction, gesture-based language, field trials},
PAGES = {19},
URL = {https://www.mdpi.com/2077-1312/6/3/91},
VOLUME = {6 (3)},
DOI = {10.3390/jmse6030091},
ISSN = {2077-1312},
JOURNAL = {JOURNAL OF MARINE SCIENCE AND ENGINEERING},
}
@ARTICLE{CHIARELLO_2018_ARTICLE_CCFD_392587,
AUTHOR = {Chiarello, F. and Cimino, A. and Fantoni, G. and Dell'Orletta, F.},
TITLE = {Automatic users extraction from patents},
YEAR = {2018},
ABSTRACT = {The purpose of the present research is to design a method capable of automatically detecting and extracting one of the multiple entities hidden in patents: the users of the invention},
KEYWORDS = {Patent analysis, Deep learning, Text mining},
PAGES = {28-38},
URL = {https://iris.cnr.it/handle/20.500.14243/392587},
VOLUME = {54},
DOI = {10.1016/j.wpi.2018.07.006},
ISSN = {0172-2190},
JOURNAL = {WORLD PATENT INFORMATION},
}
@ARTICLE{FERRO_2018_ARTICLE_FMP_356242,
AUTHOR = {Ferro, M. and Marzi, C. and Pirrelli, V.},
TITLE = {Discriminative word learning is sensitive to inflectional entropy},
YEAR = {2018},
ABSTRACT = {Psycholinguistic evidence based on inflectional and derivationalword families has emphasised the combined role of Paradigm Entropy andInflectional Entropy in human word processing. Although the way frequencydistributions affect behavioural evidence is clear in broad outline, we stillmiss a clear algorithmic model of how such a complex interaction takes placeand why. The main challenge is to understand how the local interaction oflearning and processing principles in morphology can result in global effectsthat require knowledge of the overall distribution of stems and affixes in wordfamilies. We show that principles of discriminative learning can shed light onthis issue. We simulate learning of verb inflection with a discriminativerecurrent network of specialised processing units, whose level of temporalconnectivity reflects the frequency distribution of input symbols in context. We analyse the temporal dynamic with which connection weights areadjusted during discriminative learning, to show that self-organisedconnections are optimally functional to word processing when thedistribution of inflected forms in a paradigm (Paradigm Entropy) and thedistribution of their inflectional affixes across paradigms (InflectionalEntropy) diverge minimally},
KEYWORDS = {discriminative learning, word processing, recurrent neural networks, relative entropy},
PAGES = {307-327},
URL = {https://www.rivisteweb.it/doi/10.1418/91871},
VOLUME = {XVII (2)},
DOI = {10.1418/91871},
ISSN = {1720-9331},
JOURNAL = {LINGUE E LINGUAGGIO},
}
@ARTICLE{FONTANA_2018_ARTICLE_FCDRABCCCDDDFFFGLMMMMMMNPPSTVS_532964,
AUTHOR = {Fontana, P. and Costa, C. and Di Prisco, G. and Ruzzier, E. and Annoscia, D. and Battisti, A. and Caoduro, G. and Carpana, E. and Contessi, A. and Dal Lago, A. and Dall'Olio, R. and De Cristofaro, A. and Felicioli, A. and Floris, I. and Fontanesi, L. and Gardi, T. and Lodesani, M. and Malagnini, V. and Manias, L. and Manino, A. and Marzi, G. and Massa, B. and Mutinelli, F. and Nazzi, F. and Pennacchio, F. and Porporato, M. and Stoppa, G. and Tormen, N. and Valentini, M. and Segre, A.},
TITLE = {Appeal for biodiversity protection of native honey bee subspecies of apis mellifera in Italy (San michele all'Adige declaration)},
YEAR = {2018},
ABSTRACT = {Honey bees are pollinators that play a key-role in plant biodiversity conservation and crop production. This unique insect species has been managed in hives by beekeepers for millennia, even though such a peculiar animal production system never resulted in the domestication of the western honey bee. The western honey bee was originally distributed throughout most of Europe, Africa, the Middle East, part of the Arabian Peninsula and some parts of Central Asia. From Europe, the honey bee was introduced to America, Asia and Oceania. This adaptation to a range of environmental conditions, together with geological and climatic changes in past eras, has resulted in grouping of Apis mellifera into 31 subspecies. In the last 150 years, technological advances in beekeeping and globalisation have heavily endangered conservation of the native subspecies of A. mellifera in Europe, with an impact on honey bee production and health status. Evaluation of the impact of this phenomenon on the ecological equilibrium is still ongoing, but there is already scientific evidence of negative effects that this problem is having on beekeeping. This document sets forth the scientific arguments in support of the conservation of native subspecies, and lists the existing Italian legislation in terms of subspecies protection initiatives. It also lists the main factors that are contributing to loss of genetic diversity and of local adaptations. This document does not intend to oppose the actions of the beekeeping industry, but rather to contribute to a more global vision of the very serious problem of honey bee decline},
KEYWORDS = {Beekeeping, Biodiversity, Conservation, Genetic improvement, Honey bee, Subspecies},
PAGES = {257-271},
URL = {https://iris.cnr.it/handle/20.500.14243/532964},
VOLUME = {71 (2)},
ISSN = {1721-8861},
JOURNAL = {BULLETIN OF INSECTOLOGY},
}
@ARTICLE{GOGGI_2018_ARTICLE_GPRBM_371102,
AUTHOR = {Goggi, S. and Pardelli, G. and Russo, I. and Bartolini, R. and Monachini, M.},
TITLE = {Providing Access to Grey Literature: The CLARIN Infrastructure},
YEAR = {2018},
ABSTRACT = {"In the electronic age, the World Wide Web has played a major role in making scientific information accessible to a wide audience more rapidly and efficiently. This democratic approach to information dissemination in science is changing the way science is perceived and implemented in our daily lives" (Weintraub, 2000)},
KEYWORDS = {CLARIN-IT, CLARIN - European Research Infrastructure for Language Resources and Technology, Grey Literature},
PAGES = {87-93},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85048643343\&origin=inward},
VOLUME = {14 (2)},
ISSN = {1574-1796},
JOURNAL = {THE GREY JOURNAL},
}
@ARTICLE{GUADAGNINI_2018_ARTICLE_G_348587,
AUTHOR = {Guadagnini, E.},
TITLE = {Gli alberi di Arcita: note su Teseida, XI 22-24},
YEAR = {2018},
ABSTRACT = {This essay deals with Teseida, XI, 22-24, where the trees cut for Arcita's pyre are listed. The first part presents a linguistic study examining the passage from a lexicological point of view; the second part proposes a study of Boccaccio's sources aiming at highlighting the connections between the Teseida and the 'Laurentian Thebaid\' (that is, one of the copies of Statius' poem owned by Boccaccio = ms. Laur. Plut. 38 6)},
KEYWORDS = {Linguistica italiana, Filologia italiana, Lessico},
PAGES = {155-175},
URL = {https://iris.cnr.it/handle/20.500.14243/348587},
VOLUME = {46},
ISSN = {0585-4997},
JOURNAL = {STUDI SUL BOCCACCIO},
}
@ARTICLE{KHAN_2018_ARTICLE_K_348824,
AUTHOR = {Khan, A. F. A.},
TITLE = {Towards the Representation of Etymological Data on the Semantic Web},
YEAR = {2018},
ABSTRACT = {In this article, we look at the potential for a wide-coverage modelling of etymological information as linked data using the Resource Data Framework (RDF) data model. We begin with a discussion of some of the most typical features of etymological data and the challenges that these might pose to an RDF-based modelling. We then propose a new vocabulary for representing etymological data, the Ontolex-lemon Etymological Extension (lemonETY), based on the ontolex-lemon model. Each of the main elements of our new model is motivated with reference to the preceding discussion},
KEYWORDS = {linked data, ontolex-lemon. etymologies, historical linguistics},
URL = {https://www.mdpi.com/2078-2489/9/12/304/htm},
VOLUME = {12},
DOI = {10.3390/info9120304},
ISSN = {2078-2489},
JOURNAL = {INFORMATION},
}
@ARTICLE{PECCHIOLI_2018_ARTICLE_PABGM_343397,
AUTHOR = {Pecchioli, A. and Albanesi, D. and Bellandi, A. and Giovannetti, E. and Marchi, S.},
TITLE = {Annotazione Linguistica Automatica dell'Ebraico Mishnaico: Esperimenti sul Talmud Babilonese},
YEAR = {2018},
ABSTRACT = {The automatic linguistic analysis of ancient Hebrew represents a new research opportunity in the field of Jewish studies. In fact, very little has been produced, both in terms of linguistic resources and, above all, of tools for the analysis of ancient Hebrew. This article illustrates a work born within the Italian Translation of the Babylonian Talmud Project aimed at the construction of an automatic linguistic annotator of Mishnaic Hebrew},
KEYWORDS = {Babylonian Talmud, Natural Language Processing, Mishnaic Hebrew},
PAGES = {281-291},
URL = {http://aisg.cise.unipi.it/Materia-giudaica-2018/018-Pecchioli%20pp%20281-292B.pdf},
VOLUME = {XXIII},
ISSN = {2282-4499},
JOURNAL = {MATERIA GIUDAICA},
}
@ARTICLE{PROIETTI_2018_ARTICLE_PF_405491,
AUTHOR = {Proietti, C. and Franco, A.},
TITLE = {Social Norms and the Dominance of Low-Doers},
YEAR = {2018},
ABSTRACT = {Social norms play a fundamental role in holding groups together. The rationale behind most of them is to coordinate individual actions into a beneficial societal outcome. However, there are cases where pro social behavior within a community seems, to the contrary, to cause inefficiencies and suboptimal collective outcomes. An explanation for this is that individuals in a society are of different types and their type determines the norm of fairness they adopt. Not all such norms are bound to be beneficial at the societal level. When individuals of different types meet a clash of norms can arise. This, in turn, can determine an advantage for the "wrong" type. We show this by a game-theoretic analysis in a very simple setting. To test this result-as well as its possible remedies-we also devise a specific simulation model. Our model is written in NETLOGO and is a first attempt to study our problem within an artificial environment that simulates the evolution of a society overtime},
KEYWORDS = {Agent-Based Model, Social Norms, Game Theory},
PAGES = {21},
URL = {https://iris.cnr.it/handle/20.500.14243/405491},
VOLUME = {21 (1)},
DOI = {10.18564/jasss.3524},
ISSN = {1460-7425},
JOURNAL = {JASSS},
}
@BOOK{BOSCHETTI_2018_BOOK_B_378963,
AUTHOR = {Boschetti, F.},
TITLE = {Copisti digitali e filologi computazionali},
YEAR = {2018},
ABSTRACT = {Metodi e tecniche per il trattamento automatico e semiautomatico di testi letterari con variantistica. Viene affrontato sia il tema dell'edizione critica digitale che il tema dell'analisi stilistica e linguistica (in particolare sintattica e semantica)},
URL = {https://iris.cnr.it/handle/20.500.14243/378963},
ISBN = {9788880802969},
}
@INCOLLECTION{AGNOLONI_2018_INCOLLECTION_AV_403573,
AUTHOR = {Agnoloni, T. and Venturi, G.},
TITLE = {Semantic processing of legal texts},
YEAR = {2018},
ABSTRACT = {The paper provides an overview of the field of semantic processing of legal texts, combining views and perspectives from the computational linguistic and Artificial Intelligence and Law (AI \& Law) communities. The last few years have seen a growing body of research and practice in the field of AI \& Law which addresses a range of topics: semantic and cross-language legal Information Retrieval, document classification, legal drafting, legal knowledge extraction, automated legal argumentation, as well as the construction of legal ontologies and their application. The increasing availability of legal corpora accessible as processable data is making viable their partially automated conversion into legal knowledge bases. In this context, it is of paramount importance the use of Natural Language Processing (NLP) techniques and tools that automate the process of knowledge extraction from legal texts. Accordingly, the paper aims at discussing how the two research communities can benefit from the interaction of the different perspectives: the legal artificial intelligence community can gain insight into state-of-the-art linguistic technologies, tools and resources, and the computational linguists can take advantage of the large and often multilingual legal resources (corpora as well as lexicons and ontologies) for training, domain adaptation and evaluation of current NLP technologies and tools. The authors will present an overview on semantic resources for legal texts annotation and processing. Different kind of resources (linguistic, lexical, conceptual, formal) will be introduced and their differences, methodological premises, intended use and possible integration will be highlighted. The peculiarities of the legal domain and legal language will be discussed in relation with the construction and use of legal semantic resources. The issue of multilingualism, multilingual and multi-legal system access to legal information will be also discussed showing how formalized lexical, linguistic and conceptual legal resources can support the task. How NLP tools and techniques can be fruitfully exploited to semantically process collections of legal texts will be introduced in the second part of the paper. In particular, the authors will show how they can be used to automatically extract the relevant knowledge contained in legal text corpora, to structure the extracted knowledge in semantic resources (such as domain-specific ontologies or thesauri), and to semantically annotate the texts with the extracted information to pave the way to content-based access and querying},
KEYWORDS = {Semantic Processing, Natural Language Processing, Ontology Learning, Legal Texts},
PAGES = {109-137},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85061292435\&origin=inward},
DOI = {10.1515/9781614514664-006},
PUBLISHER = {Walter De Gruyter Inc (Boston/Berlin/Munich, USA)},
ISBN = {978-1-61451-669-9},
CONFERENCE_PLACE = {Boston/Berlin/Munich},
}
@INCOLLECTION{ARTALE_2018_INCOLLECTION_AG_343807,
AUTHOR = {Artale, E. and Guadagnini, E.},
TITLE = {«Ci è bisognato servirci di molti volgarizzamenti, e traslatamenti d'opere altrui»: i testi di traduzione nella prima Crusca},
YEAR = {2018},
ABSTRACT = {Il contributo tratta dei testi di traduzione nella prima impressione del Vocabolario della Crusca (1612), a partire dalla loro presenza nella 'Tavola dei citati' e dunque in quanto fonte lessicografica per le voci del vocabolario; viene approfondita l'analisi dei testi di traduzione di ambito medico. La conclusione cui si approda è che tali testi siano 'neutri' in relazione alla loro tipologia testuale e settoriale, e che non forniscano lessico 'marcato' né per ambito semantico né per la categoria di "voci antiche"},
KEYWORDS = {Lessicografia storica, Volgarizzamenti, Medicina medievale},
PAGES = {383-425},
URL = {https://iris.cnr.it/handle/20.500.14243/343807},
ISBN = {978-88-6292-873-1},
BOOKTITLE = {La Crusca e i testi. Lessicografia, tecniche editoriali e collezionismo librario intorno al Vocabolario del 1612},
EDITOR = {Belloni and Gino Trovato and Paolo},
}
@INCOLLECTION{KHAN_2018_INCOLLECTION_KEM_345622,
AUTHOR = {Khan, F. and E Díazvera, J. and Monachini, M.},
TITLE = {Representing Meaning Change in Computational Lexical Resources: The Case of Shame and Embarrassment Terms in Old English},
YEAR = {2018},
ABSTRACT = {The inclusion of diachronic information detailing changes in the meanings of words over time can be extremely helpful in modelling broad coverage digital lexical resources but it is often crucial for lexical resources serving such fields as classical philology or historical linguistics where the diachronic aspects of a language are explicitly taken into consideration. In this article we present a linked data based model for representing meaning change in lexico-semantic resources called lemonDia and describe its use in modelling a lexicon of Old English terms for shame and embarrassment},
KEYWORDS = {linked data, diachrony, emotion},
PAGES = {59-79},
URL = {https://iris.cnr.it/handle/20.500.14243/345622},
ISBN = {978-1-5275-0803-3},
BOOKTITLE = {Formal Representation and the Digital Humanities},
}
@INCOLLECTION{MARZI_2018_INCOLLECTION_M_377275,
AUTHOR = {Marzi, C.},
TITLE = {Morpho-phonotactic typicality and second language acquisition and processing},
YEAR = {2018},
ABSTRACT = {According to many accounts of word processing and access, an input word concurrently activates non-target lexical neighbours that become available for further processing stages. Psycholinguistic evidence shows how prediction andcompetition based on word similarity and lexical redundancy affect speakers' anticipation of incoming stimuli, so as to speed input recognition and improve lexical decision (Luce/Pisoni 1998; Bailey/Hahn 2001; Hahn/Bailey 2005, among others). As observed by Bailey and Hahn (2001), wordlikeness affects both language acquisition and processing. Wordlikeness can be defined in terms of phonotactic/ orthotactic likelihood and lexical density. Both neighbourhood size and frequency distribution of neighbours are known to play a role in word prediction and competition. In this perspective, monitoring this competing behaviour can shed some light on the relationship between phonotactic/orthotactic likelihood and lexical density, and their connection with issues of word recognition and production. My goal in this chapter is to provide a computational model of bilingual lexical self-organisation, with language-independent architectural and functional requirements of the lexical store, together with language-specific phonotacticconstraints, appearing to control aspects of interaction of first and second language (hereafter L1-L2) and define the propensity to acquire novel words, showing how acquisitional strategies are affected by past knowledge of languageand entrenched expectations on incoming stimuli. On the one hand, a strong expectation based on L1 affects the way L2 inputs are perceived. On the other hand, language-independent architectural and functional requirements of the lexical store, such as its highly integrated organisation andlanguage-non-selective access (Dijkstra/van Heuven 2002), appear to control aspects of L1-L2 interaction. Simulations in the neuro-computational framework of Temporal Self-Organising Maps (TSOMs, Ferro et al. 2011; Marzi et al. 2012, 2014a, 2016; Pirrelli et al. 2014, 2015), where word processing and lexical acquisition are implemented as recoding and storage strategies for time-series of symbolic units, will highlight how partially overlapping phonological representations may cause competition in incremental learning, and how weaker connections and recycledmemory resources make L2 representations underspecified due to the lack of strong lexical expectations and selective specialisation typical of the L1 representations},
KEYWORDS = {L1-L2 acquisition, bilingual lexical self-organisation, phonotactic typicality, discriminative recurrent network},
PAGES = {219-232},
URL = {https://www.francoangeli.it/Ricerca/Scheda_Libro.aspx?ID=25216\&Tipo=Libro\&strRicercaTesto=25216\&lingua=it\&titolo=tipologia,+acquisizione,+grammaticalizzazione.+typology,++acquisition,+grammaticalization+studies},
PUBLISHER = {Franco Angeli (Milano, ITA)},
ISBN = {978-88-917-7847-5},
CONFERENCE_PLACE = {Milano},
BOOKTITLE = {Tipologia, Acquisizione, Grammaticalizzazione-Typology, Acquisition, Grammaticalization studies},
EDITOR = {Chini, M. and Cuzzolin, P.},
}
@INCOLLECTION{MONACHINI_2018_INCOLLECTION_MNS_371929,
AUTHOR = {Monachini, M. and Nicolosi, A. and Stefanini, A.},
TITLE = {Digital Classics and CLARIN-IT: What Italian Scholars of Ancient Greek Expect from Digital Resources and Technology},
YEAR = {2018},
ABSTRACT = {This paper presents and discusses the findings of a survey carried out to assess the use of digital resources and digital technologies with respect to work in ancient Greek scholarship, with the aim to identify the factors that are likely to constrain its use as well as to elicit needs and requirements of ancient Greek scholars in Italy. The survey is in line with the principles behind the user engagement strategy developed by CLARIN-ERIC and constitutes one of the national efforts undertaken by CLARIN-IT to contribute to the wider impact of CLARIN on Digital Classicists. The survey, as well as other surveys carried out in the sector in the last decade, points out that most of the available resources do not respond to users' requirements. This motivated us to develop a mock-up of a digital editor of Archilochus, which, mostly grounded on previous studies by Nicolosi, draws on the outcomes of the survey. The experiment includes a sample prototype to submit for evaluation by end-users. The final aim is to identify good practices and new models to enable new approaches to the study of classical texts and profile a new workbench for scholarly digital edition},
KEYWORDS = {Digital Classics, User Involvement, User requirements, CLARIN ERIC, CLARIN Infrastructure},
PAGES = {61-74},
URL = {https://ep.liu.se/ecp/147/006/ecp17147006.pdf},
ISBN = {978-91-7685-273-6},
BOOKTITLE = {Selected papers from the CLARIN Annual Conference 2017, Budapest, 18-20 September 2017},
}
@INCOLLECTION{NICOLAS_2018_INCOLLECTION_NKMDCAEBQV_371916,
AUTHOR = {Nicolas, L. and König, A. and Monachini, M. and Del Gratta, R. and Calamai, S. and Abel, A. and Enea, A. and Biliotti, F. and Quochi, V. and Vincenzo Stella, F.},
TITLE = {CLARIN-IT: State of Affairs, Challenges and Opportunities},
YEAR = {2018},
ABSTRACT = {his paper gives an overview on the Italian national CLARIN consortium as it currently stands two years after its creation at the end of 2015. It thus discusses the current state of affairs of the consortium on several aspects, especially with regards to members. It also discusses the events and initiatives that have been undertaken, as well as the ones that are planned in the close future. It finally outlines the conclusions of a user survey performed to understand the expectations of a targeted user population and provides indications regarding the next steps planned},
KEYWORDS = {CLARIN-IT Consortium Pisa Bolzano Siena},
PAGES = {1-14},
URL = {http://www.ep.liu.se/ecp/contents.asp?issue=147},
ISBN = {978-91-7685-273-6},
BOOKTITLE = {Selected papers from the CLARIN Annual Conference 2017, Budapest, 18-20 September 2017},
}
@INCOLLECTION{PIRRELLI_2018_INCOLLECTION_PV_358750,
AUTHOR = {Pirrelli and Vito},
TITLE = {Morphological Theory And Computational Linguistics},
YEAR = {2018},
ABSTRACT = {For decades, processing issues have taken centre stage in the debate on the theoretical foundations of linguistic morphology. The present chapter provides a computer-based, algorithmic view on these issues, ranging from the encoding of input data to the structure of output representations, going through the basic operations of word splitting, storage, access, retrieval, and assembly of intermediate representations},
KEYWORDS = {word processing, word storage, computational morphology, lexical modelling, machine language learning, finite state technology, artificial neural networks},
PAGES = {573-593},
URL = {http://www.oxfordhandbooks.com/view/10.1093/oxfordhb/9780199668984.001.0001/oxfordhb-9780199668984-e-32?rskey=qZuY8Z\&result=9},
DOI = {10.1093/oxfordhb/9780199668984.013.32},
PUBLISHER = {Oxford University Press (Oxford, GBR)},
ISBN = {978-0-19-966898-4},
CONFERENCE_PLACE = {Oxford},
BOOKTITLE = {The Oxford Handbook of Morphological Theory},
EDITOR = {Audring, J. and Masini, F.},
}
@INCOLLECTION{PROIETTI_2018_INCOLLECTION_P_411323,
AUTHOR = {Proietti, C.},
TITLE = {Temps de la logique et temps de la physique},
YEAR = {2018},
ABSTRACT = {L'histoire du raisonnement sur le temps est pleine de paradoxes et d'énigmes, et la physique contemporaine ne fait pas exception. Les logiques en général, et plus en particulier les logiques temporelles, représentent un outil formel rigoureux pour résoudre ou clarifier des problèmes de ce genre. Dans ce qui suit, nous allons d'abord expliquer, du point de vue de la logique philosophique, qu'est-ce que c'est un paradoxe et ce qui compte comme sa solution. Ensuite, nous allons illustrer la formalisation d'Arthur Norman Prior du paradoxe des futurs contingents. Ensuite, nous nous concentrerons sur deux paradoxes modernes-le paradoxe des jumeaux et le paradoxe du voyage dans le temps-et montrerons comment une logique temporelle adéquate peut aider leur encadrement et leur compréhension},
KEYWORDS = {logique, relativité, paradoxes},
PAGES = {149-168},
URL = {https://www.cnrseditions.fr/catalogue/philosophie-et-histoire-des-idees/temps-de-la-nature-nature-du-temps/},
PUBLISHER = {CNRS Editions (Paris, FRA)},
ISBN = {9782271090836},
CONFERENCE_PLACE = {Paris},
EDITOR = {Huneman, C. B. E. P.},
}
@INCOLLECTION{PROIETTI_2018_INCOLLECTION_PSR_411305,
AUTHOR = {Proietti, C. and Sandu, G. and Rivenc, F.},
TITLE = {Bivalence and Future contingency},
YEAR = {2018},
ABSTRACT = {This work presents an overview of four different approaches to the problem of future contingency and determinism in temporal logics. All of them are bivalent, viz. they share the assumption that propositions concerning future contingent facts have a determinate truth-value (true or false). We introduce Ockhamism, Peirceanism, Actualism and T x W semantics, the four most relevant bivalent alternatives in this area, and compare them from the point of view of their expressiveness and their underlying metaphysics of time},
KEYWORDS = {Future contingents, bivalence, temporal logic, Arthur Prior},
PAGES = {333-350},
URL = {https://iris.cnr.it/handle/20.500.14243/411305},
PUBLISHER = {Springer (Cham, Heidelberg, New York, Dordrecht, London, CHE)},
ISBN = {978-3-319-77434-3},
CONFERENCE_PLACE = {Cham, Heidelberg, New York, Dordrecht, London},
BOOKTITLE = {Introduction to Formal Philosophy},
EDITOR = {Hansson, S. O. and Hendricks, V.},
}
@EDITORIAL{CALZOLARICONFERENCECHAIR_2018_EDITORIAL_CCCDGHIMMMMOPT_391721,
AUTHOR = {Calzolari Conference Chair, N. and Choukri, K. and Cieri, C. and Declerck, T. and Goggi, S. and Hasida, K. and Isahara, H. and Maegaard, B. and Mariani, J. and Mazo, H. and Moreno, A. and Odijk, J. and Piperidis, S. and Tokunaga, T.},
TITLE = {Proceedings of the Eleventh International Conference on Language Resources and Evaluation (LREC-2018)},
YEAR = {2018},
ABSTRACT = {It is the LREC 20th Anniversary and LREC has become one of the most successful conferences of the field. Data are pervasive in Natural Language Processing and Language Technology: we call our data Language Resources (LR). But when LREC was started by ELRA, in 1998 in Granada, from an idea of Antonio Zampolli and Joseph Mariani, it was really a new adventure and a challenge. There were well established big conferences but he thought that the new emerging field of Language Resources deserved its own dedicated forum. In the keynote talk I gave at LREC1998 I could say: "the infrastructural role of Language Resources as the necessary common platform on which new technologies and applications can be based is nowadays widely recognised. " This could not have been said only few years before. I had the pleasure and the honour of being involved in LREC from the beginning, first as member of the Program Committee and since 2004 as Conference Chair},
KEYWORDS = {Language Resources, Language Technology},
PAGES = {1-4628},
URL = {https://www.aclweb.org/anthology/L18-1},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {979-10-95546-00-9},
CONFERENCE_PLACE = {Paris},
}
@EDITORIAL{SORIA_2018_EDITORIAL_SBP_371920,
AUTHOR = {Soria, C. and Besacier, L. and Pretorius, L.},
TITLE = {Proceedings of CCURL 2018-Sustaining knowledge diversity in the digital age},
YEAR = {2018},
ABSTRACT = {Proceedings of the CCURL 2018 workshop},
KEYWORDS = {knowledge diversity, digital age, language resources, language technologies},
PAGES = {I-75},
URL = {http://lrec-conf.org/workshops/lrec2018/W26/pdf/book_of_proceedings.pdf},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {979-10-95546-22-1},
CONFERENCE_PLACE = {Paris},
}
@EDITORIAL{BERNHARD_2018_EDITORIAL_BS_428732,
AUTHOR = {Bernhard, D. and Soria, C.},
TITLE = {Automatic processing of under-resourced languages|Traitement automatique des langues peu dotées},
YEAR = {2018},
KEYWORDS = {less-resourced languages, NLP},
PAGES = {7-14},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85063404297\&origin=inward},
VOLUME = {59 (3)},
ISSN = {1248-9433},
}
@INPROCEEDINGS{_2018_INPROCEEDINGS_GMDCB_345332,
AUTHOR = {, G. C. A. and Mueller, C. A. and Doernbach, T. and Chiarella, D. and Birk, A.},
TITLE = {Robust Gesture-Based Communication for Underwater Human-Robot Interaction in the context of Search and Rescue Diver Missions},
YEAR = {2018},
ABSTRACT = {We propose a robust gesture-based communication pipeline for divers to instruct an Autonomous Underwater Vehicle (AUV) to assist them in performing high-risk tasks and helping in case of emergency. A gesture communication language (CADDIAN) is developed, based on consolidated and standardized diver gestures, including an alphabet, syntax and semantics, ensuring a logical consistency. A hierarchical classification approach is introduced for hand gesture recognition based on stereo imagery and multi-descriptor aggregation to specifically cope with underwater image artifacts, e. g. light backscatter or color attenuation. Once the classification task is finished, a syntax check is performed to filter out invalid command sequences sent by the diver or generated by errors in the classifier. Throughout this process, the diver receives constant feedback from an underwater tablet to acknowledge or abort the mission at any time. The objective is to prevent the AUV from executing unnecessary, infeasible or potentially harmful motions. Experimental results under different environmental conditions in archaeological exploration and bridge inspection applications show that the system performs well in the field},
KEYWORDS = {Underwater Robotics, gesture-based communication, underwater human-robot interaction},
PAGES = {4},
URL = {https://arxiv.org/pdf/1810.07122.pdf},
CONFERENCE_NAME = {2018 IEEE/RSJ International Conference on Intelligent Robots and Systems},
}
@INPROCEEDINGS{ADORNI_2018_INPROCEEDINGS_ADKTV_374898,
AUTHOR = {Adorni, G. and Dell'Orletta, F. and Koceva, F. and Torre, I. and Venturi, G.},
TITLE = {Extracting dependency relations from digital learning content},
YEAR = {2018},
ABSTRACT = {Digital Libraries present tremendous potential for developing e-learning applications, such as text comprehension and question-answering tools. A way to build this kind of tools is structuring the digital content into relevant concepts and dependency relations among them. While the literature offers several approaches for the former, the identification of dependencies, and specifically of prerequisite relations, is still an open issue. We present an approach to manage this task},
KEYWORDS = {Prerequisite relationship, Concept extraction, Graph mining},
PAGES = {114-119},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85041860435\&origin=inward},
VOLUME = {806},
DOI = {10.1007/978-3-319-73165-0_11},
CONFERENCE_NAME = {14th Italian Research Conference on Digital Libraries (IRCDL 2018)},
}
@INPROCEEDINGS{ALZETTA_2018_INPROCEEDINGS_AACKT_493654,
AUTHOR = {Alzetta, C. and Adorni, G. and Celik, I. and Koceva, F. and Torre, I.},
TITLE = {Toward a user-adapted question/answering educational approach},
YEAR = {2018},
ABSTRACT = {This paper addresses the design of a model for Question/Answering in an interactive and mobile learning environment. The learner's question can be made through vocal interaction or typed text and the answer is the generation of a personalized learning path. This takes into account the focus and type of the question and some personal features of the learner extracted both from the question and prosodic features, in case of vocal questions. The response is a learning path that preserves the precedence of the prerequisite relations and contains all the relevant concepts for answering the user's question. The main contribution of the paper is to investigate the possibility to exploit educational concept maps in a Q/A interactive learning system},
KEYWORDS = {Education, Educational concept map, MOOC, Personilized Learning Path, Q/A},
PAGES = {173-177},
URL = {https://iris.cnr.it/handle/20.500.14243/493654},
DOI = {10.1145/3213586.3226214},
PUBLISHER = {Association for Computing Machinery, Inc},
ISBN = {9781450357845},
CONFERENCE_NAME = {26th ACM International Conference on User Modeling, Adaptation and Personalization, UMAP 2018},
BOOKTITLE = {UMAP 2018-Adjunct Publication of the 26th Conference on User Modeling, Adaptation and Personalization},
}
@INPROCEEDINGS{ALZETTA_2018_INPROCEEDINGS_ADMSV_371344,
AUTHOR = {Alzetta, C. and Dell'Orletta, F. and Montemagni, S. and Simi, M. and Venturi, G.},
TITLE = {Assessing the Impact of Iterative Error Detection and Correction. A Case Study on the Italian Universal Dependency Treebank},
YEAR = {2018},
ABSTRACT = {Detection and correction of errors and inconsistencies in "gold treebanks" are becoming more and more central topics of corpus annotation. The paper illustrates a new incremental method for enhancing treebanks, with particular emphasis on the extension of error patterns across different textual genres and registers. Impact and role of corrections have been assessed in a dependency parsing experiment carried out with four different parsers, whose results are promising. For both evaluation datasets, the performance of parsers increases, in terms of the standard LAS and UAS measures and of a more focused measure taking into account only relations involved in error patterns, and at the level of individual dependencies},
KEYWORDS = {Error Detection, Universal Dependency Treebanks, Syntactic parsing},
PAGES = {1-7},
URL = {http://universaldependencies.org/udw18/PDFs/39_Paper.pdf},
ISBN = {978-1-948087-84-1},
CONFERENCE_NAME = {Universal Dependencies Workshop 2018 (UDW 2018)},
}
@INPROCEEDINGS{ALZETTA_2018_INPROCEEDINGS_ADMSV_493647,
AUTHOR = {Alzetta, C. and Dell'Orletta, F. and Montemagni, S. and Simi, M. and Venturi, G.},
TITLE = {Assessing the Impact of Incremental Error Detection and Correction. A Case Study on the Italian Universal Dependency Treebank},
YEAR = {2018},
ABSTRACT = {Detection and correction of errors and inconsistencies in “gold treebanks” are becoming more and more central topics of corpus annotation. The paper illustrates a new incremental method for enhancing treebanks, with particular emphasis on the extension of error patterns across different textual genres and registers. Impact and role of corrections have been assessed in a dependency parsing experiment carried out with four different parsers, whose results are promising. For both evaluation datasets, the performance of parsers increases, in terms of the standard LAS and UAS measures and of a more focused measure taking into account only relations involved in error patterns, and at the level of individual dependencies},
KEYWORDS = {Treebank, annotation, annotation error},
PAGES = {1-7},
URL = {https://iris.cnr.it/handle/20.500.14243/493647},
PUBLISHER = {Association for Computational Linguistics (ACL)},
ISBN = {9781948087780},
CONFERENCE_NAME = {2nd Workshop on Universal Dependencies, UDW 2018, held in conjunction with EMNLP 2018},
BOOKTITLE = {EMNLP 2018-2nd Workshop on Universal Dependencies, UDW 2018-Proceedings of the Workshop},
}
@INPROCEEDINGS{ALZETTA_2018_INPROCEEDINGS_ADMV_334766,
AUTHOR = {Alzetta, C. and Dell'Orletta, F. and Montemagni, S. and Venturi, G.},
TITLE = {Dangerous Relations in Dependency Treebanks},
YEAR = {2018},
ABSTRACT = {The paper illustrates an effective and innovative method for detecting erroneously annotated arcs in gold dependency treebanks based on an algorithm originally developed to measure the reliability of automatically produced dependency relations. The method permits to significantly restrict the error search space and, more importantly, to reliably identify patterns of systematic recurrent errors which represent dangerous evidence to a parser which tendentially will replicate them. Achieved results demonstrate effectiveness and reliability of the method},
KEYWORDS = {Dependency treebanks, Error Detection, Linguistic Annotation},
PAGES = {201-210},
URL = {http://aclweb.org/anthology/W/W17/W17-7624.pdf},
ISBN = {978-80-88132-04-2},
CONFERENCE_NAME = {16th International Workshop on Treebanks and Linguistic Theories},
BOOKTITLE = {Proceedings of the 16th International Workshop on Treebanks and Linguistic Theories},
}
@INPROCEEDINGS{ALZETTA_2018_INPROCEEDINGS_ADMV_374901,
AUTHOR = {Alzetta, C. and Dell'Orletta, F. and Montemagni, S. and Venturi, G.},
TITLE = {Universal Dependencies and Quantitative Typological Trends. A Case Study on Word Order},
YEAR = {2018},
ABSTRACT = {The paper presents a new methodology aimed at acquiring typological evidence from "gold" treebanks for different languages. In particular, it investigates whether and to what extent algorithms developed for assessing the plausibility of automatically produced syntactic annotations could contribute to shed light on key issues of the linguistic typological literature. It reports the first and promising results of a case study focusing on word order patterns carried out on three different languages (English, Italian and Spanish)},
KEYWORDS = {Linguistic Knowledge Extraction, Dependency Treebanks, Linguistic Typology},
PAGES = {4540-4549},
URL = {http://www.lrec-conf.org/proceedings/lrec2018/pdf/1109.pdf},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {979-10-95546-00-9},
CONFERENCE_NAME = {Proceedings of the 11th Edition of the Language Resources and Evaluation Conference (LREC 2018)},
CONFERENCE_PLACE = {Paris},
}
@INPROCEEDINGS{ALZETTA_2018_INPROCEEDINGS_AKPTA_493653,
AUTHOR = {Alzetta, C. and Koceva, F. and Passalacqua, S. and Torre, I. and Adorni, G.},
TITLE = {PRET: Prerequisite-enriched terminology. A case study on educational texts},
YEAR = {2018},
ABSTRACT = {In this paper we present PRET, a gold dataset annotated for prerequisite relations between educational concepts extracted from a computer science textbook, and we describe the language and domain independent approach for the creation of the resource. Additionally, we have created an annotation tool to support, validate and analyze the annotation},
KEYWORDS = {prerequisite relations, resource},
PAGES = {14-20},
URL = {https://iris.cnr.it/handle/20.500.14243/493653},
VOLUME = {2253},
DOI = {10.4000/books.aaccademia.3028},
PUBLISHER = {CEUR-WS},
ISBN = {9788831978682},
CONFERENCE_NAME = {5th Italian Conference on Computational Linguistics, CLiC-it 2018},
BOOKTITLE = {CEUR Workshop Proceedings of the 5th Italian Conference on Computational Linguistics, CLiC-it 2018},
}
@INPROCEEDINGS{BAMBACI_2018_INPROCEEDINGS_BBD_403990,
AUTHOR = {Bambaci, L. and Boschetti, F. and Del Gratta, R.},
TITLE = {Qohelet Euporia: a Domain Specific Language to Annotate Multilingual Variant Readings},
YEAR = {2018},
ABSTRACT = {Encoding multilingual variant readings is time-consuming and error-prone. The guidelines provided by the Text Encoding Initiative (TEI) ensure data interchange, but the TEIXML verbosity risks to distract annotators with a traditional background in philological studies from their critical activity. We illustrate how a Domain Specific Language (DSL) facilitates both the manual annotation of the critical apparatus and the data interchange. Our case study is based on the multilingual tradition of the biblical book of Qohelet, which has been annotated through the annotation tool based on DSLs named Euporia},
URL = {https://iris.cnr.it/handle/20.500.14243/403990},
DOI = {10.1109/CIST.2018.8596332},
ISBN = {978-1-5386-4385-3},
}
@INPROCEEDINGS{BARTOLINI_2018_INPROCEEDINGS_BGMP_376199,
AUTHOR = {Bartolini, R. and Goggi, S. and Monachini, M. and Pardelli, G.},
TITLE = {The LREC Workshops Map},
YEAR = {2018},
ABSTRACT = {The aim of this work is to present an overview of the research presented at the LREC workshops over the years 1998-2016 with the aim to shed light on the community represented by workshop participants in terms of country of origin, type of affiliation, gender. There has been also an effort towards the identification of the major topics dealt with as well as of the terminological variations noticed in this time span. Data has been retrieved from the portal of the European Language Resources Association (ELRA) which organizes the conference and the resulting corpus made up of workshops titles and of the related presentations has then been processed using a term extraction tool developed at ILC-CNR},
KEYWORDS = {corpus creation, terminology, LREC},
PAGES = {557-562},
URL = {http://www.lrec-conf.org/proceedings/lrec2018/summaries/639.html},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {979-10-95546-00-9},
CONFERENCE_NAME = {Eleventh International Conference on Language Resources and Evaluation (LREC 2018)},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the Eleventh International Conference on Language Resources and Evaluation (LREC 2018)},
EDITOR = {Calzolari, N. and Choukri, K. and Cieri, C. and Declerck, T. and Goggi, S. and Hasida, K. and Isahara, H. and Maegaard, B. and Mariani, J. and Mazo, H. and Moreno, A. and Odijk, J. and Piperidis, S. and Tokunaga, T.},
}
@INPROCEEDINGS{BIBULI_2018_INPROCEEDINGS_BBCCCFGORSZ_351746,
AUTHOR = {Bibuli, M. and Bruzzone, G. and Caccia, M. and Camporeale, G. and Chiarella, D. and Ferretti, R. and Giacopelli, M. and Odetti, A. and Ranieri, A. and Spirandelli, E. and Zereik, E.},
TITLE = {An Advanced Guidance & Control System for an Unmanned Vessel with Azimuthal Thrusters},
YEAR = {2018},
ABSTRACT = {The proposed paper presents the design and development of the combined guidance \& control strategies for the autonomous navigation of an unmanned vessel characterized by azimuth-based thrust architecture. Autonomous Marine Vehicles (AMVs) are consolidates technological tools commonly employed for different tasks such as exploration, sampling and intervention. With the final aim of autonomous shipping, the capabilities of AMVs have to be migrated and adapted towards the reliable and safe control of commercial-like unmanned vessel, that are taking place thanks to a number of technological research projects. The employment of new concept hulls and thrust configurations, as for instance Small Waterplane Area Twin Hull (SWATH) combined with Azimuthal propulsion (common propeller-based thruster with the capability of 360o rotation around the vertical axis), requires robust guidance techniques to provide precise and reliable motion control during avigation. The paper proposes a dual-loop guidance \& control scheme able to provide advanced navigation capabilities. In particular, the inner control loop, devoted to the actuation of the azimuthal thrusters, allows the tracking of reference course angle (namely the autopilot). Such a control loop is characterized by a modified PID regulation scheme, where a novel adaptive derivative component is inserted in order to improve the convergence curve towards the required course reference. The outer guidance loop, based on Lyapunov/virtual-target approach, allows the vessel to track generic desired paths, thus enhancing the autonomous navigation capabilities also in constrained environments. The paper will provide a deep design \& analysis approach for the developed techniques, as well as simulation results of the combined guidance \& control scheme, proving the reliability of the proposed approach in different operative conditions. Experimental results will be provided, depending on the availability of the actual autonomous vessel (currently under final development/test phases and related to the specific project activities)},
KEYWORDS = {Autonomous Guidance, Azimuth Control, USV},
PAGES = {11},
URL = {https://iris.cnr.it/handle/20.500.14243/351746},
CONFERENCE_NAME = {International Ship Control System Symposium (iSCSS)},
BOOKTITLE = {International Ship Control System Symposium (iSCSS)},
}
@INPROCEEDINGS{BIBULI_2018_INPROCEEDINGS_BBCCCFGORSZ_513738,
AUTHOR = {Bibuli, M. and Bruzzone, G. and Caccia, M. and Camporeale, G. and Chiarella, D. and Ferretti, R. and Giacopelli, M. and Odetti, A. and Ranieri, A. and Spirandelli, E. and Zereik, E.},
TITLE = {An advanced guidance and control system for an unmanned vessel with azimuthal thrusters},
YEAR = {2018},
ABSTRACT = {The proposed paper presents the design and development of the combined guidance \& control strategies for the autonomous navigation of an unmanned vessel characterized by azimuth-based thrust architecture. Au-tonomous Marine Vehicles (AMVs) are consolidates technological tools commonly employed for different tasks such as exploration, sampling and intervention. With the final aim of autonomous shipping, the capabilities of AMVs have to be migrated and adapted towards the reliable and safe control of commercial-like unmanned ves-sel, that are taking place thanks to a number of technological research projects. The employment of new concept hulls and thrust configurations, as for instance Small Waterplane Area Twin Hull (SWATH) combined with Az-imuthal propulsion (common propeller-based thruster with the capability of 360◦ rotation around the vertical axis), requires robust guidance techniques to provide precise and reliable motion control during navigation. The paper proposes a dual-loop guidance \& control scheme able to provide advanced navigation capabilities. In par-ticular, the inner control loop, devoted to the actuation of the azimuthal thrusters, allows the tracking of reference course angle (namely the autopilot). Such a control loop is characterized by a modified PID regulation scheme, where a novel adaptive derivative component is inserted in order to improve the convergence curve towards the required course reference. The outer guidance loop, based on Lyapunov/virtual-target approach, allows the vessel to track generic desired paths, thus enhancing the autonomous navigation capabilities also in constrained envi-ronments. The paper will provide a deep design \& analysis approach for the developed techniques, as well as simulation results of the combined guidance \& control scheme, proving the reliability of the proposed approach in different operative conditions. Experimental results will be provided, depending on the availability of the actual autonomous vessel (currently under final development/test phases and related to the specific project activities)},
KEYWORDS = {Autonomous Guidance, Azimuth Control, USV},
URL = {https://iris.cnr.it/handle/20.500.14243/513738},
VOLUME = {1},
DOI = {10.24868/issn.2631-8741.2018.004},
ISSN = {2631-8741},
BOOKTITLE = {Proceedings of the International Ship Control Systems Symposium (iSCSS)},
}
@INPROCEEDINGS{BOSCO_2018_INPROCEEDINGS_BSDPT_351854,
AUTHOR = {Bosco, C. and Sanguinetti, M. and Dell'Orletta, F. and Poletto, F. and Tesconi, M.},
TITLE = {Overview of the EVALITA 2018 hate speech detection task},
YEAR = {2018},
ABSTRACT = {The Hate Speech Detection (HaSpeeDe) task is a shared task on Italian social media (Facebook and Twitter) for the detection of hateful content, and it has been proposed for the first time at EVALITA 2018. Providing two datasets from two different online social platforms differently featured from the linguistic and communicative point of view, we organized the task in three tasks where systems must be trained and tested on the same resource or using one in training and the other in testing: HaSpeeDe-FB, HaSpeeDe-TW and Cross-HaSpeeDe (further subdivided into Cross-HaSpeeDe FB and Cross-HaSpeeDe TW sub-tasks). Overall, 9 teams participated in the task, and the best system achieved a macro F1-score of 0. 8288 for HaSpeeDe-FB, 0. 7993 for HaSpeeDe-TW, 0. 6541 for Cross-HaSpeeDe FB and 0. 6985 for Cross-HaSpeeDe TW. In this report, we describe the datasets released and the evaluation measures, and we discuss results},
KEYWORDS = {Hate Speech Detection, Social Media Analysis},
PAGES = {9},
URL = {http://www.scopus.com/inward/record.url?eid=2-s2.0-85058647605\&partnerID=q2rCbXpz},
VOLUME = {2263},
CONFERENCE_NAME = {EVALITA 2018-Sixth Evaluation Campaign of Natural Language Processing and Speech Tools for Italian},
}
@INPROCEEDINGS{BRUNATO_2018_INPROCEEDINGS_BDDIV_371346,
AUTHOR = {Brunato, D. and De Mattei, L. and Dell'Orletta, F. and Iavarone, B. and Venturi, G.},
TITLE = {Is this sentence difficult? Do you agree?},
YEAR = {2018},
ABSTRACT = {In this paper, we present a crowdsourcing-based approach to model the human perception of sentence complexity. We collect a large corpus of sentences rated with judgments of complexity for two typologically-different languages, Italian and English. We test our approach in two experimental scenarios aimed to investigate the contribution of a wide set of lexical, morpho-syntactic and syntactic phenomena in predicting i) the degree of agreement among annotators independently from the assigned judgment and ii) the perception of sentence complexity},
KEYWORDS = {Linguistic complexity, Crowdsourcing, Human perception},
PAGES = {1-10},
URL = {https://www.aclweb.org/anthology/D18-1289/},
DOI = {10.18653/v1/D18-1289},
PUBLISHER = {Association for Computational Linguistics (Stroudsburg, USA)},
ISBN = {978-1-948087-84-1},
CONFERENCE_NAME = {Conference on Empirical Methods in Natural Language Processing (EMNLP)},
CONFERENCE_PLACE = {Stroudsburg},
}
@INPROCEEDINGS{BRUNATO_2018_INPROCEEDINGS_BVD_392547,
AUTHOR = {Brunato, D. and Valeriani, M. and Dell'Orletta, F.},
TITLE = {DARC-IT: A DAtaset for reading comprehension in Italian},
YEAR = {2018},
ABSTRACT = {In this paper, we present DARC-IT, a new reading comprehension dataset for the Italian language aimed at identifying 'question-worthy' sentences, i. e. sentences in a text which contain information that is worth asking a question about. The purpose of the corpus is twofold: to investigate the linguistic profile of question-worthy sentences and to support the development of automatic question generation systems},
URL = {https://iris.cnr.it/handle/20.500.14243/392547},
DOI = {10.4000/books.aaccademia.3099},
}
@INPROCEEDINGS{CHIARELLO_2018_INPROCEEDINGS_CBFOCD_392588,
AUTHOR = {Chiarello, F. and Bonaccorsi, A. and Fantoni, G. and Ossola, G. and Cimino, A. and Dell'Orletta, F.},
TITLE = {Technical Sentiment Analysis: Measuring Advantages and Drawbacks of New Products Using Social Media},
YEAR = {2018},
ABSTRACT = {This work proposes a new social media based model to measure how users perceive new products from a technical point of view. This model relies on the analysis of advantages and drawbacks of products, which are both important aspects evaluated by consumers during the buying decision process. This model is based on a lexicon developed in a related work (Chiarello et. al, 2017) to analyse patents and detect advantages and drawbacks connected to a certain technology},
URL = {https://iris.cnr.it/handle/20.500.14243/392588},
DOI = {10.4995/CARMA2018.2018.8336},
ISBN = {978-84-9048-689-4},
}
@INPROCEEDINGS{CHIRIATTI_2018_INPROCEEDINGS_CDDMPSV_403577,
AUTHOR = {Chiriatti, G. and Della Gala, V. and Dell'Orletta, F. and Montemagni, S. and Pettenati, M. C. and Sagri, M. T. and Venturi, G.},
TITLE = {A NLP-based analysis of reflective writings by Italian teachers},
YEAR = {2018},
ABSTRACT = {This paper reports first results of a wider study devoted to exploit the potentialities of a NLP-based approach to the analysis of a corpus of reflective writings on teaching activities. We investigate how a wide set of linguistic features allows reconstructing the linguistic profile of the texts written by the Italian teachers and predicting whether are reflective},
KEYWORDS = {Natural Language Processing, Reflective Writings, Linguistic Profiling, Document Classification},
PAGES = {1-7},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85057733802\&origin=inward},
VOLUME = {2253},
CONFERENCE_NAME = {5th Italian Conference on Computational Linguistics (CLiC-it)},
}
@INPROCEEDINGS{CIMINO_2018_INPROCEEDINGS_CDD_392545,
AUTHOR = {Cimino, A. and De Mattei, L. and Dell'Orletta, F.},
TITLE = {Multi-task learning in deep neural networks at EVALITA 2018},
YEAR = {2018},
ABSTRACT = {In this paper we describe the system used for the participation to the ABSITA, GxG, HaSpeeDe and IronITA shared tasks of the EVALITA 2018 conference. We developed a classifier that can be configured to use Bidirectional Long Short Term Memories and linear Support Vector Machines as learning algorithms. When using Bi-LSTMs we tested a multitask learning approach which learns the optimized parameters of the network exploiting simultaneously all the annotated dataset labels and a multiclassifier voting approach based on a k-fold technique. In addition, we developed generic and specific word embedding lexicons to further improve classification performances. When evaluated on the official test sets, our system ranked 1st in almost all subtasks for each shared task, showing the effectiveness of our approach},
URL = {https://iris.cnr.it/handle/20.500.14243/392545},
}
@INPROCEEDINGS{CIMINO_2018_INPROCEEDINGS_CDBV_403576,
AUTHOR = {Cimino, A. and Dell'Orletta, F. and Brunato, D. and Venturi, G.},
TITLE = {Sentences and documents in native language identification},
YEAR = {2018},
ABSTRACT = {Starting from a wide set of linguistic features, we present the first in depth feature analysis in two different Native Language Identification (NLI) scenarios. We compare the results obtained in a traditional NLI document classification task and in a newly introduced sentence classification task, investigating the different role played by the considered features. Finally, we study the impact of a set of selected features extracted from the sentence classifier in document classification},
KEYWORDS = {Natural Language Processing, Native Language Identification},
PAGES = {1-6},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85057749754\&origin=inward},
VOLUME = {2253},
CONFERENCE_NAME = {5th Italian Conference on Computational Linguistics (CLiC-it)},
}
@INPROCEEDINGS{COCCIU_2018_INPROCEEDINGS_CBVD_403579,
AUTHOR = {Cocciu, E. and Brunato, D. and Venturi, G. and Dell'Orletta, F.},
TITLE = {Gender and Genre Linguistic profiling: A case study on female and male journalistic and diary prose},
YEAR = {2018},
ABSTRACT = {This paper intends to investigate the linguistic profile of male-and female-authored texts belonging to two very different textual genres: newspaper articles and diary prose. By using a wide set of linguistic features automatically extracted from text and spanning across different levels of linguistic description, from lexicon to syntax, our analysis highlights the peculiarities of the two examined genres and how the genre dimension is influenced by variation depending on author's gender (and vice versa)},
KEYWORDS = {Natural Language Processing, Genre Classification, Linguistic Profiling},
PAGES = {1-6},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85057759773\&origin=inward},
VOLUME = {2253},
CONFERENCE_NAME = {5th Italian Conference on Computational Linguistics (CLiC-it)},
}
@INPROCEEDINGS{CRESCI_2018_INPROCEEDINGS_CCATD_392594,
AUTHOR = {Cresci, S. and Cimino, A. and Avvenuti, M. and Tesconi, M. and Dell'Orletta, F.},
TITLE = {Real-world witness detection in social media via hybrid crowdsensing},
YEAR = {2018},
ABSTRACT = {The task of witness detection in social media is crucial for many practical applications, including rumor debunking, emergency management, and public opinion mining. Yet to date, it has been approached in an approximated way. We propose a method for addressing witness detection in a strict and realistic fashion. By employing hybrid crowdsensing over Twitter, we contact real-life witnesses and use their reactions to build a strong ground-truth, thus avoiding a manual, subjective annotation of the dataset. Using this dataset, we develop a witness detection system based on a machine learning classifier using a wide set of linguistic features and metadata associated with the tweets},
URL = {https://iris.cnr.it/handle/20.500.14243/392594},
}
@INPROCEEDINGS{CUTUGNO_2018_INPROCEEDINGS_CDPSS_358247,
AUTHOR = {Cutugno, F. and Dell'Orletta, F. and Poggi, I. and Savy, R. and Sorgente, A.},
TITLE = {The CHROME Manifesto: Integrating multimodal data into Cultural Heritage Resources},
YEAR = {2018},
ABSTRACT = {The CHROME Project aims at collecting a wide portfolio of digital resources oriented to technological application in Cultural Heritage (henceforth CH). The contributions for the realisation of such objective come from the efforts of computer scientists, psychologists, architects, and computational linguists, who constitute an interdisciplinary equipe. We are collecting and analyzing texts, spoken materials, architectural surveys, and human motion videos, attempting the integration of these data in a multidimensional platform based on multilevel annotation systems, game engines importing, and virtualization techniques. As case of study we choose to work on the magic travel along three Charterhouses located in Campania region: S. Martino in Naples, S. Lorenzo in Padula (Salerno) and S. Giacomo, in Capri},
KEYWORDS = {cultural heritage, multimodal interaction},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85057736501\&origin=inward},
VOLUME = {2253},
CONFERENCE_NAME = {CLiC-it 2018 Italian Conference on Computational Linguistics},
}
@INPROCEEDINGS{DEFELICE_2018_INPROCEEDINGS_DDVLM_403578,
AUTHOR = {De Felice, I. and Dell'Orletta, F. and Venturi, G. and Lenci, A. and Montemagni, S.},
TITLE = {Italian in the Trenches: Linguistic annotation and analysis of texts of the great war},
YEAR = {2018},
ABSTRACT = {The paper illustrates the design and development of a textual corpus representative of the historical variants of Italian during the Great War, which was enriched with linguistic (lemmatization and pos-tagging) and meta-linguistic annotation. The corpus, after a manual revision of the linguistic annotation, was used for specializing existing NLP tools to process historical texts with promising results},
KEYWORDS = {Natural Language Processing, Automatic Linguistic Annotation},
PAGES = {1-5},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85057734451\&origin=inward},
VOLUME = {2253},
CONFERENCE_NAME = {5th Italian Conference on Computational Linguistics (CLiC-it)},
}
@INPROCEEDINGS{DEMATTEI_2018_INPROCEEDINGS_DCD_392584,
AUTHOR = {De Mattei, L. and Cimino, A. and Dell'Orletta, F.},
TITLE = {Multi-task learning in deep neural network for sentiment polarity and irony classification},
YEAR = {2018},
ABSTRACT = {We study the impact of a new multi-task learning approach in deep neural network for polarity and irony detection in Italian Twitter posts. We compare this approach with traditional single-task learning models. The different behavior of the two approaches shows the effectiveness of the proposed method that is able to combine the information from the two tasks improving the accuracy in both tasks. This is particularly true on edge cases in which knowledge about the two tasks is needed to classify a tweet, this is the case, for example, when the literal polarity of a tweet is inverted by irony},
URL = {https://iris.cnr.it/handle/20.500.14243/392584},
}
@INPROCEEDINGS{DELGRATTA_2018_INPROCEEDINGS_DGPC_376195,
AUTHOR = {Del Gratta, R. and Goggi, S. and Pardelli, G. and Calzolari, N.},
TITLE = {LREMap, a Song of Resources and Evaluation},
YEAR = {2018},
ABSTRACT = {After 8 years we revisit the LRE Map of Language Resources, introduced at LREC 2010, to try to get a picture of the field and its evolution as reflected by the creation and use of Language Resources. The purpose of the Map was in fact "to shed light on the vast amount of resources that represent the background of the research presented at LREC". It also aimed at a "change of culture in the field, actively engaging each researcher in the documentation task about resources". The data analysed here have been provided by the authors of several conferences during the phase of submission of papers, and contain information about ca. 7500 resources. We analysed the LRE Map data from many different viewpoints and the paper reports on the global picture, on different trends emerging from the diachronic perspective and finally on some comparisons between the 2 major conferences present in the Map: LREC and COLING},
KEYWORDS = {LR Infratructure, Metadata, LR Documentation},
PAGES = {1275-1281},
URL = {http://www.lrec-conf.org/proceedings/lrec2018/summaries/300.html},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {979-10-95546-00-9},
CONFERENCE_NAME = {Eleventh International Conference on Language Resources and Evaluation (LREC 2018)},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the Eleventh International Conference on Language Resources and Evaluation (LREC 2018)},
EDITOR = {Calzolari, N. and Choukri, K. and Cieri, C. and Declerck, T. and Goggi, S. and Hasida, K. and Isahara, H. and Maegaard, B. and Mariani, J. and Mazo, H. and Moreno, A. and Odijk, J. and Piperidis, S. and Tokunaga, T.},
}
@INPROCEEDINGS{DELGROSSO_2018_INPROCEEDINGS_DBGMN_348283,
AUTHOR = {Del Grosso, A. M. and Bellandi, A. and Giovannetti, E. and Marchi, S. and Nahli, O.},
TITLE = {Scanning is Just the Beginning: Exploiting Text and Language Technologies to Enhance the Value of Historical Manuscripts},
YEAR = {2018},
ABSTRACT = {In this paper we present a digital process for the explicitation of the textual, linguistic and semantic content of historical manuscripts. The proposed workflow is composed of a sequence of incremental steps, each of which is described both on a methodological and practical perspective. The steps are: 1) visualization and structuring of metadata, 2) transcription, 3) structural encoding, 4) annotation, 5) lexical and conceptual structuring},
KEYWORDS = {Computational Lexica, Digital Scholarly Editing, Digital Humanities, al-Qamus al-Muhit},
PAGES = {214-219},
URL = {https://iris.cnr.it/handle/20.500.14243/348283},
DOI = {10.1109/CIST.2018.8596373},
PUBLISHER = {IEEE (New York, USA)},
ISBN = {978-1-5386-4385-3},
CONFERENCE_NAME = {CIST 2018 WH-MNLP},
CONFERENCE_PLACE = {New York},
BOOKTITLE = {Colloquium in Information Science and Technology, CIST},
EDITOR = {Al Achhab, M. and El Mohajir, M. and Jellouli, I. and El Mohajir, B. E.},
}
@INPROCEEDINGS{DELLOGLIO_2018_INPROCEEDINGS_DBD_392583,
AUTHOR = {Dell'Oglio, P. and Brunato, D. and Dell'Orletta, F.},
TITLE = {Lexicon and Syntax: Complexity across genres and language varieties},
YEAR = {2018},
ABSTRACT = {This paper presents first results of an ongoing work to investigate the interplay between lexical complexity and syntactic complexity with respect to nominal lexicon and how it is affected by textual genre and level of linguistic complexity within genre. A cross-genre analysis is carried out for the Italian language using multi-leveled linguistic features automatically extracted from dependency parsed corpora},
URL = {https://iris.cnr.it/handle/20.500.14243/392583},
DOI = {10.4000/books.aaccademia.3282},
ISBN = {9788831978415},
}
@INPROCEEDINGS{DELLORLETTA_2018_INPROCEEDINGS_DN_392544,
AUTHOR = {Dell'Orletta, F. and Nissim, M.},
TITLE = {Overview of the Evalita 2018 cross-genre gender prediction (GXG) task},
YEAR = {2018},
ABSTRACT = {The Gender Cross-Genre (GxG) task is a shared task on author profiling (in terms of gender) on Italian texts, with a specific focus on cross-genre performance. This task has been proposed for the first time at EVALITA 2018, providing different datasets from different textual genres: Twitter, YouTube, Children writing, Journalism, Personal diaries. Results from a total of 50 different runs show that the task is difficult to learn in itself: while almost all runs beat a 50% baseline, no model reaches an accuracy above 70%. We also observe that cross-genre modelling yields a drop in performance, but not as substantial as one would expect},
URL = {https://iris.cnr.it/handle/20.500.14243/392544},
DOI = {10.4000/books.aaccademia.4478},
ISBN = {9788831978422},
}
@INPROCEEDINGS{FAHADKHAN_2018_INPROCEEDINGS_FB_345620,
AUTHOR = {Fahad Khan, A. and Boschetti, F.},
TITLE = {Towards a Representation of Citations in Linked Data Lexical Resources},
YEAR = {2018},
ABSTRACT = {In this article we look at the modelling of citations in lexical resources in linked data. We start by discussing the treatment of citations in linked data and in TEI; we also look at the idea of different conceptual levels as posited by models such as TEI and FRBR. We argue that in representing citations in lexical resources it is im-portant not to confuse different levels of information, and that at least in the case of attestations it is important to model the purpose of a citation, or the claim that is being made by that citation, separately. We develop this point with two separate examples before presenting lemonBib, our extension of the lemon model based around the idea of a lexical attestation. We also give a treatment of part of one of the examples described previously in the article},
URL = {https://iris.cnr.it/handle/20.500.14243/345620},
DOI = {10.4312/9789610600961},
ISBN = {978-961-06-0096-1},
}
@INPROCEEDINGS{FERRETTI_2018_INPROCEEDINGS_FMV_388353,
AUTHOR = {Ferretti, M. and Morgavi, G. and Veruggio, G.},
TITLE = {How should a robot caregiver for elderly people be?},
YEAR = {2018},
ABSTRACT = {During the last few years, due to the aging of the population, many scientists have developed ICT tools to offer elderly people an independent life at home as long as possible. Most of these researchers focused their efforts on problem solving without adequate care to the agreeability and/or the acceptability of these ICT objects for their users. These resulting artifacts will hardly be used in real life by the users for which they have been developed. In this paper, we will present an experiment done on 202 elderly people over 65 on the acceptability and the likeness features a caregiver robot must have. Starting from a classification of 25 different real robot pictures and the associated questionnaire on the quality of seventeen adjectives describing the first and the last robot selected, our work tried to better understand the hidden and implicit motivations that lead to the acceptance or the rejection of a robot and found some interesting results for appealing or unpleasant features for caregiver robot design},
URL = {https://iris.cnr.it/handle/20.500.14243/388353},
}
@INPROCEEDINGS{FERRETTI_2018_INPROCEEDINGS_FMV_347643,
AUTHOR = {Ferretti, M. and Morgavi, G. and Veruggio, G.},
TITLE = {The ACCEPTABILITY of Caregiver Robots in Elderly People},
YEAR = {2018},
ABSTRACT = {During the last few years, due to the aging of the population, many scientists have developed ICT tools to offer elderly people an independent life at home as long as possible. Most of these researchers focused their efforts on problem solving without adequate care to the agreeability and/or the acceptability of these ICT objects for their users. These resulting artifacts will hardly be used in real life by the users for which they have been developed. In this paper, we will present an experiment done on 202 over 65 elderly people on the acceptability and the likeness features a caregiver robot must have. From the classification and analysis of the emotions elicited by the physical/appearance characteristics of 25 different real robot pictures we found some interesting results for appealing or unpleasant features for caregiver robot design},
KEYWORDS = {Caregiver Robots, Robots for Elderly People, Robot Acceptability},
PAGES = {111-118},
URL = {http://www.scitepress.org/PublicationsDetail.aspx?ID=pYhdl1lVkzI=\&t=1},
DOI = {10.5220/0006674301110118},
ISBN = {978-989-758-299-8},
CONFERENCE_NAME = {4th International Conference on Information and Communication Technologies for Ageing Well and e-Health},
}
@INPROCEEDINGS{FERRO_2018_INPROCEEDINGS_FCGMNCP_350556,
AUTHOR = {Ferro, M. and Cappa, C. and Giulivi, S. and Marzi, C. and Nahli, O. and Cardillo, F. A. and Pirrelli, V.},
TITLE = {ReadLet: Reading for Understanding},
YEAR = {2018},
ABSTRACT = {This paper focuses on motivation, objectives, design issues and preliminary results of ReadLet, an ICT platform for assessing reading efficiency in primary school children. Test data are discussed on a sample of 200 early graders, reading French, Italian and Standard Modern Arabic (SMA)},
KEYWORDS = {Reading, text comprehension, Specific Learning Disorders, multimodal signal processing, cloud computing, portable assistive technology},
PAGES = {404-409},
URL = {https://publications.cnr.it/doc/390504},
PUBLISHER = {IEEE (New York, USA)},
ISBN = {978-1-5386-4385-3},
CONFERENCE_NAME = {IEEE-CIST2018 LED-ICT},
CONFERENCE_PLACE = {New York},
BOOKTITLE = {Proceedings of the IEEE Congress on Information Science and Technology (CiSt)},
}
@INPROCEEDINGS{GIOVANNETTI_2018_INPROCEEDINGS_GABMP_500052,
AUTHOR = {Giovannetti, E. and Albanesi, D. and Bellandi, A. and Marchi, S. and Pecchioli, A.},
TITLE = {Constructing an annotated resource for part-of-speech tagging of mishnaic Hebrew},
YEAR = {2018},
ABSTRACT = {This paper introduces the research in Part-Of-Speech tagging of mishnaic Hebrew carried out within the Babylonian Talmud Translation Project. Since no tagged resource was available to train a stochastic POS tagger, a portion of the Mishna of the Babylonian Talmud has been morphologically annotated using an ad hoc developed tool connected with the DB containing the talmudic text being translated. The final aim of this research is to add a linguistic support to the Translation Memory System of Traduco, the Computer-Assisted Translation tool developed and used within the Project},
KEYWORDS = {pos tagging, mishnaic hewbrew, babilonian talmud},
PAGES = {219-223},
URL = {https://iris.cnr.it/handle/20.500.14243/500052},
VOLUME = {2253},
DOI = {10.4000/books.aaccademia.3394},
PUBLISHER = {Accademia University Press},
ISBN = {9788831978682},
CONFERENCE_NAME = {CLiC-It 2018. Fifth Italian Conference on Computational Linguistics},
BOOKTITLE = {Proceedings of the Fifth Italian Conference on Computational Linguistics CLiC-It 2018},
}
@INPROCEEDINGS{GOGGI_2018_INPROCEEDINGS_GPRBM_348935,
AUTHOR = {Goggi, S. and Pardelli, G. and Russo, I. and Bartolini, R. and Monachini, M.},
TITLE = {Providing Access to Grey Literature: The CLARIN Infrastructure},
YEAR = {2018},
ABSTRACT = {This work will provide a map of the documentation archived in the CLARIN infrastructure, whose purpose is to share language resources produced and managed in the various European countries but finally merged into the CLARIN data centers for allowing access, interoperability, reuse and preservation of scientific documentation as well as Grey Literature},
KEYWORDS = {CLARIN Infrastructure, Language Resources, Grey Literature},
PAGES = {93-99},
URL = {http://greyguide.isti.cnr.it/wp-content/uploads/2018/03/GL19_Conference_Proceedings.pdf},
PUBLISHER = {TextRelease (Amsterdam, NLD)},
ISSN = {1386-2316},
ISBN = {978-90-77484-31-9},
CONFERENCE_NAME = {Nineteenth International Conference on Grey Literature, GL19},
CONFERENCE_PLACE = {Amsterdam},
BOOKTITLE = {THE GL-CONFERENCE SERIES. CONFERENCE PROCEEDINGS},
EDITOR = {Farace, D. and Frantzen, J.},
}
@INPROCEEDINGS{KHAN_2018_INPROCEEDINGS_KBFM_376218,
AUTHOR = {Khan, F. and Bellandi, A. and Frontini, F. and Monachini, M.},
TITLE = {One Language to rule them all: modelling Morphological Patterns in a Large Scale Italian Lexicon with SWRL},
YEAR = {2018},
ABSTRACT = {We present an application of Semantic Web Technologies to computational lexicography. More precisely we describe the publication of the morphological layer of the Italian Parole Simple Clips lexicon (PSC-M) as linked open data. The novelty of our work is in the use of the Semantic Web Rule Language (SWRL) to encode morphological patterns, thereby allowing the automatic derivation of the inflectional variants of the entries in the lexicon. By doing so we make these patterns available in a form that is human readable and that therefore gives a comprehensive morphological description of a large number of Italian word},
KEYWORDS = {Morphology, Linked Open Data, Italian Lexicon, SWRL, SQVRL},
PAGES = {4385-4389},
URL = {http://www.lrec-conf.org/proceedings/lrec2018/pdf/844.pdf},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {979-10-95546-00-9},
CONFERENCE_NAME = {Eleventh International Conference on Language Resources and Evaluation (LREC 2018)},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the Eleventh International Conference on Language Resources and Evaluation (LREC 2018)},
EDITOR = {Chair, N. C. C. and Choukri, K. and Cieri, C. and Declerck, T. and Goggi, S. and Hasida, K. and Isahara, H. and Maegaard, B. and Mariani, J. and Mazo, H. and Moreno, A. and Odijk, J. and Piperidis, S. and Tokunaga, T.},
}
@INPROCEEDINGS{MARZI_2018_INPROCEEDINGS_MFNBBP_349950,
AUTHOR = {Marzi, C. and Ferro, M. and Nahli, O. and Belik, P. and Bompolas, S. and Pirrelli, V.},
TITLE = {Evaluating Inflectional Complexity Crosslinguistically: a Processing Perspective},
YEAR = {2018},
ABSTRACT = {The paper provides a cognitively motivated method for evaluating the inflectional complexity of a language, based on a sample of"raw" inflected word forms processed and learned by a recurrent self-organising neural network with fixed parameter setting. Trainingitems contain no information about either morphological content or structure. This makes the proposed method independent of bothmeta-linguistic issues (e. g. format and expressive power of descriptive rules, manual or automated segmentation of input forms, numberof inflectional classes etc.) and language-specific typological aspects (e. g. word-based, stem-based or template-based morphology). Results are illustrated by contrasting Arabic, English, German, Greek, Italian and Spanish},
KEYWORDS = {paradigm-based morphology, inflectional complexity, prediction-based processing, recurrent self-organising networks, Statistical And Machine Learning Methods, Language Modelling},
PAGES = {3860-3866},
URL = {http://www.lrec-conf.org/proceedings/lrec2018/summaries/745.html},
PUBLISHER = {European language resources association (ELRA) (Paris, FRA)},
ISBN = {979-10-95546-00-9},
CONFERENCE_NAME = {Eleventh International Conference on Language Resources and Evaluation (LREC 2018)},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the Eleventh International Conference on Language Resources and Evaluation (LREC 2018)},
EDITOR = {Calzolari, N. and Choukri, K. and Cieri, C. and Declerck, T. and Goggi, S. and Hasida, K. and Isahara, H. and Maegaard, B. and Mariani, J. and Mazo, H. and Moreno, A. and Odijk, J. and Piperidis, S.},
}
@INPROCEEDINGS{MONACHINI_2018_INPROCEEDINGS_MF_369676,
AUTHOR = {Monachini, M. and Fahad Khan, A.},
TITLE = {Towards the Construction of a Lexical Data and Technology Ecosystem: The Experience of ILC-CNR},
YEAR = {2018},
ABSTRACT = {This paper describes the activities and projects being carried on at the "A. Zampolli" Institute for Computational Linguistics (ILC) at the crossroads between computational lexicography and e-lexicography and that are intended to assist in the creation of a queryable and interconnected ecosystem of standardised lexicographic datasets and technologies},
KEYWORDS = {e - lexicography, computational lexicography, lexical resources, standards, LOD},
PAGES = {52-54},
URL = {https://globalex.link/globalex2018/wp-content/uploads/2018/03/Globalex-2018_proceedings.pdf},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {979-10-95546-28-3},
CONFERENCE_NAME = {LREC 2018 Workshop "Globalex 2018-Lexicography \& WordNets},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the LREC 2018 Workshop "Globalex 2018-Lexicography \& WordNets"},
EDITOR = {Kernerman, I. and Krek, S.},
}
@INPROCEEDINGS{NAHLI_2018_INPROCEEDINGS_N_350457,
AUTHOR = {Nahli, O.},
TITLE = {Arabic Language Alignment with English Ontologies-Some Ontological Reflections},
YEAR = {2018},
ABSTRACT = {There have been several attempts to build lexico-conceptual resources by extension of the English WordNet, i. e. by means of translation of English synsets. However, the extension approach is arguable because it assumes that the target resource is isomorphic to English WordNet. Yet, some languages, such as English and Arabic, can be very different. The problem would be to know, first, whether they conceptualize reality in the same way; and if not, to identify different concepts types. The mapping of a lexical resource of a different language onto Princeton WordNet of English (PWN) answers these questions. The experiment, in this article, describes results obtained from mapping the Arabic dictionary, al=q?m?s al=mu???, onto English WordNet and SUMO (Standard Upper Merged Ontology), also developed for the English language},
KEYWORDS = {Ontology, concept, Arabic, PWN, SUMO, al=qamus al=muHiyT},
PAGES = {7},
URL = {https://iris.cnr.it/handle/20.500.14243/350457},
PUBLISHER = {IEEE (New York, USA)},
ISBN = {978-1-5386-4385-3},
CONFERENCE_NAME = {CIST 2018 WH-MNLP},
CONFERENCE_PLACE = {New York},
BOOKTITLE = {2018 IEEE 5th International Congress on Information Science and Technology (CiSt)},
}
@INPROCEEDINGS{PETROLITO_2018_INPROCEEDINGS_PD_392548,
AUTHOR = {Petrolito, R. and Dell'Orletta, F.},
TITLE = {Word embeddings in sentiment analysis},
YEAR = {2018},
ABSTRACT = {In the late years sentiment analysis and its applications have reached growing popularity. Concerning this field of research, in the very late years machine learning and word representation learning derived from distributional semantics field (i. e. word embeddings) have proven to be very successful in performing sentiment analysis tasks. In this paper we describe a set of experiments, with the aim of evaluating the impact of word embedding-based features in sentiment analysis tasks},
URL = {https://iris.cnr.it/handle/20.500.14243/392548},
DOI = {10.4000/books.aaccademia.3589},
}
@INPROCEEDINGS{PICCINI_2018_INPROCEEDINGS_PCG_340691,
AUTHOR = {Piccini, S. and Corsi, E. and Giovannetti, E.},
TITLE = {Une ressource termino-ontologique bilingue chinois-italien: le cas de la traduction de la Mappemonde de Matteo Ricci par Pasquale D'Elia},
YEAR = {2018},
ABSTRACT = {Cet article a pour but d'illustrer les premiers résultats obtenus dans la cadre du projet intitulé Todo el mundo es nuestra casa'. The World is Our Home. ' A Virtual Journey Around the World Atlas by Matteo Ricci, SJ (1602). Le projet comporte deux objectifs: en premier lieu permettre aux internautes un voyage virtuel à travers la Mappemonde réalisée par Matteo Ricci en 1602 et sa raduction en italien accomplie par le jésuite sinologue Pasquale D'Elia; en second lieu fournir les instruments pour l'étude linguistique et conceptuelle des cartouches contenus dans la Mappemonde. Dans le contexte de ce deuxième objectif une ressource termino-ontologique bilingue chinois-italien est en cours de développement. Dans cette ressource le niveau lexical a été modélisé suivant le modèle lemon, étendu pour représenter des caractéristiques spécifiques de la langue chinoise classique. Par contre, la partie conceptuelle a reçu une formalisation ontologique en OWL},
KEYWORDS = {Matteo Ricci, Pasquale d'Elia, risorsa termino-ontologica, cinese classico, terminologia computazionale, ontologie},
PAGES = {33-49},
URL = {http://ontologia.fr/TOTh/Conference/TOTh2017/TOTh_2017.pdf},
ISBN = {2919732803},
CONFERENCE_NAME = {Conference TOTh 2017 Terminology \& Ontology},
BOOKTITLE = {Actes de la conférence TOTh 2017, Terminologie \& Ontologie: Théories et Applications},
EDITOR = {Roche, C.},
}
@INPROCEEDINGS{SBAIMOHAMED_2018_INPROCEEDINGS_SEEN_456910,
AUTHOR = {Sbai Mohamed, A. and El Biadil, M. and El Mohajir, M. and Nahli, O.},
TITLE = {The Use of ICT in Dealing with Learning Disabilities: A Literature Review with a focus on Reading Arabic Texts},
YEAR = {2018},
ABSTRACT = {The present paper aims at giving an overview of the different learning disabilities. It also attempts to correct the idea that learning disabilities (Henceforth, LDs) are a handicap that we can do nothing about. Furthermore, the paper will shed light on the various studies done on LDs with reference to Arabic texts. It provides a detailed description of the specificities of the Arabic language in an attempt to explain the problems most learners of Arabic face when learning Arabic and how they can contribute to the hinderance of their progress. Finally, the paper brings to the fore the use of ICT along with other teaching practices which can lead to higher self-esteem and confidence among students with learning difficulties},
URL = {https://iris.cnr.it/handle/20.500.14243/456910},
DOI = {10.1109/CIST.2018.8596661},
ISBN = {978-1-5386-4385-3},
}
@INPROCEEDINGS{SORIA_2018_INPROCEEDINGS_SQR_371917,
AUTHOR = {Soria, C. and Quochi, V. and Russo, I.},
TITLE = {The DLDP Survey on Digital Use and Usability of EU Regional and Minority Languages},
YEAR = {2018},
ABSTRACT = {This paper reports about the design, the results and the key findings of a survey launched by the Digital Language Diversity Project about the digital use and usability of regional and minority languages. The aim of the survey-the first of this kind-was to investigate the real needs and expectations of European minority language speakers regarding digital opportunities. The focus on four languages (Basque, Breton, Karelian and Sardinian) at different stages of digital development offers a starting point to develop strategies for assessing digital vitality of these languages and overcoming specific difficulties},
KEYWORDS = {minority languages, digital survival, electronic communication},
PAGES = {4155-4160},
URL = {http://www.lrec-conf.org/proceedings/lrec2018/pdf/684.pdf},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {979-10-95546-00-9},
CONFERENCE_NAME = {Eleventh International Conference on Language Resources and Evaluation (LREC 2018)},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the Eleventh International Conference on Language Resources and Evaluation (LREC 2018)},
EDITOR = {Calzolari, N. and Choukri, K. and Cieri, C. and Declerck, T. and Goggi, S. and Hasida, K. and Isahara, H. and Maegaard, B. and Mariani, J. and Mazo, H. and Moreno, A. and Odijk, J. and Piperidis, S. and Tokunaga, T.},
}
@INPROCEEDINGS{BELLANDI_2018_INPROCEEDINGS_BFKM_345621,
AUTHOR = {Bellandi, A. and Frontini, F. and Khan, F. and Monachini, M.},
TITLE = {SWRL your lexicon: adding inflectional rules to a LOD dataset},
YEAR = {2018},
ABSTRACT = {Over the past few years the publication of lexical resources as Linked Data (LD) has taken on ever greater significance within the field of computational lexicography. So far the efforts of the community have been largely directed towards the definition of standards1 and the conversion of single resources (see McCrae et al 2012, Khan et al 2016), but with less of a focus on the technical possibilities afforded by this new mode of publishing lexical data. However, the fact is that the Semantic Web gives us access to a whole ecosystem of standards, languages, and technologies. In this paper we will look at one of these languages, the Semantic Web Rule Language2 (SWRL) and explore whether it might potentially play a useful role in the publication of lexical resources},
URL = {https://iris.cnr.it/handle/20.500.14243/345621},
}
@INPROCEEDINGS{BELLANDI_2018_INPROCEEDINGS_BGP_346698,
AUTHOR = {Bellandi, A. and Giovannetti, E. and Piccini, S.},
TITLE = {Collaborative Editing of Lexical and Termino-ontological Resources: a Quick Introduction to LexO},
YEAR = {2018},
ABSTRACT = {We here present LexO, a web collaborative editor of lexical and termino-ontological resources. As the underlying lexical model we adopted lemon, which appeared to be perfect for our purposes, in particular regarding the separation between the conceptual and linguistic dimensions},
KEYWORDS = {lemon model, lexo, collaborative editor, termino-ontological resource},
PAGES = {23-27},
URL = {http://euralex2018.cjvt.si/wp-content/uploads/sites/6/2018/12/Euralex2018_book_of_abstracts_FINAL.pdf},
CONFERENCE_NAME = {XVIII EURALEX International Congress},
BOOKTITLE = {The XVIII EURALEX International Congress: Lexicography in Global Contexts-Book of Abstracts},
EDITOR = {Čibej, J. and Gorjanc, V. and Kosem, I. and Krek, S.},
}
@INPROCEEDINGS{CAPPA_2018_INPROCEEDINGS_CFGMNCP_351301,
AUTHOR = {Cappa, C. and Ferro, M. and Giulivi, S. and Marzi, C. and Nahli, O. and Cardillo, F. and Pirrelli, V.},
TITLE = {ReadLet: piattaforma ICT per valutare l'efficienza di lettura},
YEAR = {2018},
ABSTRACT = {ReadLet è una piattaforma ICT pensata per valutare accuratamente l'efficienza di lettura nei bambini della scuola primaria. Combina tecnologia ICT portatile e cloud-computing con una serie di moduli software, specifici per modalità di somministrazione. Questi, implementati come servizi web, includono: i) valutazione dell'elaborazione del testo e della leggibilità; ii) valutazione della velocità di lettura (ad alta voce e silente) e delle sue fluttuazioni); iii) valutazione della correttezza della decodifica ad alta voce; iv) valutazione della comprensione del testo (in lettura silente e da ascolto). Un prototipo della tecnologia ReadLet è stato sperimentato su circa 200 alunni (8-11 anni), che variano per stato socio-economico, lingua (italiana, francese, araba) e area geografica (Italia, Svizzera, Marocco). L'utilizzo del tablet per la lettura è stato percepito dai bambini come un'esperienza coinvolgente e piacevole. Gli insegnanti hanno trovato lo strumento facile da utilizzare e in grado di fornire maggiori informazioni rispetto agli strumenti tradizionali},
KEYWORDS = {leggere per capire, disturbi del linguaggio, screening},
URL = {https://www.airipa.it/congresso/pluginfile.php/2781/mod_resource/content/1/ProgrammaCongressoAIRIPA_Arezzo_dettagliato-3.pdf},
CONFERENCE_NAME = {XXVII Congresso Nazionale AIRIPA},
BOOKTITLE = {I disturbi dell'Apprendimento-Abstract book XXVII Congresso Nazionale AIRIPA},
}
@INPROCEEDINGS{CORSI_2018_INPROCEEDINGS_CMP_401692,
AUTHOR = {Corsi, E. and Marchetti, A. and Piccini, S.},
TITLE = {Totus Mundus: A Virtual Journey Around Matteo Ricci's World Atlas Kunyu wanguo quantu ??????},
YEAR = {2018},
ABSTRACT = {TOTUS MUNDUS Project (www. totusmundus. it) was supported under the Sapienza Awards Scheme, 2015 Exercise, its main scope being the digitalization of the annotated edition by P. D'Elia of the World Atlas, Kunyu quantu (1602), by Matteo Ricci, SI. The main feature of the project portal is the computational lexicon containing geographical lexemes, astronomical and other scientific lexemes, and their corresponding Chinese graphs. The lexicon is continuously being enriched with new lexemes and new findings. Three dimensions will be accounted for during the presentation: 1. Design and development of the web portal. The application has been structured in a specific way that allows users to initially obtain an overview of the contents, which can then be filtered and examined in depth. Specific interactive views have been included in the application in order to host high-resolution digital images, manage aligned texts in different languages and present specific linguistic resources. 2. Modelling and creation of a bilingual computational lexicon which structures the chinese terms extracted from Ricci's map cartouches and their translation into Italian by Pasquale d'Elia. The lexicon, based on the lemon model, was created by means of LexO, a collaborative web editor for lemon lexical resources developed by ILC. 3. Text enrichment: transcription of the Chinese text, its alignment with the Italian translation of Pasquale D'Elia and the analysis of each graph in terms of transliterations and definitions},
URL = {https://iris.cnr.it/handle/20.500.14243/401692},
}
@INPROCEEDINGS{DELGROSSO_2018_INPROCEEDINGS_DCCCDD_377315,
AUTHOR = {Del Grosso, A. M. and Cacioli, G. and Cavallero, C. and Cioffi, R. and Di Pietro, C. and Del Turco, R. R.},
TITLE = {Encoding and publishing the Life of San Teobaldo using EVT: challenges and rewards},
YEAR = {2018},
ABSTRACT = {This contribution aims at illustrating both the scholarly work and the development outcomes that have been achieved while working towards a digital edition of the Life of San Teobaldo (an hagiography of the patron saint of the city of Alba, Italy). The text, physically embodied in an ancient palimpsest scroll, has been encoded using the TEI-XML standard and published by means of the Edition Visualization Technology tool. EVT has been appropriately customized and extended with new features concerning image visualization, diplomatic edition display and textual search. A working progress demo is available at < http: //licodemo. ilc. cnr. it/evt-rotulo >},
KEYWORDS = {digital philology, evt, computational philology, Rotulo vita San Teobaldo},
URL = {https://drive.google.com/file/d/19SQqvy4vwG_-irpelu7ro3Q1QdZjcsZJ/view?usp=sharing},
CONFERENCE_NAME = {EADH 2018: "Data in Digital Humanities"},
}
@INPROCEEDINGS{DELGROSSO_2018_INPROCEEDINGS_DCDGMSS_346825,
AUTHOR = {Del Grosso, A. M. and Cristofaro, S. and De Luca, R. M. and Giovannetti, E. and Marchi, S. and Seminara, G. and Spampinato, D.},
TITLE = {Le lettere di Bellini: dalla Carta al Web},
YEAR = {2018},
ABSTRACT = {Nel contesto del progetto "Museo virtuale della Musica BellinInRete" sarà reso fruibile, attraverso un processo di acquisizione, codifica e pubblicazione digitale, un corpus di lettere di Vincenzo Bellini, compositore catanese del XIX secolo. L'edizione digitale delle lettere belliniane sarà consultabile in rete e, inoltre, sarà integrata in un percorso museale interattivo in allestimento presso il Museo Civico Belliniano di Catania},
KEYWORDS = {Digital Edition, Digital Scholarly Platform},
PAGES = {60-64},
URL = {http://www.aiucd2018.uniba.it/content/AIUCD2018-BoA.pdf},
DOI = {10.6092/unibo/amsacta/5997},
ISBN = {9788894253528},
CONFERENCE_NAME = {AIUCD 2018 Conference},
BOOKTITLE = {AIUCD 2018-Book of abstracts},
EDITOR = {Spampinato, D.},
}
@INPROCEEDINGS{FERRO_2018_INPROCEEDINGS_FCGMCP_351299,
AUTHOR = {Ferro, M. and Cappa, C. and Giulivi, S. and Marzi, C. and Cardillo, F. and Pirrelli, V.},
TITLE = {ReadLet: an ICT platform for the assessment of reading efficiency in early graders},
YEAR = {2018},
ABSTRACT = {Reading is not just word decoding, but the joint product of decoding and deep linguisticcomprehension [ 1, 2 ]. Effective linguistic comprehension relies on language skills such assemantic and syntactic awareness. Both decoding and linguistic comprehension are necessary forreading comprehension, and neither is by itself sufficient [ 2 ]. However, current protocols forreading assessment measure decoding (reading accuracy and speed) and reading comprehensionseparately [ 3, 4, 5 ]. This does not allow evaluation of reading efficiency [ 6 ], defined as the abilityto fully understand connected texts by minimising reading time, a cognitive ability that lies at theroots of students' academic achievement [ 8, 7 ]. ReadLet is an ICT platform specifically designedto provide accurate, evidence-based assessment of reading efficiency in early grade children, byoffering an ecological, non-invasive protocol for extensive data elicitation, storage and analysis. With ReadLet, early graders at school can read a one or two page text displayed on atablet touchscreen, either silently or aloud. Children are asked to slide their finger across thewords as they read, to guide directional tracking. After reading, the child is prompted with a fewmultiple-answer questions on text content presented one at a time, while the text remainsdisplayed on the screen for the child to be able to retrieve relevant information. In the process, the tablet keeps track of time-aligned multimodal data: voice recording, finger sliding time, timeof reading, time of question answering, and number of correct answers. Data are recorded, storedlocally, sent to the ReadLet server through an internet connection, and processed remotely by abattery of cloud-based services, analysing data automatically to produce a detailed quantitativesignature of each reading session. A server-based database aggregates anonymised data to makethem available for specialists. Also individual's longitudinal profiles are stored, for them bequeried and inspected upon authorised access. The platform combines portable ICT technology and cloud computing with a number ofmodality-specific software modules, implemented as web services including: i) a text processingand readability assessment service, consisting in a battery of tools for automated linguisticannotation of written texts and a machine-learning component assigning a readability score toannotated texts [ 9 ]; ii) a finger touch processing service aligning the child's finger sliding withthe written text and measuring speed fluctuations; iii) a speech processing and decodingassessment service, aligning the acoustic record of child's reading with the written text andassessing correctness of recoding [ 10 ]. At the time of writing, the platform includes the first twomodules only. Preliminary testing of a prototype version of ReadLet technology with apopulation of about 200 pupils aged 8 to 11, both male and female, varying for socio-economicstatus, language (Italian, French and Arabic) and geographical area (Italy and Morocco), showedthat children are extremely responsive to using a tablet for reading, and very easy to engage inwhat they perceive as an enjoyable experience. We expect online databases of automaticallyclassified cross-sectional and longitudinal data, accurate statistical modelling and developmentaltrends of reading literacy to help education professionals and clinical specialists assess the levelof reading skills reached by the child, and decide which intervention programmes and measuresare most appropriate. While information technology cannot and should not supplant the role andprofessional judgement of teachers and therapists, the project intends to provide portable tools, models and data for timely screening and daily management of reading difficulties and disorders},
KEYWORDS = {reading efficiency, decoding, comprehension, language specific disorders},
PAGES = {61-61},
URL = {https://mentallexicon2018.ca/},
CONFERENCE_NAME = {11th International Conference on the Mental Lexicon},
BOOKTITLE = {Book of Abstract of the 11th International Conference on the Mental Lexicon},
}
@INPROCEEDINGS{GIOVANNETTI_2018_INPROCEEDINGS_GABDDPP_346702,
AUTHOR = {Giovannetti, E. and Albanesi, D. and Bellandi, A. and Dattilo, D. and Dollinar, M. and Pecchioli, A. and Piperno, C.},
TITLE = {Il Progetto Traduzione del Talmud Babilonese: il Ruolo della Tecnologia e della Linguistica Computazionale},
YEAR = {2018},
ABSTRACT = {L'obiettivo principale del Progetto Traduzione del Talmud Babilonese è produrre la traduzione del Talmud in italiano. La traduzione, affidata ad un team di circa 80 studiosi, è condotta con l'aiuto di Traduco, un software preposto ad agevolare tutte le fasi di lavoro previste dal progetto, dall'attribuzione degli utenti alle sezioni da tradurre, fino al supporto all'impaginazione finale. La presenza di una piattaforma collaborativa digitale che già, di per sé, costituisce una innovazione nell'ambito dei grandi progetti di traduzione, è arricchita da algoritmi per il trattamento automatico del testo e della lingua, in costante evoluzione, attraverso i quali il traduttore, il revisore o lo studioso possono contare su funzionalità sempre più avanzate},
KEYWORDS = {Linguistica Computazionale, Traduzione di Testi Religiosi, Traduzione Assistita dal Calcolatore, Traduzione Collaborativa},
PAGES = {144-146},
URL = {http://amsacta.unibo.it/5997/},
DOI = {10.6092/unibo/amsacta/5997},
ISBN = {9788894253528},
CONFERENCE_NAME = {AIUCD 2018 Conference},
BOOKTITLE = {AIUCD 2018-Book of abstracts},
EDITOR = {Spampinato, D.},
}
@INPROCEEDINGS{GOGGI_2018_INPROCEEDINGS_GPBMBC_345413,
AUTHOR = {Goggi, S. and Pardelli, G. and Bartolini, R. and Monachini, M. and Biagioni, S. and Carlesi, C.},
TITLE = {Semantic query analysis from the global science gateway},
YEAR = {2018},
ABSTRACT = {We focused on building a corpus constituted by the query logs registered by the GreyGuide: Repository and Portal to Good Practices and Resources in Grey Literature and received by the WorldWideScience. org (The Global Science Gateway) portal: the aim is to retrieve information related to social media which as of today represent a considerable source of data more and more widely used for research ends. This project includes eight months of query logs3 registered between July 2017 and February 2018 for a total of 445, 827 queries. The analysis mainly concentrates on the semantics of the queries received from the portal clients: it is a process of information retrieval from a rich digital catalogue whose language is dynamic, is evolving and follows-as well as reflects-the cultural changes of our modern society},
KEYWORDS = {Global Science Gateway, Semantic Query Analysis, Terminology},
PAGES = {93-95},
URL = {http://greyguide.isti.cnr.it/wp-content/uploads/2018/12/GL20_ProgramBook.pdf},
ISBN = {978-90-77484-34-0},
CONFERENCE_NAME = {Twentieth International Conference on Grey Literature "Research Data Fuels and Sustains Grey Literature"},
BOOKTITLE = {Research Data Fuels and Sustains Grey Literature},
EDITOR = {Farace, D. and Frantzen, J.},
}
@INPROCEEDINGS{KHAN_2018_INPROCEEDINGS_KMBFB_345619,
AUTHOR = {Khan, A. F. A. and Mugelli, G. and Boschetti, F. and Frontini, F. and Bellandi, A.},
TITLE = {Using Formal Ontologies for the Annotation and Study of Literary Texts},
YEAR = {2018},
URL = {https://iris.cnr.it/handle/20.500.14243/345619},
}
@INPROCEEDINGS{LEONI_2018_INPROCEEDINGS_LMCFG_351300,
AUTHOR = {Leoni, F. and Muzio, C. and Cappa, C. and Ferro, M. and Giulivi, S.},
TITLE = {Il progetto AEREST: primi risultati in Italia e in Canton Ticino},
YEAR = {2018},
ABSTRACT = {Il progetto AEREST, per una valutazione ecologica dell'efficienza di lettura, è attualmente in corso presso alcune classi di scuola primaria di istituti italiani e ticinesi. Si presentano qui i risultati ottenuti a seguito della prima sessione di raccolta dati, che si è svolta nell'A. A. 2017-18 su circa 160 bambini italofoni di età compresa tra 8 e 11 anni. Lo scopo di questa prima fase sperimentale è stato duplice: 1. ottenere indicazioni sull'efficacia, ai fini della valutazione dell'efficienza di lettura, dei testi utilizzati nelle prove di cui si compone il test AEREST; 2. ottenere indicazioni sulla fattibilità dell'implementazione dello screening su tablet, in termini di facilità di somministrazione e di gradimento da parte dei soggetti; 3. esplorare e confrontare le performance di lettura nel campione italiano e ticinese, al fine di individuare strategie didattiche volte a potenziare le eventuali abilità carenti},
URL = {https://iris.cnr.it/handle/20.500.14243/351300},
}
@INPROCEEDINGS{MARZI_2018_INPROCEEDINGS_MFP_355611,
AUTHOR = {Marzi, C. and Ferro, M. and Pirrelli, V.},
TITLE = {Is inflectional irregularity dysfunctional to human processing?},
YEAR = {2018},
ABSTRACT = {Regularly inflected verb forms are classically associated with the formal transparency andpredictability of their internal constituents [ 1, 2, 3 ]. Transparency ensures that full forms can besegmented uniquely into their internal constituents: as in walk-s/walk-ed. Predictability allowsfor a speaker to fill in an empty paradigm cell, using information from other known forms of thesame lexical paradigm and its inflection macro-class. From this perspective, irregulars appear tobe dysfunctional to the human processing system, as they make it hard to infer-say-boughtfrom buy, or segment bought appropriately into its constituent parts. Likewise, an influentialpsycholinguistic tradition relegates irregulars to the lexical store, whereas regulars are segmentedby rules into their simpler constituents [ 4, 5 ]. Here, we offer a few reasons for questioning this view. First, transparency andpredictability are not dichotomous notions. Secondly, their influence on processing is notunidirectional. Unpredictable stems in irregularly inflected forms of complex inflectionalsystems provide a lot of processing information, by dynamically constraining the number ofpossible alternative endings during serial processing. Thirdly, acquisition of word inflection doesnot consist in associating co-occurring cues and outcomes, but in discriminating betweenmultiple cues that are constantly in competition for their predictive value for a given outcome. We present the results of a few computer simulations with Self-organising RecurrentNeural Networks (TSOMs, [ 8, 9 ]) that learn how to inflect high-frequency verb paradigms in 6languages: English, German, Italian, Modern Greek, Modern Standard Arabic and Spanish. Aftertraining, each TSOM was tested on a word recognition (serial recoding) and a word production(serial recall) task, and results were analysed with generalised regression models. Processinguncertainty is differently apportioned on regulars and irregulars, depending on the nature of theprocessing task. While irregulars are harder to produce when they are unknown because theytypically have fewer neighbours than regulars have, they are readily accessed once they areacquired, for exactly the same reason. Our data are in line with psycholinguistic evidence [ 10, 11 ] that lexical processing ispaced by two types of uniqueness point: Marslen-Wilson's Uniqueness Point (UP), distinguishing unrelated onset-overlapping words [ 12 ], and the Complex Uniqueness Point(CUP), distinguishing paradigmatically-related words [ 11 ]. Late UPs are inhibitory and elicitprolonged reaction times in acoustic word recognition, explaining an early delay in wordrecognition of irregular stems. Similarly, late CUPs are inhibitory, and this accounts for aslowdown in the processing advantage of regulars, compared to irregulars, after UP. Thesestructural factors interact in a variety of ways and concurrently affect human processing, to showthat irregularly-inflected forms may in fact reflect communicative and processing constraints ofthe word processor. They provide strong evidence against a processing architecture that assumescompartmentalized, independent processing routes for some specific combinations of thesefactors (e. g. a rule-based route for a combination of transparency and predictability, and amemory-based route for all other combinations). In addition, they seem incompatible withBayesian approaches to auditory word comprehension ignoring a word's internal structure [ 13 ]. We suggest that a different design of the human language processor, based on a computationalarchitecture integrating memory and processing as two different dynamics of the sameunderlying mechanism, can shed light on the complexity of inflection, and vindicate the role ofirregular inflection in the system},
KEYWORDS = {inflectional processing, temporal self organizing maps, letter prediction, morpheme boundary},
PAGES = {60-60},
URL = {https://mentallexicon2018.ca/},
CONFERENCE_NAME = {11th International Conference on the Mental Lexicon},
BOOKTITLE = {Book of Abstract of the 11th International Conference on the Mental Lexicon},
}
@INPROCEEDINGS{PICCINI_2018_INPROCEEDINGS_P_404499,
AUTHOR = {Piccini, S.},
TITLE = {Una dipendenza insospettata: dall'accentuazione lituana di Saussure all'accentuazione greca di Bally},
YEAR = {2018},
ABSTRACT = {Negli studi e nelle pubblicazioni di Charles Bally centrale è l'interesse per la lingua greca, come dimostrano la tesi di dottorato, il viaggio in Grecia, le comunicazioni alla Société de linguistique de Paris, gli articoli pubblicati nei Mémoires tra il 1900 ed il 1904 ed i corsi tenuti all'Università di Ginevra. Alla lingua greca Bally torna al termine della sua vita e della sua carriera scientifica con un testo dedicato all'accentuazione, intitolato Manuel d'accentuation grecque, apparso nel 1945. Per utilizzare una felice espressione di Maurice Leroy, questo piccolo testo di appena 130 pagine costituisce il "testamento scientifico" del linguista ginevrino. Al centro vi è un tema verso il quale Bally nutriva un interesse antico: egli aveva infatti partecipato alla revisione delle bozze del Traité d'accentuation grècque di Vendreys (1904), testo che aveva aperto la strada ad una serie di riflessioni al centro di uno scambio epistolare con l'amico e collega Max Niedermann. Il Manuel d'accentuation grecque costituisce un'opera molto interessante dal punto di vista terminologico, nella quale si evidenziano due tendenze, l'una verso la conservazione della terminologia tradizionale-anche quando errata-e l'altra verso l'innovazione. Entrambe queste tendenze sono dettate dall'intento primo di scrivere un manuale pratico e chiaro per gli studenti che debbono cimentarsi con l'accentuazione di un testo greco. Così ad esempio viene perpetuato un errore radicato nella tradizione per cui anche Bally non distingue tra tono e accento: "On désigne souvent l'accent musical par le terme de ton (cf. syllabe tonique etc.) Pour des raisons pratiques, nous conservons le mot usuel, qui, ici, ne porte à aucune équivoque. » (Bally, 1945: 12). Tuttavia, Bally non rinuncia ad introdurre neologismi che ritiene funzionali al suo scopo didattico. Proprio lo studio dell'innovazione terminologica-e concettuale-del Manuel d'accentuation grecque costituisce il tema fondamentale del presente contributo. Nella fattispecie, si vuole mostrare la profonda influenza che ebbe sulla redazione del Manuel il corso di lituano tenuto da Ferdinand de Saussure e seguito da Bally nell'anno accademico 1901-1902 all'Università di Ginevra. Di queste lezioni restano gli appunti di Bally oggi conservati presso la BGE (Ms. fr. 5133). Sin da una prima lettura, emerge come nel corso dedicato alla lingua lituana, Saussure si concentri principalmente sulle problematiche connesse all'accentuazione, confidando le sue teorie rivoluzionarie ad una terminologia altrettanto innovativa. Parte di questa terminologia viene ripresa quaranta anni più tardi da Bally ed adattata al sistema accentuale del greco. Nel mio contributo mostrerò che il debito verso il maestro non è soltanto terminologico, ma anche e soprattutto teorico e metodologico: Bally cerca di condurre per l'accento greco quello stesso studio che Saussure aveva condotto per l'accento lituano, adottando la stessa prospettiva sincronica del maestro},
URL = {https://iris.cnr.it/handle/20.500.14243/404499},
}
@INPROCEEDINGS{PICCINI_2018_INPROCEEDINGS_PBG_346696,
AUTHOR = {Piccini, S. and Bellandi, A. and Giovannetti, E.},
TITLE = {A Semantic Web Approach to Modelling and Building a Bilingual Chinese-Italian Termino-ontological Resource},
YEAR = {2018},
ABSTRACT = {This paper introduces a bilingual Chinese-Italian onto-terminological resource, devoted to modelling the Chinese terminology of Matteo Ricci's World Map (1602), together with the Italian translation by Pasquale D'Elia (1835) [3]. The Map was created in collaboration with the Chinese mathematician and astronomer Li Zizhao, and is entitled ? ? ? ? ? ? Kunyu Wanguo Quantu (literally "Map of the Ten Thousand Countries of the Earth"). Its publication in China was significant as it was the first map to show the Americas, and to represent the world as a sphere. Its large number of cartouches provide information about the geography, history and customs of the world at that time as well as cosmological and cosmographic data. The map had a revolutionary impact from a linguistic standpoint as well: a large number of neologisms were introduced by Ricci, many of which have survived until today},
KEYWORDS = {termino-ontological resource, classical chinese, lemon model},
PAGES = {87-90},
URL = {http://euralex2018.cjvt.si/wp-content/uploads/sites/6/2018/12/Euralex2018_book_of_abstracts_FINAL.pdf},
CONFERENCE_NAME = {XVIII EURALEX International Congress},
BOOKTITLE = {The XVIII EURALEX International Congress: Lexicography in Global Contexts-Book of Abstracts},
EDITOR = {Čibej, J. and Gorjanc, V. and Kosem, I. and Krek, S.},
}
@INPROCEEDINGS{PIRRELLI_2018_INPROCEEDINGS_PFMGSM_355608,
AUTHOR = {Pirrelli, V. and Ferro, M. and Marzi, C. and Gagné, C. and Spalding, T. and Marelli, M.},
TITLE = {Processing compounds: what frequency (alone) cannot explain},
YEAR = {2018},
ABSTRACT = {Observed elevation in typing latency for the initial letter of the second constituent of an Englishcompound, compared with the typing time of the final letter of the first constituent (Gagné \& Spalding 2016), suggests that both compounds (snowball) and pseudo-compounds (carpet) aredecomposed but also that full form representations are available in the lexical store. To gainfurther insight into the lexical representations underlying typing, we used computationalmodelling. In particular, we used superpositional models of word memory, based onSelf-Organising Recurrent Maps (TSOMs) (Ferro et al. 2016; Marzi et al. 2016), where bothsimple and compound words are processed (and stored) using the same pool of processing (andmemory) resources, to model the elevation in typing time at the constituent boundary and the rateof typing. In addition, we also considered models based in the Compositional DistributionalSemantics framework (CAOSS, Marelli et al. 2017), to simulate independent effects of semantictransparency on compound typing (Gagné \& Spalding 2016). Due to co-activation and competition between compounds and their constituent words inTSOMs, levels of activation of processing nodes per letter positions appear to reflect degrees ofcontext-sensitive predictability: the higher the level, the more expected the letter in that position. In English compounds, activation levels appeared to exhibit a characteristically U-shapedpattern, with min values centred on the constituent boundary. A similar pattern was found forpseudo-compounds, which nonetheless present a less pronounced U-shaped pattern and a higheractivation value at the morpheme boundary than compounds do. The difference is in line with thehigher speed-up rate in typing pseudo-compounds than compounds reported in Gagné andSpalding (2016). TSOMs were trained on letter-based representations, so computer experiments couldsimulate peripheral effects of serial processing of compound structure before lexical access. Toinvestigate post-lexical issues, we also tested computational models of generation of themeanings of novel compounds based on CAOSS, which proved to be able to account forwell-established relational effects in compound processing (Gagné 2001; Gagné \& Shoben 1997)with an unsupervised data-driven framework (Marelli et al. 2017). We ran a mixed-effectsregression analysis of the data in Gagné and Spalding (2016) using vector-semantics estimatesand TSOM activation levels to predict typing time for the initial letter of the second constituent. There was a negative effect of TSOM letter activation levels: i. e. the more active a letter node is, the faster a subject is at typing the letter (t =-2. 7 p =. 007). Also, there was a positive effect ofCAOSS-based compositionality estimates: i. e. the more easily a compound's lexicalizedmeaning can be obtained through compositional operations on single constituent vectors, theslower participants were at typing the first letter of the second constituent (t =2. 4, p =. 017). These results have interesting implications for an integrative computational architectureaccounting for the whole range of experimental evidence reported by Gagné and Spalding(2016). In particular we will focus on evidence of a stronger competition (and longer typingtime) in Transparent-Transparent and Transparent-Opaque compounds, vs. Opaque-Transparentcompounds, which gives an indication of a non-trivial interaction between semanticcompositionality and serial processing effects},
KEYWORDS = {compound processing, Temporal Self-organizing Map, letter production latency, constituent boundary},
PAGES = {60-60},
URL = {https://mentallexicon2018.ca/},
CONFERENCE_NAME = {11th International Conference on the Mental Lexicon},
BOOKTITLE = {Book of Abstract of the 11th International Conference on the Mental Lexicon},
}
@INPROCEEDINGS{STEFANINI_2018_INPROCEEDINGS_SNM_348948,
AUTHOR = {Stefanini, A. and Nicolosi, A. and Monachini, M.},
TITLE = {An experiment on the development of a digital edition for ancient Greek fragmentary poetry: A case study on Archilochus of Paros},
YEAR = {2018},
ABSTRACT = {This paper overviews ongoing experiments on a digital edition of Archilochus which is based on the readings, translations and comments by Nicolosi [1] and also integrates feedback and requirements from the Digital Classics community. The experiment encompasses a few fragments of the poet of Paros, so as to provide a mock-up of the prototype for evaluation by its intended end-users, in view of developing a fully fledged digital edition. The mock-up provides the philologist with a set of resources and tools that ease a critical appraisal of the text},
KEYWORDS = {Digital methods in the humanities, Interfaces and user-friendly data presentation},
PAGES = {86-89},
URL = {http://amsacta.unibo.it/5997/1/AIUCD-2018-BoA-rev.pdf},
DOI = {10.6092/unibo/amsacta/5997},
ISBN = {9788894253528},
CONFERENCE_NAME = {Settimo Convegno Annuale AIUCD 2018},
BOOKTITLE = {Settimo Convegno Annuale AIUCD 2018. Patrimoni culturali nell'era digitale. Memorie, culture umanistiche e tecnologia. Book of Abstracts},
EDITOR = {Daria, S.},
}
@TECHREPORT{ALBANESI_2018_TECHREPORT_ABGM_350504,
AUTHOR = {Albanesi, D. and Bellandi, A. and Giovannetti, E. and Marchi, S.},
TITLE = {Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-Rapporto tecnico 13},
YEAR = {2018},
ABSTRACT = {La presente relazione tecnico-scientifica descrive l'attività svolta da ILC-CNR nel contesto del Progetto Traduzione Talmud Babilonese nel periodo novembre 2017-giugno 2018. Le due principali attività tecniche svolte su sistema Traduco sono la risoluzione di bug e l'implementazione di nuove funzionalità. Queste due attività sono fisiologicamente interrelate: di fatto, l'introduzione di nuove funzionalità implica inevitabilmente la possibilità di introdurre nuovi bug all'interno del sistema. Le attività di ricerca, come descritto nella sezione 4, sono state incentrate sulla rappresentazione della conoscenza talmudica},
URL = {https://iris.cnr.it/handle/20.500.14243/350504},
}
@TECHREPORT{ALBANESI_2018_TECHREPORT_ABGM_345453,
AUTHOR = {Albanesi, D. and Bellandi, A. and Giovannetti, E. and Marchi, S.},
TITLE = {Traduco: l'Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-Rapporto tecnico 14},
YEAR = {2018},
ABSTRACT = {La presente relazione tecnico-scientifica descrive l'attività svolta da ILC-CNR nel contesto del Progetto Traduzione Talmud Babilonese nel periodo luglio 2018-novembre 2018. Le due principali attività tecniche svolte sul sistema Traduco sono la risoluzione di bug e l'implementazione di nuove funzionalità. Queste due attività sono strettamente correlate: di fatto, l'introduzione di nuove funzionalità può implicare l'introduzione di nuovi bug all'interno del sistema. Le attività di ricerca sono state condotte, in continuità a quelle descritte nel rapporto precedente, nella rappresentazione del lessico e della conoscenza talmudica},
KEYWORDS = {Linguistica Computazionale, Traduzione di Testi Religiosi, Traduzione Assistita dal Calcolatore, Traduzione Collaborativa, Lessici elettronici, rappresentazione della conoscenza},
URL = {https://iris.cnr.it/handle/20.500.14243/345453},
}
@TECHREPORT{BARONI_2018_TECHREPORT_BQRSCGHKSS_462551,
AUTHOR = {Baroni, P. and Quochi, V. and Russo, I. and Soria, C. and Ceberio Berger, K. and Gurrutxaga Hernaiz, A. and Hicks, D. and Kruse, E. and Salonen, T. and Sarhimaa, A.},
TITLE = {Kit per la sopravvivenza digitale della lingua sarda-Le raccomandazioni del progetto DLDP per migliorare la vitalità digitale della lingua sarda},
YEAR = {2018},
ABSTRACT = {Le raccomandazioni del progetto DLDP per migliorare la vitalità digitale della lingua sarda (versione italiana)},
KEYWORDS = {digital vitality, digital diversity, digital language sur, recommendations, Sardinian},
PAGES = {12},
URL = {http://www.dldp.eu/sites/default/files/documents/DLDP_Digital-Language-Survival-Kit-for-Sardinian_IT.pdf},
}
@TECHREPORT{CARLINO_2018_TECHREPORT_C_459251,
AUTHOR = {Carlino, M.},
TITLE = {Rapporto annuale 2017 del CNR-ILC},
YEAR = {2018},
ABSTRACT = {CNR-ILC Activity Report 2017},
KEYWORDS = {Annual Report, Activity report, CNR-ILC, Rapporto Annuale},
PAGES = {1-64},
URL = {https://iris.cnr.it/handle/20.500.14243/459251},
}
@TECHREPORT{CEBERIOBERGER_2018_TECHREPORT_CGBHKQRSSS_428733,
AUTHOR = {Ceberio Berger, K. and Gurrutxaga Hernaiz, A. and Baroni, P. and Hicks, D. and Kruse, E. and Quochi, V. and Russo, I. and Salonen, T. and Sarhimaa, A. and Soria, C.},
TITLE = {The DLDP Digital Language Survival Kit},
YEAR = {2018},
ABSTRACT = {Le raccomandazioni del progetto DLDP per la sopravvivenza digitale delle lingue (versione inglese integrale)},
KEYWORDS = {sopravvivenza digitale, lingue minoritarie, less-resourced languages},
PAGES = {38},
URL = {http://www.dldp.eu/sites/default/files/documents/DLDP_Digital-Language-Survival-Kit.pdf},
}
@TECHREPORT{CEBERIOBERGER_2018_TECHREPORT_CGBHKQRSSS_428764,
AUTHOR = {Ceberio Berger, K. and Gurrutxaga Hernaiz, A. and Baroni, P. and Hicks, D. and Kruse, E. and Quochi, V. and Russo, I. and Salonen, T. and Sarhimaa, A. and Soria, C.},
TITLE = {Kit de Supervivencia Lingüística Digital del Euskera-Recomendaciones del DLDP para mejorar la Vitalidad Digital del euskera},
YEAR = {2018},
ABSTRACT = {Le raccomandazioni del progetto DLDP per la sopravvivenza digitale del basco (versione spagnola)},
KEYWORDS = {digital diversity, digital vitality, recommendations, Basque, digital survival},
PAGES = {28},
URL = {http://www.dldp.eu/sites/default/files/documents/DLDP_Digital-Language-Survival-Kit-for-Basque_ES.pdf},
}
@TECHREPORT{CEBERIOBERGER_2018_TECHREPORT_CGBHKQRSSS_428763,
AUTHOR = {Ceberio Berger, K. and Gurrutxaga Hernaiz, A. and Baroni, P. and Hicks, D. and Kruse, E. and Quochi, V. and Russo, I. and Salonen, T. and Sarhimaa, A. and Soria, C.},
TITLE = {Euskarak Mundu Digitalean Bizirauteko Kita-DLDPren gomendioak, euskararen bizitasun digitala hobetu dadin},
YEAR = {2018},
ABSTRACT = {Le raccomandazioni del progetto DLDP per la sopravvivenza digitale della lingua basca (versione basca)},
KEYWORDS = {digital vitality, digital diversity, digital language survival, recommendations, Basque},
PAGES = {27},
URL = {http://www.dldp.eu/sites/default/files/documents/DLDP_Digital-Language-Survival-Kit-for-Basque_EU.pdf},
}
@TECHREPORT{CININI_2018_TECHREPORT_C_345602,
AUTHOR = {Cinini, A.},
TITLE = {LigurArch900: Itinerari di architettura contemporanea in Liguria},
YEAR = {2018},
ABSTRACT = {The APP was conceived as a tool to display search results for a more widespread knowledge of the Patrimony of Contemporary Architecture in Liguria. This APP allows the user to create personal touring itineraries in the city of Genoa, selecting the buildings in which he/she is more interested, according to several query filters (author, period, location, type.). The APP will display the search results of the buildings on geo-referenced maps, associating them to essential information, images, related pertinent bibliographies, with reference to detailed archives},
KEYWORDS = {Android, Mobile, Term extraction},
PAGES = {1-9},
URL = {http://dbtvm1.ilc.cnr.it/Download/app-release_20170318.zip},
}
@TECHREPORT{GINGOLD_2018_TECHREPORT_GDGGMMSSW_381980,
AUTHOR = {Gingold, A. and Di Donato, F. and Gendre, P. and Giglia, E. and Maryl, M. and Mowlam, T. and Sillaume, G. and Staines, H. and Wennström, S.},
TITLE = {OPERAS Tools Research and Development White Paper},
YEAR = {2018},
ABSTRACT = {This white paper has been elaborated by the Tools (R\&D) Working Group, one of the 7 Working Groups launched by the OPERAS research infrastructure. The Working Group goal was to set up a list of tools and development which need to be done, to improve their usability for the OPERAS partners. The approach in OPERAS emphasizes the importance of building the open science scholarly communication infrastructure in Social Sciences and Humanities on community driven tools. In this perspective, the development of Open Source tools and the setup of a toolbox appear to be appropriate answers to the existing needs and evolutions in scholarly publishing. Following a first discussion in the Working Group, participants discussed the partners' practices and needs to help focus the Working Group objectives on three functions:-Peer review: interest in emerging practices such as open peer review, peer review tracking-Authoring: interest in simple and all-in-one services, especially online and collaborative authoring-Publishing: in particular, simple tools needed by small academic journals The main results of the Working Group are:-Notes on observed trends-A common approach and criteria for choosing tools-A list of relevant tools, detailing features and functionalities-An analysis of the current needs of the partners For Peer Review, the reviewing workflow is implemented in most Open Source software like Open Journal System (OJS) but developments are still needed to match the commercial software services. Similarly, the review tracking data available via services such as Publons is currently not open. The emerging trend for Open Peer Review represents an innovative area, both in terms of usage and tools. For Authoring, we see a bloom of new online and collaborative tools. Promising Open Source software for editing structured scholarly content are being developed and are near to production, alongside commercial tools such as Authorea or Overleaf. One of the main challenges, in this case, is to obtain a continuous production environment through interoperability. For Publishing, several Open Source software solutions are already used in production, but, as the level of service expected from a publication service is rising and includes a growing number of thirdparty services, the community is considering ways of working together to combine their effort to be comparable with the state of the art of the commercial solutions. The Operas partners are willing to go beyond this working group and consider engaging in follow-up projects, notably to help create a resource centre dedicated to providing the community with current information and support on scholarly communication software and tools, and to contribute to the effort in developing Open Source tools},
URL = {https://iris.cnr.it/handle/20.500.14243/381980},
}
@TECHREPORT{HEINEMANN_2018_TECHREPORT_HBDEGJKMS_381982,
AUTHOR = {Heinemann, E. and Bertino, A. and Di Donato, F. and Ekanger, A. and Giglia, E. and Jdraszko, B. and Kaiser, M. and Matthias, L. and Smaniotto, A.},
TITLE = {OPERAS Advocacy White Paper},
YEAR = {2018},
ABSTRACT = {This White Paper has been prepared by the OPERAS (Open Access in the European Research Area through Scholarly Communication) Working Group on Advocacy for Open Access Publishing in the Social Sciences and Humanities. OPERAS is a European research infrastructure for the development of open scholarly communication, particularly in the social sciences and humanities (SSH). The consortium comprises 36 organisations from 13 European countries and is coordinated by a core group of nine members. OPERAS' members come from diverse backgrounds and include publishers and publication platforms, infrastructure providers, libraries, universities, and research organisations. The paper addresses the importance of Open Science for the SSH, highlighting the role of a distributed research infrastructure like OPERAS in advocating for Open Access publishing models. Furthermore, the paper discusses the importance of the SSH in Open Science, showing how Open Science itself benefits from considering and accommodating the needs of researchers from different disciplinary backgrounds. While OPERAS does not endorse a specific Open Access publishing model, the infrastructure partners advocate for publication processes that can meet the present demand for Open Access, transparency, and open source tools in scholarly communication. This document is intended for all stakeholders actively involved in Open Access in the SSH. This includes publishers and publication platforms as well as libraries and infrastructure providers. However, the White Paper ultimately focuses on advocacy targeting researchers at different career stages. In order to support stakeholders in advocating for Open Access, the White Paper presents the benefits of Open Access publishing for scholars, while also addressing common concerns in the SSH research community. These include, but are not limited to, reputation, research evaluation, financial issues, a general lack of information, intellectual property rights and other legal concerns, and the availability of Open Access publishing models. This White Paper draws on experiences from OPERAS partners to illustrate researchers' concerns and to develop a guide with FAQs and solutions to address these issues. The White Paper concludes with advocacy suggestion sheets tailored to different stakeholders involved in Open Access in the SSH},
URL = {https://iris.cnr.it/handle/20.500.14243/381982},
}
@TECHREPORT{HICKS_2018_TECHREPORT_HBCGKQRSSS_460811,
AUTHOR = {Hicks, D. and Baroni, P. and Ceberio Berger, K. and Gurrutxaga Hernaiz, A. and Kruse, E. and Quochi, V. and Russo, I. and Salonen, T. and Sarhimaa, A. and Soria, C.},
TITLE = {DLDP etenemissuunnitelma-Toimenpidesuunnitelmat ja aikajana},
YEAR = {2018},
ABSTRACT = {Le raccomandazioni del progetto DLDP rivolte ai decisori politici (versione finlandese sintetica)},
KEYWORDS = {digital vitality, digital diversity, recommendations},
PAGES = {6},
URL = {http://www.dldp.eu/sites/default/files/documents/DLDP-Roadmap_Short-Version_FI.pdf},
}
@TECHREPORT{HICKS_2018_TECHREPORT_HBCGKQRSSS_428760,
AUTHOR = {Hicks, D. and Baroni, P. and Ceberio Berger, K. and Gurrutxaga Hernaiz, A. and Kruse, E. and Quochi, V. and Russo, I. and Salonen, T. and Sarhimaa, A. and Soria, C.},
TITLE = {The DLDP Roadmap},
YEAR = {2018},
ABSTRACT = {Le raccomandazioni del progetto DLDP rivolte ai decisori politici (versione inglese integrale)},
KEYWORDS = {digital vitality, digital diversity, recommendations},
PAGES = {19},
URL = {http://www.dldp.eu/sites/default/files/documents/DLDP_Roadmap.pdf},
}
@TECHREPORT{HICKS_2018_TECHREPORT_HBCGKQRSSS_462989,
AUTHOR = {Hicks, D. and Baroni, P. and Ceberio Berger, K. and Gurrutxaga Hernaiz, A. and Kruse, E. and Quochi, V. and Russo, I. and Salonen, T. and Sarhimaa, A. and Soria, C.},
TITLE = {La Roadmap DLDP-Recommandations de politique et calendrier},
YEAR = {2018},
ABSTRACT = {Le raccomandazioni del progetto DLDP rivolte ai decisori politici (versione francese sintetica)},
KEYWORDS = {digital vitality, digital diversity, recommendations},
PAGES = {6},
URL = {http://www.dldp.eu/sites/default/files/documents/DLDP-Roadmap_Short-Version_FR.pdf},
}
@TECHREPORT{HICKS_2018_TECHREPORT_HBCGKQRSSS_460815,
AUTHOR = {Hicks, D. and Baroni, P. and Ceberio Berger, K. and Gurrutxaga Hernaiz, A. and Kruse, E. and Quochi, V. and Russo, I. and Salonen, T. and Sarhimaa, A. and Soria, C.},
TITLE = {Diversità Linguistica Digitale: la Roadmap-Raccomandazioni strategiche & Sequenza},
YEAR = {2018},
ABSTRACT = {Le raccomandazioni del progetto DLDP rivolte ai decisori politici (versione italiana sintetica)},
KEYWORDS = {digital vitality, digital diversity, recommendations},
PAGES = {6},
URL = {http://www.dldp.eu/sites/default/files/documents/DLDP-Roadmap_Short-Version_IT.pdf},
}
@TECHREPORT{HICKS_2018_TECHREPORT_HBCGKQRSSS_460814,
AUTHOR = {Hicks, D. and Baroni, P. and Ceberio, B. K. and Gurrutxaga, H. A. and Kruse, E. and Quochi, V. and Russo, I. and Salonen, T. and Sarhimaa, A. and Soria, C.},
TITLE = {La DLDP Hoja de Ruta-Políticas recomendadas & Cronograma},
YEAR = {2018},
ABSTRACT = {Le raccomandazioni del progetto DLDP rivolte ai decisori politici (versione spagnola sintetica)},
KEYWORDS = {digital vitality, digital diversity, recommendations},
PAGES = {6},
URL = {http://www.dldp.eu/sites/default/files/documents/DLDP-Roadmap_Short-Version_ES.pdf},
}
@TECHREPORT{HICKS_2018_TECHREPORT_HBCGKQRSSS_460807,
AUTHOR = {Hicks, D. and Baroni, P. and Ceberio, B. K. and Gurrutxaga, H. A. and Kruse, E. and Quochi, V. and Russo, I. and Salonen, T. and Sarhimaa, A. and Soria, C.},
TITLE = {The DLDP Roadmap-Policy Recommendations & Timeline},
YEAR = {2018},
ABSTRACT = {Le raccomandazioni del progetto DLDP rivolte ai decisori politici (versione inglese sintetica)},
KEYWORDS = {digital vitality, digital diversity, recommendations},
PAGES = {6},
URL = {http://www.dldp.eu/sites/default/files/documents/DLDP-Roadmap_Short-Version_EN.pdf},
}
@TECHREPORT{HICKS_2018_TECHREPORT_HBCGKQRSSS_460816,
AUTHOR = {Hicks, D. and Baroni, P. and Ceberio, B. K. and Gurrutxaga, H. A. and Kruse, E. and Quochi, V. and Russo, I. and Salonen, T. and Sarhimaa, A. and Soria, C.},
TITLE = {DLDP Bide Orria-Gomendatutako politikak & Kronograma},
YEAR = {2018},
ABSTRACT = {Le raccomandazioni del progetto DLDP rivolte ai decisori politici (versione basca sintetica)},
KEYWORDS = {digital vitality, digital diversity, recommendations},
PAGES = {6},
URL = {http://www.dldp.eu/sites/default/files/documents/DLDP-Roadmap_Short-Version_EU.pdf},
}
@TECHREPORT{HICKS_2018_TECHREPORT_HBCGKQRSSS_462988,
AUTHOR = {Hicks, D. and Baroni, P. and Ceberio, B. K. and Gurrutxaga, H. A. and Kruse, E. and Quochi, V. and Russo, I. and Salonen, T. and Sarhimaa, A. and Soria, C.},
TITLE = {Die DLDP Roadmap-Strategieempfehlungen & Zeitplan},
YEAR = {2018},
ABSTRACT = {Le raccomandazioni del progetto DLDP rivolte ai decisori politici (versione tedesca sintetica)},
KEYWORDS = {digital vitality, digital diversity, recommendations},
PAGES = {6},
URL = {http://www.dldp.eu/sites/default/files/documents/DLDP-Roadmap_Short-Version_DE.pdf},
}
@TECHREPORT{HICKS_2018_TECHREPORT_HSBCGKQRSS_421382,
AUTHOR = {Hicks, D. and Soria, C. and Baroni, P. and Ceberio, B. K. and Gurrutxaga, H. A. and Kruse, E. and Quochi, V. and Russo, I. and Salonen, T. and Sarhimaa, A.},
TITLE = {Pak treuzveviñ ar Brezhoneg niverel-Erbedoù an DLDP evit gwellaat buhezegezh niverel ar brezhoneg},
YEAR = {2018},
ABSTRACT = {Le raccomandazioni del progetto DLDP per la sopravvivenza digitale del bretone (versione bretone)},
KEYWORDS = {digital vitality, digital diversity, recommendations},
URL = {http://www.dldp.eu/sites/default/files/documents/DLDP_Digital-Language-Survival-Kit-for-Breton_BR.pdf},
}
@TECHREPORT{HICKS_2018_TECHREPORT_HSBCGKQRSS_421387,
AUTHOR = {Hicks, D. and Soria, C. and Baroni, P. and Ceberio, B. K. and Gurrutxaga, H. A. and Kruse, E. and Quochi, V. and Russo, I. and Salonen, T. and Sarhimaa, A.},
TITLE = {Kit de survie numerique pour la langue bretonne-Les recommandations du DLDP pour améliorer la vitalité numérique du Breton},
YEAR = {2018},
ABSTRACT = {Le raccomandazioni del progetto DLDP per la sopravvivenza digitale del bretone (versione francese)},
KEYWORDS = {digital vitality, digital diversity, recommendations},
URL = {http://www.dldp.eu/sites/default/files/documents/DLDP_Digital-Language-Survival-Kit-for-Breton_FR.pdf},
}
@TECHREPORT{PELOSI_2018_TECHREPORT_PRRVCBCCSP_388335,
AUTHOR = {Pelosi, G. and Rocchiccioli, S. and Rial, M. and Vozzi, F. and Caselli, C. and Benvenuti, C. and Carpita, D. and Campolo, J. and Sbrana, S. and Parodi, O.},
TITLE = {SMARTool: Interim Progress Report (M19-M30)},
YEAR = {2018},
ABSTRACT = {The period between M19 and M30 has been dedicated to complete and report activities required in order to achieve the objectives of WP1 and WP2 and achieve MS7 as well as MS1 according to the new deadline set in the deviations to the DoA following implementation of the R1 mitigation plan},
URL = {https://iris.cnr.it/handle/20.500.14243/388335},
}
@TECHREPORT{SALONEN_2018_TECHREPORT_SBCGHKQRSS_462987,
AUTHOR = {Salonen, T. and Baroni, P. and Ceberio Berger, K. and Gurrutxaga Hernaiz, A. and Hicks, D. and Kruse, E. and Quochi, V. and Russo, I. and Sarhimaa, A. and Soria, C.},
TITLE = {Karjalan digitualine hengihjiämispakkavus-DLDP-rekomendatsiet karjalan kielen digitualizen elinvoimazuon kohendamizeh},
YEAR = {2018},
ABSTRACT = {Le raccomandazioni del progetto DLDP per migliorare la vitalità digitale della lingua careliana (versione careliana)},
KEYWORDS = {digital vitality, digital diversity, digital language survival, recommendations, Karelian},
PAGES = {12},
URL = {http://www.dldp.eu/sites/default/files/documents/DLDP_Digital-Language-Survival-Kit-for-Karelian_KRL.pdf},
}
@TECHREPORT{SALONEN_2018_TECHREPORT_SBCGHKQRSS_421393,
AUTHOR = {Salonen, T. and Baroni, P. and Ceberio, B. K. and Gurrutxaga, H. A. and Hicks, D. and Kruse, E. and Quochi, V. and Russo, I. and Sarhimaa, A. and Soria, C.},
TITLE = {Karjalan digitaalinen kielenselviytymispakkaus-DLDP-suositukset karjalan kielen digitaalisen elinvoimaisuuden parantamiseksi},
YEAR = {2018},
ABSTRACT = {Le raccomandazioni del progetto DLDP per la sopravvivenza digitale della lingua careliana (versione finlandese)},
KEYWORDS = {digital vitality, digital diversity, digital language survival, recommendations, Karelian},
URL = {http://www.dldp.eu/sites/default/files/documents/DLDP_Digital-Language-Survival-Kit-for-Karelian_FI.pdf},
}
@MISC{BELLANDI_2018_MISC_B_350505,
AUTHOR = {Bellandi, A.},
TITLE = {LexO},
YEAR = {2018},
ABSTRACT = {LexO is a web collaborative editor of lexical and termino-ontological resources. LexO is meant to be used mainly by humanists and, thus, hide all the technical complexities related to the adopted formal languages. Being a web application, LexO makes collaborative editing possible: a team of users, each one with his/her own role (lexicographers, domain experts, scholars, etc.), can work on the same resource collaboratively. As a result, resources quickly increase in size and are constantly updated. LexO adheres to international standards for representing lexica and ontologies in the Semantic Web (such as lemon and OWL), so that lexical resources can be shared easily or specific entities can be linked to existing datasets. LexO intends to provide features to link each entity of the resource (being it a form, a term, a concept, etc.) to a text or to a very specific portion of a text, via citational references mechanisms. Conceived to handle historical and ancient lexica and terminologies as well, LexO is flexible and extensible enough to formalize peculiar features of such linguistic resources. The development of LexO has been partially funded by the DFG in the context of the cooperation agreement between prof. Guido Mensching, director of the DiTMAO project at the Seminar für Romanische Philologie of the Georg-August-Universität Göttingen and the Istituto di Linguistica Computazionale "A. Zampolli" of the Italian National Research Council (August 29th, 2016)},
URL = {https://iris.cnr.it/handle/20.500.14243/350505},
}
@MISC{BELLANDI_2018_MISC_BFKM_350511,
AUTHOR = {Bellandi, A. and Frontini, F. and Khan, F. and Monachini, M.},
TITLE = {Parole-Simple-Clip/Morphological Layer in RDF},
YEAR = {2018},
ABSTRACT = {A version in RDF of the morphological layer of the wide coverage multi-level Italian lexicon Parole-Simple-Clips, containing the parts of speech Noun, Verb, Adjective. The dataset is encoded using the ontolex-lemon vocabulary. Information pertaining to inflectional morphological contained in the original resource is converted into Semantic Web Rule Language (SWRL) rules},
URL = {https://iris.cnr.it/handle/20.500.14243/350511},
}
@MISC{BELLANDI_2018_MISC_BM_370097,
AUTHOR = {Bellandi, A. and Marchi, S.},
TITLE = {TALMUD Interfaccia di accesso ontologia Rabbini},
YEAR = {2018},
ABSTRACT = {Interfaccia di accesso e sparql endpoint per l'accesso e la visualizzazione grafica dell'ontologia dei nomi dei rabbini},
URL = {https://iris.cnr.it/handle/20.500.14243/370097},
}
@MISC{CEBERIO_2018_MISC_CGSRQ_420185,
AUTHOR = {Ceberio, K. and Gurrutxaga, A. and Soria, C. and Russo, I. and Quochi, V.},
TITLE = {How to Use the Digital Language Vitality Scale},
YEAR = {2018},
ABSTRACT = {The Digital Language Vitality Scale is an instrument developed within the framework of the Digital Language Diversity Project (www. dldp. eu) for estimating the degree of digital vitality of any given language. It aims to be an instrument for self-assessment of the digital vitality of any language, although it is aimed in particular at identifying current gaps, needs and requirements regarding the extent to which a language community is active/vital on digital media and devices so that adequate digital language planning can be done. This document instructs prospective adopters on how to best use it},
KEYWORDS = {Diversità Linguistica, BLARK, Sopravvivenza linguistica digitale},
PAGES = {18},
URL = {http://www.dldp.eu/sites/default/files/documents/DLDP_Digital-Language-Vitality-Scale.pdf},
}
@MISC{CRISTOFARO_2018_MISC_CDS_426857,
AUTHOR = {Cristofaro, S. and Del Grosso, A. M. and Spampinato, D.},
TITLE = {Chiosco Voci di Pietra},
YEAR = {2018},
ABSTRACT = {Il chiosco multimediale Voci di Pietra è stato installato come postazione in locale all'interno del percorso museale in occasione della omonima mostra. Il totem touch screen permette la navigazione tra le informazioni raccolte nelle schede, nei video e nelle immagini digitalizzate, sia in italiano che in inglese, per favorire l'approfondimento della visita},
KEYWORDS = {Museum, Epigraphy, EpiDoc, TEI},
URL = {https://iris.cnr.it/handle/20.500.14243/426857},
}
@MISC{CRISTOFARO_2018_MISC_CDS_522848,
AUTHOR = {Cristofaro, S. and Del Grosso, A. M. and Spampinato, D.},
TITLE = {Chiosco Multimediale "Voci di pietra"},
YEAR = {2018},
ABSTRACT = {Il chiosco multimediale costituisce la versione web della postazione touch che correda la mostra “Voci di Pietra”, allestita lungo il lato est del museo civico Castello Ursino di Catania. La presenza di un chiosco multimediale all’interno della mostra permette la navigazione tra le informazioni riguardanti il materiale epigrafico e favorisce l’approfondimento della visita. La versione web del chiosco, presente all’interno del museo digitale EpiCUM, segue le stesse direttive pur differenziandosi leggermente dalla postazione in mostra. Fruibile sia in lingua italiana che inglese, infatti, permette di visitare virtualmente i contenuti della mostra "Voci di pietra" muovendosi nel percorso espositivo delle sale. È possibile, inoltre, soffermarsi su ciascuna scheda epigrafica, esaminare attentamente le immagini ad alta risoluzione, apprezzandone i dettagli, leggere commenti e informazioni, confrontare il testo delle iscrizioni in lingua antica con le traduzioni in italiano e in inglese},
KEYWORDS = {Epigrafi, Patrimonio Culturale, Musei, Edizioni Digitali, Chiosco Multimediale},
URL = {https://iris.cnr.it/handle/20.500.14243/522848},
}
@MISC{DELGROSSO_2018_MISC_D_348292,
AUTHOR = {Del Grosso, A. M.},
TITLE = {Verso la definizione e l'implementazione di un processo per la gestione dell'informazione in ambito bibliografico e archivistico},
YEAR = {2018},
ABSTRACT = {L'intervento ripercorre alcune iniziative svolte negli anni passati in collaborazione con il liceo classico Medi-Livatino. Si introduce un processo di digitalizzazione e di analisi di documenti testuali volto alla gestione e allo studio dell'informazione testuale in ambito filologico. In particolare si sottolineano gli aspetti che accomunano il lavoro ingegneristico-tecnologico con quelli maggiormente bibliografici e archivistici relativi alla conservazione e alla fruizione di risorse testuali. Si evidenziano gli sviluppi di attività dedicate alla cultura digitale e all'applicazione di strumenti computazionali per l'analisi e lo studio di tesi storici nell'ambito della didattica. In perfetta sintonia quindi con le linee guida del Piano Nazionale Scuola Digitale},
KEYWORDS = {PNSD, liceo classico, biblioteche innovative, archivi digitali},
URL = {https://iris.cnr.it/handle/20.500.14243/348292},
CONFERENCE_NAME = {Cultura Digitale: a scuola di innovazione},
}
@MISC{DELGROSSO_2018_MISC_DM_458609,
AUTHOR = {Del Grosso, A. M. and Marchi, S.},
TITLE = {Bellininrete Web Application},
YEAR = {2018},
ABSTRACT = {Applicazione web sviluppata in seno al progetto Bellininrete per lo studio e la consultazione della corrispondenza del maestro catanese Vincenzo Bellini},
KEYWORDS = {Digital Edition, Digital Scholarly Platform, web application},
URL = {http://bellinicorrespondence.cnr.it/evt},
}
@MISC{DELGROSSO_2018_MISC_DM_458607,
AUTHOR = {Del Grosso, A. M. and Marchi, S.},
TITLE = {Edizione digitale del Rotulo di San Teobaldo},
YEAR = {2018},
ABSTRACT = {Applicazione web per la consultazione dell'edizione digitale del Rotulo di San Teobaldo proprietà della Diocesi di Alba},
KEYWORDS = {digital philology, web application, evt, enhanced visualization},
URL = {https://www.visitmudi.it/rotulo-di-san-teobaldo/},
}
@MISC{DELGROSSO_2018_MISC_DMA_350041,
AUTHOR = {Del Grosso, A. M. and Marchi, S. and Albanesi, D.},
TITLE = {Omega Project: Omega: Piattaforma Multi-modulare per lo studio scientifico del testo},
YEAR = {2018},
ABSTRACT = {Piattaforma per lo studio del testo con prospettiva scientifico-filologica},
KEYWORDS = {digital humanities, computational philology, software engineering},
URL = {https://github.com/literarycomputinglab/OmegaProject},
}
@MISC{DIDONATO_2018_MISC_D_408456,
AUTHOR = {Di Donato, F.},
TITLE = {Dalla parte dell'utente. L'esperienza di Galassia Ariosto e alcune sfide aperte},
YEAR = {2018},
ABSTRACT = {Presentazione del portale Galassia Ariosto alla conferenza Historias Findgidas},
URL = {https://iris.cnr.it/handle/20.500.14243/408456},
}
@MISC{FEDERICO_2018_MISC_FD_344190,
AUTHOR = {Federico, B. and Del Grosso, A. M.},
TITLE = {Euporia: Piattaforma digitale per l'annotazione tramite Domain Specific Languages di testi multilingui disposti in parallelo},
YEAR = {2018},
ABSTRACT = {Piattaforma digitale per l'annotazione tramite Domain Specific Languages di testi multilingui disposti in parallelo},
KEYWORDS = {digital humanities, computational philology, digital philology},
URL = {https://github.com/CoPhi/euporia},
}
@MISC{GIOVANNETTI_2018_MISC_GBM_370147,
AUTHOR = {Giovannetti, E. and Bellandi, A. and Marchi, S.},
TITLE = {Ontology of Rabbis of the Babylonian Talmud-RDF version},
YEAR = {2018},
ABSTRACT = {The purpose of this research in progress is to build an ontology of the rabbis appearing in the Babylonian Talmud. The ontology, the construction of which is still in progress, will be shared as a Linked Open Data and linked to existing vocabularies (among which: Wikidata, DBpedia and VIAF). This work is being developed in the context of the Babylonian Talmud Translation Project, where more than 80 talmudists are working together at the translation of the Talmud in Italian, which will include notes and glossaries, and provide the biographies of the Talmudic Masters this ontology is being constructed from. The ontology will constitute the first portion of a more comprehensive Talmudic Knowledge Base where the text itself, the terminology, the entities and the concepts constituting the Babylonian Talmud will be formalized and linked to each other},
URL = {https://iris.cnr.it/handle/20.500.14243/370147},
}
@MISC{PICCINI_2018_MISC_P_404938,
AUTHOR = {Piccini, S.},
TITLE = {Approcci computazionali alla lessicografia e alla terminologia: il caso del lessico di Ferdinand de Saussure},
YEAR = {2018},
ABSTRACT = {L'intervento è volto ad illustrare i principali approcci computazionali adottati oggi nell'ambito della lessicografia e della terminologia computazionali. Si illustra quindi l'applicazione del modello SIMPLE ai fini della creazione di un lessico di dominio, dedicato alla terminologia di Ferdinand de Saussure},
URL = {https://iris.cnr.it/handle/20.500.14243/404938},
}
@MISC{PICCINI_2018_MISC_PB_370152,
AUTHOR = {Piccini, S. and Bellandi, A.},
TITLE = {Totus Mundus-Ancient Chinese Lexicon},
YEAR = {2018},
ABSTRACT = {Totus Mundus-Ancient Chinese Lexicon},
URL = {https://iris.cnr.it/handle/20.500.14243/370152},
}
@MISC{PIRRELLI_2018_MISC_PV_351898,
AUTHOR = {Pirrelli and Vito},
TITLE = {NLP-based assessment of reading efficiency in early grade children},
YEAR = {2018},
ABSTRACT = {Assessing reading skills is a laborious and time-consuming task, which requires monitoring a variety of interlocked abilities, ranging from accurate word rendering, reading fluency and lexical access, to linguistic comprehension, and interpretation, management and inference of complex events in working memory. No existing software, to our knowledge, is able to cover and integrate reading performance monitoring, instant feedback, personalised potentiation and intelligent decision support to teachers and speech therapists, assessment of response to intervention. NLP and ICT technologies can make such an ambitious platform an achievable target},
KEYWORDS = {NLP-based methods, reading efficiency, early graders},
PAGES = {5-6},
URL = {http://dcl.bas.bg/clib/wp-content/uploads/2018/07/CLIB_2018_Proceedings_v2_final.pdf},
CONFERENCE_NAME = {Computational Linguistics in Bulgaria},
}
@MISC{PROIETTI_2018_MISC_P_404515,
AUTHOR = {Proietti, C.},
TITLE = {« Paradoxe », version académique},
YEAR = {2018},
ABSTRACT = {Dès l'âge classique et pendant toutes les époques suivantes la philosophie et la pensée scientifique ont été confrontées à un grand nombre de paradoxes. Ceux-ci ont souvent joué le rôle de curiosités, ou bien de casse-tête et exercices de pensée (comme les insolubilia de la scolastique médiévale). Toutefois, dans beaucoup de cas les paradoxes ont servi de véritable stimulus et moyen de révision des théories scientifiques. Dans cet article, nous allons d'abord présenter deux étapes fondamentales de l'histoire des paradoxes, les paradoxes de Zénon et ceux de la théorie des ensembles d'entre la fin du XIXe et le début du XXe siècle. Les sections qui suivent se concentrent sur les dilemmes moraux, les paradoxes de la connaissance, et les paradoxes de la vérité. Le but est d'introduire le lecteur à certains des problèmes centraux dans les domaines de la philosophie morale, de l'épistémologie et de la philosophie théorétique. Cela est fait à travers l'analyse structurelle de certains des paradoxes les plus débattus dans ces domaines, l'exposition des approches majeures pour leur solution ainsi que de leur motivation théorique},
KEYWORDS = {Paradoxe},
URL = {http://encyclo-philo.fr/paradoxe-a/},
EDITOR = {Kristanek, M.},
}
@MISC{PROIETTI_2018_MISC_P_404093,
AUTHOR = {Proietti, C.},
TITLE = {« Paradoxe », version Grand Public},
YEAR = {2018},
ABSTRACT = {Dans son usage courant, le mot paradoxe indique une opinion absurde, extravagante, ou en tout état de cause inacceptable par rapport à ce qui est considéré comme connaissance commune. Cette acception est aussi manifeste dans son étymologie grecque pará dóxa, littéralement « opinion contre ». Toutefois, afin que l'on puisse proprement parler d'un paradoxe, une telle opinion doit être supportée par un argument. On peut en fait définir un paradoxe comme un argument dont la conclusion est inacceptable tout en étant dérivée à partir de prémisses en apparence acceptables, et au moyen d'un raisonnement apparemment correct (Sainsbury 2009). Dans une telle définition, certains termes sont plutôt vagues ou ambigus, comme par exemple « prémisse acceptable » ou bien encore « raisonnement apparemment correct ». Une définition plus précise risque cependant de contraindre de manière excessive l'usage du mot, ainsi que d'exclure bon nombre de propriétés caractéristiques du concept. Il est utile ici de clarifier la notion de paradoxe par ses instances plus ou moins typiques, afin d'une part de mieux comprendre son extension, et d'autre part de montrer que caractériser un argument comme paradoxal est chose relative},
KEYWORDS = {Paradoxe},
URL = {http://encyclo-philo.fr/paradoxe-gp/},
EDITOR = {Kristanek, M.},
}
@MISC{SASSI_2018_MISC_S_372952,
AUTHOR = {Sassi, M. L. G.},
TITLE = {Léxico del Tratado del esphera y del arte de marear con el regimiento de las alturas, con algunas reglas nuevamente escritas muy necessarias de Francisco de Falero},
YEAR = {2018},
ABSTRACT = {El léxico del Tratado del esphera y del Arte del marear de Francisco Faleiro, forma parte del conjunto lexicográfico del Diccionario de la navegación del Siglo de Oro. Para la realización de este diccionario, se ha contado con dos proyectos de investigación: HUM2006, financiado por el Ministerio de Educación y Ciencia de España, y FFI2012-36768, del Ministerio de Economía y Competitividad y cuatro ayudas de movilidad: dos concedidas por el Consiglio Nazionale della Ricerca italiano, CNR [Istituto di Linguistica Computazionale de Italia (2006 y 2007)] y dos por el Ministerio de Ciencia e Innovación de España [Programa de Estancias de Profesores de Universidad e Investigadores del CSIC en Centros de Investigación Extranjeros (2005 y 2010)]. Este volumen contiene la concordancia lematizada, los índices de frecuencia de lemas y formas, los índices de los nombres propios y el diccionario inverso del Tratado},
URL = {https://iris.cnr.it/handle/20.500.14243/372952},
ISBN = {978-84-362-7383-0},
}
@MISC{SORIA_2018_MISC_S_375532,
AUTHOR = {Soria, C.},
TITLE = {Minority languages in the digital world. Empowering language communities to increase digital language diversity},
YEAR = {2018},
ABSTRACT = {The rich cultural tapestry of European linguistic diversity is severely underrepresented on digital media and almost completely excluded from the digital services which are usually available in EU official languages. In the digital domain speakers of EU regional and minority languages have fewer opportunities to use their language compared to speakers of major languages. As the world becomes increasingly digitized, those speakers are facing a 'digital timebomb', as their languages are unable to match the pace of digital development for dominant languages. Unless the rate of digital development and provision is improved for regional and minority languages, and in a language domain where it's vital to attract young people to the language, speakers of these RMLs will become increasingly marginalized and excluded. In this talk, I will present the concept, mission and outcomes of the Digital Language Diversity Project, the aim of which is to provide tools and materials for empowering language communities and strengthening the digital presence and use of their language},
URL = {https://iris.cnr.it/handle/20.500.14243/375532},
}
@ARTICLE{BARTOLINI_2017_ARTICLE_BPGGB_332319,
AUTHOR = {Bartolini, R. and Pardelli, G. and Goggi, S. and Giannini, S. and Biagioni, S.},
TITLE = {A terminological "journey" in the Grey Literature domain},
YEAR = {2017},
ABSTRACT = {"It is by means of terms that the expert usually transfer their knowledge and again through terms scientific communication reaches the highest effectiveness. Therefore we can assert that terminology-in the sense of a set of representative and domain-specific units-is necessary for representing and connecting specialized fields as well as any attempt to represent and/or transfer scientific knowledge requires, more or less extensively, the use of terminology. " (Cabré, 2000). "When we read the articles or papers of a particular domain, we can recognize some lexical items in the texts as technical terms. In a domain where new knowledge is generated, new terms are constantly created to fulfill the needs of the domain, while others become obsolete. In addition, existing terms may undergo changes of meaning. " (Kageura K., 1998/1999). Specialized lexicons are made up of the terms which are specific to each field of knowledge, «a subset which is distinct but not separated from the common language» (Cassese, 1992): it is usually difficult to extract the relevant domain-specific terminology, meaning to discern terms which belong to a specialized glossary from those belonging to the common dictionary. The interest in the study of terminology and the "truth" contained in the above definitions has led us to make a "journey" in the Grey Literature (GL) domain in order to offer an overall vision on the terms used and the links between them. Within this scenario, the work analyzes a corpus constituted of the entire amount of full research papers published in the GL conference series over a time-span of more than one decade (2003-2014) with the aim of creating a terminological map of relevant words in the various GL research topics. ". corpora used to extract terminological units can be further investigated to find semantic and conceptual information on terms or to represent conceptual relationships between terms. (Bourigault D. et al., 2001). Another interesting inquiry is the terminology used in the GL conferences for describing the types of documents which can be detected (Pej?ová P. et al., 2012)},
KEYWORDS = {Grey Literature, Information Extraction IE, Terminology},
PAGES = {41-53},
URL = {http://www.greynet.org/thegreyjournal/currentissue.html},
VOLUME = {13 (1)},
ISSN = {1574-1796},
JOURNAL = {THE GREY JOURNAL},
}
@ARTICLE{BIZZONI_2017_ARTICLE_BRD_341647,
AUTHOR = {Bizzoni, Y. and Reboul, M. and Del Grosso, A.},
TITLE = {Diachronic trends in Homeric translations},
YEAR = {2017},
ABSTRACT = {This field of study is part of the more general "Classical Receptions" studies that try to analyse the influence and adaptation of classical texts in modern and contemporary literature, theatre, cinema, and many other artistic fields. While Greek texts have been analysed by scholars for more than two thousand years, research about classical translations is not yet a most renown subject. In recent years this theme has raised a growing interest in the academic community},
KEYWORDS = {Digital Humanities, Diachronic translations, Software design and engineering, Natural Language Processing},
PAGES = {26},
URL = {http://www.digitalhumanities.org/dhq/vol/11/2/000297/000297.html},
VOLUME = {11 (2)},
ISSN = {1938-4122},
JOURNAL = {DIGITAL HUMANITIES QUARTERLY},
}
@ARTICLE{BOMPOLAS_2017_ARTICLE_BFMCP_336890,
AUTHOR = {Bompolas, S. and Ferro, M. and Marzi, C. and Cardillo, F. A. and Pirrelli, V.},
TITLE = {For a performance-oriented notion of regularity in inflection: the case of Modern Greek conjugation},
YEAR = {2017},
ABSTRACT = {Paradigm-based approaches to word processing/learning assume that word forms are not acquired in isolation, but through associative relations linking members of the same word family (e. g. a paradigm, or a set of forms filling the same paradigm cell). Principles of correlative learning offer a set of equations that are key to modelling this complex dynamic at a considerable level of detail. We use these equations to simulate acquisition of Modern Greek conjugation, and we compare the results with evidence from German and Italian. Simulations show that different Greek verb classes are processed and acquired differentially, as a function of their degrees of formal transparency and predictability. We relate these results to psycholinguistic evidence of Modern Greek word processing, and interpret our findings as supporting a view of the mental lexicon as an emergent integrative system},
KEYWORDS = {paradigm-based morphology, gradient (ir)regularity, recurrent self-organisng networks},
PAGES = {77-92},
URL = {http://www.ai-lc.it/IJCoL/v3n1/IJCOL_3_1_5_bompolas_et_al.pdf?v=2a47ad90f2ae},
VOLUME = {3 (1)},
ISSN = {2499-4553},
JOURNAL = {IJCOL},
}
@ARTICLE{BOSCHETTI_2017_ARTICLE_B_338981,
AUTHOR = {Boschetti, F.},
TITLE = {Estrarre parole dalle immagini nell'era digitale: alcune osservazioni sull'OCR storico},
YEAR = {2017},
ABSTRACT = {This article discusses techniques and practices aimed at the extraction of textual content from images related to printed editions. Optical Character Recognition (Ocr) applied to scholarly editions of classical texts or applied to early printed editions is a challenging task, due to material issues, such as the bad quality of papers damaged by time, or due to linguistic issues, such as the lack of linguistic models suitable to a specific linguistic variety. This article illustrates some common strategies aimed at improving historic Ocr accuracy, such as the alignment of the textual sequences generated by different Ocr engines and the incremental enrichment of suitable linguistic models. Finally, some practices of collaborative Ocr proof-reading are described and discussed},
URL = {https://iris.cnr.it/handle/20.500.14243/338981},
ISSN = {1826-901X},
JOURNAL = {LA RIVISTA DI ENGRAMMA},
}
@ARTICLE{BURGASSI_2017_ARTICLE_B_341297,
AUTHOR = {Burgassi, C.},
TITLE = {Le traduzioni dei classici attribuite a Boccaccio alla luce del Dizionario dei Volgarizzamenti (DiVo)},
YEAR = {2017},
ABSTRACT = {Le traduzioni medievali di Tito Livio suscitano particolare interesse in ragione della loro discussa paternità. Pur in assenza di sicure firme d'autore, queste ponderose trasposizioni in volgare, in tutto o in parte, sono state più volte e con vari criteri ricondotte alla penna prestigiosa di Giovanni Boccaccio. Anche a questa annosa ipotesi attributiva, come ad altre questioni di altro ordine e rilievo, si propone di fornire un contributo apprezzabile il progetto di ricerca intitolato "DiVo-Dizionario dei Volgarizzamenti". Il corpus testuale promosso dal DiVo, che contiene il testo integrale dei volgarizzamenti di Livio associati, paragrafo per paragrafo, al latino, rende possibile verificare sistematicamente le diverse strategie delle traduzione, con speciale riferimento alle opzioni lessicali e stilistiche. I risultati così ottenuti da una parte illuminano le molteplici possibilità della traslazione dal sistema linguistico del latino a quello del volgare, dall'altra gettano luce anche in ottica più ampia sul rapporto fra lingua del volgarizzatore(-i) e lingua in uso presso gli autori del medioevo. Nello specifico sono presi in considerazione alcuni (supposti) segnali di continuità fra l'inventario lessicale e stilistico proprio di Boccaccio e quello del traduttore antico di Livio, con particolare riferimento alla resa in volgare della famiglia di PRAECIPITARE},
KEYWORDS = {Boccaccio, volgarizzamenti, lessico antico},
PAGES = {161-179},
URL = {http://www.heliotropia.org/14/burgassi.pdf},
VOLUME = {14},
ISSN = {1542-3352},
JOURNAL = {HELIOTROPIA},
}
@ARTICLE{BURGASSI_2017_ARTICLE_B_341302,
AUTHOR = {Burgassi, C.},
TITLE = {Il "cerchio tetro" di Dante e il "cammin" di Boccaccio},
YEAR = {2017},
ABSTRACT = {This paper offers a semantic survey of the word form tetro in Boccaccio's vernacular works. The adjective tetro, first employed by Dante in his Commedia with the meaning 'dark, gloomy', proves to be an extremely unusual word in the Italian language of the Middle Ages and therefore possibly difficult to understand. Starting off the analysis with Boccaccio's Esposizioni sopra la Comedia di Dante, it is firstly pointed out that the word form tetro occurring in Dante's Inferno («cerchio tetro», 7. 31) is not connected by Boccaccio to the meaning 'dark, gloomy'. According to Boccaccio, tetro rather means 'worn out by use'. After a brief review of the use of the adjective taeter in Boccaccio's Latin works, it is then observed that the meaning of the word form tetro occurring in Teseida and Rime seems to closely correspond with the semantic interpretation of tetro in the Esposizioni ('worn out by use'). A possible explanation of such an interpretation by Boccaccio is finally presented},
KEYWORDS = {Boccaccio, Dante, Lessico antico},
PAGES = {29-46},
URL = {https://iris.cnr.it/handle/20.500.14243/341302},
VOLUME = {45},
ISSN = {0585-4997},
JOURNAL = {STUDI SUL BOCCACCIO},
}
@ARTICLE{CONNOR_2017_ARTICLE_CCVR_313924,
AUTHOR = {Connor, R. and Cardillo, F. A. and Vadicamo, L. and Rabitti, F.},
TITLE = {Hilbert exclusion: improved metric search through finite isometric embeddings},
YEAR = {2017},
ABSTRACT = {Most research into similarity search in metric spaces relies on the triangle inequality property. This property allows the space to be arranged according to relative distances to avoid searching some subspaces. We show that many common metric spaces, notably including those using Euclidean and Jensen-Shannon distances, also have a stronger property, sometimes called the four-point property: In essence, these spaces allow an isometric embedding of any four points in three-dimensional Euclidean space, as well as any three points in two-dimensional Euclidean space. In fact, we show that any space that is isometrically embeddable in Hilbert space has the stronger property. This property gives stronger geometric guarantees, and one in particular, which we name the Hilbert Exclusion property, allows any indexing mechanism which uses hyperplane partitioning to perform better. One outcome of this observation is that a number of state-of-the-art indexing mechanisms over high-dimensional spaces can be easily refined to give a significant increase in performance; furthermore, the improvement given is greater in higher dimensions. This therefore leads to a significant improvement in the cost of metric search in these spaces},
KEYWORDS = {Similarity search, Metric space, Metric indexing, Four-point property, Hilbert embedding, H. Information systems. Data structures, H. Information systems. Multidimensional range search, H. Information systems. Proximity search, H. Information systems. Database query processing, H. Information systems. Retrieval models and ranking, Information systems. Retrieval efficiency, H. Information systems. Multimedia information systems, F. Theory of computation. Random projections and metric embeddings},
PAGES = {17-27},
URL = {http://doi.acm.org/10.1145/3001583},
VOLUME = {35 (3)},
DOI = {10.1145/3001583},
ISSN = {1046-8188},
JOURNAL = {ACM TRANSACTIONS ON INFORMATION SYSTEMS},
}
@ARTICLE{FERRARI_2017_ARTICLE_FDEGG_341661,
AUTHOR = {Ferrari, A. and Dell'Orletta, F. and Esuli, A. and Gervasi, V. and Gnesi, S.},
TITLE = {Natural language requirements processing: a 4D vision},
YEAR = {2017},
ABSTRACT = {Natural language processing (NLP) and requirements engineering (RE) have had a long relationship, yet their combined use isn't well established in industrial practice. This situation should soon change. The future evolution of the application of NLP technologies in RE can be viewed from four dimensions: discipline, dynamism, domain knowledge, and datasets},
KEYWORDS = {Natural Language Processing, Requirement Processing},
PAGES = {28-35},
URL = {http://ieeexplore.ieee.org/abstract/document/8106888/},
VOLUME = {34 (6)},
DOI = {10.1109/MS.2017.4121207},
ISSN = {0740-7459},
JOURNAL = {IEEE SOFTWARE},
}
@ARTICLE{GIANNINI_2017_ARTICLE_GBGP_332320,
AUTHOR = {Giannini, S. and Biagioni, S. and Goggi, S. and Pardelli, G.},
TITLE = {Grey Literature Citations in the age of Digital Repositories and Open Access},
YEAR = {2017},
ABSTRACT = {The work measures grey citations in the years 2012, 2013 and 2014 and then describes the features of GL documents cited in different areas of knowledge: Computational Linguistics, Computer Science and Engineering. With the aim of surveying a wide and varied range of resources, we selected a sample data based on the bibliographical references of articles contained in four journals-all indexed by Scopus Citation Database and ISI Web of Science, with an Impact Factor (IF) over the last three years-and two proceedings of international conferences held in 2012 and 2014},
KEYWORDS = {Grey Literature, Citations},
PAGES = {23-31},
URL = {http://www.greynet.org/thegreyjournal/currentissue.html},
VOLUME = {13 (1)},
ISSN = {1574-1796},
JOURNAL = {THE GREY JOURNAL},
}
@ARTICLE{GIOVANNETTI_2017_ARTICLE_GABB_354702,
AUTHOR = {Giovannetti, E. and Albanesi, D. and Bellandi, A. and Benotto, G.},
TITLE = {Traduco: A collaborative web-based CAT environment for the interpretation and translation of texts},
YEAR = {2017},
ABSTRACT = {Traduco is a web-based collaborative tool aimed at supporting the translation of texts that pose particular challenging interpretative issues. Nowadays, Computer-Assisted Translation (CAT) tools are mainly applied to the translation of technical manuals or legislative texts and are aimed at speeding up the translation process. Traduco extends most of the standard components of a traditional CAT tool with specific features necessary to support the interpretation and translation of complex texts (like the Babylonian Talmud, that we here present as a case study), which pose particular comprehension issues. Traduco goes beyond the translation and its printing: it includes features for the addition of notes and annotations and the creation of glossaries. Translators, editors, supervisors, and end-users accessing Traduco are able to use components that can ease the translation process through the use of CAT technologies, the supervision and managing of the whole process of translation and publishing, the exporting of translations and notes in standard formats for desktop publishing software and TEI format, and, soon, the possibility to perform automatic linguistic analysis of the text. Moreover, Traduco allows the users to insert notes, comments, annotations, and bibliographical references. The design and development of Traduco required the adoption of a multidisciplinary approach, leveraging on advances in software engineering, computational linguistics, knowledge engineering, and publishing},
KEYWORDS = {computer-assisted translation, talmud, progetto traduzione del talmud babilonese},
PAGES = {47-62},
URL = {http://dsh.oxfordjournals.org/content/early/2016/10/26/llc.fqw054},
VOLUME = {32 (1)},
DOI = {10.1093/llc/fqw054},
ISSN = {2055-7671},
JOURNAL = {DIGITAL SCHOLARSHIP IN THE HUMANITIES},
}
@ARTICLE{GUADAGNINI_2017_ARTICLE_G_348585,
AUTHOR = {Guadagnini, E.},
TITLE = {La lexicographie de l'Italien médiéval et les corpora de l'OVI: un bilan provisoire et quelques nouvelles perspectives},
YEAR = {2017},
ABSTRACT = {Breve storia e presentazione del TLIO e dei corpora dell'OVI},
KEYWORDS = {OVI, TLIO, Lessicografia, Linguistica italiana},
PAGES = {101-120},
URL = {https://iris.cnr.it/handle/20.500.14243/348585},
VOLUME = {7},
ISSN = {2118-2698},
JOURNAL = {DIACHRONIQUES},
}
@ARTICLE{MANCINI_2017_ARTICLE_MP_446684,
AUTHOR = {Mancini, L. and Pedretti, I.},
TITLE = {Un caso di integrazione tra Public History, Cultural Heritage e Digital Humanities: l'Archivio storico della Pontificia Università Gregoriana e il progetto Clavius@School},
YEAR = {2017},
ABSTRACT = {The Historical Archive of the Pontifical Gregorian University (APUG) has started a research project on one of its most important collections, the Christophorus Clavius's (1538-1612) correspondence. The Clavius on the web project has been enriched by the involvement of teachers and students from three Rome high schools: the Liceo Ennio Quirino Visconti, the Liceo Virgilio and the Liceo Aristofane. The name of this experience is Clavius@school. After a brief presentation about APUG, its activities and Clavius, this paper describes the work done with schools, starting from a philosophical perspective that analyzes technology according to its broader meaning},
KEYWORDS = {Clavius on the web, Cristoforo Clavio, Cultural Heritage, Digital Humanities, Public History},
PAGES = {19-27},
URL = {https://iris.cnr.it/handle/20.500.14243/446684},
VOLUME = {1},
DOI = {10.6092/issn.2532-8816/7194},
ISSN = {2532-8816},
JOURNAL = {UMANISTICA DIGITALE},
}
@ARTICLE{MARZI_2017_ARTICLE_MFN_317449,
AUTHOR = {Marzi, C. and Ferro, M. and Nahli, O.},
TITLE = {Arabic word processing and morphology induction through adaptive memory self-organisation strategies},
YEAR = {2017},
ABSTRACT = {Aim of the present study is to model the human mental lexicon, by focussing on storage and processing dynamics, as lexical organisation relies on the process of input recoding and adaptive strategies for long-term memory organisation. A fundamental issue in word processing is represented by the emergence of the morphological organisation level in the lexicon, based on paradigmatic relations between fully-stored word forms. Morphology induction can be defined as the task of perceiving and identifying morphological formatives within morphologically complex word forms, as a function of the dynamic interaction between lexical representations and distribution and degrees of regularity in lexical data. In the computational framework we propose here (TSOMs), based on Self-Organising Maps with Hebbian connections defined over a temporal layer, the identification/perception of surface morphological relations involves the alignment of recoded representations of morphologically-related input words. Facing a non-concatenative morphology such as the Arabic inflectional system prompts a reappraisal of morphology induction through adaptive organisation strategies, which affect both lexical representations and long-term storage. We will show how a strongly adaptive self-organisation during training is conducive to emergent relations between word forms, which are concurrently, redundantly and competitively stored in human mental lexicon, and to generalising knowledge of stored words to unknown forms},
KEYWORDS = {Non-concatenative morphological structure, Lexical storage and access, Topological alignment, Synchronisation, Self-Organising Maps},
PAGES = {179-188},
URL = {http://www.sciencedirect.com/science/article/pii/S1319157816301148},
VOLUME = {29 (2)},
DOI = {10.1016/j.jksuci.2016.11.006},
ISSN = {2213-1248},
JOURNAL = {JOURNAL OF KING SAUD UNIVERSITY. COMPUTER AND INFORMATION SCIENCES},
}
@ARTICLE{SALVATORI_2017_ARTICLE_SRADMM_493650,
AUTHOR = {Salvatori, E. and Rosselli Del Turco, R. and Alzetta, C. and Di Pietro, C. and Mannari, C. and Miaschi, A.},
TITLE = {The Codice Pelavicino between digital edition and Public History},
YEAR = {2017},
ABSTRACT = {The Codice Pelavicino Digitale Project aims to publish an online digital edition of the relevant manuscript of the XIII century. In this paper features of the edition and related issues are addressed. Secondly we explain motivations for choosing a digital edition as a medium: we address the background, and common concerns in the context of Academy and clerical and historical archives. Finally we give insights on the international standard adopted to markup the text, i. e. XML-TEI, and EVT, a tool adopted to generate the final website and display texts and images},
KEYWORDS = {Diplomatica, Filologia digitale, Latino medievale, Storia pubblica, TEI XML},
PAGES = {105-117},
URL = {https://iris.cnr.it/handle/20.500.14243/493650},
VOLUME = {2017 (1)},
DOI = {10.6092/issn.2532-8816/7232},
ISSN = {2532-8816},
JOURNAL = {UMANISTICA DIGITALE},
}
@ARTICLE{VENTURI_2017_ARTICLE_VDMFB_342151,
AUTHOR = {Venturi, G. and Dell'Orletta, F. and Montemagni, S. and Flore, E. and Bellandi, T.},
TITLE = {La qualità dei consensi informati. Un'analisi linguistico-computazionale della leggibilità dei testi},
YEAR = {2017},
ABSTRACT = {La leggibilità dei testi delle informative di consenso per le procedure diagnostico-terapeutiche è un requisito fondamentale, per offrire alle persone assistite l'accesso alle informazioni necessarie a una scelta consapevole delle opzioni disponibili per curare i diversi problemi di salute. La disponibilità di un testo leggibile è inoltre un aiuto per i medici responsabili della comunicazione e della raccolta del consenso, che possono impiegarlo come un ausilio alle informazioni presentate in forma verbale durante il colloquio, in modo tale da poter condividere una base di conoscenze minime da condividere con il paziente e i suoi familiari. Seppure le evidenze siano limitate in merito alla relazione tra la qualità del consenso e l'attitudine al contenzioso da parte dei pazienti in caso di trattamenti che esitano in un danno attribuibile alle cure (Durand et al., 2015), si tratta di un ambito di ricerca di crescente interesse nella letteratura sulla sicurezza (Wu et al., 2005; Manta et al., 2017). Nella casistica regionale della Toscana sulle richieste di risarcimento, solo l'1% dei sinistri include problemi di consenso informato (dati Centro GRC), probabilmente anche a causa di una sottovalutazione del diritto all'informazione da parte dei cittadini che si sottopongono a interventi programmati, connessa con una limitata consapevolezza del potere di scegliere le proprie cure che ogni persona dovrebbe poter esercitare posta di fronte alle opzioni terapeutiche disponibili per i propri problemi di salute},
KEYWORDS = {Consenso informato, valutazione automatica della leggibilità, Trattamento Automatico del Linguaggio},
PAGES = {35-39},
URL = {http://www.formas.toscana.it/rivistadellasalute/fileadmin/files/fascicoli/2017/212/SeT_fascicolo_212.pdf},
VOLUME = {212},
ISSN = {0392-4505},
JOURNAL = {SALUTE E TERRITORIO},
}
@BOOK{BURGASSI_2017_BOOK_BG_351415,
AUTHOR = {Burgassi, C. and Guadagnini, E.},
TITLE = {La tradizione delle parole. Sondaggi di lessicologia storica},
YEAR = {2017},
ABSTRACT = {Se la tradizione è trasmissione nel tempo e insieme l'eredità di ogni tempo, descrivere la tradizione delle parole significa valutare come queste cambino nella storia e in che misura il loro uso risponda alle istanze particolari di ogni epoca. Lo studio del lessico, in quest'ottica, coinvolge la dialettica tra i documenti e il quadro culturale complessivo, tra l'uno e il molteplice, tra attestazioni e lingua. I sondaggi di lessicologia storica, qui presentati, illustrano il 'comportamento' di alcune parole che appartengono oggi al vocabolario di base italiano e che hanno visto mutare nei secoli, dal Medioevo all'Età contemporanea, il loro statuto, intenso come la 'posizione' (nucleare / periferica) occupata nel lessico. La stima della posizione lessicale in una fase storica della lingua poggia su un metodo di analisi che considera vari parametri, proposti nella prima parte del volume e applicati, nella seconda parte, allo studio di casi. Le implicazioni con i problemi classici della storia della lingua e con il dibattito sul cambiamento lessicale sono tracciate nella terza parte del libro, che mira a profilare, da angolature diverse e complementari, l'insieme delle questioni pertinenti alla tradizione delle parole},
URL = {https://iris.cnr.it/handle/20.500.14243/351415},
ISBN = {9782372760164},
}
@INCOLLECTION{AMATO_2017_INCOLLECTION_ACF_339526,
AUTHOR = {Amato, G. and Cardillo, F. A. and Falchi, F.},
TITLE = {Technologies for visual localization and augmented reality in smart cities},
YEAR = {2017},
ABSTRACT = {The widespread diffusion of smart devices, such as smartphones and tablets, and the new emerging trend of wearable devices, such as smart glasses and smart watches, has pushed forward the development of applications where the user can interact relying on his or her position and field of view. In this way, users can also receive additional information in augmented reality, that is, seeing the information through the smart device, overlaid on top of the real scene. The GPS or the compass can be used to localize the user when augmented reality has to be provided with scenes of large size, for instance, squares or large buildings. However, when augmented reality has to be offered for enriching the view of small objects or small details of larger objects, for instance, statues, paintings, or epigraphs, a more precise positioning is needed. Visual object recognition and tracking technologies offer very detailed and fine-grained positioning capabilities. This chapter discusses the techniques enabling a precise positioning of the user and the subsequent experience in augmented reality, focusing on algorithms for image matching and homography estimation between the images seen by smart devices and images representing objects of interest},
KEYWORDS = {Localization, Augmented reality, Deep learning, Smart cities, Landmark recognition},
PAGES = {429-434},
URL = {https://link.springer.com/chapter/10.1007%2F978-3-319-50518-3_20},
DOI = {10.1007/978-3-319-50518-3_20},
PUBLISHER = {Springer International Publishing (Switzerland, CHE)},
ISBN = {978-3-319-50518-3},
CONFERENCE_PLACE = {Switzerland},
BOOKTITLE = {Sensing the Past: From artifact to historical site},
EDITOR = {Masini, N. and Soldovieri, F.},
}
@INCOLLECTION{BOSCHETTI_2017_INCOLLECTION_B_381122,
AUTHOR = {Boschetti, F.},
TITLE = {Alcune note di ecdotica digitale nella prospettiva della filologia collaborativa e cooperativa},
YEAR = {2017},
ABSTRACT = {In the digital age, classical philology is becoming more and more collaborative and cooperative. Even if these terms are apparently synonyms, the distinction adopted by pedagogues in the last decades is useful to describe different ways to organise collective works. Collaboration aims at the realisation of a final product, which is the result of negotiations among the involved parts. Cooperation aims at the creation of independent subproducts, which will be coordinated to achieve the agreed final result, but which can also be assembled in unpredictable new ways by third parties. In order to integrate these approaches in the domain of classical philology, first of all it is necessary to clarify the needs of a typical philologist, not just the requirements of the user of a specific project. For this reason, the last part of the article is devoted to a case study that takes into account the exploration of the secondary literature, often neglected by digital philologists but crucial to the ecdotic best practices},
URL = {https://iris.cnr.it/handle/20.500.14243/381122},
DOI = {10.14277/978-88-6969-182-9/ANT_14},
ISBN = {9788869691836},
}
@INCOLLECTION{BOSCHETTI_2017_INCOLLECTION_BDD_336800,
AUTHOR = {Boschetti, F. and Del Gratta, R. and Del Grosso, A. M.},
TITLE = {The role of digital scholarly editors in the design of components for cooperative philology},
YEAR = {2017},
ABSTRACT = {This contribution is focused on the role of the digital scholarly editor in the continuous process of analysis, development and evaluation of libraries of components for cooperative philology},
URL = {https://iris.cnr.it/handle/20.500.14243/336800},
ISBN = {978-90-8890-484-4},
}
@INCOLLECTION{BURGASSI_2017_INCOLLECTION_BG_341306,
AUTHOR = {Burgassi, C. and Guadagnini, E.},
TITLE = {L'integrazione lessicale di "facile" nel vocabolario italiano},
YEAR = {2017},
ABSTRACT = {Il contributo è dedicato a precisare lo statuto lessicale di "facile" e dei suoi concorrenti onomasiologici (come "agevole") in italiano antico, in dialogo con quanto è documentato per le altre lingue neolatine, nel solco degli studi relativi alla (s)fortuna romanza della base lat. FACILIS},
KEYWORDS = {Lessico antico, lingue romanze, onomasiologia},
PAGES = {157-177},
URL = {https://iris.cnr.it/handle/20.500.14243/341306},
PUBLISHER = {Edizioni dell'ORSO (Alessandria, ITA)},
ISBN = {978-88-6274-783-7},
CONFERENCE_PLACE = {Alessandria},
BOOKTITLE = {"Rem tene, verba sequentur". Latinità e medioevo romanzo: testi e lingue in contatto},
EDITOR = {Guadagnini, E. and Vaccaro, G.},
}
@INCOLLECTION{COPPOLA_2017_INCOLLECTION_CMRT_330654,
AUTHOR = {Coppola, D. and Moretti, R. and Russo, I. and Tranchida, F.},
TITLE = {In quante lingue mangi? Tecniche glottodidattiche e language testing in classi plurilingui e ad abilità differenziata},
YEAR = {2017},
ABSTRACT = {La diversità linguistica e culturale costituisce oggi una caratteristica struttura-le delle nostre scuole. La necessità, caldeggiata dai principali documenti nazio-nali ed europei sull'educazione, di considerare le lingue "immigrate", assieme a tutte le altre presenti in classe, come un'importante risorsa linguistica e cultura-le per gli alunni, impone la ricerca di metodologie d'insegnamento idonee a va-lorizzare l'intero repertorio linguistico dei ragazzi e di prove di verifica atte a testare in modo più adeguato le loro competenze linguistico-comunicative, senza trascurare gli importanti aspetti culturali veicolati dalle diverse lingue. Il presente contributo riporta i primi dati di un'indagine che si colloca nell'ambito di una più ampia sperimentazione, avviata nel gennaio 2015, in al-cune classi del quinto anno della scuola primaria e del primo anno della secon-daria di primo grado della provincia di Firenze, con l'obiettivo di implementare tecniche glottodidattiche cooperative supportate dalla tecnologia in classi pluri-lingui e ad abilità differenziata},
KEYWORDS = {language testing, glottodidattica, plurilinguismo},
PAGES = {199-231},
URL = {https://iris.cnr.it/handle/20.500.14243/330654},
PUBLISHER = {Pisa University Press (Pisa, ITA)},
ISBN = {978-88-6741-789-6},
CONFERENCE_PLACE = {Pisa},
BOOKTITLE = {Strutture linguistiche e dati empirici in diacronia e sincronia},
EDITOR = {Marotta, G. and Lievers, F. S.},
}
@INCOLLECTION{DELGRATTA_2017_INCOLLECTION_D_463742,
AUTHOR = {Del Gratta, R.},
TITLE = {WordNets per lingue classiche},
YEAR = {2017},
ABSTRACT = {The Wordnet for Ancient Greek (AGWN) is presented and illustrated both as a stand-alone semantic net and as a participant in a more complex net of wordnets for historical and modern languages. Two applications of AGWN carried out within the Memorata Poetis project are described: in the first application, the AGWN is used to investigate multilingual synonyms; in the second one, AGWN is used to extract Greek synonyms in order to classify epigrams in terms of similar content},
KEYWORDS = {WordNet, Perseus project, Ancient Greek Wordnet, oNLP, Classical Languages},
PAGES = {117-122},
URL = {https://iris.cnr.it/handle/20.500.14243/463742},
DOI = {10.14277/6969-182-9/ANT-14-9},
PUBLISHER = {Edizioni Ca' Foscari (Venezia, ITA)},
ISBN = {978-88-6969-183-6},
CONFERENCE_PLACE = {Venezia},
BOOKTITLE = {Strumenti digitali e collaborativi per le Scienze dell'antichità},
EDITOR = {Mastandrea, P.},
}
@INCOLLECTION{KHAN_2017_INCOLLECTION_KBFM_339934,
AUTHOR = {Khan, F. and Bellandi, A. and Frontini, F. and Monachini, M.},
TITLE = {Using SWRL rules to model noun behaviour in Italian},
YEAR = {2017},
ABSTRACT = {In this article we describe our ongoing attempts to use the Semantic Web Rule Language (SWRL) to model the morphological layer of a wide-coverage Italian lexical resource, Parole-Simple-Clips (PSC); in this case that subset of PSC dealing with Italian noun morphology. After giving a brief introduction to SWRL and to Italian noun morphology we go onto describe the actual transformation itself. Finally we describe an experiment on our dataset using SWRL rules and queries written in the Semantic Query-Enhanced Rule Web Language (SQWRL)},
KEYWORDS = {Linked Open Data, Logic Programming, Italian Morphology},
PAGES = {134-142},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85021186095\&origin=inward},
DOI = {10.1007/978-3-319-59888-8_11},
PUBLISHER = {Springer (Berlin, DEU)},
CONFERENCE_PLACE = {Berlin},
BOOKTITLE = {LANGUAGE, DATA, AND KNOWLEDGE, LDK},
EDITOR = {Gracia, J. and Bond, F. and McCrae, J. and Buitelaar, P. and Chiarcos, C. and Hellmann, S.},
}
@INCOLLECTION{MARCONI_2017_INCOLLECTION_MRC_393029,
AUTHOR = {Marconi, L. and Ruiz Miyares, L. and Cutugno, P.},
TITLE = {Características distributivas del español de Cuba a partir del análisis de dos estudios lingüísticos},
YEAR = {2017},
ABSTRACT = {El objetivo de este artículo es realizar un estudio sobre las características distributivas de un subconjunto del español de Cuba; se refiere a la información recogida en el Diccionario Ortográfico del Español-con la exclusión de las lexías complejas y de las locuciones -, o sea de los 7927 lemas que han sido generados a partir de las 93759 palabras flexionadas con sus categorías gramaticales; también se analizarán los datos del Léxico Activo-Funcional del Escolar Cubano para hacer un mapeo de las palabras utilizadas por los escolares. El artículo contiene también una serie de comparaciones de algunas propiedades distributivas derivadas del tratamiento de los datos del DOE con los resultados obtenidos mediante el análisis del Léxico Activo-Funcional del Escolar Cubano. Cuando se habla de propiedades distributivas de una lengua, estas pueden ser consideradas en relación con los lemas, con las diversas palabras flexionadas o con el número de apariciones en un corpus específico. En este artículo nos referiremos a una muestra de lemas y flexiones derivada del Diccionario Ortográfico del Español y solamente a las flexiones del Léxico Activo-Funcional del Escolar Cubano},
KEYWORDS = {Léxico, escolares, Cuba, propiedades distributivas},
PAGES = {87-111},
URL = {https://iris.cnr.it/handle/20.500.14243/393029},
PUBLISHER = {Centro de Lingüística Aplicada, Ministero de Ciencia, Tecnología y Medio Ambiente (Santiago de Cuba, CUB)},
ISBN = {978-959-7174-34-9},
CONFERENCE_PLACE = {Santiago de Cuba},
BOOKTITLE = {Estudios de Lexicología y Lexicografía Homenaje a Eloína Miyares Bermúdez},
EDITOR = {Miyares, L. R.},
}
@INCOLLECTION{MONTEMAGNI_2017_INCOLLECTION_MW_353806,
AUTHOR = {Montemagni, S. and Wieling, M.},
TITLE = {Exploring the role of extra-linguistic factors in defining dialectal variation patterns through cluster comparison},
YEAR = {2017},
ABSTRACT = {This paper contributes to two open issues in the dialectometric literature, i. e. i) whether and how patterns of linguistic variation are influenced by extra-linguistc features such as the geomorphology of the area, or cultural, administrative and political boundaries, and ii) whether and how the influence of extra-linguistic factors remains stable across linguistically-grounded partitions of data. To investigate these issues, a case study focusing on lexical variation has been carried out on a regional lexical atlas of Tuscan dialects. A variety of extra-linguistic features was taken into account, whose impact and role has been evaluated with respect to both the whole dialectal dataset and across different semantic fields},
KEYWORDS = {dialectometric literature, dialectology, linguistic variation, dialect, Tuscan, lexical atlas},
PAGES = {241-251},
URL = {http://www.let.rug.nl/festschriftnerbonne/25.%20Montemagni%20\&%20Wieling.pdf},
BOOKTITLE = {From Semantics to Dialectometry. Festschrift in honor of John Nerbonne},
EDITOR = {Wieling, M. and Kroon, M. and Van Noord, G.},
}
@INCOLLECTION{PROIETTI_2017_INCOLLECTION_P_404008,
AUTHOR = {Proietti, C.},
TITLE = {Time of Logics, time of Physics},
YEAR = {2017},
ABSTRACT = {The history of reasoning about time is disseminated with paradoxes and conundra and contemporary physics does not make an exception. Logics in general, and more in particular temporal logics, represent a rigorous formal tool in order to solve or clarify problems of this kind. In what follows we will first explain, from the point of view of philosophical logic, what is a paradox and what should count as a solution for it. After that we will illustrate A. N. Prior's formalization of the traditional paradox of future contingency and determinism. Then we will focus on two modern paradoxes-the twin paradox and the time travel paradox-and show how an adequate temporal logic can help their framing and understanding},
KEYWORDS = {Time travel, relativity, paradoxes},
PAGES = {39-53},
URL = {https://iris.cnr.it/handle/20.500.14243/404008},
DOI = {10.1007/978-3-319-53725-2},
PUBLISHER = {Springer (Cham, Heidelberg, New York, Dordrecht, London, CHE)},
ISBN = {978-3-319-53723-8},
CONFERENCE_PLACE = {Cham, Heidelberg, New York, Dordrecht, London},
BOOKTITLE = {Time of Nature and the Nature of Time},
EDITOR = {Bouton and Christophe and Huneman and Philippe},
}
@INCOLLECTION{RMANZELLA_2017_INCOLLECTION_RBBDDFMMMNS_333614,
AUTHOR = {R Manzella, G. M. and Bartolini, R. and Bustaffa, F. and D'Angelo, P. and De Mattei, M. and Frontini, F. and Maltese, M. and Medone, D. and Monachini, M. and Novellino, A. and Spada, A.},
TITLE = {Semantic Search Engine for Data Management and Sustainable Development: Marine Planning Service Platform},
YEAR = {2017},
ABSTRACT = {This chapter presents a computer platform supporting a Marine Information and Knowledge System based on a repository that gathers, classify and structures marine scientific literature and data, guaranteeing their accessibility by means of standard protocols. This requires the access to quality controlled data and to information that is provided in grey literature and/or in relevant scientific literature. There exist efforts to develop search engines to find author's contributions to scientific literature or publications. This implies the use of persistent identifiers. However very few efforts are dedicated to link publications to data that was used, or cited in them or that can be of importance for the published studies. Full-text technologies are often unsuccessful since they assume the presence of specific keywords in the text; to fix this problem, it is suggested to use different semantic technologies for retrieving the text and data and thus getting much more complying results},
KEYWORDS = {Marine Information and Knowledge System},
PAGES = {127-154},
URL = {http://www.igi-global.com/chapter/semantic-search-engine-for-data-management-and-sustainable-development/166839#},
DOI = {10.4018/978-1-5225-0700-0.ch006},
PUBLISHER = {IGI Global (Hershey, USA)},
ISSN = {5225-0700},
CONFERENCE_PLACE = {Hershey},
BOOKTITLE = {Oceanographic and Marine Cross-Domain Data Management for Sustainable Development},
EDITOR = {Paolo Diviacco, A. L. and Glaves, H.},
}
@INCOLLECTION{SASSI_2017_INCOLLECTION_S_341692,
AUTHOR = {Sassi, M.},
TITLE = {Cuestiones pertinentes e impertinentes de los Diccionarios Temáticos},
YEAR = {2017},
ABSTRACT = {Los diccionarios en general, y en particular los temáticos, han representado el hilo conductor de mi carrera en el Istituto di Linguistica Computazionale de Pisa desde y anteriormente a sus orígenes (en los años 1965-1978 se denominaba Divisione Linguistica del CNUCE y después ILC-CNR). En los 60-70 se trabajó en el DMI (Diccionario Maquina del Italiano) bajo los auspicios del Parlamento Italiano. En los 80 empezaron los primeros estudios de diccionarios organizados en Campos Léxicos, a partir de las intuiciones de Julio Casares y se aplicaron los mismos principios al italiano. A partir de estas lejanas esperiencias, a lo largo de 50 años, se han desarrollados diferentes estudios, aplicaciones, corpora y bancos de datos con relacion a varias disciplinas: Literatura, Filologia, Derecho, Justicia, Administración, Turismo, Medicina. Se han reunido compilaciones de varios Autores en idioma espanol: Bolivar, Carpentier, Cervantes, Encina, Machado, Marquez, Neruda, Salinas, Teresa de Avila, Unamuno, Vallejo, que se describerán en esta presentacion, con ejemplos de busqueda on-line mediante la interfaz DBT-Web. Se discute tambien de preservar estos datos para el futuro a traves del mantenimiento para su consulta en la red},
KEYWORDS = {Computational Linguistics, Thematic Dictionaries, Corpora, Preservation and Reuse of data, Historical overview of Text Processing},
PAGES = {37-49},
URL = {https://iris.cnr.it/handle/20.500.14243/341692},
ISBN = {978-84-617-4512-8},
BOOKTITLE = {El diccionario en la encrucijada: de la sintaxis y la cultura al desafío digital},
EDITOR = {López, S. and Cuadrado, I. G. and Escribano, J. G. and Cecilio},
}
@INCOLLECTION{SORIA_2017_INCOLLECTION_S_337284,
AUTHOR = {Soria, C.},
TITLE = {What is Digital Language Diversity and why should we care?},
YEAR = {2017},
ABSTRACT = {The relationship between language and the Internet is a growing area of policy interest and academic study, see for instance (MAAYA 2012), (Paolillo et al. 2005), (Pimienta 2001), (Kornai 2013), (Pimienta et al. 2009), (Rehm and Uszkoreit 2012). The emerging picture is one where language profoundly affects a person's experience of the Internet. It determines how much-if any-information you can access on Wikipedia. It orients a person's choices and decisions by shaping the results of a search engine, depending on the language used. It determines the range of services that can be available over the Internet, and therefore the amount of everyday tasks (such as buying a ticket, reviewing opinions about hotel and restaurants, purchasing books or other goods, etc.) that can be carried out virtually. Far from infinite, the Internet, it seems, is only as big as one's language. Should this hold true, it would be at odds with the original spirit of the Internet, which-according to the words of Tim Berners-Lee-would be a place "to cross barriers and connect cultures". But it is safe to argue that the extent to which a language can be used over the Internet not only affects a person's experience and choice of opportunities; it also affect the language itself. If a language is poorly or not supported to be used over digital devices, for instance if the keyboard of the PC is not equipped with the characters and diacritics necessary to write in the language, or if there is no spell checker for a language, then its usability becomes severely affected, and it might will never be used online. The language could become "digitally endangered", and its value and profile could be lessened, especially in the eyes of the new generations. These considerations call for closer examination of a number of related issues. First, the "digital language diversity", i. e. the linguistic diversity of the Internet. Second, it is important to reflect on the conditions that make it possible for a language to be used over digital devices, and about what can be done in order to grant this possibility to languages other than so-called "major" ones},
KEYWORDS = {digital language diversity},
PAGES = {13-28},
URL = {http://www.linguapax.org/wp-content/uploads/2015/03/LinguapaxReview2016web.pdf},
}
@EDITORIAL{BOSCHETTI_2017_EDITORIAL_B_336810,
AUTHOR = {Boschetti, F.},
TITLE = {AIUCD2016-Book of Abstracts},
YEAR = {2017},
ABSTRACT = {Raccolta di abstracts / saggi brevi presentati al quinto convegno annuale dell'Associazione per l'Informatica Umanistica e la Cultura Digitale (AIUCD2016)},
URL = {https://iris.cnr.it/handle/20.500.14243/336810},
DOI = {10.6092/unibo/amsacta/5559},
ISBN = {978-88-942535-0-4},
}
@EDITORIAL{GUADAGNINI_2017_EDITORIAL_GV_351414,
AUTHOR = {Guadagnini, E. and Vaccaro, G.},
TITLE = {Rem tene, verba sequentur. Latinità e medioevo romanzo: testi e lingue in contatto, Atti del Convegno conclusivo del progetto FIRB-Futuro in ricerca 2010 «DiVo-Dizionario dei Volgarizzamenti. Il lessico di traduzione dal latino nell'italiano delle Origini» (Firenze, Villa Medicea di Castello, 17-18 febbraio 2016)},
YEAR = {2017},
ABSTRACT = {Contributi di linguistica storica e filologia romanza},
KEYWORDS = {Filologia romanza, Linguistica romanza, Linguistica italiana, Filologia italiana, Volgarizzamenti},
URL = {https://iris.cnr.it/handle/20.500.14243/351414},
PUBLISHER = {Edizioni dell'Orso (Alessandria, ITA)},
ISBN = {9788862747837},
CONFERENCE_PLACE = {Alessandria},
}
@EDITORIAL{MONTEMAGNI_2017_EDITORIAL_MN_344003,
AUTHOR = {Montemagni, S. and Nivre, J.},
TITLE = {Proceedings of the Fourth International Conference on Dependency Linguistics (Depling 2017), September 18-20, 2017, Università di Pisa, Italy},
YEAR = {2017},
ABSTRACT = {Proceedings of the Fourth International Conference on Dependency Linguistics (Depling 2017), September 18-20, 2017, Università di Pisa, Italy},
URL = {https://iris.cnr.it/handle/20.500.14243/344003},
ISBN = {978-91-7685-467-9},
}
@EDITORIAL{PRETORIUS_2017_EDITORIAL_PS_334733,
AUTHOR = {Pretorius, L. and Soria, C.},
TITLE = {Language Resources and Evaluation. Special Issue: Collaboration and Computing for Under-resourced Languages},
YEAR = {2017},
ABSTRACT = {Special issue of the journal "Language Resources and Evaluation", dedicated to under-resourced languages},
KEYWORDS = {under-resourced languages, language resources, minority languages, endangered languages, small languages},
PAGES = {891-1084},
URL = {https://link.springer.com/journal/10579/51/4/page/1},
DOI = {10.1007/s10579-017-9405-8},
PUBLISHER = {Springer (Berlin, DEU)},
ISSN = {1574-020X},
CONFERENCE_PLACE = {Berlin},
}
@EDITORIAL{BASILI_2017_EDITORIAL_BM_344022,
AUTHOR = {Basili, R. and Montemagni, S.},
TITLE = {Nota Editoriale},
YEAR = {2017},
URL = {https://iris.cnr.it/handle/20.500.14243/344022},
ISSN = {2499-4553},
}
@EDITORIAL{PIRRELLI_2017_EDITORIAL_PZ_327066,
AUTHOR = {Pirrelli, V. and Zarghili, A.},
TITLE = {Arabic Natural Language Processing: Models, systems and applications},
YEAR = {2017},
KEYWORDS = {Natural Language Processing, Standard Modern Arabic},
PAGES = {A1-A3},
URL = {https://www.sciencedirect.com/science/article/pii/S1319157817301155},
VOLUME = {29},
DOI = {10.1016/j.jksuci.2017.04.004},
ISSN = {2213-1248},
}
@EDITORIAL{PRETORIUS_2017_EDITORIAL_PS_337242,
AUTHOR = {Pretorius, L. and Soria, C.},
TITLE = {Introduction to the Special Issue},
YEAR = {2017},
KEYWORDS = {language resources, under-resourced languages, minority languages},
PAGES = {891-895},
URL = {https://link.springer.com/article/10.1007%2Fs10579-017-9405-8},
VOLUME = {51 (4)},
DOI = {10.1007/s10579-017-9405-8},
ISSN = {1574-020X},
}
@INPROCEEDINGS{BARTOLINI_2017_INPROCEEDINGS_BPGGB_327780,
AUTHOR = {Bartolini, R. and Pardelli, G. and Goggi, S. and Giannini, S. and Biagioni, S.},
TITLE = {A terminological "journey" in the Grey Literature domain},
YEAR = {2017},
ABSTRACT = {The work analyzes a corpus constituted of the entire amount of full research papers published in the GL conference series over a time-span of more than one decade (2003-2014) with the aim of creating a terminological map of relevant words in the various GL research topics. ". corpora used to extract terminological units can be further investigated to find semantic and conceptual information on terms or to represent conceptual relationships between terms. (Bourigault D. et al., 2001). Another interesting inquiry is the terminology used in the GL conferences for describing the types of documents which can be detected (Pej?ová P. et al., 2012)},
KEYWORDS = {Grey Literature, Information Extraction IE, Terminology},
PAGES = {117-130},
URL = {https://iris.cnr.it/handle/20.500.14243/327780},
PUBLISHER = {TextRelease (Amsterdam, NLD)},
ISSN = {1386-2316},
ISBN = {978-90-77484-30-2},
CONFERENCE_NAME = {Eighteenth International Conference on Grey Literature (GL18): Leveraging Diversity in Grey Literature},
CONFERENCE_PLACE = {Amsterdam},
BOOKTITLE = {THE GL-CONFERENCE SERIES. CONFERENCE PROCEEDINGS},
EDITOR = {Farace, D. and Frantzen, J.},
}
@INPROCEEDINGS{BELLANDI_2017_INPROCEEDINGS_BGPW_340692,
AUTHOR = {Bellandi, A. and Giovannetti, E. and Piccini, S. and Weingart, A.},
TITLE = {Developing LexO: a Collaborative Editor of Multilingual Lexica and Termino-ontological Resources in the Humanities},
YEAR = {2017},
ABSTRACT = {In this paper we present a first version of LexO, a collaborative editor of multilingual lexica and termino-ontological resources. It is based on the lemon model, and aims at supporting lexicographers and terminologists in their work. Although the development of LexO is still ongoing, the editor is already being used within two research projects in the field of Computational Linguistics applied to Humanities: DiTMAO and Totus Mundus. This allowed to test the functionalities of LexO, and prove its high degree of flexibility according to the different extensions of the lemon model needed to fulfill the needs of the involved scholars},
KEYWORDS = {lexo, multi-lingual termino-ontological resources, DiTMAO, Totus Mundus},
URL = {http://www.aclweb.org/anthology/W17-7000},
CONFERENCE_NAME = {Workshop on Language, Ontology, Terminology and Knowledge Structures-LOTKS 2017},
BOOKTITLE = {Proceedings of Language, Ontology, Terminology and Knowledge Structures Workshop (LOTKS 2017)},
}
@INPROCEEDINGS{BIBULI_2017_INPROCEEDINGS_BBCCFORZ_330476,
AUTHOR = {Bibuli, M. and Bruzzone, G. and Caccia, M. and Chiarella, D. and Ferretti, R. and Odetti, A. and Ranieri, A. and Zereik, E.},
TITLE = {Cutting-edge underwater robotics-CADDY project challenges, results and future steps},
YEAR = {2017},
ABSTRACT = {This paper describes results from the EU research project CADDY on cognitive autonomous robotics to support divers. The robot communicates with the diver by understanding gestures and acknowledges by light signals and task execution. Validation trials showed feasibility of the approach. In order to successfully achieve these beyond-the-state-of-the-art objectives, a number of specific features and functionalities have been designed and developed from scratch, integrated in the overall CADDY architecture and finally tested for validation. This paper focuses on the development on some of the game-changing techniques needed to face the scientific challenges of the projects},
URL = {https://iris.cnr.it/handle/20.500.14243/330476},
ISBN = {978-3-89220-701-6},
}
@INPROCEEDINGS{BIBULI_2017_INPROCEEDINGS_BBCCFORZ_330495,
AUTHOR = {Bibuli, M. and Bruzzone, G. and Caccia, M. and Chiarella, D. and Ferretti, R. and Odetti, A. and Ranieri, A. and Zereik, E.},
TITLE = {CADDY project-how robots get close to divers},
YEAR = {2017},
ABSTRACT = {Divers operate in harsh and poorly monitored environments in which the slightest unexpected disturbance, technical malfunction, or lack of attention can have catastrophic consequences. They manoeuvre in complex 3D environments and carry cumbersome equipment, while performing their mission. The CADDY project aims to overcome such problems, by establishing an innovative paradigm, i. e. introducing in the field a robotic diver companion. This last can accompany the diver during his/her mission, being a useful companion in a twofold manner: i) helping the diver to accomplish his/her mission; and ii) monitoring the diver actions and physical state, in order to provide help (e. g. signaling problems to the surface ground station) in case of emergency. The CADDY project replaces a human buddy diver with an autonomous underwater vehicle and adds a new autonomous surface vehicle to improve monitoring, assistance, and safety of the diver's mission. The resulting system plays a threefold role similar to those that a human buddy diver should have: i) the buddy observer" that continuously monitors the diver; ii) the buddy "slave" that is the diver's "extended hand" during underwater operations performing tasks such as "do a mosaic of that area", "take a photo of that" or illuminate that"; and iii) the buddy "guide" that leads the diver through the underwater environment. In such a way to be effective once employed in such a context, the robotic buddy must exhibit cognitive behaviour through learning, interpreting, and adapting to the diver's behaviour, physical state, and actions. Moreover, in order to be "accepted" by the human divers, the robotic buddy should also interact with them in a way that result natural to the humans. For this reason, the robotic buddy has been endowed with the capability to understand diver sign language. To this regards, since this sign language is composed by few gestures and since here is the need to issue more complex commands, a completely new language, called CADDIAN, has been created, using the diver common gestures plus some more symbols. The companion robot is thus able to understand complex commands (or even entire sentences containing more than one command), validate them using the CADDIAN syntax rules and promptly responding to them by executing the requested actions. In the paper, the CADDY concept will be presented in details, and the robotic system will be described. The CADDIAN language and some hints about the related gesture recognition process will be introduced as well},
URL = {https://iris.cnr.it/handle/20.500.14243/330495},
}
@INPROCEEDINGS{BRUNATO_2017_INPROCEEDINGS_BD_339434,
AUTHOR = {Brunato, D. and Dell'Orletta, F.},
TITLE = {On the order of words in Italian: a study on genre vs complexity},
YEAR = {2017},
ABSTRACT = {In this paper we present a cross-genre study on word order variation in Italian based on automatically dependency-parsed corpora. A comparative analysis focused on dependency direction and dependency distance for major constituents in the sentence is carried out in order to assess the influence of both textual genre and linguistic complexity on the distribution of phenonemena of syntactic markedeness},
KEYWORDS = {word order, syntactic analysis, linguistic complexity, natural language processing},
PAGES = {25-31},
URL = {https://iris.cnr.it/handle/20.500.14243/339434},
CONFERENCE_NAME = {International Conference on Dependency Linguistics (Depling 2017)},
}
@INPROCEEDINGS{BURGASSI_2017_INPROCEEDINGS_BG_351409,
AUTHOR = {Burgassi, C. and Guadagnini, E.},
TITLE = {L'integrazione lessicale di "facile" nel vocabolario italiano},
YEAR = {2017},
ABSTRACT = {Studio lessicologico del lessema "facile" in italiano (e nelle lingue romanze)},
KEYWORDS = {Lessicologia storica, Latinismi, Storia della lingua},
PAGES = {157-177},
URL = {https://iris.cnr.it/handle/20.500.14243/351409},
CONFERENCE_NAME = {Rem tene, verba sequentur. Latinità e medioevo romanzo: testi e lingue in contatto},
BOOKTITLE = {Rem tene, verba sequentur. Latinità e medioevo romanzo: testi e lingue in contatto, Atti del Convegno conclusivo del progetto FIRB-Futuro in ricerca 2010 «DiVo-Dizionario dei Volgarizzamenti. Il lessico di traduzione dal latino nell'italiano delle Origini» (Firenze, Villa Medicea di Castello, 17-18 febbraio 2016)},
EDITOR = {Guadagnini, E. and Vaccaro, G.},
}
@INPROCEEDINGS{CARDILLO_2017_INPROCEEDINGS_CFMP_326587,
AUTHOR = {Cardillo, F. A. and Ferro, M. and Marzi, C. and Pirrelli, V.},
TITLE = {How "deep" is learning word inflection?},
YEAR = {2017},
ABSTRACT = {Machine learning offers two basic strategies for morphology induction: lexical segmentation and surface word relation. The first one assumes that words can be segmented into morphemes. Inducing a novel inflected form requires identification of morphemic constituents and a strategy for their recombination. The second approach dispenses with segmentation: lexical representations form part of a network of associatively related inflected forms. Production of a novel form consists in filling in one empty node in the network. Here, we present the results of a recurrent LSTM network that learns to fill in paradigm cells of incomplete verb paradigms. Although the process is not based on morpheme segmentation, the model shows sensitivity to stem selection and stem-ending boundaries},
KEYWORDS = {LSTM, Morphology induction, Cognitive modelling},
PAGES = {77-82},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85037368972\&origin=inward},
VOLUME = {2006},
DOI = {10.4000/books.aaccademia.2314},
PUBLISHER = {Accademia University Press (Torino, DEU)},
ISBN = {978-88-99982-76-8},
CONFERENCE_NAME = {Fourth Italian Conference on Computational Linguistics},
CONFERENCE_PLACE = {Torino},
BOOKTITLE = {Proceedings of the Fourth Italian Conference on Computational Linguistics (CLiC-it 2017)},
EDITOR = {Basili, R. and Nissim, M. and Satta, G.},
}
@INPROCEEDINGS{CARDILLO_2017_INPROCEEDINGS_CMR_339525,
AUTHOR = {Cardillo, F. A. and Masulli, F. and Rovetta, S.},
TITLE = {Automatic Approaches for CE-MRI Examination of the Breast: A Survey},
YEAR = {2017},
ABSTRACT = {Abstract-Breast cancer is the most frequently diagnosed non-skin cancer in women, the second leading cause of death among women. Early detection of a breast cancer is fundamental for ensuring high survival rate. Imaging techniques are used to identify suspicious modifications of breast tissue. Among these, contrast-enhanced magnetic resonance imaging (CE-MRI) is particularly interesting for its lack of exposure to radiation and its ability to highlight differences in vascularisation, typical of cancer lesions. Automatic or semi-automatic methods are especially useful with this technique, due to the high quantity of data, in the form of 4D images (3D space time), to be analysed in each test. This survey describes approaches to fully automatic computer-aided detection/diagnosis of breast lesions with CE-MRI, with particular emphasis on computational intelligence techniques},
URL = {https://iris.cnr.it/handle/20.500.14243/339525},
}
@INPROCEEDINGS{CIMINO_2017_INPROCEEDINGS_CD_341662,
AUTHOR = {Cimino, A. and Dell'Orletta, F.},
TITLE = {Stacked Sentence-Document Classifier Approach for Improving Native Language Identification},
YEAR = {2017},
ABSTRACT = {In this paper, we describe the approach of the ItaliaNLP Lab team to native language identification and discuss the results we submitted as participants to the essay track of NLI Shared Task 2017. We introduce for the first time a 2-stacked sentencedocument architecture for native language identification that is able to exploit both local sentence information and a wide set of general-purpose features qualifying the lexical and grammatical structure of the whole document. When evaluated on the official test set, our sentence-document stacked architecture obtained the best result among all the participants of the essay track with an F1 score of 0. 8818},
KEYWORDS = {Native Language Identification},
PAGES = {430-437},
URL = {https://iris.cnr.it/handle/20.500.14243/341662},
CONFERENCE_NAME = {Workshop on Innovative Use of NLP for Building Educational Applications},
}
@INPROCEEDINGS{CIMINO_2017_INPROCEEDINGS_CWDMV_342154,
AUTHOR = {Cimino, A. and Wieling, M. and Dell'Orletta, F. and Montemagni, S. and Venturi, G.},
TITLE = {Identifying predictive features for textual genre classification: The key role of syntax},
YEAR = {2017},
ABSTRACT = {The paper investigates impact and role of different feature types for the specific task of Automatic Genre Classification with the final aim of identifying the most predictive ones. The goal was pursued by carrying out incremental feature selection through Grafting using different sets of linguistic features. Achieved results for discriminating among four traditional textual genres show the key role played by syntactic features, whose impact turned out to vary across genres},
KEYWORDS = {Textual Genre Classification, Feature Selection, Syntactic Features},
PAGES = {1-6},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85037370866\&origin=inward},
VOLUME = {2006},
CONFERENCE_NAME = {Italian Conference on Computational Linguistics (CLiC-it)},
}
@INPROCEEDINGS{CUTUGNO_2017_INPROCEEDINGS_CCLMM_328766,
AUTHOR = {Cutugno, P. and Chiarella, D. and Lucentini, R. and Marconi, L. and Morgavi, G.},
TITLE = {CoLFIS: análisis de las categorias morfosintácticas},
YEAR = {2017},
ABSTRACT = {CoLFIS es una base de datos de la lengua italiana escrita de 3. 798. 275 palabras, formada de textos escritos de varios géneros analizados oportunamente y seleccionados en tres sectores distintos: diarios, periódicos y libros. El corpus realizado representa el italiano comúnmente leído, y no tanto la lengua italiana escrita en su totalidad. Esta elección se justifica en cuanto se deseaba construir un corpus, y en consecuencia un léxico de frecuencia, que se acercara lo más posible al léxico mental de un hablante de cultura media y no a un diccionario de la lengua italiana. El corpus CoLFIS ha sido sometido a una lematización completa y además se han desarrollado paquetes de software de análisis estadístico para producir los léxicos de frecuencia relativos al corpus total y a los distintos sectores. Este artículo analiza los componentes gramaticales de los diferentes textos del corpus lematizado CoLFIS; los objetivos son identificar las posibles diferencias de las partes del discurso en los textos de los diferentes sectores y subsectores que componen el corpus CoLFIS y, al mismo tiempo, tratar de establecer, para los diversos tipos de textos, dentro de qué gama de valores se coloca la relación entre sustantivos y verbos},
URL = {https://iris.cnr.it/handle/20.500.14243/328766},
ISBN = {9789597174325},
}
@INPROCEEDINGS{CUTUGNO_2017_INPROCEEDINGS_CMMCF_338751,
AUTHOR = {Cutugno, P. and Marconi, L. and Morgavi, G. and Chiarella, D. and Ferretti, M.},
TITLE = {ESTUDIOS MORFOSINTÁCTICOS Y SEMÁN TICOS EN ANTOLOGÍAS NARRATIVAS SOBRE EL TEMA Y LA EXPERIENCIA DEL VIAJE},
YEAR = {2017},
ABSTRACT = {En este trabajo queremos analizar, desde la perspectiva lingüística y estadística, los aportes de algunos jóvenes italianos entre las edades de dieciocho hasta treinta cinco años sobre el tema y la experiencia del viaje. En particular se investigó sobre las contribuciones de escritos de algunos volúmenes titulados " Partire. Antologia. "; estos volúmenes, contienen textos de jóvenes escritores, son una antología ilustrada hecha por el CTS, Centro de Turismo y Juventud Estudiantil. Se analizaron los textos, y se investigó en los lemas mas frecuentes sobretodo dentro las categorías gramaticales de los sustantivos, de los verbos y de los adjetivos; nuestra intención era extraer, por los lemas más frecuentes, las informaciones semánticas, sintácticas o textuales y mapear las palabras más representativasnde las emociones del viaje. En este artículo se han analizado los componentes gramaticales de las contribuciones escritas y los objetivos han sido identificar las posibles diferencias de las partes del discurso en los textos que componen los distintos volumen y, al mismo tiempo, tratar de establecer, para los diversos textos, dentro de qué gama de valores se coloca la relación entre sustantivos y verbos. El análisis cualitativo y cuantitativo de las palabras más frecuentes nos permitió de monitorear cómo, algunos de los relatos de viaje, se conviertan en reflexiones introspectivas cambiando el enfoque de los que escriben del viaje en el mundo a en el viaje de la vida y viceversa. El viaje, en las contribuciones, también se concibe como una vuelta en su propia ciudad, en el lugar donde uno vive, y en las descripciones se encuentran detalles únicos y exclusivos, conocidos sólo por aquellos que tienen un profundo conocimiento de un determinado lugar},
URL = {https://iris.cnr.it/handle/20.500.14243/338751},
ISBN = {9789597152378},
}
@INPROCEEDINGS{DELGROSSO_2017_INPROCEEDINGS_DGM_335873,
AUTHOR = {Del Grosso, A. M. and Giovannetti, E. and Marchi, S.},
TITLE = {The Importance of Being. Object-Oriented: Old Means for New Perspectives in Digital Textual Scholarship},
YEAR = {2017},
ABSTRACT = {In this contribution we propose an Object-Oriented (OO) approach to the design and development of reusable tools for the domain of scholarly editing. It regards some software engineering considerations about the importance of being object-oriented in implementing software applications for digital textual scholarship. This work fits into an ongoing discussion about textual modelling (Pierazzo 2015) where the need for extensible, reusable and modular applications is constantly increasing (Driscoll and Pierazzo 2016). Although the digital turn of textual scholarship is nowadays a reality and many advancements have been made in encoding and visualizing textual resources, flexible and shared models in the construction of tools for scholarly editing are still missing (Almas and Beaulieu 2013; Shillingsburg 2015; Robinson and Bordalejo 2016). This lack typically leads to the development of ad hoc-i. e. not reusable-software (Ciotti 2014; Schmidt 2014). Exploiting our experience in projects we worked on (e. g. Giovannetti et al. 2016; Abrate et al. 2014; Bozzi 2013; Del Grosso et al. 2013), we have conceived a general OO model that will be introduced in the following section (Del Grosso et al. 2016; Boschetti and Del Grosso 2015)},
KEYWORDS = {Digital Scholarly Editing, Web Application, Abstract Data Type},
PAGES = {269-274},
URL = {https://iris.cnr.it/handle/20.500.14243/335873},
VOLUME = {1},
ISBN = {9789088904837},
CONFERENCE_NAME = {Digital Scholarly Editing: Theory, Practice, Methods},
BOOKTITLE = {Advances in Digital Scholarly Editing},
}
@INPROCEEDINGS{DELVIGNA_2017_INPROCEEDINGS_DCDPT_355348,
AUTHOR = {Del Vigna, F. and Cimino, A. and Dell'Orletta, F. and Petrocchi, M. and Tesconi, M.},
TITLE = {Hate me, hate me not: Hate speech detection on Facebook},
YEAR = {2017},
ABSTRACT = {While favouring communications and easing information sharing, Social Network Sites are also used to launch harmful campaigns against specific groups and individuals. Cyberbullism, incitement to self-harm practices, sexual predation are just some of the severe effects of massive online offensives. Moreover, attacks can be carried out against groups of victims and can degenerate in physical violence. In this work, we aim at containing and preventing the alarming diffusion of such hate campaigns. Using Facebook as a benchmark, we consider the textual content of comments appeared on a set of public Italian pages. We first propose a variety of hate categories to distinguish the kind of hate. Crawled comments are then annotated by up to five distinct human annotators, according to the defined taxonomy. Leveraging morpho-syntactical features, sentiment polarity and word embedding lexicons, we design and implement two classifiers for the Italian language, based on different learning algorithms: the first based on Support Vector Machines (SVM) and the second on a particular Recurrent Neural Network named Long Short Term Memory (LSTM). We test these two learning algorithms in order to verify their classification performances on the task of hate speech recognition. The results show the effectiveness of the two classification approaches tested over the first manually annotated Italian Hate Speech Corpus of social media text},
KEYWORDS = {Hate speech, NLP, Social Networks},
PAGES = {86-95},
URL = {http://www.scopus.com/inward/record.url?eid=2-s2.0-85017337270\&partnerID=q2rCbXpz},
VOLUME = {1816},
CONFERENCE_NAME = {ITA-SEC 17},
}
@INPROCEEDINGS{FERRETTI_2017_INPROCEEDINGS_FBCCORZB_337741,
AUTHOR = {Ferretti, R. and Bibuli, M. and Caccia, M. and Chiarella, D. and Odetti, A. and Ranieri, A. and Zereik, E. and Bruzzone, G.},
TITLE = {Towards Posidonia Meadows Detection, Mapping and Automatic recognition using Unmanned Marine Vehicles},
YEAR = {2017},
ABSTRACT = {This paper reports the development of a new methodology for automatic detection and mapping of underwater vegetation by means of highly autonomous marine robotic platforms. In particular, the work describes the exploitation of a Remotely Operated Vehicle (ROV), equipped with a multi-parametric sensors package, for the exploration and characterization of sea-bottoms interested by the presence of the Posidonia oceanica seagrass, which represents a valuable indicator of the environmental health. The proposed methodology relies on the systematic exploration of the sea-bottom by means of the ROV acquiring acoustic data and video imagery of the seabed, in order to reconstruct a 2. 5D model of the environment (i. e. an elevation map of the sea-bottom). The data collection is achieved by the employment of a single beam echosounder for seabed range measurements and a down-looking underwater camera. Furthermore, an acoustic data procedural analysis is developed to automatically detect the Posidonia presence, so that in future works it will be possible to operate also in low-visibility conditions. Data acquisition was carried out over different seafloor types in coastal area near Biograd Na Moru (Croatia) and the results are reported in the paper},
KEYWORDS = {Posidonia detection, seabed mapping, Unmanned Marine Vehicles},
PAGES = {12386-12391},
URL = {https://doi.org/10.1016/j.ifacol.2017.08.2504},
VOLUME = {VOLUME 50, ISSUE 1},
DOI = {10.1016/j.ifacol.2017.08.2504},
CONFERENCE_NAME = {The 20th World Congress of the International Federation of Automatic Control, IFAC 2017},
}
@INPROCEEDINGS{FERRETTI_2017_INPROCEEDINGS_FBCCORZB_337733,
AUTHOR = {Ferretti, R. and Bibuli, M. and Caccia, M. and Chiarella, D. and Odetti, A. and Ranieri, A. and Zereik, E. and Bruzzone, G.},
TITLE = {Machine learning methods for acoustic-based automatic Posidonia meadows detection by means of unmanned marine vehicles},
YEAR = {2017},
ABSTRACT = {This work describes the exploitation of a Remotely Operated Vehicle (ROV), equipped with a multi-parametric sensors package (acoustic and video), for the exploration and characterisation of sea-bottoms covered with Posidonia oceanica seagrass, which represents a valuable indicator of the environmental health. The data collection is achieved by the employment of a single beam echosounder and a down-looking underwater camera. An acoustic data procedural analysis based on machine learning methods was developed to automatically detect the Posidonia presence, so that in future works it will be possible to operate also in low-visibility conditions, using only the acoustic sensors. Data acquisition was carried out over different seafloor types in coastal area near Biograd Na Moru (Croatia) and the preliminary results are reported in the paper},
KEYWORDS = {Machine Learning, Posidonia Detection, unmanned marine vehicles},
PAGES = {1-6},
URL = {https://ieeexplore.ieee.org/document/8084721},
DOI = {10.1109/OCEANSE.2017.8084721},
PUBLISHER = {IEEE (New York, USA)},
ISBN = {978-1-5090-5278-3},
CONFERENCE_NAME = {OCEANS 2017-Aberdeen},
CONFERENCE_PLACE = {New York},
}
@INPROCEEDINGS{GIOVANNETTI_2017_INPROCEEDINGS_GABDD_340694,
AUTHOR = {Giovannetti, E. and Albanesi, D. and Bellandi, A. and Dattilo, D. and Dell'Orletta, F.},
TITLE = {Stylometry in Computer-Assisted Translation: Experiments on the Babylonian Talmud},
YEAR = {2017},
ABSTRACT = {The purpose of this research is to experiment the application of stylometric techniques in the area of Computer-Assisted Translation to reduce the revision effort in the context of a collaborative, large scale translation project. The obtained results show a correlation between the editing extent and the compliance to some specific linguistic features, proving that supporting translators in writing translations following a desired style can actually reduce the number of following necessary interventions (and, consequently, save time) by revisors, editors and curators},
KEYWORDS = {traduco, babylonian talmud, computer-assisted translation, stylometry, readability},
PAGES = {177-182},
URL = {https://iris.cnr.it/handle/20.500.14243/340694},
PUBLISHER = {Accademia University Press (Torino, ITA)},
ISBN = {9788899982942},
CONFERENCE_NAME = {Fourth Italian Conference on Computational Linguistics (CLiC-it)},
CONFERENCE_PLACE = {Torino},
BOOKTITLE = {Proceedings of 4th Italian Conference on Computational Linguistics (CLiC-it)},
EDITOR = {Basili, R. and Nissim, M. and Satta, G.},
}
@INPROCEEDINGS{KHAN_2017_INPROCEEDINGS_KBBM_339933,
AUTHOR = {Khan, F. and Bellandi, A. and Boschetti, F. and Monachini, M.},
TITLE = {The Challenges of Converting Legacy Lexical Resources to Linked Open Data using Ontolex-Lemon: The Case of the Intermediate Liddell-Scott Lexicon},
YEAR = {2017},
ABSTRACT = {In this article we discuss the conversion of a legacy lexical resource, an abridged version of the ancient Greek-English lexicon, the Liddell-Scott-Jones lexicon, into RDF using the lemon model discussing some of the challenges we confronted during this conversion. We will also introduce the polyLemon vocabulary which we introduced to describe the structuring of the senses in a lexical entry in a dictionary},
URL = {https://iris.cnr.it/handle/20.500.14243/339933},
}
@INPROCEEDINGS{KHAN_2017_INPROCEEDINGS_KBF_342012,
AUTHOR = {Khan, F. and Bowers, J. and Frontini, F.},
TITLE = {Situating Word Senses in their Historical Context with Linked Data},
YEAR = {2017},
ABSTRACT = {In this article we present a Semantic Web-based model for creating lexical resources in which the diachronic and, more broadly, contextual dimensions of word meaning can be explicitly represented as part of a graph-based data structure. We start by discussing why Linked Data is the right publishing approach for such diachronic datasets. We then describe our model, lemonEty, which utilizes the ontology engineering technique of perdurants in order to model lexical entries as dynamic processes. Next we go onto explain how to represent etymologies using our model, and in particular how to associate temporal information with word senses, taking examples from two different lexicographic resources. In addition, we will show how our model deals with cognates and attestations},
URL = {https://iris.cnr.it/handle/20.500.14243/342012},
}
@INPROCEEDINGS{LUCENTINI_2017_INPROCEEDINGS_LCCMM_330471,
AUTHOR = {Lucentini, R. and Chiarella, D. and Cutugno, P. and Marconi, L. and Morgavi, G.},
TITLE = {ILCatalogo: a digital archive for theatre cultural heritage},
YEAR = {2017},
ABSTRACT = {In this article the final results of the research project "Digital archive of the artistic heritage of Emanuele Luzzati: the theatre" will be presented. The project, lasting two years, was funded under the Convention between the Region of Liguria and ILC-CNR for "Higher education projects Operational Programme (OP) Regional Competitiveness and Employment (CRO) European Social Fund (ESF) 2007-2013 Liguria Region axis IV Human Capital Specific Objective I / 6" and it ended on April 30th, 2015. The main theme of the research was on the structuring, integration, accessibility and maintenance of archives and the scope of intervention is related to cultural heritage},
URL = {https://iris.cnr.it/handle/20.500.14243/330471},
}
@INPROCEEDINGS{MARCONI_2017_INPROCEEDINGS_MCM_338744,
AUTHOR = {Marconi, L. and Cutugno, P. and Morgavi, G.},
TITLE = {INMIGRACIÓN: ANÁLISIS LINGÜÍSTICO DIACRÓNICO EN COMPOSICIONES DE ALUMNOS DE LA ESCUELA SECUNDARIA},
YEAR = {2017},
ABSTRACT = {ILC-CNR colaboró en "Storia di una Giovinezza diversa", un proyecto de la Onlus Comunità di Sant"Egidio, a través una actividad específica de tipo lingüístico; en esta actividad participaron cuatro escuelas de Génova: dos escuelas secundarias de tipo científico (Cassini y Fermi), una escuela secundaria clásica (Doria) y una escuela secundaria profesional (Bergese). El objetivo general del proyecto de la Onlus fue sensibilizar los estudiantes hacia la cuestión de la inmigración. ILC ha propuesto la creación de un corpus de composiciones de los alumnos llevadas a cabo en dos fases diferentes. En particular, se pidió a los estudiantes de escribir de forma voluntaria una composición sobre el tema de la inmigración. A continuación siguieron encuentros en las escuelas entre los refugiados y los estudiantes participantes al proyecto y, finalmente, se le pidió a los alumnos de volver a escribir otra vez una composición teniendo en cuenta la experiencia hecha. Se recogió un corpus de composiciones (mas de 250. 000 palabras); el corpus ha sido completamente lematizado y se llevaron a cabo análisis para la detección de frecuencias en algunas categorías gramaticales. En el estudio hemos querido investigar si y cómo las palabras usadas de los estudiantes en las composiciones había cambiado después de la experiencia hecha. En este artículo vamos a describir algunas análisis lingüísticas y en particular se centrará la atención en los componentes gramaticales de las composiciones escritas con el objetivo de identificar las posibles diferencias de las partes del discurso; además el enfoque será exponer una lista de palabras extraídas de las composiciones entre las más frecuentes que caracterizan el tema de la inmigración con el objetivo de identificar las conexiones semánticas tanto para laprimera que para la segunda composición en algunas clases},
URL = {https://iris.cnr.it/handle/20.500.14243/338744},
ISBN = {9789597152378},
}
@INPROCEEDINGS{MORGAVI_2017_INPROCEEDINGS_MMFMCLC_330469,
AUTHOR = {Morgavi, G. and Morando, M. and Ferretti, M. and Marconi, L. and Cutugno, P. and Lucentini, R. and Chiarella, D.},
TITLE = {Active aging: a user centred approach for designing a virtual village network architecture},
YEAR = {2017},
ABSTRACT = {Currently many solutions for domotic housing have been created to provide a better autonomous life for older people and to reduce health and caregiving costs. Unfortunately, assistive technology is often not accepted by old users. This may be due to the technology-oriented approach adopted in designing such systems, which does not consider enough the users' needs. This paper proposes a procedure to design an AAL(Ambient Assisted Living) system to support active aging based on the User-Centred Design approach. A virtual network architecture integrating different solutions have been designed involving final users from the very beginning of the planning stage. The result is a high usable and flexible platform that allows creating user-friendly products as well as services and realizing also high-level functions by integrating data from completely different contexts},
KEYWORDS = {Virtual Village Network, Active aging, Ambient Assisted Living, User-Centred Design Approach},
PAGES = {5},
URL = {https://iris.cnr.it/handle/20.500.14243/330469},
PUBLISHER = {Centro de Lingüística Aplicada, Ministero de Ciencia, Tecnología y Medio Ambiente (Santiago de Cuba, CUB)},
ISBN = {9789597174325},
CONFERENCE_NAME = {XV° Simposio Internacional de Comunicación Social, Eloína Miyares in memoriam},
CONFERENCE_PLACE = {Santiago de Cuba},
}
@INPROCEEDINGS{MUGELLI_2017_INPROCEEDINGS_MFBB_342010,
AUTHOR = {Mugelli, G. and Fahad Khan, A. and Bellandi, A. and Boschetti, F.},
TITLE = {Designing an Ontology for the Study of Ritual in Ancient Greek Tragedy},
YEAR = {2017},
ABSTRACT = {We examine the use of an ontology within the context of a system for the annotation and querying of ancient Greek tragic texts. This ontology in question results from the reorganisation of a tagset that was originally used in the annotation of a corpus of tragic texts for salient information regarding ritual and religion and its representation in Greek tragedy. In the article we discuss the original tagset as as providing examples of the annotation. We also describe the structure of the ontology itself as well as its use within a system for querying the annotated corpus},
URL = {https://iris.cnr.it/handle/20.500.14243/342010},
}
@INPROCEEDINGS{PARDELLI_2017_INPROCEEDINGS_PGBRM_353286,
AUTHOR = {Pardelli, G. and Goggi, S. and Bartolini, R. and Russo, I. and Monachini, M.},
TITLE = {A Geographical Visualization of GL Communities: A Snapshot},
YEAR = {2017},
ABSTRACT = {This quotation stresses the important role of the several international organizations in producing and disseminating knowledge in the field of Grey Literature (GL): the paper aims to provide a first snapshot of the geographical distribution of GL organizations and their participation to the annual International Conference on Grey Literature over the time (in the period from 2003 to 2015. See List of Conferences on Table 2). Nowadays a visual representation of data is often associated with the traditional statistical graphs, in particular for representing complex phenomena by means of maps and diagrams, which allow a deeper and more focused analysis of the data. In our case the geographical representation of stakeholders in government, academics, business and industry aims at visualizing the GL community across the globe: it concerns 674 organizations which over the years have contributed to the development of a common vision on the most pressing issues of the field by using new paradigms such as Open Access and the social networks},
KEYWORDS = {Geographical Visualization, Grey Literature Communities},
PAGES = {109-113},
URL = {http://greyguide.isti.cnr.it/wp-content/uploads/2017/04/GL18_Conference_Proceedings.pdf},
PUBLISHER = {TextRelease (Amsterdam, NLD)},
ISSN = {1386-2316},
ISBN = {978-90-77484-30-2},
CONFERENCE_NAME = {Eighteenth International Conference on Grey Literature: Leveraging Diversity in Grey Literature},
CONFERENCE_PLACE = {Amsterdam},
BOOKTITLE = {THE GL-CONFERENCE SERIES. CONFERENCE PROCEEDINGS},
EDITOR = {Farace, D. and Frantzen, J.},
}
@INPROCEEDINGS{PIRRELLI_2017_INPROCEEDINGS_P_358748,
AUTHOR = {Pirrelli, V.},
TITLE = {Co-activation and competition effects in lexical storage and processing},
YEAR = {2017},
ABSTRACT = {According to traditional wisdom in Linguistics, morphologically simple words reside in the mental lexicon, a kind of brain dictionary that contains unpredictable mappings between lexical features. Here I illustrate some of the defining features of an alternative view of the language architecture, where computation and storage are just the short-term and long-term dynamics of the same underlying process. Empirical results of a computational model of this view are reported and general implications for a theory of the lexicon are discussed},
KEYWORDS = {Mental Lexicon, Morphology, Human Language Processing, artificial neural networks, lexical self-organization},
PAGES = {1-21},
URL = {https://picgl4.files.wordpress.com/2015/11/4-paper_1_pirrelli.pdf},
CONFERENCE_NAME = {4th Patras International Conference of Graduate Students in Linguistics},
}
@INPROCEEDINGS{PROIETTI_2017_INPROCEEDINGS_P_411311,
AUTHOR = {Proietti, C.},
TITLE = {Polarization and Bipolar Probabilistic Argumentation Frameworks},
YEAR = {2017},
ABSTRACT = {Discussion among individuals about a given issue often induces polarization and bipolarization effects, i. e. individuals radicalize their initial opinion towards either the same or opposite directions. Experimental psychologists have put forward Persuasive Arguments Theory (PAT) as a clue for explaining polarization. PAT claims that adding novel and persuasive arguments pro or contra the debated issue is the major cause for polarization. Recent developments in abstract argumentation provide the tools for capturing these intuitions on a formal basis. Here Bipolar Argumentation Frameworks (BAF) are employed as a tool for encoding the information of agents in a debate relative to a given issue a. A probabilistic extension of BAF allows to encode the likelihood of the opinions pro or contra a before and after information exchange. It is shown, by a straightforward example, how these measures provide the basis to capture the intuitions of PAT},
KEYWORDS = {bipolar argumentation frameworks, group polarization},
PAGES = {22-27},
URL = {http://ceur-ws.org/},
VOLUME = {2012},
PUBLISHER = {CEUR-WS. org (Aachen, DEU)},
CONFERENCE_NAME = {AI*IA 2017},
CONFERENCE_PLACE = {Aachen},
}
@INPROCEEDINGS{PROIETTI_2017_INPROCEEDINGS_P_411308,
AUTHOR = {Proietti, C.},
TITLE = {The Dynamics of Group Polarization},
YEAR = {2017},
ABSTRACT = {Exchange of arguments in a discussion often makes individuals more radical about their initial opinion. This phenomenon is known as Group-induced Attitude Polarization. A byproduct of it are bipolarization effects, where the distance between the attitudes of two groups of individuals increases after the discussion. This paper is a first attempt to analyse the building blocks of information exchange and information update that induce polarization. I use Argumentation Frameworks as a tool for encoding the information of agents in a debate relative to a given issue a. I then adapt a specific measure of the degree of acceptability of an opinion (Matt and Toni 2008). Changes in the degree of acceptability of a, prior and posterior to information exchange, serve here as an indicator of polarization. I finally show that the way agents transmit and update information has a decisive impact on polarization and bipolarization},
KEYWORDS = {group polarization, argumentation frameworks, abstract argum},
PAGES = {195-208},
URL = {https://link.springer.com/book/10.1007/978-3-662-55665-8},
VOLUME = {10445},
DOI = {10.1007/978},
PUBLISHER = {Springer (Cham, Heidelberg, New York, Dordrecht, London, CHE)},
ISBN = {9783662556658},
CONFERENCE_NAME = {Logic, Rationality and Interaction 2017 (LORI 2017)},
CONFERENCE_PLACE = {Cham, Heidelberg, New York, Dordrecht, London},
}
@INPROCEEDINGS{PROIETTI_2017_INPROCEEDINGS_PC_459222,
AUTHOR = {Proietti and Carlo},
TITLE = {The Dynamics of Group Polarization},
YEAR = {2017},
ABSTRACT = {Exchange of arguments in a discussion often makes individuals more radical about their initial opinion. This phenomenon is known as Group-induced Attitude Polarization. A byproduct of it are bipolarization effects, where the distance between the attitudes of two groups of individuals increases after the discussion. This paper is a first attempt to analyse the building blocks of information exchange and information update that induce polarization. I use Argumentation Frameworks as a tool for encoding the information of agents in a debate relative to a given issue a. I then adapt a specific measure of the degree of acceptability of an opinion (Matt and Toni 2008). Changes in the degree of acceptability of a, prior and posterior to information exchange, serve here as an indicator of polarization. I finally show that the way agents transmit and update information has a decisive impact on polarization and bipolarization},
URL = {https://iris.cnr.it/handle/20.500.14243/459222},
DOI = {10.1007/978-3-662-55665-8_14},
ISBN = {978-3-662-55664-1},
}
@INPROCEEDINGS{SASSOLINI_2017_INPROCEEDINGS_SCC_335238,
AUTHOR = {Sassolini, E. and Cucurullo, S. and Cinini, A.},
TITLE = {I corpora digitali: dall'obsolescenza tecnologica, alla salvaguardia e alla condivisione},
YEAR = {2017},
ABSTRACT = {Studio e implementazione di un protocollo di recupero, conservazione e valorizzazione di testi e corpora digitali interessati da problemi di obsolescenza tecnologica. Le strategie di salva-guardia adottate si spingono oltre il salvataggio dei testi e la conservazione in un formato di rappresentazione in linea con gli standard internazionali (XML TEI), si pongono come obiettivo la valorizzazione di questo patrimonio attraverso nuove modalità di fruizione dei contenuti. Lo scopo è affiancare le funzionalità classiche di analisi testuale, che da sempre caratterizzano le nostre attività di ricerca, a nuove modalità grafiche e visuali di fruizione dei dati e, in alcuni casi, migrare verso dispositivi mobili e tecnologie App. In questo articolo, oltre al protocollo di recupero, presentiamo due sperimentazioni di valorizzazione di contenuti testuali. Nel primo caso proponiamo tecniche di visual analytics applicate ad un corpus testuale semi strutturato riguardante corrispondenza redatta in lingua italiana del 1600. Nel secondo caso abbiamo realizzato un'applicazione per sistema Android finalizzata all'interrogazione di dati testuali relativi ad un progetto di censimento di architetture moderne della regione Liguria},
KEYWORDS = {Testi digitali, Analisi testuale, Preservazione dei dati, Diffusione dei risultati},
PAGES = {31-35},
URL = {https://www.garr.it/it/documenti/3529-conferenza-2016-selected-papers-sassolini-et-al/file},
DOI = {10.26314/GARR-Conf16-proceeedings-06},
PUBLISHER = {Consortium GARR (Roma, ITA)},
ISBN = {978-88-905077-6-2},
CONFERENCE_NAME = {Conferenza GARR 2016-The CreActive Network},
CONFERENCE_PLACE = {Roma},
}
@INPROCEEDINGS{VADICAMO_2017_INPROCEEDINGS_VCFCDCT_340636,
AUTHOR = {Vadicamo, L. and Carrara, F. and Falchi, F. and Cimino, A. and Dell'Orletta, F. and Cresci, S. and Tesconi, M.},
TITLE = {Cross-media learning for image sentiment analysis in the wild},
YEAR = {2017},
ABSTRACT = {Much progress has been made in the field of sentiment analysis in the past years. Researchers relied on textual data for this task, while only recently they have started investigating approaches to predict sentiments from multimedia content. With the increasing amount of data shared on social media, there is also a rapidly growing interest in approaches that work "in the wild", i. e. that are able to deal with uncontrolled conditions. In this work, we faced the challenge of training a visual sentiment classifier starting from a large set of user-generated and unlabeled contents. In particular, we collected more than 3 million tweets containing both text and images, and we leveraged on the sentiment polarity of the textual contents to train a visual sentiment classifier. To the best of our knowledge, this is the first time that a cross-media learning approach is proposed and tested in this context. We assessed the validity of our model by conducting comparative studies and evaluations on a benchmark for visual sentiment analysis. Our empirical study shows that although the text associated to each image is often noisy and weakly correlated with the image content, it can be profitably exploited to train a deep Convolutional Neural Network that effectively predicts the sentiment polarity of previously unseen images},
KEYWORDS = {Big data, Data Mining, Sentiment Analysis, Social Media Analysis},
PAGES = {10},
URL = {https://ieeexplore.ieee.org/document/8265255},
DOI = {10.1109/ICCVW.2017.45},
ISBN = {978-1-5386-1034-3},
CONFERENCE_NAME = {ICCV 2017 IEEE International Conference on Computer Vision Workshops},
}
@INPROCEEDINGS{BARTOLINI_2017_INPROCEEDINGS_BGPRF_334111,
AUTHOR = {Bartolini, R. and Goggi, S. and Pardelli, G. and Russodominic Farace, I. and Frantzen, J.},
TITLE = {Data Visualization of a Grey Literature Community: A Cooperative Project},
YEAR = {2017},
ABSTRACT = {The expected outcome of this project will not only produce a revised and updated publication of International Directory of Organizations in Grey Literature, IDGL, but will also provide a visual overview of GreyNet as an international organization serving diverse communities with shared interests in grey literature. It would be a demonstration of GreyNet's commitment to research, publication, open access, education, and public awareness in this field of library and information science},
KEYWORDS = {International Directory of Organizations in Grey Literature, Data Visualization},
PAGES = {63-63},
URL = {https://iris.cnr.it/handle/20.500.14243/334111},
ISBN = {978-90-77484-32-6},
CONFERENCE_NAME = {Nineteenth International Conference on Grey Literature, GL19},
BOOKTITLE = {Nineteenth International Conference on Grey Literature Public Awareness and Access to Grey Literature. Program Book},
EDITOR = {Farace, D. and Frantzen, J.},
}
@INPROCEEDINGS{BELLANDI_2017_INPROCEEDINGS_BBFDM_331756,
AUTHOR = {Bellandi, A. and Boschetti, F. and Fahad Khan, A. and Del Grosso, A. M. and Monachini, M.},
TITLE = {Provando e riprovando modelli di dizionario storico digitale: collegare voci, citazioni, interpretazioni},
YEAR = {2017},
ABSTRACT = {Il dizionario storico è il luogo d'incontro privilegiato di linguistica e lessicografia e filologia e critica letteraria. Nella prima parte prendiamo in considerazione un caso di studio piuttosto noto, relativo all'espressione "provando e riprovando", per mostrare come perfino i luoghi citati nei dizionari, che sono introdotti con lo scopo di disambiguare i termini in contesto, non siano privi di controversie interpretative. Nella seconda parte, molto più dettagliata e più tecnica, tentiamo di aggiungere ai modelli lessicali e citazionali già esistenti ed aperti soluzioni minime che ci permettano di collegare voci, citazioni e interpretazioni all'interno dell'universo dei Linked Open Data},
KEYWORDS = {Linked Open Data LOD},
PAGES = {119-125},
URL = {http://aiucd2017.aiucd.it/wp-content/uploads/2017/01/book-of-abstract-AIUCD-2017.pdf},
CONFERENCE_NAME = {AIUCD 2017 Conference \& 3rd EADH Day},
BOOKTITLE = {AIUCD 2017 Conference},
}
@INPROCEEDINGS{BOMPOLAS_2017_INPROCEEDINGS_BMFCPR_327030,
AUTHOR = {Bompolas, S. and Marzi, C. and Ferro, M. and Cardillo, F. A. and Pirrelli, V. and Ralli, A.},
TITLE = {Transparency and predictability in Modern Greek conjugation: Implications for models of word processing},
YEAR = {2017},
ABSTRACT = {We argue that the Greek evidence calls for a substantial revision of the clear-cut interaction between transparency/predictability and regularity, to make room for a more process-oriented notion of regularity. According to this view, regularity is no longer an epiphenomenon of the design of the human language faculty and the purported dualism between rule-based and memory-based routes, but the graded result of the varying interaction of several structural factors concurrently affecting the human word processor},
KEYWORDS = {Inflectional regularity, Word Processing, Modern Greek Conjugation},
PAGES = {17-19},
URL = {http://www.lilec.it/mmm/wp/wp-content/uploads/2017/02/Book-of-abstracts_MMM11_Final.pdf},
CONFERENCE_NAME = {MMM 11: 11th Mediterranean Morphology Meeting},
BOOKTITLE = {Proceedings of the 11th Mediterranean Morphology Meeting},
}
@INPROCEEDINGS{DELGROSSO_2017_INPROCEEDINGS_DGM_339001,
AUTHOR = {Del Grosso, A. M. and Giovannetti, E. and Marchi, S.},
TITLE = {Il modello a microkernel di Omega nello sviluppo di strumenti per lo studio dei testi: dagli ADT alle API},
YEAR = {2017},
KEYWORDS = {microkernel, studio del testo, Omega, ADT, API},
PAGES = {199-205},
URL = {https://iris.cnr.it/handle/20.500.14243/339001},
ISBN = {978-88-942535-1-1},
CONFERENCE_NAME = {AIUCD 2017 Conference},
}
@INPROCEEDINGS{GOGGI_2017_INPROCEEDINGS_GPRBM_334108,
AUTHOR = {Goggi, S. and Pardelli, G. and Russo, I. and Bartolini, R. and Monachini, M.},
TITLE = {Providing Access to Grey Literature: The CLARIN Infrastructure},
YEAR = {2017},
ABSTRACT = {This work will provide a map of the documentation archived in the CLARIN infrastructure, whose purpose is to share language resources produced and managed in the various European countries but finally merged into the CLARIN data centers for allowing access, interoperability, reuse and preservation of scientific documentation as well as Grey Literature},
KEYWORDS = {CLARIN ERIC, Terminological Resources, Grey Literature},
PAGES = {60-62},
URL = {https://iris.cnr.it/handle/20.500.14243/334108},
ISBN = {978-90-77484-32-6},
CONFERENCE_NAME = {Nineteenth International Conference on Grey Literature, GL19},
BOOKTITLE = {Nineteenth International Conference on Grey Literature Public Awareness and Access to Grey Literature. Program Book},
EDITOR = {Farace, D. and Frantzen, J.},
}
@INPROCEEDINGS{MONACHINI_2017_INPROCEEDINGS_MNS_330360,
AUTHOR = {Monachini, M. and Nicolosi, A. and Stefanini, A.},
TITLE = {Digital Classics: A Survey of the Needs of Ancient Greek Scholars in Italy},
YEAR = {2017},
ABSTRACT = {This paper presents and discusses the findings of a survey carried out in order to assess the use of digital resources and digital technologies with respect to work in Ancient Greek scholarship, as well as to identify the factors that are likely to constrain its use and to elicit needs and requirements of Ancient Greek scholars in Italy. The survey is in line with the principles behind the recent user engagement strategy developed by CLARIN-ERIC and constitutes one of the national efforts undertaken by CLARIN-IT to contribute to the wider impact of CLARIN on Digital Classicists},
KEYWORDS = {CLARIN-ERIC, CLARIN-IT, CLARIN on Digital Classicists},
PAGES = {5},
URL = {https://www.clarin.eu/event/2017/clarin-annual-conference-2017-budapest-hungary},
CONFERENCE_NAME = {CLARIN Annual Conference 2017},
}
@INPROCEEDINGS{NICOLAS_2017_INPROCEEDINGS_NKMDCAEBQ_330362,
AUTHOR = {Nicolas, L. and Konig, A. and Monachini, M. and Del Gratta, R. and Calamai, S. and Abel, A. and Enea, A. and Biliotti, F. and Quochi, V.},
TITLE = {CLARIN-IT: State of Affairs, Challenges and Opportunities},
YEAR = {2017},
ABSTRACT = {This paper provides an overview on the Italian national CLARIN consortium and the status of CLARIN-IT in general. It thus discusses the current state of affairs of the consortium and provi-des information on the members, especially with regards to what they offer to CLARIN in terms of resources, services and expertise, and what CLARIN offers them to further their own research},
KEYWORDS = {Italian CLARIN consortium, CLARIN-IT},
PAGES = {4},
URL = {https://www.clarin.eu/event/2017/clarin-annual-conference-2017-budapest-hungary},
CONFERENCE_NAME = {CLARIN Annual Conference 2017},
}
@INPROCEEDINGS{PARDELLI_2017_INPROCEEDINGS_PGBD_331741,
AUTHOR = {Pardelli, G. and Giannini, S. and Boschetti, F. and Del Gratta, R.},
TITLE = {AIUCD e CLiC-it: citazioni bibliografiche a confronto},
YEAR = {2017},
ABSTRACT = {Il lavoro propone l'analisi e il confronto dei riferimenti bibliografici delle cinque edizioni annuali della Conferenza dell'Associazione per l'Informatica Umanistica e la Cultura Digitale (AIUCD) e del primo biennio (2014-2015) della Conferenza Italiana di Linguistica Computazionale (CLiC-it) per misurare la direzione in cui si muove il trend citazionale. L'analisi muove dal principio di rilevanza della citazione nella trasmissione della conoscenza in un periodo di grandi cambiamenti socioculturali e di importanti evoluzioni nelle modalità di produzione e diffusione dei risultati della ricerca scientifica. Lo scopo dello studio è quello di misurare la gamma delle risorse citate in questa area del sapere mediante l'uso di indicatori volti a comprendere la loro ampiezza, l'estensione temporale, la varietà, le relazioni con il mondo editoriale e i modelli di riferimento. L'osservazione dei risultati consente di classificare i documenti citati, di descriverne le caratteristiche e di valutare eventuali trasformazioni rispetto alle modalità di citazione tradizionali.-The paper suggests the analysis of the bibliographic references-enclosed in the proceedings of the Italian Conference on Computational Linguistics-CLICit in 2014-2015 biennium and of five AIUCD Conference editions 2012-2016. The analysis moves from the principle of relevance of citation in the transmission of knowledge in a period of great socio-cultural changes and important developments in the production and dissemination of the results in the scientific research. The purpose of the study is to measure the range of resources cited in this area of knowledge by the use of indicators aimed in understanding their wideness, the time extension, the variety, the relations with the publishing world and the reference models. The observation of the results allows to classify the cited document, to describe its characteristics and to assess any changes compared to the traditional citation mode},
KEYWORDS = {Corpus bibliografico, Analisi di metadati},
PAGES = {38-50},
URL = {http://aiucd2017.aiucd.it/wp-content/uploads/2017/01/book-of-abstract-AIUCD-2017.pdf},
CONFERENCE_NAME = {AIUCD 2017 Conference \& 3rd EADH Day},
BOOKTITLE = {AIUCD 2017 Conference},
}
@INPROCEEDINGS{PIRRELLI_2017_INPROCEEDINGS_PMFC_327022,
AUTHOR = {Pirrelli, V. and Marzi, C. and Ferro, M. and Cardillo, F. A.},
TITLE = {Paradigm Relative Entropy and Discriminative Learning},
YEAR = {2017},
ABSTRACT = {In the present contribution, we show that principles of discriminative learning of symbolic time series go a long way in accounting for these effects, thus making an important contribution to our understanding of the human lexical processor and its sensitivity to word distributions both within and across paradigms},
KEYWORDS = {Paradigm Entropy, Discriminative Learning, Mental Lexicon, Verb Inflection},
PAGES = {5},
URL = {http://w3.erss.univ-tlse2.fr/ParadigMo2017/program.html},
CONFERENCE_NAME = {ParadigMo 2017: First Workshop on Paradigmatic Word Formation Modeling},
BOOKTITLE = {Book of Abstract of the ParadigMo Workshop},
}
@INPROCEEDINGS{PIRRELLI_2017_INPROCEEDINGS_PV_327041,
AUTHOR = {Pirrelli and Vito},
TITLE = {Storage vs. Processing in Models of Word Inflection. A Neuro-computational Hebbian Perspective},
YEAR = {2017},
ABSTRACT = {The advent of connectionism in the 80's popularised the idea that the lexical processor consists of a network of parallel processing units selectively firing in response to sensory stimuli. In the light of these assumptions, the most important contribution of connectionism to the theoretical debate on lexical modelling at the time was the utter rejection of the widely accepted idea that word recognition and production require a dichotomous choice between storage and processing. However, in spite of the prima facie psycho-computational allure of this view of the lexicon, early connectionist models also embraced a number of unsatisfactory assumptions about word learning and processing. More recently, a growing number of approaches to inflection in both Psycholinguistics and Theoretical Linguistics developed the view that surface word relations represent a fundamental domain of morphological competence. Learning the morphology of a language amounts to acquiring relations between fully stored lexical forms, which are concurrently available in the speaker's mental lexicon and jointly facilitate processing of morphologically related forms through patterns of emergent self-organisation. This novel view presupposes an integrative language architecture, where storage and processing, far from being conceived of as insulated and poorly interacting modules, are the short-term and the long-term dynamics of the same underlying process of adaptive specialisation of synaptic connections. This view, upheld by recent evidence of the neuro-anatomical bases of short-term and long-term memory processes, crucially hinges on Hebbian principles of synaptic plasticity, which are, in turn, in keeping with mathematical models of discriminative learning. I contend that integrative computer models of Hebbian language learning represent an exciting way forward in current neuro-computational research on word processing, and a persistently fertile legacy of the connectionist revolution},
KEYWORDS = {Hebbian Learning, Recurrent Neural Networks, Word Inflection},
PAGES = {19-19},
URL = {https://indico.sissa.it/event/12/abstract-book.pdf},
CONFERENCE_NAME = {International Morphological Processing Conference (MoProc)},
}
@INPROCEEDINGS{RUSSO_2017_INPROCEEDINGS_RS_337274,
AUTHOR = {Russo, I. and Soria, C.},
TITLE = {Digital Language Diversity on New Media: the DLDP Survey about European Minority Languages Speakers},
YEAR = {2017},
ABSTRACT = {How does the linguistic diversity of Europe reflect in the New Media? Do regional and minority languages contribute to EU digital language diversity? In this paper we will present the results of the first survey about actual needs of European minority languages speakers regarding digital opportunities. The survey is part of the work carried out by the Digital Language Diversity Project (DLDP), a three-year Erasmus project started in September 2015. The goal of DLDP is helping minority languages speakers in the acquisition of intellectual and practical skills to create, share, and reuse online digital content, at the same time defining general guidelines and best practices for the promotion of minority languages with poor digital representation, a fact that further prevents their usability on digital media and devices. The focus of the project is on four European minority languages at different stages of digital developments (Basque, Breton, Karelian and Sardinian), and this will enable a comparison about the role of the availability of digital content for promotion of digital usage of these languages and development of language-based digital applications. With the aim of understanding the specific needs and the peculiar behaviours of speakers of these languages, during Spring 2016 we conducted a survey focused on gathering information about their personal digital use of the language and about any known digital resource and services that make use of the language. We received feedback from almost 2000 speakers and we are now in the position of analysing results for future actions. In particular, taking into account media user typology elaborated by Brandtzæg (2010) (e. g. entertainment, instrumental and advanced users) we aim to profile speakers' answers according to these different classes, in order to better understand how to make speakers aware of the opportunities new media offer for preservation and revitalisation of minority languages},
KEYWORDS = {minority l, regional languages, new media, digital language diversity, digital language development},
URL = {https://minoritylanguagesnewmedia2017.files.wordpress.com/2017/03/final_abstracts-baal-cup-seminar-on-minority-languages-in-new-media.pdf},
CONFERENCE_NAME = {BAAL-Cambridge University Press Seminar on Minority Languages in New Media},
}
@INPROCEEDINGS{SASSOLINI_2017_INPROCEEDINGS_SC_335262,
AUTHOR = {Sassolini, E. and Cinini, A.},
TITLE = {Approcci grafici all'analisi di corpora testuali},
YEAR = {2017},
ABSTRACT = {sperimentazioni finalizzate a combinare tecniche di "distant reading" e funzionalità classiche di Information Retrieval (IR) su dati testuali. Incrementare con sintesi grafiche e visuali l'offerta di strumenti di studio e di analisi dei dati testuali rappresenta una nuova frontiera del nostro ambito di ricerca consueto},
KEYWORDS = {analisi testuale, distant reading, visual analytics},
PAGES = {83-86},
URL = {http://aiucd2017.aiucd.it/wp-content/uploads/2017/01/book-of-abstract-AIUCD-2017.pdf},
CONFERENCE_NAME = {AIUCD 2017 Conference},
}
@INPROCEEDINGS{SORIA_2017_INPROCEEDINGS_S_337251,
AUTHOR = {Soria, C.},
TITLE = {The digital language vitality scale: a model for assessing digital vitality of languages},
YEAR = {2017},
ABSTRACT = {In this paper, we present the Digital Language Vitality Scale, a tool for measuring the degree of digital vitality of languages. Digital vitality can be defined as the extent to which a language is present, used and usable over the Internet through digital devices. The scale is inspired to ethnolinguistic vitality assessment (such as GIDS, Fishman 2001), updated by (Lewis and Simons 2010) as EGIDS, and the UNESCO "nine factors" (UNESCO 2003), and is based on previous work in this area such as (Kornai 2013) and (Gibson 2015). Seven levels of digital vitality are identified, from "pre-digital" to "digitally thriving", and a set of associated indicators. The indicators associated with the scale are proxies representing both digital representation (presence) of a language and digital use. They are clustered into three groups: a first group of indicators refers to digital usability of a language, for instance, the existence of Internet connection or the availability of standardised fonts for writing the language. A second group of indicators is related to the quality and amount of digital use of a language: if and how much a language is used for texting and emailing, on websites, blogs, if there are e-books, Wikipedias, if the language is used on social media. The last group of indicators correlates with the digital prestige of a language; they are a sign of a language that not only is used on digital media and devices, but it is so in a full-fledged way, enjoying the widest possible ranges of uses and applications (e. g. localised digital services, machine translation, edu-tainment products and services). The scale is currently being used in the context of the DLDP project (http: //www. dldp. eu) as an assessing instrument for digital language planning, with particular reference to regional and minority languages},
KEYWORDS = {digital vitality, language vitality, digital language diversity},
PAGES = {100-100},
URL = {https://icriml.indiana.edu/conference-program/Abstractbook.pdf},
CONFERENCE_NAME = {First International Conference on Revitalization of Indigenous and Minoritized Languages},
}
@TECHREPORT{ALBANESI_2017_TECHREPORT_ABGP_350499,
AUTHOR = {Albanesi, D. and Bellandi, A. and Giovannetti, E. and Pecchioli, A.},
TITLE = {Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-Rapporto tecnico 11},
YEAR = {2017},
ABSTRACT = {Il presente documento descrive lo stato di avanzamento del lavoro condotto dall'Istituto di Linguistica Computazionale "A. Zampolli" del CNR (ILC-CNR) nel contesto del Progetto Traduzione Talmud Babilonese in italiano nei mesi di novembre, dicembre 2016 e gennaio, febbraio 2017. Quanto qui descritto costituisce un "Rapporto sullo Stato di Avanzamento dei Lavori (SAL) dell'applicazione Web" unicamente da parte dell'ILC-CNR e si configura come l'undicesimo dei fascicoli previsti a cadenza quadrimestrale},
URL = {https://iris.cnr.it/handle/20.500.14243/350499},
}
@TECHREPORT{ALBANESI_2017_TECHREPORT_ABGPM_350502,
AUTHOR = {Albanesi, D. and Bellandi, A. and Giovannetti, E. and Pecchioli, A. and Marchi, S.},
TITLE = {Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-Rapporto tecnico 12},
YEAR = {2017},
ABSTRACT = {Il presente documento descrive lo stato di avanzamento del lavoro condotto dall'Istituto di Linguistica Computazionale "A. Zampolli" del CNR (ILC-CNR) nel contesto del Progetto Traduzione Talmud Babilonese in italiano nei mesi di marzo, aprile, maggio e giugno 2017. Quanto qui descritto costituisce un "Rapporto sullo Stato di Avanzamento dei Lavori (SAL) dell'applicazione Web" unicamente da parte dell'ILC-CNR e si configura come il dodicesimo dei fascicoli previsti a cadenza quadrimestrale},
URL = {https://iris.cnr.it/handle/20.500.14243/350502},
}
@TECHREPORT{CARLINO_2017_TECHREPORT_C_459249,
AUTHOR = {Carlino, M.},
TITLE = {Rapporto annuale 2016 del CNR-ILC},
YEAR = {2017},
ABSTRACT = {CNR-ILC Activity Report 2016},
KEYWORDS = {Activity report, Annual Report, Istituto di Linguistica Computazionale, CNR-ILC, Rapporto Annuale},
PAGES = {1-54},
URL = {https://iris.cnr.it/handle/20.500.14243/459249},
}
@TECHREPORT{CININI_2017_TECHREPORT_CCS_373360,
AUTHOR = {Cinini, A. and Cucurullo, S. and Sassolini, E.},
TITLE = {Rapporto Tecnico: Standardizzazione del corpus testuale del PRIN Crusca},
YEAR = {2017},
ABSTRACT = {Attività previste nella convenzione operativa tra ILC-CNR e Accademia della Crusca che riguardano la progettazione e lo sviluppo di una piattaforma Web modulare per l'archiviazione, la gestione e l'interrogazione di corpora testuali in lingua italiana, con funzionalità derivate dal DBT (Data Base Testuale) nelle sue diverse implementazioni. Il lavoro preliminare svolto riguarda anche la normalizzazione dei testi e la conversione nello standard di rappresentazione XML TEI},
KEYWORDS = {Codifica dei testi, Analisi testuale, formato XML TEI},
PAGES = {1-21},
URL = {https://iris.cnr.it/handle/20.500.14243/373360},
}
@TECHREPORT{FERRETTI_2017_TECHREPORT_FM_332833,
AUTHOR = {Ferretti, M. and Morgavi, G.},
TITLE = {Analisi delle caratteristiche accettabili per un robot di supporto agli anziani},
YEAR = {2017},
ABSTRACT = {Il lavoro analizza i dati raccolti, nell'ambito di tirocinio post laurea magistrale, attraverso la somministrazione di 25 schede ad un campione di 153 persone over sessantacinque anni. Le schede, contenenti ciascuna due o tre fotografie di uno stesso robot, sono state realizzate scegliendo immagini a colori, in cui possibilmente fossero presenti elementi (persone o oggetti di dimensione nota) che permettessero all'osservatore di arguire informazioni sulle dimensioni e le funzioni possibili del robot. Obiettivo dell'indagine era quello di valutare le caratteristiche che rendono un robot di servizio per l'anziano accettabile ed utilizzabile, al fine di comprendere le peculiarità che dovrebbe avere un tale dispositivo per essere realmente utilizzato in un contesto domestico con una persona anziana},
KEYWORDS = {Active Aging, ICT for elderly, Intervista strutturata},
PAGES = {1-39},
URL = {https://iris.cnr.it/handle/20.500.14243/332833},
}
@TECHREPORT{ROMARY_2017_TECHREPORT_RV_342709,
AUTHOR = {Romary, L. and Van Nispen Maciej Ogrodniczuk Nikolaos Papadakis Graziella Pastore Stefan Pernes Marie Purencharles Riondet Mikel Sanz Maurizio Sanesi Panayiotis Siozos Reinier De Valk, P. B. J. B. D. M. U. R. G. I. A. J. F. K. M. K. L. A. L. M. A.},
TITLE = {Report on Standardization (draft)},
YEAR = {2017},
ABSTRACT = {The present report reflects the second stage of the definition of the Standardisation Survival Kit (SSK) within Work Package 4 of the PARTHENOS project. On the basis of the various user scenarios presented in Deliverable 4. 1, where each stage of the research process has been annotated according to the actual standards that are actually needed in order to fulfil the research task, we present here a systematic review of the activities that have to be carried out to provide support to researchers in using, but also contributing to, these standards},
URL = {https://iris.cnr.it/handle/20.500.14243/342709},
}
@TECHREPORT{RUSSO_2017_TECHREPORT_RS_334736,
AUTHOR = {Russo, I. and Soria, C.},
TITLE = {Sardinian-a digital language?},
YEAR = {2017},
ABSTRACT = {In this report we present the results of the first survey about the actual needs of Sardinian speakers in terms of digital opportunities},
KEYWORDS = {digital use, digital language diversity, Sardinian},
URL = {http://www.dldp.eu/sites/default/files/documents/DLDP_Sardinian-Report.pdf},
}
@TECHREPORT{SASSOLINI_2017_TECHREPORT_SC_371867,
AUTHOR = {Sassolini, E. and Cinini, A.},
TITLE = {DIGESTO: NUOVE FUNZIONALITÀ E SITO WEB},
YEAR = {2017},
ABSTRACT = {Realizzazione di un nuovo sito web per la consultazione dei testi bilingui, con sviluppo di nuove funzionalità di ricerca, non più solo per parola ma anche per Titolo, Frammento o Paragrafo. Realizzazione di una versione PDF scaricabile di parti ragionate dell'intero corpus},
KEYWORDS = {testi paralleli, sito web, analisi testuale, visual analytics},
PAGES = {1-12},
URL = {https://iris.cnr.it/handle/20.500.14243/371867},
}
@MISC{ALBANESI_2017_MISC_ABBCDGCP_404165,
AUTHOR = {Albanesi, D. and Bellandi, A. and Bulleri, F. and Carniani, E. and Dattilo, D. and Giovannetti, E. and Colombo, M. and Papini, M.},
TITLE = {Traduco},
YEAR = {2017},
ABSTRACT = {il Progetto Traduzione del Talmud Babilonese ha permesso di allestire una "officina digitale" specializzata nella traduzione di testi di particolare complessità interpretativa, quali, appunto, il Talmud Babilonese. Per la realizzazione della complessa opera di traduzione è stata costituita una équipe multidisciplinare che ha coinvolto traduttori, revisori di contenuto, redattori, curatori e grafici che, attraverso la piattaforma digitale Traduco hanno potuto lavorare congiuntamente sul testo da diversi luoghi del mondo. Traduco è uno strumento web collaborativo per la traduzione assistita di testi, per lo sviluppo del quale sono state condotte ricerche specifiche, sia nell'ambito dell'Ingegneria del Software che in quello della Linguistica Computazionale. Attraverso il lavoro di ricerca, è stato possibile mettere a punto un ambiente "intelligente" di supporto alla traduzione con caratteristiche innovative. Traduco ha consentito, come side effect positivo del processo vero e proprio di traduzione, di produrre innovazione tecnologica e scientifica},
KEYWORDS = {traduzione collaborativa, traduzione assistita dal calcolatore, linguistica computazionale, traduco, talmud babilonese},
URL = {https://iris.cnr.it/handle/20.500.14243/404165},
}
@MISC{BELLANDI_2017_MISC_B_350510,
AUTHOR = {Bellandi, A.},
TITLE = {Lexique de la Terminologie Saussurienne: Interface d'Interrogation},
YEAR = {2017},
ABSTRACT = {One of the aim of the project was the creation of an electronic thesaurus-lexicon of Saussure's linguistic terminology. Such a lexicon, based on a multidimensional structuring of the domain specific concepts and that offers a highly structured, rich and explicit semantic representation, allows a scholar to browse and query the lexical data-be it a semantic relation, a semantic feature, a lexical unit, or any combination. The different typologies of queries enable to acquire a deeper understanding of the componential and relational nature of meaning},
URL = {https://iris.cnr.it/handle/20.500.14243/350510},
}
@MISC{BELLANDI_2017_MISC_BKB_350512,
AUTHOR = {Bellandi, A. and Khan, F. and Boschetti, F.},
TITLE = {Linked Data Version of the Intermediate Greek English Lexicon},
YEAR = {2017},
ABSTRACT = {A linked data version of the intermediate greek english lexicon by Liddell-Scott-Jones encoded using the ontolex-lemon vocabulary},
URL = {https://iris.cnr.it/handle/20.500.14243/350512},
}
@MISC{CARRARA_2017_MISC_CCCDFVT_411838,
AUTHOR = {Carrara, F. and Cimino, A. and Cresci, S. and Dell'Orletta, F. and Falchi, F. and Vadicamo, L. and Tesconi, M.},
TITLE = {T4SA: Twitter for Sentiment Analysis},
YEAR = {2017},
ABSTRACT = {T4SA is intended for training and testing image sentiment analysis approaches. It contains little less than a million tweets, corresponding to about 1. 5M images. We initially collected about 3. 4M tweets corresponding to about 4M images. We classified the sentiment polarity of the texts (as described in Section 4) and we selected the tweets having the most confident textual sentiment predictions to build our Twitter for Sentiment Analysis (T4SA) dataset. The dataset is publicly available at: http: //www. t4sa. it/},
KEYWORDS = {social media, sentiment analysis, image analysis, image sentiment analysis, deep learning, multimedia sentiment analysis, dataset, tweets},
URL = {http://www.t4sa.it/},
}
@MISC{DELGRATTA_2017_MISC_D_336808,
AUTHOR = {Del Gratta, R.},
TITLE = {(Re)Using OpeNER and PANACEA Web Services in the CLARIN Research Infrastructure},
YEAR = {2017},
ABSTRACT = {We describe the implications of (re)using the OpeNer and PANACEA Web Services into the CLARIN Research Infrastructure. The analyzed tools are of great interest for specific communities such as academic and small business focused on sentiment/opinion analysis and on Machine Translation along with related technologies, but their outcomes may be of great importance for the CLARIN audience as well. In fact, the Virtual Language Observatory shows a lot of lexical resources for sentiment but a few tool, while a lot of lexical resources and tools are available for Machine Translation. This means that the latter community is already in CLARIN, while the former should be poked. If community-related challenges are on the political side, issues related to interoperability are definitely on the technical one. The initiative is carried out at the ILC4CLARIN center in Pisa, the leading one of the CLARIN-IT national Consortium. The least common multiple between those two projects is neither limited to tools and Web Services nor to the creation of annotated corpora and lexicons; neither to the focus they have on specific communities. They also are based on (and strongly pursue and suggest) the concept of interoperability. This is clear from the use of the Kyoto Annotation Format in OpeNer, of Graph Annotation Format in PANACEA8 and of and the Lexical Markup Framework in both. Data and tools interoperability is also a key asset in both CLARIN (https: //www. clarin. eu/event/2017/clarin-workshop-towards-interoperability-lexico-semantic-resources) and EUDAT (https: //eudat. eu/communities/an-eudat-based-fair-data-approach-for-data-interoperability). Within CLARIN, initiatives such as the Language Resource Switchboard and openly go towards methodologies and "systems" to address the interoperability issues. From a technical point of view the main issues are briefly reported below: 1. Many tools in OpeNer and PANACEA are command line ones; 2. OpeNer o_ers both POST and GET API; 3. PANACEA built its Web Services using Soaplab11 and o_ers SOAP Web Services; 4. KAF, LMF and GrAF guarantee the interoperability among data and services; 5. Simple pipelines are available in OpeNer, while a workow engine has been used in PANACEA. Tools are already wrapped, but to fully meet the requirements of both LRS and WebLicht we have to build a new shell around the command line tools so that REST APIs can accept both POST and GET requests and accept/produce different formats. Indeed if Language Resource Switchboard accepts tools with their output format but requires to read data from URL in plain text, WebLicht accepts tools which read and write the TCF format. While OpeNer requires that the core (the command line) be wrapped into a REST shell, Web Services in PANACEA need REST APIs around a SOAP core. In the final paper, we will finalize the technical aspects and describe how the User Involvement group can play an important role in poking the sentiment/opinion community in CLARIN},
KEYWORDS = {Web Services, Clarin, Research Infrastructures},
URL = {https://office.clarin.eu/v/CE-2019-1512_CLARIN2019_ConferenceProceedings.pdf},
CONFERENCE_NAME = {Digital Infrastructures for Research 2017},
}
@MISC{DELGROSSO_2017_MISC_D_370140,
AUTHOR = {Del Grosso, A. M.},
TITLE = {Modelli Concettuali e Architetture orientate agli oggetti per la Progettazione e lo Sviluppo di una Digital Scholarly Platform},
YEAR = {2017},
ABSTRACT = {L'intervento affronta temi legati alla progettazione concettuale e alla definizione di architetture software object-oriented per lo sviluppo di una Digital Scholarly Platform},
KEYWORDS = {digital philology, computational philology, software engineering},
URL = {https://iris.cnr.it/handle/20.500.14243/370140},
}
@MISC{DELGROSSO_2017_MISC_D_370141,
AUTHOR = {Del Grosso, A. M.},
TITLE = {Tools for Digital Textual Scholarship},
YEAR = {2017},
ABSTRACT = {la presentazione illustra le architetture software per la realizzazione di biblioteche digitali e archivi digitali, con particolare riguardo agli aspetti di studio filologico del testo},
KEYWORDS = {computational philology, digital philology, digital humanities},
URL = {https://iris.cnr.it/handle/20.500.14243/370141},
}
@MISC{DELGROSSO_2017_MISC_D_348280,
AUTHOR = {Del Grosso, A. M.},
TITLE = {Digital Textual Scholarship Tools: From Digitizing Historical Archives To Digital Scholarly Editing Models},
YEAR = {2017},
ABSTRACT = {The contribution illustrates fundamental aspects concerning the digitization of a historical archive for scholarly studies. During the first part of the talk I briefly introduce the standard reference model for digital archives, thereafter, I will show some features and technologies about the production of digital facsimiles from original primary sources. Beside this topic the metadata issues will be pointed out. Afterwards, digital transcription tools and text recognition tasks will be highlighted. Highlights on digital textual scholarship will introduce the text encoding and the annotation topics. This talk ends with an overview of tools for visualizing, indexing and searching textual content},
KEYWORDS = {historical archive, digital textual scholarship, digital humanities, digital libraries, computational philology, software engineering},
URL = {https://iris.cnr.it/handle/20.500.14243/348280},
CONFERENCE_NAME = {International Workshop on Machine Learning and Natural Language Processing},
}
@MISC{DELGROSSO_2017_MISC_D_346827,
AUTHOR = {Del Grosso, A. M.},
TITLE = {Domain Driven Design and Domain Specific Modelling for Digital Textual Scholarship},
YEAR = {2017},
ABSTRACT = {Over the last years, the digital turn and the world wide web have led historical studies towards an automatic processing of their own data and consequently towards new forms of scholarly editing and publications. In this framework, scholars have adopted digital models, electronic elements and computational features in their work, but these new instruments are generally derived from other disciplines. For example, they exploit optical character recognition from image processing, corpora annotation and natural language processing from computational linguistics, text alignment from bioinformatics, text meaning from knowledge engineering, text presentation from data visualization. However, these latter research areas do not cover entirely the specificity of the fundamental requirements of the scholarly domain (for instance, treebank data models do not provide the adequate abstractions to manage multiple variant readings and multiple text interpretations). To exceed these issues, it is essential to adopt correct design approaches devoted to analyze the problem space of the historical source editing field. This rigorous and formal analysis will shape suitable architectures, design patterns, data abstractions and procedural abstractions for the constitutive features of the digital scholarly editions. Moreover, this modelling process will produce generic, flexible, maintainable and reusable digital models and modular textual scholarly environments. This contribution aims at discussing software engineering approaches, within an object-oriented paradigm, towards the definition of domain specific abstractions (DS-ADTs). In this way, it will be possible to accommodate domain needs by formally defining core "unities of concerns" which actually adhere to both the traditional and the digital editorial domain},
KEYWORDS = {Domain Driven Design, Digital Scholarly Editing, Computational Philology, Digital Philology},
URL = {http://atlasfontium.pl/edition2.0/Home-and-News.php},
CONFERENCE_NAME = {Historical Source Edition 2. 0},
}
@MISC{DELGROSSO_2017_MISC_D_461377,
AUTHOR = {Del Grosso, A. M.},
TITLE = {Introduzione alle tecnologie digitali per la redazione e la pubblicazione di contenuti Web},
YEAR = {2017},
ABSTRACT = {Introduzione alle tecnologie digitali per la redazione e la pubblicazione di contenuti Web},
KEYWORDS = {tecnologie web, html, css},
URL = {https://iris.cnr.it/handle/20.500.14243/461377},
}
@MISC{DELGROSSO_2017_MISC_D_348343,
AUTHOR = {Del Grosso, A. M.},
TITLE = {Annotazioni collaborative di testi storici},
YEAR = {2017},
ABSTRACT = {Con l'avvento delle tecnologie e degli strumenti digitali, l'annotazione di testi (storici) è divenuta ancora più importante ed essenziale nel lavoro di strutturazione, di analisi e di comprensione dei fenomeni testuali. Inoltre, considerando gli aspetti più filologici, la realizzazione di una edizione digitale semanticamente connotata determina il bisogno di arricchire il testo con informazioni di varia granularità, di varia natura e di vario tipo. Questo intervento presenterà un approccio all'annotazione che tragga vantaggio dal Web semantico e dalle sue tecnologie. Le risorse testuali verranno caratterizzate da una forte interconnessione con risorse esterne favorendo di fatto la costruzione e l'interrogazione di un'unica banca dati globale, condivisa e formalmente descritta. In concreto, verrà presentato come scrivere annotazioni in RDF, utilizzando strumenti di annotazione disponibili sul web: a) il Text Encoder and Annotator (TEA); b) Annotarium. Il primo orientato alla trascrizione e all'annotazione delle risorse testuali, il secondo orientato alla gestione e alla interrogazione full-text e concettuale delle risorse annotate},
KEYWORDS = {Digital Humanities, tools, software engineering, semantic web, digital edition},
URL = {https://digitaltools.labcd.unipi.it/past-editions/resources2017/#DelGrosso},
}
@MISC{DELGROSSO_2017_MISC_D_370142,
AUTHOR = {Del Grosso, A. M.},
TITLE = {Strumenti software per lo studio e l'analisi di risorse testuali},
YEAR = {2017},
ABSTRACT = {Il contributo introduce i principali strumenti digitali per l'analisi dei testi letterari. Inoltre saranno illustrati gli strumenti sviluppati dal gruppo di Literary Computing dell'Istituto},
KEYWORDS = {digital humanities, digital philology, software, software engineering},
URL = {https://iris.cnr.it/handle/20.500.14243/370142},
}
@MISC{DELGROSSO_2017_MISC_DGM_340684,
AUTHOR = {Del Grosso, A. M. and Giovannetti, E. and Marchi, S.},
TITLE = {Thinking like the "Modern Operating Systems": The Omega architecture and the Clavius on the Web project},
YEAR = {2017},
ABSTRACT = {The current digital turn in studying and analyzing historical documents results in both having machine actionable cultural data and providing software able to process them. However, these data and services often lack in integration strategies among them in order to be reused in other contexts different from the original ones. As pointed out by Franz Fischer in a worthy of note article: "There is no out-of-the-box software available for creating truly critical and truly digital editions at the same time" [1]. Likewise, Monica Berti stated that is now important to "build a model for representing quotations and text reuses of lost works in a digital environment" [2]. In this vision Bridget Almas is in charge of developing an integrated platform for collaboratively transcribing, editing, and translating historical documents and texts. She claimed that through this platform, called Perseids, students and scholars are able to create open source digital scholarly editions [3]. A number of interesting projects are currently under development to realize general models, digital services, and online tools that can be adopted as part of a long-term infrastructure for managing digital editions. Among Perseids and others, we cite as reference systems (a) the Textual Community project led by P. Robinson and B. Bordalejo, (b) the AustESE project led by the Australian eResearch group, (c) the Tagore Online Variorum "Bichitra" project led by Sukanta Chaudhuri, (d) Homer Multitext led by Neel Smith and Christopher Blackwell, (e) Sharing Ancient Wisdoms founded by the HERA network},
KEYWORDS = {Omega, object-oriented design, digital scholarly editing, clavius on the web},
URL = {https://iris.cnr.it/handle/20.500.14243/340684},
CONFERENCE_NAME = {Global Philology Open Conference},
}
@MISC{DELGROSSO_2017_MISC_DM_348347,
AUTHOR = {Del Grosso, A. M. and Marchi, S.},
TITLE = {Clavius on The Web search framework},
YEAR = {2017},
ABSTRACT = {Search engine and restful API developed within the Clavius On the Web project},
KEYWORDS = {digital humanities, computational philology, software engineering, search engine},
URL = {https://github.com/literarycomputinglab/ClaviusSearch},
}
@MISC{DIDONATO_2017_MISC_D_408451,
AUTHOR = {Di Donato, F.},
TITLE = {How to deal with a DH project. Methodologies and workflows},
YEAR = {2017},
ABSTRACT = {Presentazione di alcune esperienze di progetti in Digital Humanities a Net7},
URL = {https://iris.cnr.it/handle/20.500.14243/408451},
}
@MISC{DIDONATO_2017_MISC_D_408448,
AUTHOR = {Di Donato, F.},
TITLE = {Pundit},
YEAR = {2017},
ABSTRACT = {presentation of pundit and the GO-FAIR initiative},
URL = {https://iris.cnr.it/handle/20.500.14243/408448},
}
@MISC{GIOVANNETTI_2017_MISC_GD_350043,
AUTHOR = {Giovannetti, E. and Del Grosso, A. M.},
TITLE = {LicoLab@LabexObvil},
YEAR = {2017},
ABSTRACT = {This talk illustrates some aspects of our research activities, specifically some outcomes carried out during designing and developing a digital environment for textual scholarship},
KEYWORDS = {digital humanities, computational philology, software engineering},
URL = {https://iris.cnr.it/handle/20.500.14243/350043},
}
@MISC{MARTONE_2017_MISC_MADFU_381984,
AUTHOR = {Martone, M. and Andreini, G. and Di Donato, F. and Fowler, P. and Udell, J.},
TITLE = {Annotating all Knowledge: Adventures in Interoperability},
YEAR = {2017},
ABSTRACT = {The Annotating All Knowledge Coalition was founded as a forum for accelerating the development of a pervasive interoperable annotation layer across all scholarly works. Figuring out what, exactly, an interoperable annotation layer means was one of the first goals of the coalition. We took the first steps towards defining what an interoperable layer looks like and how it should operate at our Face to Face meetings at FORCE2016 and I Annotate. So what are the next steps? Participants in both events felt strongly that the best way to move forward was to "Just do it", that is, identify a use case where you have a need to share annotations across: tools, content, platforms, workflows. Interoperability can be realized at many different levels, so the goal is explore some of the practical issues that will have to be addressed by trying to implement even basic functionality. With these practical examples in hand, we can start to focus on critical aspects of interoperability in year 2. In that spirit, folks at Pundit and Hypothesis, two open web-based annotation tools, got together to conduct a little interoperability exploration using our respective tools},
URL = {https://iris.cnr.it/handle/20.500.14243/381984},
}
@MISC{MONACHINI_2017_MISC_M_341670,
AUTHOR = {Monachini, M.},
TITLE = {Discipline umanistiche: vantaggi, opportunità e benefici dell'Infrastruttura di Ricerca CLARIN e del nodo nazionale CLARIN-IT per la comunità italiana},
YEAR = {2017},
ABSTRACT = {L'interesse da parte delle scienze umane e sociali per le tecnologie del linguaggio non è mai stato così attuale come in questo momento storico. Le principali conferenze di Digital Humanities vedono sempre più la partecipazione di linguisti computazionali, mentre nelle conferenze di Trattamento Automatico del Linguaggio (TAL), l'applicazione di soluzioni TAL alle scienze umane e sociali costituisce una tematica che si affianca a quella delle ricadute industriali. Il bisogno di rispondere alle esigenze di una platea di utenti diversa apre nuove prospettive e offre una sfida rilevante per il settore delle tecnologie del linguaggio. I testi da trattare in ambito umanistico possono essere spesso eterogenei per genere, per periodo storico, per tipologia e nuovi tipi di analisi testuale acquistano particolare rilevanza. I software di analisi devono permettere una elaborazione automatica affidabile di tipologie di dati diversi da quelli che comunemente vengono usati nel TAL. La qualità delle risorse, in particolare la qualità dei vari livelli di annotazione acquista maggiore importanza quando queste devono essere usate per fare ricerca. Diventa cruciale sviluppare strumenti facilmente usabili e adattabili a diverse tipologie di contenuto e fornire soluzioni volte facilitare il reperimento e la condivisione di risorse e di tecnologie. E' proprio per rispondere a queste esigenze e per far incontrare chi produce e sviluppa risorse e tecnologie linguistiche con chi le usa, che è stata creata CLARIN (Common Language Resources Infrastructure for Social Sciences and Humanities), l'infrastruttura di ricerca europea per le risorse linguistiche al servizio delle scienze umane e sociali. CLARIN favorisce lo sviluppo di soluzioni tecnologiche volte a rendere le risorse e le tecnologie linguistiche visibili e disponibili per studiosi, ricercatori, studenti e cittadini, attraverso una modalità unificata e standardizzata di accesso. Tale innovazione consente di adottare nuovi e diversi approcci alla disciplina tradizionale determinando, in prospettiva, nuove consuetudini di studio che, sulla base delle buone pratiche lasciate in eredità dalla tradizione precedente, permettono lo sviluppo di una diversa e più attuale metodologia di ricerca e di prassi didattica},
KEYWORDS = {Digital Humanities, CLARIN-IT},
URL = {https://apps.unive.it/server/eventi/13818/master%202017-2018%2011-2017-1.pdf},
ISSN = {2011-2017},
CONFERENCE_NAME = {Università Ca' Foscari. Cerimonia conclusiva Master Digital Humanities},
}
@MISC{MONACHINI_2017_MISC_M_341683,
AUTHOR = {Monachini, M.},
TITLE = {Infrastrutture di Ricerca e Studi Classici. CLARIN-IT: opportunità e prospettive},
YEAR = {2017},
ABSTRACT = {L'interesse da parte delle scienze umane e sociali per le tecnologie del linguaggio non è mai stato così attuale come in questo momento storico. Le principali conferenze di Digital Humanities vedono sempre più la partecipazione di linguisti computazionali, mentre nelle conferenze di Trattamento Automatico del Linguaggio (TAL), l'applicazione di soluzioni TAL alle scienze umane e sociali costituisce una tematica che si affianca a quella delle ricadute industriali. Il bisogno di rispondere alle esigenze di una platea di utenti diversa apre nuove prospettive e offre una sfida rilevante per il settore delle tecnologie del linguaggio. I testi da trattare in ambito umanistico possono essere spesso eterogenei per genere, per periodo storico, per tipologia e nuovi tipi di analisi testuale acquistano particolare rilevanza. I software di analisi devono permettere una elaborazione automatica affidabile di tipologie di dati diversi da quelli che comunemente vengono usati nel TAL. La qualità delle risorse, in particolare la qualità dei vari livelli di annotazione acquista maggiore importanza quando queste devono essere usate per fare ricerca. Diventa cruciale sviluppare strumenti facilmente usabili e adattabili a diverse tipologie di contenuto e fornire soluzioni volte facilitare il reperimento e la condivisione di risorse e di tecnologie. E' proprio per rispondere a queste esigenze e per far incontrare chi produce e sviluppa risorse e tecnologie linguistiche con chi le usa, che è stata creata CLARIN (Common Language Resources Infrastructure for Social Sciences and Humanities), l'infrastruttura di ricerca europea per le risorse linguistiche al servizio delle scienze umane e sociali. CLARIN favorisce lo sviluppo di soluzioni tecnologiche volte a rendere le risorse e le tecnologie linguistiche visibili e disponibili per studiosi, ricercatori, studenti e cittadini, attraverso una modalità unificata e standardizzata di accesso. Tale innovazione consente di adottare nuovi e diversi approcci alla disciplina tradizionale determinando, in prospettiva, nuove consuetudini di studio che, sulla base delle buone pratiche lasciate in eredità dalla tradizione precedente, permettono lo sviluppo di una diversa e più attuale metodologia di ricerca e di prassi didattica},
KEYWORDS = {Digital Humanities, CLARIN-IT},
URL = {http://www.clarin-it.it/sites/default/files/documents/UniParma_Workshop_2017_Locandina.pdf},
CONFERENCE_NAME = {DIGITAL HUMANITIES E FILOLOGIA GRECA: risorse e infrastrutture di ricerca applicate allo studio del greco antico},
}
@MISC{MONACHINI_2017_MISC_M_341686,
AUTHOR = {Monachini, M.},
TITLE = {Nuove tecnologie e nuovi sviluppi di indagine: CLARIN-IT e alcuni esempi di applicazione allo studio del greco antico},
YEAR = {2017},
ABSTRACT = {l lavoro tradizionale del filologo necessita oggi di una disponibilità sempre più ampia di dati e di testi (letteratura secondaria, bibliografia specifica, fonti primarie), il lavoro del singolo studioso sembra oramai accompagnarsi alla necessità di un team di ricerca che collabori su progetti di ampia scale, quali le edizioni dei testi. Molte delle informazioni indispensabili per il filologo sono oggi (o potrebbero essere) disponibili e maggiormente accessibili grazie all'utilizzo di strumenti informatici, ma spesso si tratta di materiali dispersi e poco connessi tra loro; talora la loro esistenza è persino ignota agli studiosi tradizionali. 2 Il trend dei dati che si registra nella disciplina, grazie alla diffusione del web, con la circolazione di risorse utili per l'analisi e la ricostruzione del testo, fa ripensare al rapporto tra filologia-in ogni suo aspetto-e nuove tecnologie e lascia ampio spazio alle riflessioni metodologiche sui procedimenti d'indagine. Si tratta di far dialogare questi dati e implementarli. Il primo passo riguarda l'individuazione delle opportunità offerte dal settore delle DH in relazione a ogni singola disciplina nella sua specificità e, d'altro lato definire quali siano le esigenze di ciascun singolo settore. Nel fare questo è necessario mantenere alto lo standard sia dello strumento sia del tipo di dati inseriti. Come tratta il testo lo studioso affiancato dall'ausilio delle nuove tecnologie? Cosa trova online? Che bisogni emergono nelle pratiche di uso odierne? Si tenterà di dare una risposta a queste domande con esempi pratici di metodo applicato allo studio-ad esempio-di un autore specifico. Nel contesto verranno inoltre presentate le attività sino ad ora svolte dal gruppo di ricerca. 1) Tramite Survey si sono identificati la pratica d'uso oggi, e i punti di forza e mancanze degli strumenti esistenti. 2) Si sono così definite le esigenze di una comunità specifica e le relative richieste e aspettative. 3) Si è definito un prototipo di strumento che risponda alle esigenze individuate, ora in fase di valutazione. 4) realizzazione, in prospettiva, di uno strumento che possa offrire una piattaforma collaborativa che metta a disposizione i dati (testo, apparato, commento, analisi a diversi livelli, etc.), variamente fruibili, assieme alla possibilità di accedere facilmente a tutti i dati relativi disponibili in rete},
KEYWORDS = {Digital Humanities, Computational Philology},
URL = {http://www.clarin-it.it/sites/default/files/documents/UniParma_Workshop_2017_Locandina.pdf},
CONFERENCE_NAME = {2° Workshop di Studio Insegnamenti di Storia della Lingua Greca (LT) e Filologia Greca (LM)},
}
@MISC{MONACHINI_2017_MISC_M_405401,
AUTHOR = {Monachini, M.},
TITLE = {Digital Humanities and Research Infrastructures: CLARIN and CLARIN-IT},
YEAR = {2017},
ABSTRACT = {La lezione al Corso "Digital Humanities: Web Resources, Tools and Infrastructures" Venice International University (a. a. 2017-2018) ha lo scopo di dimostrare i vantaggi, i benefici e le opportunità offerte da una infrastruttura di ricerca come CLARIN-ERIC per rispondere ai quesiti di ricerca e le sfide nel settore delle Digital Humanities},
KEYWORDS = {digital humanities, research infrastructures, data deluge},
URL = {https://iris.cnr.it/handle/20.500.14243/405401},
CONFERENCE_NAME = {Course "Digital Humanities: Web Resources, Tools and Infrastructures" Venice International University},
}
@MISC{PECCHIOLI_2017_MISC_PABMG_340687,
AUTHOR = {Pecchioli, A. and Albanesi, D. and Bellandi, A. and Marchi, S. and Giovannetti, E.},
TITLE = {Elaborazione del linguaggio naturale (NLP) in Ebraico: il caso dell'analisi linguistica automatica applicata all'ebraico mishnaico del Talmud},
YEAR = {2017},
ABSTRACT = {The paper briefly introduces the field of Digital Humanities (i. e. the intersection of digital technologies and disciplines of humanities) and provides some examples of digital applications in the area of jewish studies. The Progetto Traduzione Talmud Babilonese (PTTB) project, aimed at producing the first complete Italian translation of the Babylonian Talmud, then will be presented. The translation is being carried out with the help of "Traduco", an innovative, collaborative, computer-assisted translation (CAT) tool developed at the Istituto di Linguistica Computazionale of Consiglio Nazionale delle Ricerche (ILC-CNR) in Pisa. In particular, the paper will focus on what is automatic linguistic analysis, why it's being integrated in one of the components of "Traduco" and its application to the mishnaic language. Even if we are at the very beginning of the construction of the tool, this research activity have exposed all the peculiarities of the mishnaic language and the problems arising from the lacking of resources and tools for the processing of this language. Finally, we will show the two main use cases leveraging on the obtained analysis, namely the improvement of the automatic suggestions component and the linguistic based querying of the annotated talmudic corpus},
KEYWORDS = {traduco, nlp, Mishanic Hebrew, talmud},
URL = {http://aisg.cise.unipi.it/Materia-giudaica-2018/018-Pecchioli%20pp%20281-292B.pdf},
CONFERENCE_NAME = {Nuovi studi sull'Ebraismo-XXXI Convegno AISG 2017},
}
@MISC{PICCINI_2017_MISC_P_401699,
AUTHOR = {Piccini, S.},
TITLE = {Il mappamondo di Ricci e la traduzione di Pasquale d'Elia a confronto: un viaggio semantico attraverso la geografia e la cosmografia dalla Cina del XVI secolo all'Italia del XIX secolo},
YEAR = {2017},
ABSTRACT = {Il contributo è volto a presentare la risorsa termino-ontologica bilingue italiano-cinese, dedicata alla terminologia astronomica e geografica del Mappamondo di Ricci (?????? Kunyu Wanguo Quantu, 1602) e della sua traduzione in italiano ad opera di Pasquale d'Elia. Il livello lessicale è stato strutturato secondo il modello Ontolex-lemon, opportunamente esteso per rappresentare le caratteristiche specifiche della lingua cinese. La parte concettuale ha ricevuto una formalizzazione in OW-DL},
URL = {https://iris.cnr.it/handle/20.500.14243/401699},
}
@MISC{PICCINI_2017_MISC_PMG_330935,
AUTHOR = {Piccini, S. and Marchi, S. and Giovannetti, E.},
TITLE = {Étudier le structuralisme par le structuralisme: expériences de sémantique distributionnelle dans la construction d'un lexique électronique de la terminologie saussurienne},
YEAR = {2017},
ABSTRACT = {En 2010-2011, le premier lexique électronique dédié à la terminologie linguistique saussurienne a été créé [1] dans le cadre d'un projet de recherche intitulé « Pour une édition numérique des manuscrits de Ferdinand de Saussure », projet coordonné par le Professeur Gambarara. La première étape de construction de la ressource lexicale a consisté en l'identification manuelle dans les textes des termes clés du vocabulaire saussurien et de leurs propriétés sémantiques. L'informatique n'est intervenue que dans la phase de formalisation des données extraites. C'est pourquoi nous nous proposons d'illustrer ici la possibilité de recourir à des techniques automatiques et, en particulier, à des algorithmes de sémantique distributionnelle [2] pour identifier les relations que les termes entretiennent entre eux dans le texte. La méthodologie sous-jacente est basée sur l'hypothèse distributionnelle selon laquelle plus deux mots sont sémantiquement proches, plus ils ont tendance à se produire dans des contextes similaires. Le lexique d'un texte est considéré comme un espace métrique où chaque mot peut être représenté comme un vecteur à n dimensions, chacune d'elles enregistrant le nombre de fois que ce mot apparaît dans un contexte donné. La proximité spatiale entre deux vecteurs indique la similarité sémantique entre deux mots. Elle est calculée par le cosinus de l'angle compris entre les deux vecteurs: plus la valeur du cosinus est grande, plus les termes sont, en principe, sémantiquement similaires. Les techniques computationnelles ont été appliquées aux mêmes textes à partir desquels le lexique électronique a été construit: le Cours de linguistique générale [3], les Écrits de linguistique générale [4] et le Recueil des publications scientifiques [5]. Bien qu'au stade préliminaire, l'expérience a permis d'obtenir des résultats intéressants. À titre d'exemple, nous présentons ci-dessous (Tableau) les valeurs de similitude obtenues par l'algorithme entre le terme signe et d'autres mots dans les textes. Si l'on compare les résultats avec l'entrée du lexique signe, on peut remarquer que l'algorithme est en mesure de détecter un grand nombre de liens explicités dans la ressource et de suggérer, en outre, des relations possibles avec d'autres termes comme valeur, rapport, idée. L'application de ces techniques computationnelles au corpus saussurien peut donc constituer une aide précieuse non seulement pour les lexicographes mais également pour les experts du domaine en faisant émerger des connections qui n'apparaissent pas immédiatement de manière explicite et en suggérant ainsi des parcours alternatifs d'analyse de la pensée de l'auteur},
KEYWORDS = {structuralisme, sémantique distributionnelle, terminologie saussurienne, lexique électronique},
URL = {https://iris.cnr.it/handle/20.500.14243/330935},
CONFERENCE_NAME = {Atelier "Les manuscrits de Saussure, parmi d'autres. Problèmes, stratégies et solutions d'édition pour les archives numériques"},
}
@MISC{SORIA_2017_MISC_S_337263,
AUTHOR = {Soria, C.},
TITLE = {Inquiring current digital use and usability of regional and minority languages: the DLDP survey},
YEAR = {2017},
ABSTRACT = {The Digital Language Diversity Project is a three-year project funded under the Erasmus programme that addresses the problem of low digital representation and use of EU regional and minority languages, a cause for their endangerment according to some scholars. One of the first actions of the project is to assess the current use and usability of four EU regional/minority languages, representing very different degrees of digital language representation and use: these languages are Sardinian, Karelian, Basque and Breton. From June to September 2016, the DLDP project has been spreading a survey, that was localized and translated into these languages. The survey is developed on the basis of previous work carried out in the area of ethnolinguistic vitality, such as the ELDIA Barometer, and other inquiries addressing specifically digital use of languages and availability and usability of digital resources and media. The DLDP survey consists of a general part collecting basic information on the informant (age, sex, proficiency level in the language, frequency of use, etc.). The second part is focused on gathering information about his/her personal digital use of the language and about any known digital resource and services that make use of the language. The survey is the first ever study of the digital needs of minority language speakers. It will give stakeholders and academia a detailed view into what actual language speakers are thinking about in terms of how they want to develop provision for their languages in the digital sphere. Therefore, we strongly encourage wide adoption and dissemination of the survey to regional and minority languages beyond the four investigated. The workshop intends to illustrate and discuss the model survey, to share it with researchers interested in adopting it for other languages, and to discuss collaboration paths},
KEYWORDS = {digital language use, regional languages, minority languages, digital language vitality},
PAGES = {44-44},
URL = {https://icriml.indiana.edu/conference-program/Abstractbook.pdf},
CONFERENCE_NAME = {First International Conference on Revitalization of Indigenous and Minoritized Languages},
}
@MISC{SORIA_2017_MISC_S_337266,
AUTHOR = {Soria, C.},
TITLE = {Alliances for digital linguistic diversity},
YEAR = {2017},
ABSTRACT = {Linguapax proposes a complementary pair of Roundtable discussions in the Conference's thematic line 1: The value of linguistic diversity, from an operational perspective. This "diptych" will present different types of alliances that create contexts for the preservation and continuation of linguistic diversity (RT 1), and will show how a plural perspective on linguistic diversity can emerge, drawing on Linguapax's experience as an international network (RT 2). In the first Roundtable discussion we will tackle the generation of different contexts of interaction (networks and alliances) to enhance the presence and vitality of linguistic diversity-those contexts emerging from linguistic, cultural and digital networks (although should be-in theory-mostly overlapping, an overview of their specific potentialities is useful and needed): 1. "Linguistic cooperation": International networks of projects/exchange of experiences in language revitalisation. Andoni Barreña (Garabide Elkartea, Basque Country); 2. Alliances for digital linguistic diversity. Claudia Soria. Consiglio Nazionale delle Ricerche. Pisa. 3. International cultural cooperation. Although "cultural cooperation" should be the common umbrella, it is usually driven by a specific logic in which linguistic diversity rarely comes consistently into play. On this occasion for dialogue, the Round Table will expose linguists/activists to a potentially useful vocabulary and world of networks and platforms. Jordi Pascual, expert on international cultural relations. This Roundtable aims to harness the relational potential of the Conference: On one hand, putting into dialogue two contributions already planning individual participation (1, 2), and on the other, inviting an 74 external perspective to crossfertilise the debate and increase the scope for networking. Given the operational approach of this Roundtable, active interaction with the audience will be a key element for achieving the desired multiplier effect. Moderator: Alícia Fuentes-Calle. Linguapax (Barcelona). Departament de Lingüística. Universitat de Barcelona},
KEYWORDS = {linguistic diversity, digital language diversity},
URL = {https://iris.cnr.it/handle/20.500.14243/337266},
CONFERENCE_NAME = {ROUNDTABLE DISCUSSION-Linguapax-I. Generating contexts for linguistic diversity to thrive: networks of linguistic, cultural and digital cooperation. First International Conference on Revitalization of Indigenous and Minoritized Languages},
}
@MISC{SORIA_2017_MISC_S_337255,
AUTHOR = {Soria, C.},
TITLE = {The digital language vitality scale: a model for assessing digital vitality of languages},
YEAR = {2017},
ABSTRACT = {In this paper, we present the Digital Language Vitality Scale, a tool for measuring the degree of digital vitality of languages. Digital vitality can be defined as the extent to which a language is present, used and usable over the Internet through digital devices. The scale is inspired to ethnolinguistic vitality assessment (such as GIDS, Fishman 2001), updated by (Lewis and Simons 2010) as EGIDS, and the UNESCO "nine factors" (UNESCO 2003), and is based on previous work in this area such as (Kornai 2013) and (Gibson 2015). Seven levels of digital vitality are identified, from "pre-digital" to "digitally thriving", and a set of associated indicators. The indicators associated with the scale are proxies representing both digital representation (presence) of a language and digital use. They are clustered into three groups: a first group of indicators refers to digital usability of a language, for instance, the existence of Internet connection or the availability of standardised fonts for writing the language. A second group of indicators is related to the quality and amount of digital use of a language: if and how much a language is used for texting and emailing, on websites, blogs, if there are e-books, Wikipedias, if the language is used on social media. The last group of indicators correlates with the digital prestige of a language; they are a sign of a language that not only is used on digital media and devices, but it is so in a full-fledged way, enjoying the widest possible ranges of uses and applications (e. g. localised digital services, machine translation, edu-tainment products and services). The scale is currently being used in the context of the DLDP project (http: //www. dldp. eu) as an assessing instrument for digital language planning, with particular reference to regional and minority languages},
KEYWORDS = {digital vitality, language vitality, digital language diversity},
URL = {https://iris.cnr.it/handle/20.500.14243/337255},
CONFERENCE_NAME = {First International Conference on Revitalization of Indigenous and Minoritized Languages},
}
@MISC{SORIA_2017_MISC_S_337261,
AUTHOR = {Soria, C.},
TITLE = {Language policies and speakers' attitudes: evaluating the impact of official recognition on some of Italy's regional languages},
YEAR = {2017},
ABSTRACT = {The panel focuses on the minority (some of them highly endangered) languages of Italy, with a special attention to those which are not recognized (nor supported) by the Italian Government. Key points will be a. the official language policy of Italy, b. language discrimination, c. language ideology and d. the ambiguous role of academic institutions vis-à-vis languages and dialects, e. the effects (and results) of official support for recognized minority languages, as well as f. grassroots approaches to the standardization and development of unrecognized languages and new developments on the net},
KEYWORDS = {minority languages, multilingualism, language policy},
PAGES = {42-42},
URL = {https://icriml.indiana.edu/conference-program/Abstractbook.pdf},
CONFERENCE_NAME = {First International Conference on Revitalization of Indigenous and Minoritized Languages},
}
@MISC{SORIA_2017_MISC_SRQ_334735,
AUTHOR = {Soria, C. and Russo, I. and Quochi, V.},
TITLE = {Reports on Digital Language Diversity in Europe},
YEAR = {2017},
ABSTRACT = {In these reports we present the results of the first survey about the actual needs of European minority languages speakers in terms of digital opportunities},
KEYWORDS = {regional languahges, minority languages, digital vitality, digital use},
URL = {http://www.dldp.eu/content/reports-digital-language-diversity-europe},
}
@MISC{STAINES_2017_MISC_SDLM_408450,
AUTHOR = {Staines, H. and Di Donato, F. and Lin, J. and Martone, M.},
TITLE = {GO)FAIR-Annotations as Research Objects: Ensuring Findable, Indexable, Accessible and Reusable},
YEAR = {2017},
ABSTRACT = {Presentation of the Go FAIR initiative},
URL = {https://iris.cnr.it/handle/20.500.14243/408450},
}
@MISC{WEINGART_2017_MISC_WBG_340685,
AUTHOR = {Weingart, A. and Bellandi, A. and Giovannetti, E.},
TITLE = {Representing Multilingualism and Multiwords in a Lemon Old Occitan Medico-Botanical Lexicon},
YEAR = {2017},
ABSTRACT = {This article illustrates the progresses made in representing a multilingual and multi-alphabetical Old Occitan medico-botanical lexicon in the context of project DiTMAO. The chosen lexical model of reference is lemon, that has been extended accordingly to some specific linguistic and lexical features of the lexicon. In particular, issues and solutions about the modelling of multilingual and multiword phenomena are discussed, as the way they will be managed through LexO, a web editor developed in the context of the project},
KEYWORDS = {lemon model, RDF, multilingualism, multiwords, multialphabet, historical lexicon, medico-botanical terminology, Old Occitan, Hebrew, Arabic, LexO Web editor},
URL = {https://iris.cnr.it/handle/20.500.14243/340685},
CONFERENCE_NAME = {Third International Workshop on Semantic Web for Scientific Heritage (SW4SH 2017)},
}
@MISC{WEINGART_2017_MISC_WG_338563,
AUTHOR = {Weingart, A. and Giovannetti, E.},
TITLE = {From canabo to Cannabis sativa L.: Modelling Diachronic Termino-ontological Resources in the Context of DiTMAO},
YEAR = {2017},
ABSTRACT = {The paper aims at contributing to the understanding of the Medieval Brain from a knowledge engineering perspective. As the brain is conceived as locus of cognition and knowledge in medieval medicine, we want to focus on the representation of medieval medico-botanical knowledge by means of a three-level text-termino-ontological resource. The resource is based on lemon (a model for the representation of lexica as RDF) and a set of ontologies represented in OWL and consists of (i) a medieval termino-ontological resource, (ii) a modern termino-ontological resource and (iii) a documentation corpus. It is developed and implemented within the DFG-funded project "Dictionnaire de Termes Médico-botaniques de l'Ancien Occitan" (DiTMAO). In an introductory part we will briefly introduce the aims of the project and the particularities of the corpus. The corpus consists of medical monographs in Latin script but also of so-called synonym lists in Hebrew script. These lists can be described as ancient multilingual dictionaries, in our case of Old Occitan, (Judaeo-)Arabic, Hebrew, Latin or other Romance languages and sometimes Greek and Aramaic, and they are of particular importance because the equivalent terms in other ancient languages help to determine the meaning of otherwise opaque Old Occitan terms. After introducing the three components of the resource, given some examples from our corpus, we elaborate, in the main part of paper, a solution to the problem of representing the relation between medieval medical terms or concepts and their ancient and modern correspondences. The problem concerns in particular the process of determining the terms´ meaning through the documentation of each term in corpus-external dictionaries and editions, and how this process can be represented in a comprehensive and transparent way. We propose to relate the terms of the medieval termino-ontological resource at a lexical level using relations such as synonymy or sublemma. The connections between modern and medieval terms, like a translation into modern English, will be mediated by the documentation corpus. As for modern scientific terms, we opt for an ontological connection. These types of connections will be exemplified with (mainly) plant names from our corpus. For example, a medieval term has a referent in the medieval ontology, structuring the botanic world as conceived by a "medieval brain" by giving the medieval classifications e. g. the primary qualities. This ontological entity is related to a referent of a modern scientific name, given that the documentation of the medieval term provides such information. We will argue that a clear separation of datasets (medieval and modern) allows for the diachronic study of the evolution of terminology and, more importantly for this context, paves the way for the analysis of the changes in the cognitive representation of what those terms actually refer to},
KEYWORDS = {lexica, multi-language lexica, termino-ontological resource, ancient occitan},
URL = {https://themedievalbrain.wordpress.com/},
CONFERENCE_NAME = {The Medieval Brain Conference},
}
@MISC{ZAMORANI_2017_MISC_Z_373615,
AUTHOR = {Zamorani, N.},
TITLE = {Featured Linguist: Nicoletta Calzolari},
YEAR = {2017},
ABSTRACT = {The LINGUIST List Official LINGUIST List Blog: Featured Linguist: Nicoletta Calzolari Posted on April 7, 2017 by Clare Harshey We are proud to share with our readers the next featured linguist of our 2017 Fund Drive: Nicoletta Calzolari. We hope that you enjoy reading Dr. Calzolari's thoughts on her long and varied career as a computational linguist},
KEYWORDS = {Computational Linguistics, Nicoletta Calzolari},
PAGES = {11},
URL = {https://blog.linguistlist.org/fund-drive/featured-linguist-nicoletta-calzolari/},
}
@ARTICLE{APREDA_2016_ARTICLE_ABDF_392597,
AUTHOR = {Apreda, R. and Bonaccorsi, A. and Dell'Orletta, F. and Fantoni, G.},
TITLE = {Functional technology foresight. A novel methodology to identify emerging technologies},
YEAR = {2016},
ABSTRACT = {The speed and complexity of the technology evolution faced by modern societies need new approaches to the analysis and understanding of the world. Indeed, an exclusive focus on technological goals can miss to recognize all the stakeholders of a technology and address real user needs; moreover, on the one hand low signals are becoming more and more important in fast evolving markets, on the other hand the excess of hype, fashions, or vested interests sometimes deeply alter indicators. However, the so called Big Data promise to be a huge low cost set of valuable information, available and affordable to all (SMEs included). But, analyzing them is not trivial especially if we deal with academic papers and patents. To tackle these issues, the present paper proposes to apply a powerful methodological tool called Functional Analysis to the Technology Foresight process. Actually the rigorous study of the functions, that an artefact should perform to satisfy the user needs, provides a universal and thus unifying point of view, which is able to correlate the user perspective on the product with its technical features. Functional reasoning has been applied to (i) detect possible patterns of development, spotting missing elements and highlighting strengths as well as potential sources of failure; (ii) to enhance traditional bibliometric tools such as the analysis of S-curves and (iii), integrated with a natural language processing analysis toolchain, tailored for patent documents, to identify emerging technologies. The paper describes the functional approach to technology foresight activity, presents how to integrate it with text mining algorithms and experts' domain knowledge, and finally discusses its benefits in the context of Technology Foresight also from an economic point of view, showing that oresight is affordable also for Small and Medium Enterprises},
URL = {https://iris.cnr.it/handle/20.500.14243/392597},
DOI = {10.1007/s40309-016-0093-1},
ISSN = {2195-2248},
JOURNAL = {EUROPEAN JOURNAL OF FUTURES RESEARCH},
}
@ARTICLE{BELLANDI_2016_ARTICLE_BABG_354700,
AUTHOR = {Bellandi, A. and Albanesi, D. and Benotto, G. and Giovannetti, E.},
TITLE = {Il Sistema Traduco nel Progetto Traduzione del Talmud Babilonese},
YEAR = {2016},
ABSTRACT = {Nell'ambito del Progetto Traduzione del Talmud Babilonese, l'Istituto di Linguistica Computazionale del CNR ha sviluppato Traduco, uno strumento web collaborativo con alcune caratteristiche che lo rendono particolarmente adatto alla traduzione di testi che pongono problemi interpretativi. Ad oggi, gli strumenti per la traduzione assistita (in inglese, Computer-Assisted Translation, o CAT) sono utilizzati tipicamente per la traduzione di manuali tecnici, testi legislativi o siti Web e hanno principalmente lo scopo di accelerare il processo di traduzione. Traduco riprende la maggior parte dei componenti standard di uno strumento di traduzione assistita tradizionale, ma li estende con caratteristiche specifiche necessarie per supportare l'interpretazione e la traduzione di testi complessi che pongono particolari problemi di comprensione. In questo articolo presenteremo un caso di studio specifico, relativo a un testo con queste caratteristiche: il Talmud Babilonese. Traduco include funzionalità per l'aggiunta di note, riferimenti bibliografici, annotazioni semantiche e creazione di glossari. Traduttori, revisori, redattori, supervisori e utenti finali che accedono al Sistema sono supportati nell'intero processo di traduzione, che va dall'interpretazione del testo originario alla fase ditoriale per la stampa delle traduzioni, attraverso l'uso di tecnologie di traduzione assistita, l'annotazione semantica del testo, l'arricchimento delle traduzioni con informazioni esplicative, l'esportazione delle traduzioni in XML e in TEI e l'integrazione di tecniche per il trattamento automatico della lingua. La progettazione e lo sviluppo di Traduco ha richiesto l'adozione di un approccio multidisciplinare che combina aspetti di ingegneria del software, linguistica computazionale, ingegneria della conoscenza ed editoria digitale},
KEYWORDS = {traduco, traduzione-assistita, talmud},
PAGES = {109-126},
URL = {https://journals.openedition.org/ijcol/404},
VOLUME = {2 (2)},
ISSN = {2499-4553},
JOURNAL = {IJCOL},
}
@ARTICLE{BOSCHETTI_2016_ARTICLE_BB_336804,
AUTHOR = {Boschetti, F. and Buzzoni, M.},
TITLE = {Cronache-Edizioni digitali: Rappresentazione, Interoperabilità, Analisi del testo e Infrastrutture (Venezia, 7-9 settembre 2016)},
YEAR = {2016},
ABSTRACT = {Cronaca del quinto convegno annuale dell'Associazione di Informatica Umanistica e Cultura Digitale (AIUCD), che si è svolto dal 7 al 9 settembre 2016 presso l'Aula Magna di Ca' Dolfin dell'Università Ca' Foscari di Venezia e ha avuto per tema: "Edizioni digitali: rappresentazione, interoperabilità, analisi del testo e infrastrutture"},
KEYWORDS = {convegno AIUCD},
PAGES = {269-274},
URL = {http://bit.ly/2CW0BOV},
VOLUME = {13},
ISSN = {1825-5361},
JOURNAL = {ECDOTICA},
}
@ARTICLE{BRUNATO_2016_ARTICLE_BD_325818,
AUTHOR = {Brunato, D. and Dell'Orletta, F.},
TITLE = {ISACCO: a corpus for investigating spoken and written language development in Italian school-age children},
YEAR = {2016},
ABSTRACT = {In this paper we present ISACCO (Italian School-Age Children COrpus), a corpus of oral and written retellings of Italian-speaking children attending primary school. All texts were digitalized and automatically enriched with multi-level linguistic annotation. Preliminary explorations of both the form and the content of children's productions were carried out based on a set of features automatically extracted by NLP tools. Written retellings were manually annotated with a typology of errors belonging to three different linguistic levels. The resource, which has been made publicly available1, is conceived to support research and computational modeling of "later language acquisition", with an emphasis on comparative assessment of the evolution of oral and written language competencies in early school grades},
KEYWORDS = {Child language acquisition, Oral and Written language, multi-level linguistic analysis},
PAGES = {63-76},
URL = {http://www.italianlp.it/wp-content/uploads/2016/09/04_brunato_dell-orletta.pdf},
VOLUME = {2 (1)},
ISSN = {2499-4553},
JOURNAL = {IJCOL},
}
@ARTICLE{BRUNATO_2016_ARTICLE_BDMV_372675,
AUTHOR = {Brunato, D. and Dell'Orletta, F. and Montemagni, S. and Venturi, G.},
TITLE = {Monitoraggio linguistico di Scritture Brevi: aspetti metodologici e primi risultati},
YEAR = {2016},
ABSTRACT = {Se da un lato le tecnologie del linguaggio svolgono un ruolo ormai indiscusso per l'accesso al contenuto testuale, ciò non appare scontato quando si va a considerare il loro ruolo nella valutazione delle strutture linguistiche sottostanti al testo. Questo contributo si focalizza sulla definizione di una metodologia innovativa di monitoraggio linguistico della lingua italiana che a partire dall'output di strumenti di annotazione linguistica automatica permette di ricostruire un profilo linguistico di una collezione di testi rappresentativa di una specifica varietà d'uso della lingua. Tale metodologia è stata applicata a un corpus di tweet allo scopo di far luce su interrogativi aperti quali la possibilità di rintracciare tendenze lessicali, morfo-sintattiche e sintattiche peculiari all'interno di questa tipologia testuale; di studiare come queste tendenze si rapportino ai tratti caratterizzanti della lingua scritta e parlata; di individuare possibili differenze nella forma linguistica in cui si twittano contenuti di natura diversa},
KEYWORDS = {Trattamento Automatico del Linguaggio, Monitoraggio Linguistico, Varietà d'Uso della Lingua, Lingua del Web},
PAGES = {149-176},
URL = {https://iris.cnr.it/handle/20.500.14243/372675},
VOLUME = {N. S. 5},
ISSN = {1825-2796},
JOURNAL = {QUADERNI DI AIŌN},
}
@ARTICLE{BURGASSI_2016_ARTICLE_B_357035,
AUTHOR = {Burgassi, C.},
TITLE = {«CHIEDERE A LINGUA»: BOCCACCIO E DINTORNI},
YEAR = {2016},
ABSTRACT = {L'analisi prende le mosse dalla descrizione di Guido Cavalcanti nel Decameron di Giovanni Boccaccio: «oltre a quello che egli fu un de' migliori loici che avesse il mondo e ottimo filosofo naturale [. ], sì fu egli leggiadrissimo e parlante uom molto [. ] e con questo era ricchissimo, e a chiedere a lingua sapeva onorare cui nell'animo gli capeva che il valesse» (VI 9, 8). Sulla scorta di questo celebre passo, la locuzione chiedere a lingua gode di una certa fortuna nella letteratura del Rinascimento maturo, in autori che riflettono l'espressività della tradizione linguistica fiorentina più schietta: Antonfrancesco Grazzini, Benedetto Varchi, Benvenuto Cellini, Annibal Caro, Bernardo Davanzati. Il contributo ripercorre la storia di questo modulo fraseologico, indagandone i contesti di ricorrenza e precisandone, di volta in volta, il significato nel quadro sintattico, alla luce in particolare delle traduzioni dei testi classici. Per la fase anticalo studio tiene conto dei numerosi commenti al Decamerone e offre nuovo materiale documentario, soprattutto con riferimento al volgarizzamento della Terza Decade di Tito Livio, rilevante per la comprensione della formula in esame},
KEYWORDS = {Boccaccio, lessico},
PAGES = {5-20},
URL = {https://iris.cnr.it/handle/20.500.14243/357035},
VOLUME = {33},
ISSN = {0392-5218},
JOURNAL = {STUDI DI LESSICOGRAFIA ITALIANA},
}
@ARTICLE{BURGASSI_2016_ARTICLE_B_357037,
AUTHOR = {Burgassi, C.},
TITLE = {«PROVENTI A LA LOR NATURA». UN'IPOTESI PER BONAGIUNTA},
YEAR = {2016},
ABSTRACT = {This paper examines the meaning of the expression «proventi a la lor natura»in the poemFermamenteintensa, vv. 30-31, allegedly attributable to Bonagiunta Orbicciani da Lucca. In the stanza involving «proventi a la lornatura» the poet makes a comparison between the behaviour of snakes and that of the noble and honourable men who rule the society. The interpretation of the stanzatherefore entailsthe correct understanding of why noble men and snakes are connected. The analysis takes also into account linguistic featuresthat maycontribute to underpin the alleged authorship of Bonagiunta for the poem},
KEYWORDS = {Bonagiunta Orbicciani, lessico},
PAGES = {81-93},
URL = {https://iris.cnr.it/handle/20.500.14243/357037},
VOLUME = {62},
ISSN = {0585-4962},
JOURNAL = {STUDI MEDIOLATINI E VOLGARI},
}
@ARTICLE{CHRISTOFF_2016_ARTICLE_CHP_405492,
AUTHOR = {Christoff, Z. and Hansen, J. U. and Proietti, C.},
TITLE = {Reflecting on Social Influence in Networks},
YEAR = {2016},
ABSTRACT = {In many social contexts, social influence seems to be inescapable: the behavior of others influences us to modify ours, and vice-versa. However, social psychology is full of examples of phenomena where individuals experience a discrepancy between their public behavior and their private opinion. This raises two central questions. First, how does an individual reason about the behavior of others and their private opinions in situations of social influence? And second, what are the laws of the resulting information dynamics? In this paper, we address these questions by introducing a formal framework for representing reasoning about an individual's private opinions and public behavior under the dynamics of social influence in social networks. Moreover, we dig deeper into the involved information dynamics by modeling how individuals can learn about each other based on this reasoning. This compels us to introduce a new formal notion of reflective social influence. Finally, we initialize the work on proof theory and automated reasoning for our framework by introducing a sound and complete tableaux system for a fragment of our logic. Furthermore, this constitutes the first tableau system for the "Facebook logic" of J. Seligman, F. Liu, and P. Girard},
KEYWORDS = {Social networks, Modal logic, Hybrid logic, Opinion dynamics, Social influence, Tableau systems},
PAGES = {299-333},
URL = {https://iris.cnr.it/handle/20.500.14243/405492},
VOLUME = {25 (3-4)},
DOI = {10.1007/s10849-016-9242-y},
ISSN = {0925-8531},
JOURNAL = {JOURNAL OF LOGIC, LANGUAGE, AND INFORMATION},
}
@ARTICLE{DIDONATO_2016_ARTICLE_D_381985,
AUTHOR = {Di Donato, F.},
TITLE = {From the Past to the Future. Alcune riflessioni dopo DH2016},
YEAR = {2016},
ABSTRACT = {Riflessioni a margine del convegno DH2016},
URL = {https://iris.cnr.it/handle/20.500.14243/381985},
ISSN = {1591-4305},
JOURNAL = {BOLLETTINO TELEMATICO DI FILOSOFIA POLITICA},
}
@ARTICLE{GANASCIA_2016_ARTICLE_G_320494,
AUTHOR = {Ganascia, C. B. F.},
TITLE = {REDEN: Named Entity Linking in Digital Literary Editions Using Linked Data Sets},
YEAR = {2016},
ABSTRACT = {This paper proposes a graph-based Named Entity Linking (NEL) algorithm named REDEN for the disambiguation of authors' names in French literary criticism texts and scientific essays from the 19th and early 20th centuries. The algorithm is described and evaluated according to the two phases of NEL as reported in current state of the art, namely, candidate retrieval and candidate selection. REDEN leverages knowledge from different Linked Data sources in order to select candidates for each author mention, subsequently crawls data from other Linked Data sets using equivalence links (e. g., owl: sameAs), and, finally, fuses graphs of homologous individuals into a non-redundant graph well-suited for graph centrality calculation; the resulting graph is used for choosing the best referent. The REDEN algorithm is distributed in open-source and follows current standards in digital editions (TEI) and semantic Web (RDF). Its integration into an editorial workflow of digital editions in Digital humanities and cultural heritage projects is entirely plausible. Experiments are conducted along with the corresponding error analysis in order to test our approach and to help us to study the weaknesses and strengths of our algorithm, thereby to further improvements of REDEN},
URL = {https://iris.cnr.it/handle/20.500.14243/320494},
DOI = {10.7250/csimq.2016-7.04},
ISSN = {2255-9922},
JOURNAL = {COMPLEX SYSTEMS INFORMATICS AND MODELING QUARTERLY},
}
@ARTICLE{GOGGI_2016_ARTICLE_GPBFMMDB_320996,
AUTHOR = {Goggi, S. and Pardelli, G. and Bartolini, R. and Frontini, F. and Monachini, M. and Manzella, G. and De Mattei, M. and Bustaffa, F.},
TITLE = {A semantic engine for grey literature retrieval in the oceanography domain},
YEAR = {2016},
ABSTRACT = {Here we present the final results of the MAPS (Marine Planning and Service Platform) project, an environment designed for gathering, classifying, managing and accessing marine scientific literature and data, making it available for search to Operative Oceanography researchers of various institutions by means of standard protocols. The system takes as input non-textual data (measurements) and text-both published papers and documentation-and it provides an advanced search facility thanks to the rich set of metadata and, above all, to the possibility of a refined and domain targeted key-word indexing of texts using Natural Language Processing (NLP) techniques. The paper describes the system in its details providing also evidence of evaluation},
KEYWORDS = {Information Extraction, Search Engine, Operative Oceanography},
PAGES = {155-161},
URL = {http://www.greynet.org/thegreyjournal/currentissue.html},
VOLUME = {12 (3)},
ISSN = {1574-1796},
JOURNAL = {THE GREY JOURNAL},
}
@ARTICLE{GUADAGNINI_2016_ARTICLE_G_354823,
AUTHOR = {Guadagnini, E.},
TITLE = {Scelta di voci del Tesoro della Lingua Italiana delle Origini (diciannovesima serie)},
YEAR = {2016},
ABSTRACT = {Voci scena (1) s. f., scena (2) s. f., scenàcolo s. m., scènico agg. /s. m},
KEYWORDS = {lessicografia},
PAGES = {94-97},
URL = {https://iris.cnr.it/handle/20.500.14243/354823},
VOLUME = {21},
ISSN = {1591-8254},
JOURNAL = {BOLLETTINO-OPERA DEL VOCABOLARIO ITALIANO},
}
@ARTICLE{GUADAGNINI_2016_ARTICLE_G_354810,
AUTHOR = {Guadagnini, E.},
TITLE = {Lessicografia, filologia e «corpora» digitali: qualche considerazione dalla parte dell'OVI},
YEAR = {2016},
ABSTRACT = {This paper aims at showing how today's databases could change the traditional relationship existing between Philology and historical Lexicography, with specific reference to Old Italian lexicography and OVI dictionary (TLIO) and databases. Through the analysis of some Old Italian words meaning 'beginning' ((in)cominciamento, (in)comincianza, inizio), this paper presents a new philological method to manage the Corpus OVI extensive documentation: while traditional historical lexicography operates by identifying ancient occurrences of a particular word and, on this ground, by interpreting and defining their meaning, the "new" corpus-based (or, more likely, corpus-driven) historical lexicography can go further, placing that word inside the structure of ancient lexicon, that is, inferring from the documentation the distribution and the (possible) specificity of the lexeme. Relying on a study carried out by Cosimo Burgassi and by myself, this paper introduces some new interpretative categories targeting the study of words' (in the case in point, Romance words') history, such as "Rate of Connotation" ('quoziente connotativo') and "latent Latinism" ('latinismo latente')},
KEYWORDS = {lexicography, lexicology, corpus linguistics, Old Italian, latinism},
PAGES = {755-792},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-84987750318\&origin=inward},
VOLUME = {132},
DOI = {10.1515/zrp-2016-0050},
ISSN = {0049-8661},
JOURNAL = {ZEITSCHRIFT FÜR ROMANISCHE PHILOLOGIE},
}
@ARTICLE{GUADAGNINI_2016_ARTICLE_GV_354814,
AUTHOR = {Guadagnini, E. and Vaccaro, G.},
TITLE = {Il passato è una lingua straniera. Il Dizionario dei Volgarizzamenti tra filologia, linguistica e digital humanities},
YEAR = {2016},
ABSTRACT = {This paper describes the main results of the Divo (Dizionario dei Volgarizzamenti) project, which was carried out at the OVI institute and at the Scuola Normale Superiore from March 8, 2012 to March 7, 2016 and its main tools: all are open and free access. The Corpus del Dizionario dei Volgarizzamenti (Corpus DiVo, online since October 10, 2010 at ) contains 168 vernacular translations (6, 375, 803 occurrencies). The Corpus dei classici latini volgarizzati (Corpus CLaVo, online since October 30, 2012 at ) is a "mirror" and contains 89 texts for 42 latin works: so lexical research starts from Latin. Finally, the Bibliografia filologica (online at ) the philological and bibliographical notes of the texts studied for the realization of the project},
KEYWORDS = {DiVo, lessicografia, italiano antico},
PAGES = {279-394},
URL = {https://iris.cnr.it/handle/20.500.14243/354814},
VOLUME = {21},
ISSN = {1591-8254},
JOURNAL = {BOLLETTINO-OPERA DEL VOCABOLARIO ITALIANO},
}
@ARTICLE{KHAN_2016_ARTICLE_KABF_322086,
AUTHOR = {Khan, F. and Arrigoni, S. and Boschetti, F. and Frontini, F.},
TITLE = {Restructuring a Taxonomy of Literary Themes and Motifs for More Efficient Querying},
YEAR = {2016},
ABSTRACT = {In this paper we describe ongoing work in the restructuring of a tagset originally organised as a taxonomy and used to annotate literary themes and motifs in a corpus of classical works of poetry from a number of different traditions. We show how such a tagset can be rendered more efficient and useful through the appropriation of ideas and techniques from lexical semantics and ontology design. The newly redesigned tagset is described with examples showing how the new design is much more expressive than the old taxonomy; furthermore, an example query is described in order to demonstrate how more refined semantic searches can be carried using the new version of the taxonomy. The final result is, we hope, a resource that will be useful not only for the specific project for which it was developed but one that is well-designed and well-documented enough to be of use for other similar semantic annotation tasks},
URL = {https://iris.cnr.it/handle/20.500.14243/322086},
DOI = {10.14195/2182-8830},
ISSN = {2182-8830},
JOURNAL = {MATLIT},
}
@ARTICLE{LENCI_2016_ARTICLE_LLMM_353736,
AUTHOR = {Lenci, A. and Labanca, N. and Marazzini, C. and Montemagni, S.},
TITLE = {Voci della Grande Guerra: An Annotated Corpus of Italian Texts on World War I},
YEAR = {2016},
ABSTRACT = {Voci della Grande Guerra (Voices of the Great War) is a scientific and cultural initiative with the aim of preserving and promoting the memory of Italy in World War I through the creation of a corpus of digital texts selected by historians and linguists in order to be representative of the different ways to experience and describe the Italian war by its protagonists. With the help of advanced techniques of computational linguistics, semantic web and information visualization, the digitized historical materials will be explored with an online interface to enable easy but effective and innovative search modalities. The project will allow experts as well as non-experts to become acquainted with "linguistic polyphony" of Italy during World War I},
KEYWORDS = {Great War, World War, digital texts, corpus, Italian, Voci della Grande Guerra, Voices of the Great War},
PAGES = {101-108},
URL = {http://www.ai-lc.it/IJCoL/v2n2/6-lenci_et_al.pdf},
VOLUME = {2 (2)},
ISSN = {2499-4553},
JOURNAL = {IJCOL},
}
@ARTICLE{MANCINI_2016_ARTICLE_MP_325857,
AUTHOR = {Mancini, L. and Pedretti, I.},
TITLE = {Il progetto Clavius On The Web entra nelle scuole},
YEAR = {2016},
ABSTRACT = {Clavius on the web is a Digital Humanities project dedicated to the manuscripts of Christophorus Clavius-an important jesuit mathematician and one of most influential scholars of his time-preserved by the Historical Archive of the Pontifical Gregorian University. This paper describes Clavius@School, an initiative within the same project in which students from three high schools partecipate. Clavius@School aims not only to spread knowledge about Clavius' works, but also to alert to a conscientious and aware use of digital technology, according to the perspective proposed by the French philosopher Bernard Stiegler},
KEYWORDS = {Christophorus Claviu, Digital Humanitie, Bernard Stiegler, Technology, Education},
PAGES = {219-226},
URL = {https://iris.cnr.it/handle/20.500.14243/325857},
VOLUME = {4},
ISSN = {2283-7833},
JOURNAL = {LEXICON PHILOSOPHICUM. INTERNATIONAL JOURNAL FOR THE HISTORY OF TEXTS AND IDEAS},
}
@ARTICLE{MARZI_2016_ARTICLE_MFCP_319237,
AUTHOR = {Marzi, C. and Ferro, M. and Cardillo, F. A. and Pirrelli, V.},
TITLE = {Effects of frequency and regularity in an integrative model of word storage and processing},
YEAR = {2016},
ABSTRACT = {In spite of converging evidence in this direction, little efforts have been put so far into providing detailed, algorithmic models of the interaction between lexical token frequency, paradigm frequency, and paradigm regularity in word processing and acquisition. Here we propose a neuro-computational account of the frequency/regularity interaction, and discuss some of its theoretical implications by analysing experimental results in the computational framework of Temporal Self-Organising Maps. Detailed quantitative analysis shows that the model provides a unitary explanatory framework bringing together insights from neighbour family effects on word recognition and production, evidence from family size effects in serial lexical access and paradigm-based dynamics in lexical acquisition. Considerable evidence has accrued on the role of paradigms as both theoretical and cognitive structures regimenting the way words are processed and acquired. The evidence supports a view of the lexicon as an emergent integrative system, where word forms are concurrently and competitively stored as repeatedly successful processing patterns, and on-line processing crucially depends on the internal organisation of stored patterns},
KEYWORDS = {Lexical access, word recall, serial processing, parallel activation, inflectional paradigms, mental lexicon},
PAGES = {79-114},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-84986550295\&origin=inward},
VOLUME = {28 (1)},
ISSN = {2499-8117},
JOURNAL = {ITALIAN JOURNAL OF LINGUISTICS},
}
@ARTICLE{MONACHINI_2016_ARTICLE_MF_327645,
AUTHOR = {Monachini, M. and Frontini, F.},
TITLE = {CLARIN, l'infrastruttura europea delle risorse linguistiche per le scienze umane e sociali e il suo network italiano CLARIN-IT},
YEAR = {2016},
ABSTRACT = {ll 1°ottobre 2015 il MIUR firma l'adesione dell'Italia a CLARIN-ERIC, l'infrastruttura di ricerca che offre risorse e tecnologie linguistiche dedicate al settore delle scienze del linguaggio e delle scienze umane e sociali. Questo articolo intende fornire alla comunità italiana una ampia panoramica di CLARIN, la sua missione, i suoi pilastri, i servizi, la sua organizzazione tecnica ed amministrativa e la struttura di governance, sia a livello europeo che locale. Viene introdotto il network italiano, con il primo centro nazionale ILC4CLARIN, ospitato ed in via di sviluppo presso l'ILC-CNR, le funzionalità, le risorse ed i servizi offerti; viene presentato infine il primo nucleo del consorzio nazionale CLARIN-IT, illustrando i criteri di costituzione, le attività previste e le prospettive future},
KEYWORDS = {Infrastrutture di ricerca, Tecnologie linguistiche, Network italiano CLARIN-IT},
PAGES = {1-30},
URL = {http://www.ai-lc.it/IJCoL/v2n2/1-monachini_and_frontini.pdf},
VOLUME = {VOL. 2 (2)},
ISSN = {2499-4553},
JOURNAL = {IJCOL},
}
@ARTICLE{MUGELLI_2016_ARTICLE_MBDDKT_354715,
AUTHOR = {Mugelli, G. and Boschetti, F. and Del Gratta, R. and Del Grosso, A. and Khan, F. and Taddei, A.},
TITLE = {A user-centred design to annotate ritual facts in ancient greek tragedies},
YEAR = {2016},
ABSTRACT = {Euporia is an annotation system developed with a user-centred approach for the study of ritual and religion in ancient Greek tragedy. Euporia adopts a domain specific language (DSL) and a lightweight web user interface in order to offer digital support to an anthropological study of ancient Greek tragedy that compares ritual as it is performed or described in Greek tragedy with ancient ritual as it can be reconstructed from literary, archaeological, and epigraphic sources. The case study discussed in this paper (Aesch. Ag 67-71) shows one of the main features of Euporia: the ability to annotate different readings and different interpretations of the text and their consequences in the reconstruction of ancient Greek ritual},
KEYWORDS = {Digital Philology, Digital Humanities, Digital Classicist, Computational philology, Computational Linguistics},
PAGES = {103-120},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85007489227\&origin=inward},
VOLUME = {59},
DOI = {10.1111/j.2041-5370.2016.12041.x},
ISSN = {0076-0730},
JOURNAL = {BULLETIN OF THE INSTITUTE OF CLASSICAL STUDIES OF THE UNIVERSITY OF LONDON},
}
@ARTICLE{PROIETTI_2016_ARTICLE_PC_405494,
AUTHOR = {Proietti and Carlo},
TITLE = {The Fitch-Church Paradox and First Order Modal Logic},
YEAR = {2016},
ABSTRACT = {Reformulation strategies for solving Fitch's paradox of knowability date back to Edgington (Mind 94: 557-568, 1985). Their core assumption is that the formula p-> lozenge Kp, from which the paradox originates, does not correctly express the intended meaning of the verification thesis (VT), which should concern possible knowledge of actual truths, and therefore the contradiction does not represent a logical refutation of verificationism. Supporters of these solutions claim that (VT) can be reformulated in a way that blocks the derivation of the paradox. Unfortunately, these reformulation proposals come with other problems, on both the logical and the philosophical side (see Percival in Aust J Philos 69: 82-97, 1991; Williamson in Knowledge and its limits, Oxford University Press, Oxford, 2000; Wright in Realism, meaning and truth, Blackwell, Oxford, 1987). We claim that in order to make the reformulation idea consistent and adequate one should analyze the paradox from the point of view of a quantified modal language. An approach in this line was proposed by, among others, Kvanvig (Nous 29: 481-499, 1995; The knowability paradox, Oxford University Press, Oxford, 2006) but was not fully developed in its technical details. Here we approach the paradox by means of a first order hybrid modal logic (FHL), a tool that strikes us as more adequate to express transworld reference and the rigidification needed to consistently express this idea. The outcome of our analysis is ambivalent. Given a first order formula we are able to express the fact that it is knowable in a way which is both consistent and adequate. However, one must give up the possibility of formulating (VT) as a substitution free schema of the kind p-> lozenge Kp. We propose that one may instead formulate (VT) by means of a recursive translation of the initial formula, being aware that many alternative translations are possible},
KEYWORDS = {first order modal logic, knowability paradox},
PAGES = {87-104},
URL = {https://iris.cnr.it/handle/20.500.14243/405494},
VOLUME = {81 (1)},
DOI = {10.1007/s10670-015-9730-5},
ISSN = {0165-0106},
JOURNAL = {ERKENNTNIS},
}
@ARTICLE{REHM_2016_ARTICLE_RUABBBBBCDGGGVHHJKKKLMMMMMMOOPPPRRPSDTTTVVVZ_317422,
AUTHOR = {Rehm, G. and Uszkoreit, H. and Ananiadou, S. and Bel, N. and Bieleviciene, A. and Borin, L. and Branco, A. and Budin, G. and Calzolari, N. and Daelemans, W. and Garabik, R. and Grobelnik, M. and Garciamateo, C. and Van Genabith, J. and Hajic, J. and Hernaez, I. and Judge, J. and Koeva, S. and Krek, S. and Krstev, C. and Linden, K. and Magnini, B. and Mariani, J. and McNaught, J. and Melero, M. and Monachini, M. and Moreno, A. and Odijk, J. and Ogrodniczuk, M. and Pezik, P. and Piperidis, S. and Przepiorkowski, A. and Rognvaldsson, E. and Rosner, M. and Pedersen Bolette, S. and Skadina, I. and De Smedt, K. and Tadic, M. and Thompson, P. and Tufis, D. and Varadi, T. and Vasiljevs, A. and Vider, K. and Zabarskaite, J.},
TITLE = {The strategic impact of META-NET on the regional, national and international level},
YEAR = {2016},
ABSTRACT = {This article provides an overview of the dissemination work carried out in META-NET from 2010 until 2015; we describe its impact on the regional, national and international level, mainly with regard to politics and the funding situation for LT topics. The article documents the initiative's work throughout Europe in order to boost progress and innovation in our field},
KEYWORDS = {Language technology, Multilingual technologies, Machine translation, Language resources, META-NET, META-SHARE},
PAGES = {351-374},
URL = {http://link.springer.com/article/10.1007/s10579-015-9333-4},
VOLUME = {50 (2)},
DOI = {10.1007/s10579-015-9333-4},
ISSN = {1574-020X},
JOURNAL = {LANGUAGE RESOURCES AND EVALUATION},
}
@ARTICLE{SASSOLINI_2016_ARTICLE_S_335259,
AUTHOR = {Sassolini, E.},
TITLE = {Corpora digitali: dalla salvaguardia alla condivisione},
YEAR = {2016},
ABSTRACT = {Studio e sviluppo di metodi e tecniche che vanno nella direzione di una standardizzazione sia del formato dei file, in cui sono stati memorizzati i testi e/o la loro elaborazione software, con procedure di annotazione e arricchimento del testo; sia del set dei caratteri utilizzati in fase di digitalizzazione. L'obiettivo è recuperare il testo conservando tutte le preziose annotazioni che erano state oggetto di progetti e iniziative di ricerca. Data la grande varietà dei progetti ai quali ILC ha partecipato e mancando in passato un modello condiviso di rappresentazione delle varie caratteristiche contenute nei testi, i formati dei file trovati sono molto diversi. Il lavoro di recupero è divenuto quindi estremamente complesso. Parallelamente al recupero sono state attivate iniziative e strategie per la valorizzazione di questo patrimonio con l'intenzione di restituirlo alla comunità},
URL = {https://iris.cnr.it/handle/20.500.14243/335259},
ISSN = {2039-8271},
JOURNAL = {GARR NEWS},
}
@INCOLLECTION{BRUNATO_2016_INCOLLECTION_BV_325822,
AUTHOR = {Brunato, D. and Venturi, G.},
TITLE = {Le tecnologie linguistico-computazionali per la leggibilità della comunicazione istituzionale},
YEAR = {2016},
ABSTRACT = {Il contributo illustra il ruolo delle tecnologie linguistico-computazionali per la valutazione automatica della leggibilità dei testi della comunicazione istituzionale e propone alcuni esempi di semplificazione semi-automatica di testi amministrativi e normativi},
KEYWORDS = {tecnologie linguistico-computazionali, valutazione automatica della leggibilità, comunicazione istituzionale},
PAGES = {119-157},
URL = {https://iris.cnr.it/handle/20.500.14243/325822},
PUBLISHER = {Pisa University Press (Pisa, ITA)},
ISBN = {978-88-6741-627-1},
CONFERENCE_PLACE = {Pisa},
}
@INCOLLECTION{DELGRATTA_2016_INCOLLECTION_DBDKM_312011,
AUTHOR = {Del Gratta, R. and Boschetti, F. and Del Grosso, A. and Khan, F. and Monachini, M.},
TITLE = {Cooperative philology on the way to web services: The case of the cophiwordnet platform},
YEAR = {2016},
ABSTRACT = {In this paper we present ongoing research carried out at the Institute for Computational Linguistics "A. Zampolli" (ILC) in Pisa. The institute has been active since many years in the field of Digital Humanities providing resources, tools and solutions to address issues of the to digital humanists. Starting from those previous initiatives, we show how to re-engineer them as Web Services in order to make connections between lexicons, semantic resources and a fine grained text management. Linked Open Data is chosen as the paradigm used to link the different resources as well as the modality of data presentation},
KEYWORDS = {Canonical text services, Cooperative philology, Linked open data, Web services},
PAGES = {173-187},
URL = {http://www.scopus.com/inward/record.url?eid=2-s2.0-84961744725\&partnerID=q2rCbXpz},
DOI = {10.1007/978-3-319-31468-6_13},
PUBLISHER = {Springer International Publishing (Switzerland, CHE)},
ISBN = {978-3-319-31468-6},
CONFERENCE_PLACE = {Switzerland},
BOOKTITLE = {Worldwide Language Service Infrastructure: Second International Workshop, WLSI 2015, Kyoto, Japan, January 22-23, 2015. Revised Selected Papers},
EDITOR = {Murakami, Y. and Li, D.},
}
@INCOLLECTION{FRONTINI_2016_INCOLLECTION_FDM_320992,
AUTHOR = {Frontini, F. and Del Gratta, R. and Monachini, M.},
TITLE = {GeoDomainWordNet: Linking the Geonames Ontology to WordNet},
YEAR = {2016},
ABSTRACT = {This paper illustrates the transformation of GeoNames' ontology concepts, with their English labels and glosses, into a GeoDomain WordNet-like resource in English, its translation into Italian, and its linking to the existing generic WordNets of both languages. The paper describes the criteria used for the linking of domain synsets to each other and to the generic ones and presents the published resource in RDF according to the w3c and lemon schema},
KEYWORDS = {GeoNames, WordNet, Language resources, Lexi, Linguistic linked data, lemon, RDF},
PAGES = {229-242},
URL = {http://link.springer.com/chapter/10.1007/978-3-319-43808-5_18},
DOI = {10.1007/978-3-319-43808-5},
ISBN = {978-3-319-43808-5},
BOOKTITLE = {Human Language Technology. Challenges for Computer Science and Linguistics},
}
@INCOLLECTION{MONTEMAGNI_2016_INCOLLECTION_MW_353727,
AUTHOR = {Montemagni, S. and Wieling, M.},
TITLE = {Tracking linguistic features underlying lexical variation patterns: A case study on Tuscan dialects},
YEAR = {2016},
ABSTRACT = {In this paper, we illustrate the application of hierarchical spectral partitioning of bipartite graphs in the study of lexical variation in Tuscany based on the data from a regional linguistic atlas. This method makes it possible not only to identify existing patterns of lexical variation in Tuscany, but also to uncover the underlying lexical features in terms of the most characteristic concept-lexicalization pairs. The results are promising, demonstrating the potential of the method for tracking the linguistic features underlying identified patterns of lexical variation and change across generations},
KEYWORDS = {tuscan, dialects, lexical variation, linguistic atlas},
PAGES = {117-135},
URL = {http://langsci-press.org/catalog/view/81/146/376-1},
DOI = {10.17169/langsci.b81.146},
PUBLISHER = {Language Science Press (Berlin, DEU)},
CONFERENCE_PLACE = {Berlin},
BOOKTITLE = {The future of dialects},
EDITOR = {Marie Hélène Côté, R. K. and Jo},
}
@INCOLLECTION{PROIETTI_2016_INCOLLECTION_PO_404027,
AUTHOR = {Proietti, C. and Olsson, E. J.},
TITLE = {Explicating Ignorance and Doubt: A Possible Worlds Approach},
YEAR = {2016},
ABSTRACT = {While the concepts of ignorance and doubt occupy central roles in epistemology as well as in philosophy generally, there have been surprisingly few attempts to give detailed analyses of these notions. We start out by identifying their main conceptual ingredients. We then propose a semi-formal account within the possible worlds framework of epistemic and doxastic logic. The upshot is that while ignorance can be construed as the absence of knowledge of any of the alternatives under scrutiny, doubt is a very special kind of ignorance. We develop two specific proposals for how to capture special features of doubt in our framework. One centers on the notion that doubt, as opposed to ignorance, requires maximum plausibility of opposing alternatives. The other is based on the assumption that, for an agent to doubt a proposition, she must entertain the question whether that proposition is true on her research agenda},
KEYWORDS = {Doubt, Ignorance, Modal Logic},
PAGES = {81-95},
URL = {https://iris.cnr.it/handle/20.500.14243/404027},
ISBN = {9780511820076},
BOOKTITLE = {The Epistemic Dimensions of Ignorance},
EDITOR = {Peels, R. and Blaauw, M.},
}
@INCOLLECTION{QUOCHI_2016_INCOLLECTION_Q_320606,
AUTHOR = {Quochi, V.},
TITLE = {Development and representation of Italian light-fare constructions},
YEAR = {2016},
ABSTRACT = {The essay describes the study of the development and use of light fare 'do' constructions in Child-directed Speech and in Child Language with the twofold goal of showing that a Construction Grammar approach is viable, and of providing support to usage-based, functional predictions on language acquisition. The analysis of naturalistic data derived from the CHILDES database lead to two main findings: first, a representation of fare Light Verb Constructions as a family of constructions organized like a radial category is not only possible but more explicative, second, there exists a 'fare' pivot schema that children generalize at an early stage because it serves the purpose of naming new events, activities or situations},
KEYWORDS = {Corpus linguistic, Language Acquisition, Construction Grammar, phraseology},
PAGES = {39-64},
URL = {https://benjamins.com/#catalog/books/cal.19.03quo/details},
DOI = {10.1075/cal.19.03quo},
PUBLISHER = {John Benjamins Publishing Company (Amsterdam/Philadelphia, USA)},
ISBN = {9789027204417},
CONFERENCE_PLACE = {Amsterdam/Philadelphia},
BOOKTITLE = {Corpus-based Approaches to Construction Grammar},
EDITOR = {Yoon, J. and Th Gries, S.},
}
@INCOLLECTION{SORIA_2016_INCOLLECTION_S_374887,
AUTHOR = {Soria, C.},
TITLE = {Speakers' attitudes on Piedmontese: A case for Vitality Re-assessment},
YEAR = {2016},
ABSTRACT = {In this research I present the results of a survey carried out among speakers of Piedmontese, a regional language of Italy, to assess its vitality in terms of speaker numbers, domains of use, intergenerational transmission and speakers' attitudes. After illustrating the methodology adopted for the survey, I compare the survey results with the vitality assessment of Piedmontese currently available. I show how the discrepancies can be interpreted, and then argue for the need for a finer. grained instrument for vitality assessment, one that places proper emphasis on signs of revitalisation and less stress on intergenerational transmission},
URL = {https://iris.cnr.it/handle/20.500.14243/374887},
ISBN = {978-1-4438-9943-7},
}
@INCOLLECTION{WEINGART_2016_INCOLLECTION_WG_354705,
AUTHOR = {Weingart, A. and Giovannetti, E.},
TITLE = {Extending the Lemon Model for a Dictionary of Old Occitan Medico-Botanical Terminology},
YEAR = {2016},
ABSTRACT = {The article presents the adaptation of the lemon model (a model for lexica as RDF data) for a multilingual and multi-alphabetical lexicon of Old Occitan medico-botanical terminology. The lexicon is the core component of an ontology-based information system that will be constructed and implemented within the DFG-funded project "Dictionnaire des Termes Medico-botaniques de l'Ancien Occitan" (DiTMAO). The difficulties for the lemmatization raised by the particularities of the corpus (terms in Latin, Hebrew and Arabic script and corresponding terms in other ancient languages, mostly Hebrew and Arabic) can be perfectly solved by extending the basic properties of lemon and introducing domain specific vocabulary},
KEYWORDS = {Lemon model, RDF, Multilingual, Multi-alphabetical, Historical lexicon, Medico-Botanical terminology, Old occitan, Hebrew, Arabic},
PAGES = {408-421},
URL = {http://link.springer.com/chapter/10.1007/978-3-319-47602-5_53},
DOI = {10.1007/978-3-319-47602-5_53},
ISBN = {978-3-319-47601-8},
BOOKTITLE = {The Semantic Web},
EDITOR = {Sack, H. and Rizzo, G. and Steinmetz, N. and Mladenić, D. and Auer, S. and Lange, C.},
}
@INCOLLECTION{WIELING_2016_INCOLLECTION_WM_353731,
AUTHOR = {Wieling, M. and Montemagni, S.},
TITLE = {Infrequent forms: Noise or not?},
YEAR = {2016},
ABSTRACT = {In this study we ask the question whether simplifying the data in dialectometrical studies by removing infrequent forms is advantageous to uncovering the geographical structure in dialect data. By investigating lexical variation in a large corpus of Tuscan dialect data via hierarchical bipartite spectral graph partitioning, we are able to identify the main geographical areas together with their linguistic basis. In order to assess the influence of infrequent forms, we conduct two analyses: one which includes only lexical variants used by at least 0. 5% of the informants, and another which includes all lexical variants in the data. Using this approach we show that using all data enables us to find a geographical characterization with a more adequate linguistic basis than by using the trimmed data},
KEYWORDS = {dialectometrical studies, dialectology, dialect data, lexical variation, Tuscan},
PAGES = {215-224},
URL = {http://langsci-press.org/catalog/view/81/78/367-1},
DOI = {10.17169/langsci.b81.78},
PUBLISHER = {Language Science Press (Berlin, DEU)},
ISBN = {978-3-946234-18-0},
CONFERENCE_PLACE = {Berlin},
BOOKTITLE = {The Future of Dialects},
EDITOR = {Côté, M. H. and Knooihuizen, R. and Nerbonne, J.},
}
@EDITORIAL{BRANCO_2016_EDITORIAL_BCC_328598,
AUTHOR = {Branco, A. and Calzolari, N. and Choukri, K.},
TITLE = {4REAL Workshop: Workshop on Research Results Reproducibility and Resources Citation in Science and Technology of Language},
YEAR = {2016},
ABSTRACT = {This workshop seeks to foster the discussion and the advancement on a topic that has been so far given insufficient attention in the research area of language processing tools and resources (Branco, 2013, Fokkens et al., 2013) and that has been an important topic emerging in other scientific areas. That is the topic of the reproducibility of research results and the citation of resources, and its impact on research integrity},
URL = {https://iris.cnr.it/handle/20.500.14243/328598},
ISBN = {978-2-9517408-9-1},
}
@EDITORIAL{BRUNATO_2016_EDITORIAL_BDVFB_351623,
AUTHOR = {Brunato, D. and Dell'Orletta, F. and Venturi, G. and François, T. and Blache, P.},
TITLE = {Proceedings of the Workshop on Computational Linguistics for Linguistic Complexity (CL4LC 2016)},
YEAR = {2016},
ABSTRACT = {Introduzione agli atti della prima edizione del workshop "Computational Linguistics for Linguistic Complexity" che raccoglie lavori che studiano da prospettive diverse il tema della complessità linguistica workshop allo scopo di promuovere una riflessione comune su approcci diversi all'indagine, al trattamento e alla valutazione di aspetti che rendono complessa la lingua},
KEYWORDS = {Linguistic Complexity, Computational Linguistics},
PAGES = {1-245},
URL = {https://aclweb.org/anthology/W/W16/W16-41.pdf},
ISBN = {978-4-87974-709-9},
}
@EDITORIAL{CHAIR_2016_EDITORIAL_CCDGGMMMMOP_317884,
AUTHOR = {Chair, N. C. C. and Choukri, K. and Declerck, T. and Goggi, S. and Grobelnik, M. and Maegaard, B. and Mariani, J. and Mazo, H. and Moreno, A. and Odijk, J. and Piperidis, S.},
TITLE = {Proceedings of the Tenth International Conference on Language Resources and Evaluation (LREC 2016)},
YEAR = {2016},
ABSTRACT = {Curatela dei 744 articoli presentati alla conferenza LREC2016},
KEYWORDS = {Language Resource, Evaluation},
PAGES = {1-4693},
URL = {http://www.lrec-conf.org/proceedings/lrec2016/index.html},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {978-2-9517408-9-1},
CONFERENCE_PLACE = {Paris},
}
@EDITORIAL{KHAN_2016_EDITORIAL_KVAFFPGU_324185,
AUTHOR = {Khan, F. and Vintar, P. and Araúz, P. L. and Faber, P. and Frontini, F. and Parvizi, A. and Grisimeunovi, L. and Unger, C.},
TITLE = {Language and Ontology (LangOnto2) & Terminology and Knowledge Structures (TermiKS)},
YEAR = {2016},
ABSTRACT = {This joint workshop brings together two different but closely related strands of research. On the one hand it looks at the overlap between ontologies and computational linguistics and on the other it explores the relationship between knowledge modelling and terminologies. In particular the workshop aims to create a forum for discussion in which the different relationships and commonalities between these two areas can be explored in detail, as well as presenting cutting edge research in each of the two individual areas. A significant amount of human knowledge can be found in texts. It is not surprising that languages such as OWL, which allow us to formally represent this knowledge, have become more and more popular both in linguistics and in automated language processing. For instance ontologies are now of core interest to many NLP fields including Machine Translation, Question Answering, Text Summarization, Information Retrieval, and Word Sense Disambiguation. At a more abstract level, however, ontologies can also help us to model and reason about phenomena in natural language semantics. In addition, ontologies and taxonomies can also be used in the organisation and formalisation of linguistically relevant categories such as those used in tagsets for corpus annotation. Notably also, the fact that formal ontologies are being increasingly accessed by users with limited to no background in formal logic has led to a growing interest in developing accessible front ends that allow for easy querying and summarisation of ontologies. It has also led to work in developing natural language interfaces for authoring ontologies and evaluating their design. Additionally in recent years there has been a renewed interest in the linguistic aspects of accessing, extracting, representing, modelling and transferring knowledge. Numerous tools for the automatic extraction of terms, term variants, knowledge-rich contexts, definitions, semantic relations and taxonomies from specialized corpora have been developed for a number of languages, and new theoretical approaches have emerged as potential frameworks for the study of specialized communication. However, the building of adequate knowledge models for practitioners (e. g. experts, researchers, translators, teachers etc.), on the one hand, and NLP applications (including cross-language, cross-domain, cross-device, multi-modal, multi-platform applications), on the other hand, still remains a challenge. The papers included in the workshop range across a wide variety of different areas and reflect the strong inter-disciplinary approach, which characterises both areas of research. In addition we are very happy to include two invited talks in the program presented by authorities in their respective fields: Pamela Faber from the field of terminology, and John McCrae, an expert on linguistic linked data and the interface between NLP and ontologies},
KEYWORDS = {lexicons, ontologies},
URL = {http://www.lrec-conf.org/proceedings/lrec2016/index.html},
}
@EDITORIAL{MARZI_2016_EDITORIAL_MP_319239,
AUTHOR = {Marzi, C. and Pirrelli, V.},
TITLE = {Word knowledge and word usage: A foreword},
YEAR = {2016},
ABSTRACT = {This special issue, together with its companion issue to appear in Italian Journalof Linguistics, stems from the NetWordS Final Conference "Wordknowledge and word usage: representations and processes in the mental lexicon". The conference, held on the 30th and 31st of March, and the 1st of April2015 in Pisa, concluded the 4-year NetWordS project, the European Networkof Word Structure funded by the European Science Foundation within the ResearchNetworking Programme. In line with the highly multidisciplinary profileof NetWordS agenda, the conference offered a comprehensive and inclusiveforum focussing on two main lines of lexical inquiry: (i) usage-based approaches to bootstrapping word form and structure(morpho-phonological and morpho-syntactic issues), including: acquisition oflexical categories, emergence of morphological structure, lexical memories, anticipatory prediction-based mechanisms of word recognition, word production, frequency-based models of lexical productivity, word encoding, modelsof lexical architecture, family-based effects in word processing, word readingand writing; (ii) usage-based approaches to word meanings (lexical semantics andpragmatics in morphologically simple and complex words), including: distributionalsemantics, compound interpretation, concept composition and coercion, conceptualization of perception and action, time and space in the lexicon, metonymy and metaphor, lexico-semantic relations, perceptual groundingand embodied cognition, context-based and encyclopedic knowledge, semanticassociation and categorization. The multidisciplinary focus on word knowledge and word usage promotedby the Conference led participants to openly discuss an impressive range ofapproaches and empirical data: priming and lexical decision in a number ofcontexts, distributional semantics and models of semantic composition, neuralnetworks, machine learning and mathematical modelling of empirical evidence, as well as their neuro-biological and neuro-functional correlates. It is widely acknowledged that looking at the same problem from differentangles has an additive effect on the impact of current language research. Certainly more can be achieved, however, if, rather than simply adding more perspectiveson the same subject, with individual research efforts staying withinthe boundaries of single knowledge domains, scholars manage to integratethem into a boundary-shifting methodological perspective. When psycholinguisticevidence from humans is successfully replicated algorithmicallythrough a computational model implementing a few well-understood principlesof time-series processing, we are in a position to empirically assess whatinput conditions favour memorisation and acquisition of symbolic strings bythe model, and test these algorithmic predictions back on human subjects, thusgoing full circle. This may have a multiplicative effect on current research, providing not only mathematical modelling of present behavioural evidence, but amounting to fully explanatory mechanisms. Our current understanding ofWHERE and WHEN some cognitive processes are implemented in the brain willbe complemented by knowledge of WHAT information they rely on and HOWthey integrate it. Other compelling examples of the full potential of cross-disciplinary integrationcan be found in the present volume and in the twin issue of ItalianJournal of Linguistics. As a general point, we contend that only by puttingsingle-domain acquisitions into the wider context of human communication, and developing an interdisciplinary framework whereby each specialist willtake advantage of insights from other disciplines, we can make substantialprogress in our understanding of the lexical roots of human verbal communicationin real contexts. The edited selection of papers presented here providesa representative sample of the range of approaches debated at the NetWordSPisa Conference, by way of illustration of how aspects of knowledge integrationand methodological innovation can be put at the service of a better understandingof broad lexical issues},
KEYWORDS = {word knowledge, word usage, interdisciplinary approach, mental lexicon, NetWordS},
PAGES = {3-6},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-84978285090\&origin=inward},
DOI = {10.1418/83651},
PUBLISHER = {Il Mulino (Bologna, ITA)},
ISSN = {1720-9331},
ISBN = {978-88-15-26226-4},
CONFERENCE_PLACE = {Bologna},
}
@EDITORIAL{MARZI_2016_EDITORIAL_MP_319238,
AUTHOR = {Marzi, C. and Pirrelli, V.},
TITLE = {Word knowledge and word usage: A Foreword},
YEAR = {2016},
ABSTRACT = {This special issue, together with its companion issue to appear in Lingue e Linguaggio, stems from the NetWordS Final Conference Word knowledge and word usage: representations and processes in the mental lexicon. * The conference, held on the 30th and 31st of March, and the 1st of April 2015 in Pisa, concluded the 4-year NetWordS project, the European Network of Word Structure funded by the European Science Foundation within the Research Networking Programme. In line with the highly multidisciplinary profile of NetWordS agenda, the conference offered a comprehensive and inclusive forum focussing on two main lines of lexical inquiry: (i) usage-based approaches to bootstrapping word form and structure (morpho-phonological and morpho-syntactic issues), including: acquisition of lexical categories, emergence of morphological structure, lexical memories, anticipatory prediction-based mechanisms of word recognition, word production, frequency-based models of lexical productivity, word encoding, models of lexical architecture, family-based effects in word processing, word reading and writing; (ii) usage-based approaches to word meanings (lexical semantics and pragmatics in morphologically simple and complex words), including: distributional semantics, compound interpretation, concept composition and coercion, conceptualization of perception and action, time and space in the lexicon, metonymy and metaphor, lexico-semantic relations, perceptual grounding and embodied cognition, context-based and encyclopedic knowledge, semantic association and categorization. The multidisciplinary focus on word knowledge and word usage promoted by the Conference led participants to openly discuss an impressive range of approaches and empirical data: priming and lexical decision in a number of contexts, distributional semantics and models of semantic composition, neural networks, machine learning and mathematical modelling of empirical evidence, as well as their neuro-biological and neuro-functional correlates},
KEYWORDS = {word knowledge, word usage, mental lexicon, interdisciplinary approach, NetWordS},
PAGES = {3-6},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-84986558643\&origin=inward},
PUBLISHER = {Pacini (Pisa, ITA)},
ISSN = {2499-8117},
CONFERENCE_PLACE = {Pisa},
}
@EDITORIAL{MONTEMAGNI_2016_EDITORIAL_M_353676,
AUTHOR = {Montemagni, S.},
TITLE = {Proceedings CLiC-it 2016 and EVALITA 2016},
YEAR = {2016},
ABSTRACT = {Proceedings of Third Italian Conference on Computational Linguistics (CLiC-it 2016) \& Fifth Evaluation Campaign of Natural Language Processing and Speech Tools for Italian. Final Workshop (EVALITA 2016)},
KEYWORDS = {Computational Linguistic, Natural Language Processing, Speech Tools for Italian, CLiC-it, EVALITA},
URL = {http://ceur-ws.org/Vol-1749/},
PUBLISHER = {CEUR-WS. org (Aachen, DEU)},
CONFERENCE_PLACE = {Aachen},
}
@EDITORIAL{SORIA_2016_EDITORIAL_SPDMSE_324691,
AUTHOR = {Soria, C. and Pretorius, L. and Declerck, T. and Mariani, J. and Scannell, K. and Evelinewandlvogt},
TITLE = {CCURL 2016 Collaboration and Computing for Under-Resourced Languages: Towards an Alliance for Digital Language Diversity},
YEAR = {2016},
ABSTRACT = {Atti del Workshop "CCURL 2016 Collaboration and Computing for Under-Resourced Languages: Towards an Alliance for Digital Language Diversity"},
KEYWORDS = {Less-resourced languages, Language Technology, digital language vitality, digital language diversity},
PAGES = {1-103},
URL = {http://www.lrec-conf.org/proceedings/lrec2016/workshops/LREC2016Workshop-CCURL2016_Proceedings.pdf},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {978-2-9517408-9-1},
CONFERENCE_PLACE = {Paris},
}
@EDITORIAL{BASILI_2016_EDITORIAL_BM_353693,
AUTHOR = {Basili, R. and Montemagni, S.},
TITLE = {Nota Editoriale},
YEAR = {2016},
KEYWORDS = {Computational Linguistic, CLiC-it, natural language processing},
PAGES = {7-10},
URL = {http://www.ai-lc.it/IJCoL/v2n1/00_nota_editoriale.pdf},
VOLUME = {2 (1)},
ISSN = {2499-4553},
}
@INPROCEEDINGS{ATTARDI_2016_INPROCEEDINGS_ASAS_493652,
AUTHOR = {Attardi, G. and Sartiano, D. and Alzetta, C. and Semplici, F.},
TITLE = {Convolutional neural networks for sentiment analysis on Italian tweets},
YEAR = {2016},
ABSTRACT = {The paper describes our submission to the task 2 of Sentiment Polarity Classification in Italian Tweets at Evalita 2016. Our approach is based on a convolutional neural network that exploits both word embeddings and Sentiment Specific word embeddings. We also experimented a model trained with a distant supervised corpus. Our submission with Sentiment Specific word embeddings achieved the first official score},
KEYWORDS = {convolutional networks, sentiment analysis},
PAGES = {156-160},
URL = {https://iris.cnr.it/handle/20.500.14243/493652},
VOLUME = {1749},
DOI = {10.4000/books.aaccademia.1995},
PUBLISHER = {CEUR-WS},
ISBN = {9788899982553},
CONFERENCE_NAME = {3rd Italian Conference on Computational Linguistics, CLiC-it 2016 and 5th Evaluation Campaign of Natural Language Processing and Speech Tools for Italian, EVALITA 2016},
BOOKTITLE = {CEUR Workshop Proceedings of the 5th Evaluation Campaign of Natural Language Processing and Speech Tools for Italian, EVALITA 2016},
}
@INPROCEEDINGS{BARBAGLI_2016_INPROCEEDINGS_BLDMV_325812,
AUTHOR = {Barbagli, A. and Lucisano, P. and Dell'Orletta, F. and Montemagni, S. and Venturi, G.},
TITLE = {CItA: an L1 Italian Learners Corpus to Study the Development of Writing Competence},
YEAR = {2016},
ABSTRACT = {In this paper, we present the CItA corpus (Corpus Italiano di Apprendenti L1), a collection of essays written by Italian L1 learners collected during the first and second year of lower secondary school. The corpus was built in the framework of an interdisciplinary study jointly carried out by computational linguistics and experimental pedagogists and aimed at tracking the development of written language competence over the years and students' background information},
KEYWORDS = {Italian Learner Corpus, Diachronic Evolution of Written Language Competence, Error Annotation},
PAGES = {88-95},
URL = {http://www.lrec-conf.org/proceedings/lrec2016/pdf/536_Paper.pdf},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {978-2-9517408-9-1},
CONFERENCE_NAME = {Proceedings of the Tenth International Conference on Language Resources and Evaluation (LREC 2016)},
CONFERENCE_PLACE = {Paris},
}
@INPROCEEDINGS{BELLANDI_2016_INPROCEEDINGS_BBDG_354708,
AUTHOR = {Bellandi, A. and Benotto, G. and Di Segni, G. and Giovannetti, E.},
TITLE = {Investigating the Application and Evaluation of Distributional Semantics in the Translation of Humanistic Texts: a Case Study},
YEAR = {2016},
ABSTRACT = {Digital Humanities are persisting ascending and the need for translating humanistic texts using Computer Assisted Translation (CAT) tools demands for a specific investigation both of the available technologies and of the evaluation techniques. Indeed, humanistic texts can present deep differences from texts that are usually translated with CAT tools, due to complex interpretative issues, the request of heavy rephrasing, and the addition of explicative parts in order to make the translation fully comprehensible to readers and, also, stylistically pleasant to read. In addition, these texts are often written in peculiar languages for which no linguistic analysis tool can be available. We faced this situation in the context of the project for the translation of the Babylonian Talmud from Ancient Hebrew and Aramaic into Italian. In this paper we describe a work in progress on the application of distributional semantics to the informing of the Translation Memory, and on the evaluation issues arising from its assessment},
KEYWORDS = {computer-assisted translation, distributional semantics, talmud},
PAGES = {6-11},
URL = {http://www.lrec-conf.org/proceedings/lrec2016/workshops/LREC2016Workshop-NLP4TM_Proceedings.pdf},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
CONFERENCE_NAME = {2nd Workshop on Natural Language Processing for Translation Memories (NLP4TM 2016)},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the 2nd Workshop on Natural Language Processing for Translation Memories (NLP4TM 2016)},
}
@INPROCEEDINGS{BENOTTO_2016_INPROCEEDINGS_BGM_354707,
AUTHOR = {Benotto, G. and Giovannetti, E. and Marchi, S.},
TITLE = {Investigating the Application of Distributional Semantics to Stylometry},
YEAR = {2016},
ABSTRACT = {The inclusion of semantic features in the stylometric analysis of literary texts appears to be poorly investigated. In this work, we experiment with the application of Distributional Semantics to a corpus of Italian literature to test if words distribution can convey stylistic cues. To verify our hypothesis, we have set up an Authorship Attribution experiment. Indeed, the results we have obtained suggest that the style of an author can reveal itself through words distribution too},
KEYWORDS = {NLP for Digital Humanities, Stilometry, Distributional Semantic},
PAGES = {61-65},
URL = {https://drive.google.com/open?id=0B0sEp2O7Oo7feVJLdHI3YXBxdTg},
PUBLISHER = {Accademia University Press (Torino, ITA)},
ISBN = {9788899982089},
CONFERENCE_NAME = {Third Italian Conference on Computational Linguistics},
CONFERENCE_PLACE = {Torino},
BOOKTITLE = {Proceedings of Third Italian Conference on Computational Linguistics (CLiC-it 2016)},
}
@INPROCEEDINGS{BENOTTO_2016_INPROCEEDINGS_BGN_333396,
AUTHOR = {Benotto, G. and Giovannetti, E. and Nahli, O.},
TITLE = {An application of distributional semantics for the analysis of the Holy Quran},
YEAR = {2016},
ABSTRACT = {In this contribution we illustrate the methodology and the results of an experiment we conducted by applying Distributional Semantics Models to the analysis of the Holy Quran. Our aim was to gather information on the potential differences in meanings that the same words might take on when used in Modern Standard Arabic w. r. t. their usage in the Quran. To do so we used the Penn Arabic Treebank as a contrastive corpus},
KEYWORDS = {Distributional Semantics, the Holy Quran, Classical Arabic, Modern Standard Arabic, Contrastive Linguistics},
PAGES = {374-379},
URL = {http://ieeexplore.ieee.org/document/7805074/},
DOI = {10.1109/CIST.2016.7805074},
ISBN = {978-1-5090-0751-6},
CONFERENCE_NAME = {4th (IEEE) International Colloquium on Information Science and Technology, CiSt 2016},
BOOKTITLE = {2016 4th IEEE International Colloquium on Information Science and Technology (CiSt)},
EDITOR = {El Mohajir and Mohammed and Chahhou and Mohamed and Al Achhab and Badr, E.},
}
@INPROCEEDINGS{BERTI_2016_INPROCEEDINGS_BCYBBD_328799,
AUTHOR = {Berti, M. and Crane, G. and Yousef, T. and Bizzoni, Y. and Boschetti, F. and Del Gratta, R.},
TITLE = {Ancient Greek WordNet meets the Dynamic Lexicon: the example of the fragments of the Greek Historians},
YEAR = {2016},
ABSTRACT = {The Ancient Greek WordNet (AGWN) and the Dynamic Lexicon (DL) are multilingual resources to study the lexicon of Ancient Greek texts and their translations. Both AGWN and DL are works in progress that need accuracy improvement and manual validation. After a detailed description of the current state of each work, this paper illustrates a methodology to cross AGWN and DL data, in order to mutually score the items of each resource according to the evidence provided by the other resource. The training data is based on the corpus of the Digital Fragmenta Historicorum Graecorum (DFHG), which includes ancient Greek texts with Latin translations},
KEYWORDS = {wordnet},
PAGES = {34-38},
URL = {http://gwc2016.racai.ro/procedings.pdf},
ISBN = {978-606-714-239-6},
CONFERENCE_NAME = {Global WordNet Conference},
BOOKTITLE = {Global WordNet Conference},
}
@INPROCEEDINGS{BIBULI_2016_INPROCEEDINGS_BBCCORSZ_328321,
AUTHOR = {Bibuli, M. and Bruzzone, G. and Chiarella, D. and Caccia, M. and Odetti, A. and Ranieri, A. and Saggini, E. and Zereik, E.},
TITLE = {Underwater Robotics for Diver Operations Support: The CADDY Project},
YEAR = {2016},
ABSTRACT = {This paper describes the EU project "CADDY-Cognitive Autonomous Diving Buddy" which aims at developing a cooperative autonomous underwater robotic system to improve monitoring, assistance, and safety of the diver's operations. The paper presents key results related to the gesture recognition system, developed to enhance the interaction between diver and robot, and autonomous functionalities provided by the robotic framework to support the diver operations. Some experimental results obtained by field trials are also reported},
URL = {https://iris.cnr.it/handle/20.500.14243/328321},
ISBN = {978-3-89220-690-3},
}
@INPROCEEDINGS{BOMPOLAS_2016_INPROCEEDINGS_BMFCP_318149,
AUTHOR = {Bompolas, S. and Marzi, C. and Ferro, M. and Cardillo, F. A. and Pirrelli, V.},
TITLE = {Reassessing inflectional regularity in Modern Greek conjugation},
YEAR = {2016},
ABSTRACT = {Paradigm-based approaches to word processing/learning assume that word forms are not acquired in isolation, but through associative relations linking members of the same word family (e. g. a paradigm, or a set of forms filling the same paradigm cell). Principles of correlative learning offer a set of dynamic equations that are key to modelling this complex dynamic at a considerable level of detail. We use these dynamic equations to simulate acquisition of Modern Greek conjugation, and we compare the results with evidence from German and Italian. Simulations show that different Greek verb classes are processed and acquired differentially, depending on their degrees of formal transparency and predictability. We relate these results to psycholinguistic evidence on Modern Greek word processing, and interpret our findings as supporting a view of the mental lexicon as an emergent integrative system},
KEYWORDS = {word processing, paradigm-based learning, morphological processing, Greek stem allomoprhy, Temporal Self-Organising Map},
PAGES = {72-77},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85009242702\&origin=inward},
VOLUME = {1749},
DOI = {10.4000/books.aaccademia.1721},
PUBLISHER = {Accademia University Press (Torino, ITA)},
ISBN = {978-88-99982-08-9},
CONFERENCE_NAME = {Third Italian Conference on Computational Linguistics (CLiC-it 2016) \& Fifth Evaluation Campaign of Natural Language Processing and Speech Tools for Italian. Final Workshop (EVALITA 2016)},
CONFERENCE_PLACE = {Torino},
BOOKTITLE = {CLiC-it \& EVALITA 2016-Proceedings of Third Italian Conference on Computational Linguistics (CLiC-it 2016) \& Fifth Evaluation Campaign of Natural Language Processing and Speech Tools for Italian. Final Workshop (EVALITA 2016)},
EDITOR = {Basile, P. and Corazza, A. and Monetmagni, S. and Nissim, M. and Patti, V. and Semeraro, G. and Sprugnoli, R.},
}
@INPROCEEDINGS{BRUNATO_2016_INPROCEEDINGS_BCDV_333951,
AUTHOR = {Brunato, D. and Cimino, A. and Dell'Orletta, F. and Venturi, G.},
TITLE = {PaCCSS-IT: A Parallel Corpus of Complex-Simple Sentences for Automatic Text Simplification},
YEAR = {2016},
ABSTRACT = {In this paper we present PaCCSS-IT, a Parallel Corpus of Complex-Simple Sentences for ITalian. To build the resource we develop a new method for automatically acquiring a corpus of complex-simple paired sentences able to intercept structural transformations and particularly suitable for text simplification. The method requires a wide amount of texts that can be easily extracted from the web making it suitable also for less-resourced languages. We test it on the Italian language making available the biggest Italian corpus for automatic text simplification},
KEYWORDS = {Automatic Text Simplification, Sentence alignment, Italian corpus},
PAGES = {351-361},
URL = {https://www.aclweb.org/anthology/D/D16/D16-1034.pdf},
DOI = {10.18653/v1/d16-1034},
PUBLISHER = {Association for Computational Linguistics (Stroudsburg, USA)},
ISBN = {978-1-945626-25-8},
CONFERENCE_NAME = {Conference on Empirical Methods in Natural Language Processing (EMNLP 2016)},
CONFERENCE_PLACE = {Stroudsburg},
}
@INPROCEEDINGS{CALZOLARI_2016_INPROCEEDINGS_C_328564,
AUTHOR = {Calzolari, N.},
TITLE = {Preface: General Chair},
YEAR = {2016},
ABSTRACT = {COLING is organised under the auspices of the International Committee on Computational Linguistics (ICCL, http: //nlp. shef. ac. uk/iccl/index. html). ICCL is a very special committee, with no fixed rules and no funding, whose only function is to make sure that aCOLING appears every two years and that it is a good and friendly conference},
URL = {https://iris.cnr.it/handle/20.500.14243/328564},
ISBN = {978-4-87974-702-0},
}
@INPROCEEDINGS{CARDILLO_2016_INPROCEEDINGS_C_331310,
AUTHOR = {Cardillo, R. C. A.},
TITLE = {Quantifying the specificity of near-duplicate image classification functions},
YEAR = {2016},
ABSTRACT = {There are many published methods for detecting similar and near-duplicate images. Here, we consider their use in the context of unsupervised near-duplicate detection, where the task is to find a (relatively small) near-duplicate intersection of two large candidate sets. Such scenarios are of particular importance in forensic near-duplicate detection. The essential properties of a such a function are: performance, sensitivity, and specificity. We show that, as collection sizes increase, then specificity becomes the most important of these, as without very high specificity huge numbers of false positive matches will be identified. This makes even very fast, highly sensitive methods completely useless. Until now, to our knowledge, no attempt has been made to measure the specificity of near-duplicate finders, or even to compare them with each other. Recently, a benchmark set of near-duplicate images has been established which allows such assessment by giving a near-duplicate ground truth over a large general image collection. Using this we establish a methodology for calculating specificity. A number of the most likely candidate functions are compared with each other and accurate measurement of sensitivity vs. specificity are given. We believe these are the first such figures be to calculated for any such function},
URL = {https://iris.cnr.it/handle/20.500.14243/331310},
}
@INPROCEEDINGS{CIMINO_2016_INPROCEEDINGS_CD_333953,
AUTHOR = {Cimino, A. and Dell'Orletta, F.},
TITLE = {Building the state-of-the-art in POS tagging of Italian Tweets},
YEAR = {2016},
ABSTRACT = {In this paper we describe our approach to EVALITA 2016 POS tagging for Italian Social Media Texts (PoSTWITA). We developed a two-branch bidirectional Long Short Term Memory recurrent neural network, where the first bi-LSTM uses a typical vector representation for the input words, while the second one uses a newly introduced word-vector representation able to encode information about the characters in the words avoiding the increasing of computational costs due to the hierarchical LSTM introduced by the character-based LSTM architectures. The vector representations calculated by the two LSTM are then merged by the sum operation. Even if participants were allowed to use other annotated resources in their systems, we used only the distributed data set to train our system. When evaluated on the official test set, our system outperformed all the other systems achieving the highest accuracy score in EVALITA 2016 PoSTWITA, with a tagging accuracy of 93. 19%. Further experiments carried out after the official evaluation period allowed us to develop a system able to achieve a higher accuracy. These experiments showed the central role played by the handcrafted features even when machine learning algorithms based on neural networks are used},
URL = {https://iris.cnr.it/handle/20.500.14243/333953},
}
@INPROCEEDINGS{CIMINO_2016_INPROCEEDINGS_CD_333954,
AUTHOR = {Cimino, A. and Dell'Orletta, F.},
TITLE = {Tandem LSTM-SVM approach for sentiment analysis},
YEAR = {2016},
ABSTRACT = {In this paper we describe our approach to EVALITA 2016 SENTIPOLC task. We participated in all the subtasks with constrained setting: Subjectivity Classification, Polarity Classification and Irony Detection. We developed a tandem architecture where Long Short Term Memory recurrent neural network is used to learn the feature space and to capture temporal dependencies, while the Support Vector Machines is used for classification. SVMs combine the document embedding produced by the LSTM with a wide set of general-purpose features qualifying the lexical and grammatical structure of the text. We achieved the second best accuracy in Subjectivity Classification, the third position in Polarity Classification, the sixth position in Irony Detection},
URL = {https://iris.cnr.it/handle/20.500.14243/333954},
}
@INPROCEEDINGS{CONNOR_2016_INPROCEEDINGS_CVCR_313938,
AUTHOR = {Connor, R. and Vadicamo, L. and Cardillo, F. and Rabitti, F.},
TITLE = {Supermetric search with the four-point property},
YEAR = {2016},
ABSTRACT = {Metric indexing research is concerned with the efficient evaluation of queries in metric spaces. In general, a large space of objects is arranged in such a way that, when a further object is presented as a query, those objects most similar to the query can be efficiently found. Most such mechanisms rely upon the triangle inequality property of the metric governing the space. The triangle inequality property is equivalent to a finite embedding property, which states that any three points of the space can be isometrically embedded in two-dimensional Euclidean space. In this paper, we examine a class of semimetric space which is finitely 4-embeddable in three-dimensional Euclidean space. In mathematics this property has been extensively studied and is generally known as the four-point property. All spaces with the four-point property are metric spaces, but they also have some stronger geometric guarantees. We coin the term supermetric space as, in terms of metric search, they are significantly more tractable. We show some stronger geometric guarantees deriving from the four-point property which can be used in indexing to great effect, and show results for two of the SISAP benchmark searches that are substantially better than any previously published},
KEYWORDS = {Similarity search, Metric Space, Supermetric Space, Metric Indexing, Four-point property, Hilbert Embedding, H.3.3 INFORMATION STORAGE AND RETRIEVAL. Information Search and Retrieval},
PAGES = {51-64},
URL = {https://link.springer.com/chapter/10.1007%2F978-3-319-46759-7_4},
DOI = {10.1007/978-3-319-46759-7_4},
CONFERENCE_NAME = {Similarity Search and Applications. 9th International Conference},
BOOKTITLE = {Similarity Search and Applications. SISAP 2016},
EDITOR = {Amsaleg, L. and Houle, M. and Schubert, E.},
}
@INPROCEEDINGS{DELGRATTA_2016_INPROCEEDINGS_DFMPRBKSC_324176,
AUTHOR = {Del Gratta, R. and Frontini, F. and Monachini, M. and Pardelli, G. and Russo, I. and Bartolini, R. and Khan, F. and Soria, C. and Calzolari, N.},
TITLE = {LREC as a Graph: People and Resources in a Network},
YEAR = {2016},
ABSTRACT = {This proposal describes a new way to visualise resources in the LREMap, a community-built repository of language resource descriptions and uses. The LREMap is represented as a force-directed graph, where resources, papers and authors are nodes. The analysis of the visual representation of the underlying graph is used to study how the community gathers around LRs and how LRs are used in research},
KEYWORDS = {Language Resources, Resources Documentation, Data Visualisation},
PAGES = {2529-2532},
URL = {http://www.lrec-conf.org/proceedings/lrec2016/index.html},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {978-2-9517408-9-1},
CONFERENCE_NAME = {Tenth International Conference on Language Resources and Evaluation (LREC 2016)},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Tenth International Conference on Language Resources and Evaluation (LREC 2016)},
EDITOR = {Calzolari, N. and Choukri, K. and Declerck, T. and Goggi, S. and Grobelnik, M. and Maegaard, B. and Mariani, J. and Mazo, H. and Moreno, A. and Odijk, J. and Piperidis, S.},
}
@INPROCEEDINGS{DELLORLETTA_2016_INPROCEEDINGS_DM_325820,
AUTHOR = {Dell'Orletta, F. and Montemagni S, V. G.},
TITLE = {Esplorazioni computazionali nello spazio dell'interlingua: verso una nuova metodologia di indagine},
YEAR = {2016},
ABSTRACT = {Il presente contributo intende proporre un innovativo approccio all'identificazione delle caratteristiche linguistiche che aiutano a definire l'interlingua. Tale approccio consiste nella ricostruzione del profilo linguistico di corpora di produzioni scritte da apprendenti una lingua seconda basato su strumenti di trattamento automatico del linguaggio},
KEYWORDS = {interlingua, annotazione linguistica automatica, monitoraggio linguistico},
PAGES = {143-161},
URL = {https://www.bulzoni.it/it/catalogo/lingue-in-contatto-contact-linguistics.html},
PUBLISHER = {Bulzoni Editore (Roma, ITA)},
ISBN = {978-88-6897-029-1},
CONFERENCE_NAME = {XLVIII Congresso Internazionale di Studi della Società di Linguistica Italiana (SLI 2014)},
CONFERENCE_PLACE = {Roma},
}
@INPROCEEDINGS{DELLORLETTA_2016_INPROCEEDINGS_DV_325815,
AUTHOR = {Dell'Orletta, F. and Venturi, G.},
TITLE = {ULISSE: una strategia di adattamento al dominio per l'annotazione sintattica automatica},
YEAR = {2016},
ABSTRACT = {This paper deals with Domain Adaptation for automatic syntactic annotation. Until the half of the 1980s, automatic linguistic annotation was based on algorithms built on groups of hand-written rules, defined a priori on the basis of the knowledge of the system to formalise. Subsequently, thanks to the progress of research in the field of Artificial Intelligence and to the development of linguistic resources, algorithms based on machine learning techniques began to be employed. The major difficulties of those algorithms were due to certain aspects of natural language such as ambiguities, diachronic evolutions, or language variations from the original domain of knowledge. More specifically, the issue of Domain Adaptation can be put in the following terms: "can an annotated corpus [which is representative of a specific linguistic variety] be used for the syntactic analysis of a second corpus [which is representative of a different linguistic variety]?". The author answer presenting an algorithm called ULISSE (Unsupervised LInguistically-driven Selection of dEpendency parses), which selects in an optima way the most representative sentences of a new target domain and feed them to the parser in addition to the original training set},
KEYWORDS = {Domain Adaptation, annotazione sintattica automatica},
PAGES = {55-79},
URL = {http://www.italianlp.it/wp-content/uploads/2016/10/Compter_Parler_Soigner_ULISSE.pdf},
ISBN = {978-88-6952-038-9},
CONFERENCE_NAME = {Atti del convegno "Compter parler soigner: tra linguistica e intelligenza artificiale"},
}
@INPROCEEDINGS{FERRO_2016_INPROCEEDINGS_FCPGS_325153,
AUTHOR = {Ferro, M. and Cardillo, F. A. and Pirrelli, V. and Gagné, C. L. and Spalding, T. L.},
TITLE = {Written word production and lexical self-organisation: evidence from English (pseudo)compounds},
YEAR = {2016},
ABSTRACT = {Elevation in typing latency for the initial letter of the second constituent of an English compound, relative to the latency for the final letter of the first constituent of the same compound, provides evidence that implementation of a motor plan for written compound production involves smaller constituents, in both semantically transparent and semantically opaque compounds. We investigate here the implications of this evidence for algorithmic models of lexical organisation, to show that effects of differential perception of the internal structure of compounds and pseudo-compounds can also be simulated as peripheral stages of lexical access by a self-organising connectionist architecture, even in the absence of morphosemantic information. This complementary evidence supports a maximizationof-opportunity approach to lexical modelling, accounting for the integration of effects of pre-lexical and lexical access},
KEYWORDS = {compound, pseudo-compound, written word production, lexical self-organisation, temporal self organising map},
PAGES = {146-151},
URL = {http://ceur-ws.org/Vol-1749/},
VOLUME = {1749},
DOI = {10.4000/books.aaccademia.1775},
PUBLISHER = {Accademia University Press (Aachen, DEU)},
ISBN = {9788899982546},
CONFERENCE_NAME = {Third Italian Conference on Computational Linguistics (CLiC-it 2016)},
CONFERENCE_PLACE = {Torino},
BOOKTITLE = {Proceedings CLiC-it 2016},
EDITOR = {Basile, P. and Corazza, A. and Cutugno, F. and Montemagni, S. and Nissim, M. and Patti, V. and Semeraro, G. and Sprugnoli, R.},
}
@INPROCEEDINGS{GIANNINI_2016_INPROCEEDINGS_GBGP_312301,
AUTHOR = {Giannini, S. and Biagioni, S. and Goggi, S. and Pardelli, G.},
TITLE = {Grey Literature citations in the age of Digital Repositories and Open Access},
YEAR = {2016},
ABSTRACT = {The work measures grey citations in the years 2012, 2013 and 2014 and then describes the features of GL documents cited in different areas of knowledge: Computational Linguistics, Computer Science and Engineering. With the aim of surveying a wide and varied range of resources, we selected a sample data based on the bibliographical references of articles contained in four journals-all indexed by Scopus Citation Database and ISI Web of Science, with an Impact Factor (IF) over the last three years-and two proceedings of international conferences held in 2012 and 2014},
KEYWORDS = {Grey Literature, Citations},
PAGES = {137-145},
URL = {https://iris.cnr.it/handle/20.500.14243/312301},
ISSN = {1386-2316},
ISBN = {978-90-77484-27-2},
CONFERENCE_NAME = {Seventeenth International Conference on Grey Literature: A New Wave of Textual and Non-Textual Grey literature},
BOOKTITLE = {THE GL-CONFERENCE SERIES. CONFERENCE PROCEEDINGS},
}
@INPROCEEDINGS{GOGGI_2016_INPROCEEDINGS_GPBFMMDB_315259,
AUTHOR = {Goggi, S. and Pardelli, G. and Bartolini, R. and Frontini, F. and Monachini, M. and Manzella, G. and De Mattei, M. and Bustaffa, F.},
TITLE = {A semantic engine for grey literature retrieval in the oceanography domain},
YEAR = {2016},
ABSTRACT = {Here we present the final results of the MAPS (Marine Planning and Service Platform) project, an environment designed for gathering, classifying, managing and accessing marine scientific literature and data, making it available for search to Operative Oceanography researchers of various institutions by means of standard protocols. The system takes as input non-textual data (measurements) and text-both published papers and documentation-and it provides an advanced search facility thanks to the rich set of metadata and, above all, to the possibility of a refined and domain targeted key-word indexing of texts using Natural Language Processing (NLP) techniques. The paper describes the system in its details providing also evidence of evaluation},
KEYWORDS = {Information Extraction, Search Engine, Operative Oceanography},
PAGES = {104-111},
URL = {https://iris.cnr.it/handle/20.500.14243/315259},
ISBN = {978-90-77484-27-2},
CONFERENCE_NAME = {Seventeenth International Conference on Grey Literature. A New Wave of Textual and Non-Textual Grey Literature},
EDITOR = {Farace, D. and Frantzen, J.},
}
@INPROCEEDINGS{GUADAGNINI_2016_INPROCEEDINGS_GV_354818,
AUTHOR = {Guadagnini, E. and Vaccaro, G.},
TITLE = {L'OVI visto dal DiVo: due contributi alla discussione},
YEAR = {2016},
ABSTRACT = {Il saggio propone alcune considerazioni di lessicografia e filologia italiana, alla luce dell'esperienza del progetto DiVo},
KEYWORDS = {lessicografia, filologia italiana, storia della lingua italiana},
PAGES = {183-228},
URL = {https://iris.cnr.it/handle/20.500.14243/354818},
PUBLISHER = {Edizioni dell'Orso (Alessandria, ITA)},
ISBN = {9788862747462},
CONFERENCE_NAME = {Attorno a Dante, Petrarca, Boccaccio: la lingua italiana. I primi trent'anni dell'Istituto CNR Opera del Vocabolario Italiano},
CONFERENCE_PLACE = {Alessandria},
BOOKTITLE = {Attorno a Dante, Petrarca, Boccaccio: la lingua italiana. I primi trent'anni dell'Istituto CNR Opera del Vocabolario Italiano},
EDITOR = {Leonardi, L. and Maggiore, M.},
}
@INPROCEEDINGS{KHALFI_2016_INPROCEEDINGS_KNZ_346119,
AUTHOR = {Khalfi, M. and Nahli, O. and Zarghili, A.},
TITLE = {Classical Dictionary Al-Qamus in lemon},
YEAR = {2016},
ABSTRACT = {In order to enrich the digital content of Classical Arabic, we aim to propose and represent the Arabic dictionary "'Al-Qamus Al-Muhit" in the standard format LEMON. Printed transition to digital format requires various steps of work. This article describes the procedures that we followed to convert the dictionary in digitized and encoded format to apply automatic extractions and get the Lemon format used in semantic web. Furthermore, due to Arabic dictionary complexity, formalize lexical and semantic information involves morphosyntactic and derivational knowledge that we try to explain},
KEYWORDS = {Arabic Lexicon, lemon, Al Qamus Al Muhit},
PAGES = {325-330},
URL = {https://ieeexplore.ieee.org/document/7805065/},
DOI = {10.1109/CIST.2016.7805065},
ISBN = {978-1-5090-0751-6},
CONFERENCE_NAME = {4th IEEE International Colloquium on Information Science and Technology (CiSt)},
}
@INPROCEEDINGS{KHAN_2016_INPROCEEDINGS_KBBFGR_322088,
AUTHOR = {Khan, A. F. A. and Bellandi, A. and Benotto, G. and Frontini, F. and Giovannetti, E. and Reboul, M.},
TITLE = {Leveraging a narrative ontology to query a literary text},
YEAR = {2016},
ABSTRACT = {In this work we propose a model for the representation of the narrative of a literary text. The model is structured in an ontology and a lexicon constituting a knowledge base that can be queried by a system. This narrative ontology, as well as describing the actors, locations, situations found in the text, provides an explicit formal representation of the timeline of the story. We will focus on a specific case study, that of the representation of a selected portion of Homer's Odyssey, in particular of the knowledge required to answer a selection of salient queries, formulated by a literary scholar. This work is being carried out within the framework of the Semantic Web by adopting models and standards such as RDF, OWL, SPARQL, and lemon among others},
URL = {https://iris.cnr.it/handle/20.500.14243/322088},
DOI = {10.4230/OASIcs.CMN.2016.10},
ISBN = {9783959770200},
}
@INPROCEEDINGS{KHAN_2016_INPROCEEDINGS_KBM_331670,
AUTHOR = {Khan, A. F. and Bellandi, A. and Monachini, M.},
TITLE = {Tools and Instruments for Building and Querying Diachronic Computational Lexica},
YEAR = {2016},
ABSTRACT = {This article describes work on enabling the addition of temporal information to senses of words in linguistic linked open data lexica based on the lemonDia model. Our contribution in this article is twofold. On the one hand, we demonstrate how lemonDia enables the querying of diachronic lexical datasets using OWL-oriented Semantic Web based technologies. On the other hand, we present a preliminary version of an interactive interface intended to help users in creating lexical datasets that model meaning change over time},
KEYWORDS = {OWL-oriented Semantic Web based technologies},
PAGES = {164-171},
URL = {https://www.clarin-d.net/images/lt4dh/pdf/LT4DH22.pdf},
ISBN = {978-4-87974-708-2},
CONFERENCE_NAME = {Language Technology Resources and Tools for Digital Humanities (LT4DH 2016)},
}
@INPROCEEDINGS{KHAN_2016_INPROCEEDINGS_KDM_324221,
AUTHOR = {Khan, F. and Díazvera Javier, E. and Monachini, M.},
TITLE = {Representing Polysemy and Diachronic Lexico-Semantic Data on the Semantic Web},
YEAR = {2016},
ABSTRACT = {In this article we will outline two different vocabularies, both extensions of the lemon model, for representing diachronic lexico-semantic data on the Semantic Web. This is especially useful for repre-senting the evolution of scientific terminologies where many terms are polysemous and or imported from other languages. The first vocabulary, polyLemon, allows for the representation of data about polysemy; the second, lemonDIA the representation of meaning shift over time},
KEYWORDS = {Language Resources, Resource Data Framework (RDF)},
PAGES = {37-45},
URL = {http://ceur-ws.org/Vol-1595/paper4.pdf},
VOLUME = {1595},
CONFERENCE_NAME = {Second International Workshop on Semantic Web for Scientific Heritage co-located with 13th Extended Semantic Web Conference (ESWC 2016)},
BOOKTITLE = {SWASH 2016 Semantic Web for Scientific Heritage Proceedings of the Second International Workshop on Semantic Web for Scientific Heritage co-located with 13th Extended Semantic Web Conference (ESWC 2016)},
EDITOR = {Draelants, I. and Zucker, C. F. and Monnin, A. and Zucker, A.},
}
@INPROCEEDINGS{KHAN_2016_INPROCEEDINGS_KDM_324193,
AUTHOR = {Khan, F. and Díazvera, J. and Monachini, M.},
TITLE = {The Representation of an Old English Emotion Lexicon as Linked Open Data},
YEAR = {2016},
ABSTRACT = {We present the ongoing conversion of a lexicon of emotion terms in Old English (OE) into RDF using an extension of lemon called lemonDIA and which we briefly describe. We focus on the translation of the subset of the lexicon dealing with terms for shame and guilt and give a number of illustrative example},
KEYWORDS = {Linguistic Linked Open Data, Old English, Lexicon},
PAGES = {73-76},
URL = {http://www.lrec-conf.org/proceedings/lrec2016/index.html},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {978-2-9517408-9-1},
CONFERENCE_NAME = {Tenth International Conference on Language Resources and Evaluation (LREC 2016)},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {LDL 2016 5th Workshop on Linked Data in Linguistics: Managing, Building and Using Linked Language Resources},
EDITOR = {McCrae, J. P. and Chiarcos, C. and Ponsoda, E. M. and Declerck, T. and Osenova, P. and Hellmann, S.},
}
@INPROCEEDINGS{KHAN_2016_INPROCEEDINGS_KFBMM_322106,
AUTHOR = {Khan, F. and Frontini, F. and Boschetti, F. and Monachini and , M.},
TITLE = {Converting the Liddell Scott Greek-English Lexicon into Linked Open Data using lemon},
YEAR = {2016},
ABSTRACT = {The emergence and growing popularity of Linked Open Data (LOD) offers researchers a new range of possibilities when it comes to publishing datasets online (Hyvönen 2012, Oomen et al 2012); indeed not only does the success of LOD greatly facilitate the process of making scholarly data accessible and to a wider community but it also permits the enrichment of individual datasets by linking them to the other datasets available on the so called Linked Open Data Cloud. The advantages of Linked Open Data for teachers, academics and students in the humanities are obvious and are indeed manifold. However there is currently a paucity of linked open datasets in fields such as philology and literary studies, and in particular of datasets that deal with classical languages such as ancient Greek, Sanskrit, and Latin. This seems strange given the rich abundance of surviving works, of both a religious and secular character, that exist in those languages. A salient consideration here relates to the fact that even when such works have been digitised and made available in a format such as TEI-XML, a format which renders the structure and content of such texts more amenable to computer processing, the conversion of these resources into the Resource Data Framework (RDF), the standardised data model that underpins the Semantic Web, is not always straightforward. In this article we describe ongoing work in the conversion of an important 19th century Ancient Greek resource the Liddell-Scott-Jones Lexicon, into RDF, part of a wider program of work that has been recently initiated at CNR-ILC in converting historical lexicons in languages such as Greek, Latin and Arabic into Linked Open Data},
URL = {https://iris.cnr.it/handle/20.500.14243/322106},
ISBN = {978-83-942760-3-4},
}
@INPROCEEDINGS{MONTEMAGNI_2016_INPROCEEDINGS_M_353682,
AUTHOR = {Montemagni, S.},
TITLE = {Preface},
YEAR = {2016},
ABSTRACT = {Our very warm welcome to CLiC-it 2016 (http: //clic-it2016. dieti. unina. it/), the 3 rd edition of the Italian Conference on Computational Linguistics, held on December 5 th and 6 th, in Naples, Italy, co-located with Evalita 2016 (http: //www. evalita. it/2016), hosted and locally organized by Università Federico II, one the oldest public and laic universities in the world. The organization of the conference is the result of a fruitful conjoint effort of different research groups (Istituto di Linguistica Computazionale "Antonio Zampolli" del CNR, Università degli Studi di Bari Aldo Moro and Università degli Studi di Napoli Federico II) showing the nationwide spreading of Computational Linguistics in Italy. The CLiC-it conference series is organized by the Italian Association for Computational Linguistics (AILC) and has clearly established itself as the premier national forum for research and development in the fields of Computational Linguistics (CL) and Natural Language Processing (NLP), where leading researchers and practitioners from academia and industry meet to share their challenges, solutions, research results, and experiences. CLiC-it covers all aspects of computational linguistics and natural language (both written and spoken) processing, and targets state-of-art theoretical results, experimental methodologies, technologies, as well as application perspectives, which may contribute to advance the field},
KEYWORDS = {Computational Linguistic, Natural Language Processing, Speech Tools for Italian, CLiC-it, EVALITA},
URL = {https://iris.cnr.it/handle/20.500.14243/353682},
VOLUME = {1749},
PUBLISHER = {CEUR-WS. org (Aachen, DEU)},
CONFERENCE_NAME = {CLiC-it \& EVALITA 2016},
CONFERENCE_PLACE = {Aachen},
BOOKTITLE = {Proceedings CLiC-it 2016 and EVALITA 2016},
EDITOR = {Montemagni, S.},
}
@INPROCEEDINGS{NAHLI_2016_INPROCEEDINGS_NFMKZK_324187,
AUTHOR = {Nahli, O. and Frontini, F. and Monachini, M. and Khan, F. and Zarghili, A. and Khalfi, M.},
TITLE = {Al Qamus al Muhit, a Medieval Arabic Lexicon in LMF},
YEAR = {2016},
ABSTRACT = {This paper describes the conversion into LMF, a standard lexicographic digital format of 'al-q?m?s al-mu???, a Medieval Arabic lexicon. The lexicon is first described, then all the steps required for the conversion are illustrated. The work is will produce a useful lexicographic resource for Arabic NLP, but is also interesting per se, to study the implications of adapting the LMF model to the Arabic language. Some reflections are offered as to the status of roots with respect to previously suggested representations. In particular, roots are, in our opinion are to be not treated as lexical entries, but modeled as lexical metadata for classifying and identifying lexical entries. In this manner, each root connects all entries that are derived from it},
KEYWORDS = {Arabic Lexicon, LMF, Al Qamus al Muhi},
PAGES = {943-950},
URL = {http://www.lrec-conf.org/proceedings/lrec2016/index.html},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {978-2-9517408-9-1},
CONFERENCE_NAME = {Tenth International Conference on Language Resources and Evaluation (LREC 2016)},
CONFERENCE_PLACE = {Paris},
EDITOR = {Calzolari, N. and Choukri, K. and Declerck, T. and Goggi, S. and Grobelnik, M. and Maegaard, B. and Mariani, J. and Mazo, H. and Moreno, A. and Odijk, J. and Piperidis, S.},
}
@INPROCEEDINGS{ORLETTI_2016_INPROCEEDINGS_ODI_333948,
AUTHOR = {Orletti, F. and Dell'Orletta, F. and Iovino, R.},
TITLE = {La leggibilità dei testi di ambito medico rivolti al paziente: Il caso dei bugiardini di farmaci senza obbligo di prescrizione medica},
YEAR = {2016},
ABSTRACT = {In this paper we present the first results of an exploratory analysis of simplification of the package leaflets of medicines, considered representative texts of doctor-patient communication. It will be shown how natural language processing tools can be used to reconstruct the linguistic profile of these texts and to guide their simplification},
KEYWORDS = {leggibilità},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85009291162\&origin=inward},
VOLUME = {1749},
CONFERENCE_NAME = {Third Italian Conference on Computational Linguistics (CLiC-it)},
}
@INPROCEEDINGS{PARDELLI_2016_INPROCEEDINGS_PGGB_324209,
AUTHOR = {Pardelli, G. and Goggi, S. and Giannini, S. and Biagioni, S.},
TITLE = {Two decades of terminology: European framework programmes titles},
YEAR = {2016},
ABSTRACT = {This work analyses a corpus made of the titles of research projects belonging to the last four European Commission Framework Programmes (FP4, FP5, FP6, FP7) during a time span of nearly two decades (1994-2012). The starting point is the idea of creating a corpus of titles which would constitute a terminological niche, a sort of "cluster map" offering an overall vision on the terms used and the links between them. Moreover, by performing a terminological comparison over a period of time it is possible to trace the presence of obsolete words in outdated research areas as well as of neologisms in the most recent fields. Within this scenario, the minimal purpose is to build a corpus of titles of European projects belonging to the several Framework Programmes in order to obtain a terminological mapping of relevant words in the various research areas: particularly significant would be those terms spread across different domains or those extremely tied to a specific domain. A term could actually be found in many fields and being able to acknowledge and retrieve this cross-presence means being able to linking those different domains by means of a process of terminological mapping},
KEYWORDS = {Terminology Extraction, Natural Language Processing, Terminological Comparison},
PAGES = {373-378},
URL = {http://www.lrec-conf.org/proceedings/lrec2016/index.html},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {978-2-9517408-9-1},
CONFERENCE_NAME = {LREC 2016-Tenth International Conference on Language Resources and Evaluation},
CONFERENCE_PLACE = {Paris},
EDITOR = {Calzolari, N. and Choukri, K. and Declerck, T. and Goggi, S. and Grobelnik, M. and Maegaard, B. and Mariani, J. and Mazo, H. and Moreno, A. and Odijk, J. and Piperidis, S.},
}
@INPROCEEDINGS{PESINI_2016_INPROCEEDINGS_PDB_228562,
AUTHOR = {Pesini, L. and Del Grosso, A. M. and Bozzi, A.},
TITLE = {F. de Saussure e la linguistica romanza. Un'applicazione web per l'edizione elettronica dei manoscritti},
YEAR = {2016},
ABSTRACT = {Se il ruolo di F. de Saussure nella linguistica indoeuropea e nella linguistica generale è ben noto, il suo interesse nell'ambito della linguistica romanza è stato quasi del tutto trascurato dagli studiosi. Fino ad oggi è stato difficile valutare il contributo di Saussure alla romanistica, dato che i suoi lavori (riguardanti soprattutto i patois francesi e la toponomastica) restano in gran parte inediti. Soltanto nel quadro di una nuova edizione critica digitale di tutte le opere di Saussure sarà possibile apprezzare il suo profondo interesse per la filologia romanza e far luce sul ruolo che lo studio dell'evoluzione delle lingue neolatine ebbe nella riflessione generale di questo linguista, sia comparatista che romanista},
KEYWORDS = {Computational and collaborative philology, digital humanities, software engineering},
PAGES = {239-254},
URL = {http://www.atilf.fr/cilpr2013/actes/section-16/CILPR-2013-16-Pesini-Bozzi-Del_Grosso.pdf},
PUBLISHER = {Société de linguistique romane/ÉLiPhi (Strasbourg, FRA)},
ISBN = {979-10-91460-32-3},
CONFERENCE_NAME = {XXVIIe Congrès international de linguistique et de philologie romanes},
CONFERENCE_PLACE = {Strasbourg},
EDITOR = {Buchi and Éva and Chauveau and Jean Paul and Pierrel and Jean Marie},
}
@INPROCEEDINGS{PICCINI_2016_INPROCEEDINGS_P_401721,
AUTHOR = {Piccini, S.},
TITLE = {CLAVIUS: verso la modellazione di una risorsa termino-ontologica diacronica del dominio matematico-astronomico del XVII secolo},
YEAR = {2016},
ABSTRACT = {This article describes the termino-ontological resource, CLAVIUS, which models mathematical and astronomical terminology from the sixteenth century. It is being created on the basis of Clavius' commentaries on Euclid's Elements and on Sacrobosco's Sphaera. The resource has been built in Protégé, a free open-source ontology editor, using both OntologyWeb Language Description Logic (OWL DL) and Simple Knowledge Organization System (SKOS), the latter via a specifically designed Protégé plug-in, SkosEditor. OWL DL is used due to its expressivity and decidability. Instead, SKOS was chosen to formalize the evolution in knowledge and conceptualisation revealed in Clavius' works. This diachronic aspect was modeled using Chronos, a plug-in for Protégé to manage temporal ontologies. The two OWL and SKOS worlds are kept separate. An annotation property skos: as has been introduced to link OWL entities to particular SKOS concepts. An example of formalization in SKOS is provided, which describes how theories on the number of celestial spheres developed from Aristotle to Magini},
URL = {https://iris.cnr.it/handle/20.500.14243/401721},
DOI = {10.4399/97888548xxxxx11},
ISSN = {1121-0095},
ISBN = {978-88-548-9402-0},
BOOKTITLE = {AIDA INFORMAZIONI},
}
@INPROCEEDINGS{PICCINI_2016_INPROCEEDINGS_PBBG_371091,
AUTHOR = {Piccini, S. and Bellandi, A. and Benotto, G. and Giovannetti, E.},
TITLE = {La modellazione diacronica di risorse termino-ontologiche nell'ambito delle digital humanities: Esperimenti su clavius},
YEAR = {2016},
ABSTRACT = {In this work, we present an experiment in the modeling of a diachronic termino-ontological resource named CLAVIUS through both the N-ary relations model and the 4D-fluents approach. Some of the salient differences of these two models are discussed. The overall objective of this research is to illustrate the main advantages and disadvantages in the adoption of a given model to build diachronic resources},
KEYWORDS = {Diachronic terminology, termino-ontological resources, n-ary models, perdurantist models},
PAGES = {205-245},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85009289234\&origin=inward},
VOLUME = {1749},
PUBLISHER = {Accademia University Press (Torino, ITA)},
ISBN = {9788899982089},
CONFERENCE_NAME = {Third Italian Conference on Computational Linguistics},
CONFERENCE_PLACE = {Torino},
}
@INPROCEEDINGS{PICCINI_2016_INPROCEEDINGS_PGBR_264622,
AUTHOR = {Piccini, S. and Giovannetti, E. and Bellandi, A. and Ruimy, N.},
TITLE = {Le lexique électronique de la terminologie de Ferdinand de Saussure: une première},
YEAR = {2016},
ABSTRACT = {Le Projet italien intitulé "Per un'edizione digitale dei manoscritti di Ferdinand de Saussure" a pour objectif la création d'un prototype d'édition numérique des textes du grand linguiste genevois, réalisé à partir d'une sélection de ses documents autographes. Dans ce projet, l'un des volets novateurs est la création du premier thésaurus-lexique électronique de la terminologie linguistique Saussurienne. Afin de réaliser cette base de connaissance, nous nous sommes inspirés du modèle lexical SIMPLE qui a permis le développement de vastes lexiques sémantiques informatisés, et l'avons adapté aux exigences de notre domaine de la connaissance. Le lexique réalisé a été conçu dans le but d'offrir un outil performant pour les études saussuriennes. Il fournit en effet une représentation structurée de la terminologie de Saussure, une définition du contenu sémantique de chacun des termes ainsi qu'un cadre explicite de la nature et de l'importance des liens qui les unissent. Ce faisceau d'informations devrait donc contribuer de manière significative à mieux maîtriser le vocabulaire saussurien et, partant, à éclairer certains aspects originaux de la pensée du père de la linguistique moderne},
KEYWORDS = {Saussure, lessici computazionali, ontologie},
PAGES = {255-267},
URL = {http://www.atilf.fr/cilpr2013/actes/section-16/CILPR-2013-16-Piccini-Giovannetti-Bellandi-Ruimy.pdf},
ISBN = {979-10-91460-32-3},
CONFERENCE_NAME = {XXVII Congrès international de linguistique et de philologie romanes},
BOOKTITLE = {Section 16: Projets en cours; ressources et outils nouveaux},
EDITOR = {Trotter, D. and Bozzi, A. and Fairon, C.},
}
@INPROCEEDINGS{PIERI_2016_INPROCEEDINGS_PBD_333949,
AUTHOR = {Pieri, G. and Brunato, D. and Dell'Orletta, F.},
TITLE = {Studio sull'ordinamento dei costituenti nel confronto tra generi e complessità},
YEAR = {2016},
ABSTRACT = {In this paper we present a study on the order of constituents in Italian based on automatically dependency-parsed corpora. The comparative investigation has allowed to evaluate the influence of the textual genre and the linguistic complexity on the distribution of phenonemena of syntactic markedeness},
KEYWORDS = {Complessità linguistica, Corpora annotati, Generi testuali},
PAGES = {5},
URL = {http://ceur-ws.org/Vol-1749/paper44.pdf},
VOLUME = {1749},
CONFERENCE_NAME = {Third Italian Conference on Computational Linguistics (CLiC-it 2016)},
EDITOR = {Basile, P. and Corazza, A. and Cutugno, F. and Montemagni, S. and Nissim, M. and Patti, V. and Semeraro, G. and Sprugnoli, R.},
}
@INPROCEEDINGS{PIERI_2016_INPROCEEDINGS_PBD_392599,
AUTHOR = {Pieri, G. and Brunato, D. and Dell'Orletta, F.},
TITLE = {Studio sull'ordinamento dei costituenti nel confronto tra generi e complessità},
YEAR = {2016},
ABSTRACT = {In questo articolo presentiamo uno studio sull'ordine dei costituenti in italiano basato su corpora annotati in maniera automatica fino all'analisi sintattica a dipendenze. L'indagine comparativa ha permesso di valutare l'influenza sia del genere testuale sia della complessità linguistica nella distribuzione dei fenomeni di marcatezza sintattica},
URL = {https://iris.cnr.it/handle/20.500.14243/392599},
ISBN = {978-88-99982-08-9},
}
@INPROCEEDINGS{POPESCU_2016_INPROCEEDINGS_PLDCC_328826,
AUTHOR = {Popescu, V. and Liu, L. and Del Gratta, R. and Choukri, K. and Calzolari, N.},
TITLE = {New Developments in the LRE Map},
YEAR = {2016},
ABSTRACT = {In this paper we describe the new developments brought to LRE Map, especially in terms of the user interface of the Web application, of the searching of the information therein, and of the data model updates. Thus, users now have several new search facilities, such asfaceted search and fuzzy textual search, they can now register, log in and store search bookmarks for further perusal. Moreover, thedata model now includes the notion of paper and author, which allows for linking the resources to the scientific works. Also, users cannow visualise author-provided field values and normalised values. The normalisation has been manual and enables a better grouping ofthe entries. Last but not least, provisions have been made towards linked open data (LOD) aspects, by exposing an RDF access pointallowing to query on the authors, papers and resources. Finally, a complete technological overhaul of the whole application has beenundertaken, especially in terms of the Web infrastructure and of the text search backend},
KEYWORDS = {Language resource, LRE Map, Information search and retrieval, Data modelling},
PAGES = {4526-4530},
URL = {http://www.lrec-conf.org/proceedings/lrec2016/pdf/1256_Paper.pdf},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {978-2-9517408-9-1},
CONFERENCE_NAME = {Tenth International Conference on Language Resources and Evaluation (LREC 2016)},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Tenth International Conference on Language Resources and Evaluation (LREC 2016)},
}
@INPROCEEDINGS{PROIETTI_2016_INPROCEEDINGS_P_405497,
AUTHOR = {Proietti, C.},
TITLE = {Understanding Group Polarization with Bipolar Argumentation Frameworks},
YEAR = {2016},
ABSTRACT = {Group polarization occurs when an initial attitude or belief of individuals becomes more radical after group discussion. Polarization often leads subgroups towards opposite directions. Since the 1960s this effect has been observed and repeatedly confirmed in lab experiments by social psychologists. Persuasive Arguments Theory (PAT) emerged as the most convincing explanation for this phenomenon. This paper is a first attempt to frame the PAT explanation more formally by means of Bipolar Argumentation Frameworks (BAFs). In particular, I show that polarization may emerge in a BAF by simple and rational belief updates by participants},
KEYWORDS = {Group Polarization, Persuasive Arguments Theory, Bipolar Argumentation Frameworks, Value-Based Argumentation Frameworks},
PAGES = {41-52},
URL = {https://iris.cnr.it/handle/20.500.14243/405497},
VOLUME = {287},
DOI = {10.3233/978-1-61499-686-6-41},
CONFERENCE_NAME = {COMMA 2016},
}
@INPROCEEDINGS{RUSSO_2016_INPROCEEDINGS_RM_355296,
AUTHOR = {Russo, I. and Monachini, M.},
TITLE = {Samskara minimal structural features for detecting subjectivity and polarity in Italian tweets},
YEAR = {2016},
ABSTRACT = {Sentiment analysis classification tasks strongly depend on the properties of the medium that is used to communicate opinionated content. There are some limitations in Twitter that force the user to exploit structural properties of this social network with features that have pragmatic and communicative functions. Samskara is a system that uses minimal structural features to classify Italian tweets as instantiations of a textual genre, obtaining good results for subjectivity classification, while polarity classification needs substantial improvements},
KEYWORDS = {sentiment analysis, twitter},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85009270160\&origin=inward},
VOLUME = {1749},
CONFERENCE_NAME = {Fifth Evaluation Campaign of Natural Language Processing and Speech Tools for Italian. Final Workshop EVALITA 2016},
}
@INPROCEEDINGS{RUSSO_2016_INPROCEEDINGS_RPS_355294,
AUTHOR = {Russo, I. and Pisano, S. and Soria, C.},
TITLE = {Sardinian on Facebook: Analysing Diatopic Varieties through Translated Lexical Lists},
YEAR = {2016},
ABSTRACT = {Presence of regional and minority languages over digital media is an indicator of their vitality. In this paper, we want to investigate quantitative aspects of the use on Facebook of the Sardinian language. In particular, we want to focus on the co-existence of diatopic varieties. We extracted linguistic data from public pages and, through the translation of the most frequent words, we find out similarities and differences between varieties},
KEYWORDS = {Sardinian, minority languages, digital vitality},
PAGES = {263-267},
URL = {https://iris.cnr.it/handle/20.500.14243/355294},
ISBN = {978-88-99982-08-9},
CONFERENCE_NAME = {Proceedings of the Third Italian Conference on Computational Linguistics CLiC-it 2016},
}
@INPROCEEDINGS{SORIA_2016_INPROCEEDINGS_SRQHGST_324686,
AUTHOR = {Soria, C. and Russo, I. and Quochi, V. and Hicks, D. and Gurrutxaga, A. and Sarhimaa, A. and Tuomisto, M.},
TITLE = {Fostering digital representation of EU regional and minority languages: the Digital Language Diversity Project},
YEAR = {2016},
ABSTRACT = {Poor digital representation of minority languages further prevents their usability on digital media and devices. The Digital Language Diversity Project, a three-year project funded under the Erasmus programme, aims at addressing the problem of low digital representation of EU regional and minority languages by giving their speakers the intellectual an practical skills to create, share, and reuse online digital content. Availability of digital content and technical support to use it are essential prerequisites for the development of language-based digital applications, which in turn can boost digital usage of these languages. In this paper we introduce the project, its aims, objectives and current activities for sustaining digital usability of minority languages through adult education},
KEYWORDS = {Less-resourced languages, Language Technology, digital language vitality, digital language diversity},
PAGES = {3256-3260},
URL = {http://www.lrec-conf.org/proceedings/lrec2016/index.html},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {978-2-9517408-9-1},
CONFERENCE_NAME = {Tenth International Conference on Language Resources and Evaluation (LREC 2016)},
CONFERENCE_PLACE = {Paris},
}
@INPROCEEDINGS{TUSA_2016_INPROCEEDINGS_TDMV_325817,
AUTHOR = {Tusa, E. and Dell'Orletta, F. and Montemagni, S. and Venturi, G.},
TITLE = {Dieci sfumature di marcatezza sintattica: Verso una nozione computazionale di complessita},
YEAR = {2016},
ABSTRACT = {In this work, we will investigate whether and to what extent algorithms typically used to assess the reliability of the output of syntactic parsers can be used to study the correlation between processing complexity and the linguistic notion of markedness. Although still preliminary, achieved results show the key role of features such as dependency direction and length in defining the markedness degrees of a given syntactic construction},
KEYWORDS = {marcatezza sintattica, complessità linguistica, annotazione linguistica automatica},
PAGES = {1-6},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-85009279517\&origin=inward},
VOLUME = {1749},
CONFERENCE_NAME = {Italian Conference on Computational Linguistics (CLiC-it)},
}
@INPROCEEDINGS{VALSECCHI_2016_INPROCEEDINGS_VABMP_319109,
AUTHOR = {Valsecchi, F. and Abrate, M. and Bacciu, C. and Marchetti, A. and Piccini, S.},
TITLE = {Text Encoder and Annotator: an all-in-one editor for transcribing and annotating manuscripts with RDF},
YEAR = {2016},
ABSTRACT = {In the context of the digitization of manuscripts, transcription and annotation are often distinct, sequential steps. This could lead to difficulties in improving the transcribed text when annotations have already been defined. In order to avoid this, we devised an approach which merges the two steps into the same process. Text Encoder and Annotator (TEA) is a prototype application embracing this concept. TEA is based on a lightweight language syntax which annotates text using Semantic Web technologies. Our approach is currently being developed within the Clavius on the Web project, devoted to studying the manuscripts of Christophorus Clavius, an influential 16th century mathematician and astronomer},
KEYWORDS = {RDF, Semantic Annotation, Semantic Web},
PAGES = {399-407},
URL = {https://iris.cnr.it/handle/20.500.14243/319109},
DOI = {10.1007/978-3-319-47602-5_52},
CONFERENCE_NAME = {European Semantic Web Conference 2016},
BOOKTITLE = {The Semantic Web},
}
@INPROCEEDINGS{WEINGART_2016_INPROCEEDINGS_WG_354709,
AUTHOR = {Weingart, A. and Giovannetti, E.},
TITLE = {A lexicon for Old Occitan medico-botanical terminology in lemon},
YEAR = {2016},
ABSTRACT = {The article presents the adaptation of the lemon model (a model for lexica as RDF data) for a multilingual and multi-alphabetical lexicon of Old Occitan medico-botanical terminology. The lexicon is the core component of an ontology-based information system that will be constructed and implemented within the DFG-funded project "Dictionnaire de Termes Médico-botaniques de l'Ancien Occitan" (DiTMAO). The difficulties for the lemmatization raised by the particularities of the corpus (terms in Latin, Hebrew and Arabic script and corresponding terms in other ancient languages, mostly Hebrew and Arabic) can be perfectly solved by extending the basic properties of lemon and introducing domain specific vocabulary},
KEYWORDS = {lemon model, RDF, multilingual, multi-alphabetical, historical lexicon, medico-botanical terminology, Old Occitan, Hebrew, Arabic},
PAGES = {25-36},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-84978818653\&origin=inward},
VOLUME = {1595},
CONFERENCE_NAME = {Second International Workshop on Semantic Web for Scientific Heritage (SW4SH 2016)},
}
@INPROCEEDINGS{WIELING_2016_INPROCEEDINGS_WSCM_321018,
AUTHOR = {Wieling, M. and Sassolini, E. and Cucurullo, S. and Montemagni, S.},
TITLE = {ALT Explored: Integrating an Online Dialectometric Tool and an Online Dialect Atlas},
YEAR = {2016},
ABSTRACT = {In this paper, we illustrate the integration of an online dialectometric tool, Gabmap, together with an online dialect atlas, the Atlante Lessicale Toscano (ALT-Web). By using a newly created url-based interface to Gabmap, ALT-Web is able to take advantage of the sophisticated dialect visualization and exploration options incorporated in Gabmap. For example, distribution maps showing the distribution in the Tuscan dialect area of a specific dialectal form (selected via the ALT-Web website) are easily obtainable. Furthermore, the complete ALT-Web dataset as well as subsets of the data (selected via the ALT-Web website) can be automatically uploaded and explored in Gabmap. By combining these two online applications, macro-and micro-analyses of dialectal data (respectively offered by Gabmap and ALT-Web) are effectively and dynamically combined},
KEYWORDS = {Lexicon, Lexical Database, Tools, Systems, Applications},
PAGES = {3265-3272},
URL = {http://www.lrec-conf.org/proceedings/lrec2016/index.html},
ISBN = {978-2-9517408-9-1},
CONFERENCE_NAME = {LREC 2016},
}
@INPROCEEDINGS{ANDREINI_2016_INPROCEEDINGS_ADGGMR_381983,
AUTHOR = {Andreini, G. and Di Donato, F. and Giacomi, D. and Giusti, E. and Masotti and , R.},
TITLE = {Pundit. Semantic Annotation for Digital Humanities},
YEAR = {2016},
ABSTRACT = {Students and researchers are used to study on books and printed articles, underlining and taking notes on the text itself in the meantime. Pundit (http: //thepund. it/) allows to perform the same actions on any web page, being it an online magazine, a blog or a digital library. In fact, Pundit (Morbidoni et al., 2015) is an open source suite of applications that allows users to build semantic annotations with different levels of expressivity on web pages, collaborating in the meantime with others. The knowledge base created by annotations can be reused inside the Pundit applications or by external third party projects. Pundit implements a client-server architecture and is made up of several components which interact with each other, but, if needed, are able to work independently: Pundit Annotator: a simple and lightweight annotator tool that allows to highlight and comment text in web pages with ease. This tool is intended for general users, students and journalists. Pundit Annotator Pro: an advanced tool for web annotation that allows to create semantic annotations (built by one or more triples) using text fragments, web pages, Cultural Heritage Objects or Linked Data entities. This tool is intended for scholars and researchers. Pundit Annotations Manager: the Annotation Manager is a web application that allows users to review and manage their annotations as well as to export them in different formats. Pundit Server: it is where all annotations are stored in a graph format. The data model of annotations is an extension of the Web Annotation Data Model standard (http: //www. w3. org/TR/2014/WD-annotation-model-20141211/), defined by the Web Annotation Working Group of W3C. Pundit Annotator Pro used in the project The European correspondence to Jacob Burckhardt By using Pundit, users contribute to create a new knowledge layer on top of web pages, thus enriching the web of data. Thanks to the possibility of sharing public annotations, adding comments to or evaluating existing annotations, Pundit can be portrayed as a collaborative platform, allowing the users to cooperate and share their results with workgroups, thus enabling revisions and a form of peer reviewing. Saved annotations are collected in notebooks that can be made public or private. Users are able to visualize and manage their annotations in the so-called 'Annotations Manager'. Besides browsing their notebooks and performing advanced research, there users can export their collected data in various standard formats. In this way, is possible to save copies of collected data, to be potentially exported in different systems, compliant with the Web Annotation standard. The Pundit Annotations Manager is the application where users can manage their annotations The Annotation Server implements a set of REST APIs, which allow to expose public resources through content negotiation. The knowledge base can be integrated in third party projects such as Digital Libraries 1 and be used to build advanced research systems or advanced semantic data visualizations. In these last years the software underwent continuous refactoring with the objective to make it more and more modular and adaptable in several contexts. Besides the graphical interface flexibility, with its pro and light modes, the client allows the use of custom vocabularies and ontologies. Pundit can be customized for tailor made projects where requirements lie outside its standard features. Starting from open source code new features not present in the original version are developed. The first version of Pundit was developed from 2010 within the EU Semlib project (http: //cordis. europa. eu/result/rcn/57391_en. html). Then in 2012 the development continued in the context of the EU DM2E project (http: //dm2e. eu/). In 2014 the StoM project (http: //www. stom-project. eu) started with the aim of bringing Pundit in the market as a software-as-a-service platform. Specific features of Pundit are also under development within EU Europeana Sounds (http: //www. europeanasounds. eu/) project. Pundit is used for semantic annotations in research projects such as the ERC AdG LOOKINGATWORDS (http: //cordis. europa. eu/project/rcn/102545_en. html) and ERC AdG EUROCORR (http: //www. burckhardtsource. org) funded projects. In both applications it is used by teams of researchers to semantically enrich the corpus of text of their digital library},
URL = {https://iris.cnr.it/handle/20.500.14243/381983},
}
@INPROCEEDINGS{ARRIGONI_2016_INPROCEEDINGS_AKMB_328803,
AUTHOR = {Arrigoni, S. and Khan, F. and Monachini, M. and Boschetti, F.},
TITLE = {Misurare Memorata Poetis: prime statistiche},
YEAR = {2016},
KEYWORDS = {intertestualità, temi e motivi},
PAGES = {151-155},
URL = {http://www.himeros.eu/aiucd2016/c47.pdf},
CONFERENCE_NAME = {Quinto Convegno Annuale AIUCD. Edizioni digitali: rappresentazione, interoperabilità, analisi del testo e infrastrutture},
BOOKTITLE = {AIUCD 2016-Book of Abstracts},
EDITOR = {Boschetti, F.},
}
@INPROCEEDINGS{BARTOLINI_2016_INPROCEEDINGS_BPGGB_320039,
AUTHOR = {Bartolini, R. and Pardelli, G. and Goggi, S. and Giannini, S. and Biagioni, S.},
TITLE = {A terminological "journey" in the Grey Literature domain},
YEAR = {2016},
ABSTRACT = {"When we read the articles or papers of a particular domain, we can recognize some lexical items in the texts as technical terms. In a domain where new knowledge is generated, new terms are constantly created to fulfil the needs of the domain, while others become obsolete. In addition, existing terms may undergo changes of meaning. " (Kageura K., 1998/1999). According to Kaugera, our aim with this work is to make a "journey" in the Grey Literature (GL) domain in order to offer an overall vision on the terms used and the links" "between them. Moreover, by performing a terminological comparison over a given period of time it could be possible to trace the presence of obsolete words as well as of neologisms in the most recent research fields. Within this scenario, the work analyzes a corpus constituted of the entire amount of full" "research papers published in the GL conference series over a time span of more than one decade (2003-2014) with the aim of creating a terminological map of relevant words. ". corpora used to extract terminological units can be further investigated to find semantic and conceptual information on terms or to represent conceptual relationships between terms. (Bourigault D. et al., 2001). Another interesting inquiry is the terminology used in the GL conferences for describing the types of documents (Pej?ová P. et al., 2012). The work is split up in four sections: creation of the corpus by acquiring the digital papers of GL conference proceedings (GL5-GL16)1; data cleaning; data processing; terminological" "analysis and comparison. The corpus-made up of 231 research papers (for a total amount of 785. 042 tokens)-was processed using a Natural Language Processing (NLP) tool for term extraction developed at the Institute of Computational Linguistics "Antonio Zampolli" of CNR (Goggi et al. 2015; 2016). This tool is what is called a "pipeline" (that is, a sequence of different tools) which extracts lexical knowledge from texts: in short, this is a rule system tool for knowledge extraction and document indexing that combines NLP technologies for term extraction and techniques to measure the associative strength of multi-words. This tool extracts a list of single (monograms) and multi-word terms (bigrams and trigrams) ordered by frequency with respect to the context. The pipeline-used as semantic engine within the MAPS project-has been customized for the extraction of terms from our corpus. This survey on the results of the information extraction process performed by the described NLP tool has been a sort of linguistic path in the past and present of terminology used in GL proceedings. By means of samplings, it has been possible to obtain the terminological flow in GL domain and to determine if and how the lexicon was evolving over these twelve years and investigate on its dynamic nature},
KEYWORDS = {Grey Literature, Digital Repositories, Open Access},
PAGES = {79-84},
URL = {https://iris.cnr.it/handle/20.500.14243/320039},
ISBN = {978-90-77484-29-6},
CONFERENCE_NAME = {GL18-Eighteenth International Conference on Grey Literature: Leveraging Diversity in Grey Literature},
BOOKTITLE = {Leveraging Diversity in Grey Literature},
EDITOR = {Farace, D. and Frantzen, J.},
}
@INPROCEEDINGS{DELGROSSO_2016_INPROCEEDINGS_DAGM_316981,
AUTHOR = {Del Grosso, A. M. and Albanesi, D. and Giovannetti, E. and Marchi, S.},
TITLE = {Defining the Core Entities of an Environment for Textual Processing in Literary Computing},
YEAR = {2016},
KEYWORDS = {Digital Humanities, Literary Computing, Software Engineering, Object Oriented Design and Development},
URL = {http://dh2016.adho.org/abstracts/425},
ISBN = {978-83-942760-3-4},
CONFERENCE_NAME = {Digital Humanities Conference},
}
@INPROCEEDINGS{DELGROSSO_2016_INPROCEEDINGS_DBMG_316984,
AUTHOR = {Del Grosso, A. M. and Boschetti, F. and Marchi, S. and Giovannetti, E.},
TITLE = {Vantaggi dell'Astrazione attraverso l'Approccio Orientato agli Oggetti per il Digital Scholarly Editing},
YEAR = {2016},
KEYWORDS = {Object Oriented Design, ADT, Digital Textual Scholarship},
URL = {http://www.himeros.eu/aiucd2016/c33.pdf},
DOI = {10.6092/unibo/amsacta/5559},
ISBN = {978-88-942535-0-4},
CONFERENCE_NAME = {Quinto Convegno Annuale AIUCD. Edizioni digitali: rappresentazione, interoperabilità, analisi del testo e infrastrutture},
}
@INPROCEEDINGS{DOLOWYRYBINSKA_2016_INPROCEEDINGS_DS_316368,
AUTHOR = {Dolowyrybinska, N. and Soria, C.},
TITLE = {Surveying the ethnolinguistic vitality of two regional collateral languages: the case of Kashubian and Piedmontese},
YEAR = {2016},
ABSTRACT = {The paper presents the results of a Polish-Italian research project concerning the vitality of two regional collateral languages: Kashubian in Poland and Piedmontese in Italy. Despite their diffeent status (Kashubian is a language recognised under the Polish law while Piedmontese is not), they are both perceived as dialects of the State language by the inhabitants of Poland and Italy. The status and prestige of both languages in their respective countries are low; consciousness about the importance of their maintenance within the communities and outside them is weakening. As they belong to the same language family as the dominant language they were/are treated as dialects of the State languages not worth of preservation. Current accounts of language vitality for Kashubian and Piedmontese are not entirely satisfactory in that they seem to overestimate the importance of the number of speakers over speakers' attitudes and stigma. In this paper, we will present the preliminary results of the survey, focusssing on the interdependence between actual and perceived use of the two languages on the one side, and different ethnolinguistic vitality parameters, such as self-assessment of language proficiency, awareness of the language institutional status and policies, attitudes towards the language, and language ideology. This research is a pilot study that aims to raise the discussion on current assessment of ethnolinguistic vitality and to broaden it to other languages that are contested, unrecognized or treated as dialects of the State languages},
KEYWORDS = {regional and minority language, ethnolinguistic vitality study},
URL = {https://iris.cnr.it/handle/20.500.14243/316368},
CONFERENCE_NAME = {Contested Languages in the Old World #2},
}
@INPROCEEDINGS{GANASCIA_2016_INPROCEEDINGS_G_320495,
AUTHOR = {Ganascia, F. F. B.},
TITLE = {REDEN ONLINE: Disambiguation, Linking and Visualisation of References in TEI Digital Editions},
YEAR = {2016},
URL = {https://iris.cnr.it/handle/20.500.14243/320495},
}
@INPROCEEDINGS{MANZELLA_2016_INPROCEEDINGS_MBBDDFMMMNS_324227,
AUTHOR = {Manzella, G. and Bartolini, R. and Bustaffa, F. and D'Angelo, P. and De Mattei, M. and Frontini, F. and Maltese, M. and Medone, D. and Monachini, M. and Novellino, A. and Spada, A.},
TITLE = {Marine Planning and Service Platform: Specific Ontology Based semantic Search Engine Serving Data Management and Sustainable Development},
YEAR = {2016},
ABSTRACT = {The MAPS (Marine Planning and Service Platform) project is aiming at building a computer platform supporting a Marine Information and Knowledge System. One of the main objective of the project is to develop a repository that should gather, classify and structure marine scientific literature and data thus guaranteeing their accessibility to researchers and institutions by means of standard protocols. In oceanography the cost related to data collection is very high and the new paradigm is based on the concept to collect once and re-use many times (for re-analysis, marine environment assessment, studies on trends, etc). This concept requires the access to quality controlled data and to information that is provided in reports (grey literature) and/or in relevant scientific literature. Hence, creation of new technology is needed by integrating several disciplines such as data management, information systems, knowledge management},
KEYWORDS = {Marine Information, Knowledge System},
PAGES = {2},
URL = {http://meetingorganizer.copernicus.org/EGU2016/orals/20144},
VOLUME = {18},
ISSN = {1607-7962},
CONFERENCE_NAME = {European Geosciences Union General Assembly (EGU 2016)},
}
@INPROCEEDINGS{MARCHETTI_2016_INPROCEEDINGS_MABBGMP_323894,
AUTHOR = {Marchetti, A. and Abrate, M. and Bacciu, C. and Bellandi, A. and Giovannetti, E. and Mancini, L. and Piccini, S.},
TITLE = {When Traditional Ontologies are not Enough: Modelling and Visualizing Dynamic Ontologies in Semantic-Based Access to Texts},
YEAR = {2016},
ABSTRACT = {The work described in this paper came about as a result of reflections made within the "Clavius on the web" Project, which studied the correspondence between the Jesuit mathematician and also astronomer and some important scientists of his century, such as Galileo and Brahe. One of the main aims of the project is to make it possible for students and scholars to access the texts on a semantic basis, in order to allow a deeper understanding of the often complex content, they convey. Texts are often the unique source that scholars have at their disposal in order to be able to reconstruct and more completely understand the past author's thought. In order for technology to come to the aid of scholars in this effort, the concepts evoked within the text, as well as the terms representing these concepts need to 1) have a structured organization 2) be explicitly and univocally represented and 3) be defined through the relationships that unite them. In order to achieve this, we chose to adopt an ontology based model, as ontologies are a de facto standard for knowledge representation. Interestingly, the choice to use ontologies raised some issues, also with regard to theoretical aspects: indeed, standard ontological formalisms usually static and crisp proved to be inadequate in modelling the complexity of the knowledge conveyed by the analysed texts. As a result, more refined models as well as appropriate graphical representations needed to be introduced so that computers would be able to process these ontologies and visualize them in a way that students and scholars could understand and work with them},
KEYWORDS = {Data Visualization, Information Visualization, knowledge engineering, Ontologies},
PAGES = {1-5},
URL = {http://dh2016.adho.org/abstracts/324},
CONFERENCE_NAME = {Digital Humanities 2016},
}
@INPROCEEDINGS{NAHLI_2016_INPROCEEDINGS_NBAT_328804,
AUTHOR = {Nahli, O. and Boschetti, F. and Arrigoni, S. and Tessarolo, L.},
TITLE = {Il corpus di testi arabi in Memorata Poetis},
YEAR = {2016},
KEYWORDS = {letteratura araba, temi e motivi},
PAGES = {157-162},
URL = {http://www.himeros.eu/aiucd2016/c03.pdf},
CONFERENCE_NAME = {Quinto Convegno Annuale AIUCD. Edizioni digitali: rappresentazione, interoperabilità, analisi del testo e infrastrutture},
BOOKTITLE = {AIUCD 2016-Book of Abstracts},
EDITOR = {Boschetti, F.},
}
@INPROCEEDINGS{PARDELLI_2016_INPROCEEDINGS_PGMBR_323831,
AUTHOR = {Pardelli, G. and Goggi, S. and Monachini, M. and Bartolini, R. and Russo, I.},
TITLE = {A Geographical Visualization of GL Community: a Snapshot},
YEAR = {2016},
ABSTRACT = {"Today, in the spirit of science, grey literature communities are called to demonstrate their know-how and merit to wider audiences" [Farace Dominic J., 2011]. This quotation stresses the important role of the several international organizations in producing and disseminating knowledge in the field of Grey Literature (GL): the paper aims to provide a first snapshot of the geographical distribution of GL organizations and their participation to the annual International Conference on Grey Literature over the time (in the period from 2003 to 2015). Nowadays a visual representation of data is often associated with the traditional statistical graphs, in particular for representing complex phenomena by means of maps and diagrams, which allow a deeper and more focused analysis of the data. In our case the geographical representation of stakeholders in government, academics, business and industry aims at visualizing the GL community across the globe: it concerns 675 organizations which over the years have contributed to the development of a common vision on the most pressing issues of the field by using new paradigms such as Open Acces and the social networks},
KEYWORDS = {Geographical Visualization, Grey Literature},
PAGES = {67-67},
URL = {https://iris.cnr.it/handle/20.500.14243/323831},
ISBN = {978-90-77484-29-6},
CONFERENCE_NAME = {Eighteenth International Conference on Grey Literature: Leveraging Diversity in Grey Literature},
BOOKTITLE = {GL18 Program Book},
EDITOR = {Farace, D. and Frantzen, J.},
}
@INPROCEEDINGS{PETITTI_2016_INPROCEEDINGS_PDCPIMMBCCORZCB_358698,
AUTHOR = {Petitti, A. and Di Paola, D. and Colella, R. and Patruno, C. and Ianigro, M. and Milella, A. and Maglietta, R. and Bibuli, M. and Caviglione, L. and Chiarella, D. and Odetti, A. and Ranieri, A. and Zereik, E. and Caccia, M. and Bruzzone, G.},
TITLE = {The MAVIS System: Towards the Use of Marsupial Robotic Networks for Automatic Sensing in Polar Regions},
YEAR = {2016},
ABSTRACT = {A poster about the use of marsupial robots and vehicles for next-genaration of missions in polar regions},
KEYWORDS = {autonomous robots, marsupial robotics, robotic networks},
URL = {https://iris.cnr.it/handle/20.500.14243/358698},
CONFERENCE_NAME = {IEEE International Conference on Robotics and Automation, Workshop on Fielded Multi-robot Systems Operating on Land, Sea, and Air},
}
@INPROCEEDINGS{RECCHIA_2016_INPROCEEDINGS_RFMD_325195,
AUTHOR = {Recchia, V. and Ferro, M. and Maglie, R. and Dodaro, A.},
TITLE = {Readability of current patient information leaflets for informed consent in UK radiotherapy centers},
YEAR = {2016},
ABSTRACT = {Background: Guidelines on informed consent recommend the use of plain language and readability standards to enhance patient's comprehension, engagement and shared decision making. Aim: To assess the readability of current patient information leaflets (PILs) used for informed consent in radiotherapy. Methods: We evaluated PILs (n=38) from three radiation therapy centers in UK. They regard the most common radiation therapy techniques for different kinds of cancer and body disctricts, such as bladder, bowel, colo-rectum, brain, breast-chest, femal pelvis, prostate, lung, linphomas, stomach. We analyzed each text with Flesch-Kincaid (F-K) grade level, with higher numbers indicating harder-to-read text (from 0 = easy, to 25 = difficult). Then, we compared the related grade levels to the health literacy recommended standard of US grade level 5, indicating that patient education texts might be understood by a typical student in the US primary school. Results: Readibility is suboptimal for the analised PILs (red, green and blue points in the figure) and should be improved with respect to the international standard score (red dotted line in the figure). The results show a mean grade level equal to 8. 1 (std = 0. 8), thus suggesting the need of a 3-points decrease on average. Conclusion: Current PILs for informed consent in the three analised radiotherapy centers are hardly readable for the average patient. Although the readability scores achieved in the three centers is not very low, substantially higher readability scores should be achieved with novel PILs which explicitly discuss risks/benefits and other elements relevant for informed consent, and should be prepared by following standard recommendations of plain language},
KEYWORDS = {Ethics and communication, Communicating Risk and Uncertainty, Health Literacy},
PAGES = {1},
URL = {http://www.communication.aau.dk/research/dihm/events/comet2016/},
CONFERENCE_NAME = {COMMUNICATION, MEDICINE AND ETHICS CONFERENCE 2016},
}
@INPROCEEDINGS{RIZZETTO_2016_INPROCEEDINGS_RTFPTBS_328800,
AUTHOR = {Rizzetto, M. and Trevisiol, A. and Falcone, D. and Pilon, N. and Tomè, P. and Boschetti, F. and Springmann, U.},
TITLE = {Nuove frontiere delle Digital Humanities in classe: esperienze dal campo},
YEAR = {2016},
KEYWORDS = {didattica, ocr, latino umanistico},
PAGES = {119-122},
URL = {http://www.himeros.eu/aiucd2016/c32.pdf},
CONFERENCE_NAME = {Quinto Convegno Annuale AIUCD. Edizioni digitali: rappresentazione, interoperabilità, analisi del testo e infrastrutture},
BOOKTITLE = {AIUCD 2016-Book of Abstracts},
EDITOR = {Boschetti, F.},
}
@INPROCEEDINGS{SASSOLINI_2016_INPROCEEDINGS_SCC_335239,
AUTHOR = {Sassolini, E. and Cucurullo, S. and Cinini, A.},
TITLE = {I corpora digitali: dall'obsolescenza tecnologica, alla salvaguardia e alla condivisione},
YEAR = {2016},
ABSTRACT = {Il progetto di recupero, nato pochi anni fa come iniziativa fortemente voluta da ILC, prosegue oggi con la collaborazione di molte istituzioni pubbliche e private, impegnate sullo stesso fronte. Approccio al recupero a tappe: inizialmente lavorando su testi che erano stati prodotti per essere indicizzati con le prime procedure di analisi testuale presenti all'ILC sin dalla fine degli anni '70 del secolo scorso. Definizione di criteri da adottare per la scelta dei testi, basati sullo studio di casi significativi e sull'importanza dei materiali, spesso legati alla realizzazione di autorevoli progetti nazionali e internazionali},
KEYWORDS = {recupero testi, conversione in formato XML, valorizzazione dei risultati},
PAGES = {1-3},
URL = {https://www.eventi.garr.it/it/conf16/home/materiali-conferenza-2016/paper},
CONFERENCE_NAME = {Conferenza GARR 2016-The CreActive Network},
}
@INPROCEEDINGS{STANZIONE_2016_INPROCEEDINGS_SRMTBD_328801,
AUTHOR = {Stanzione, A. and Re, G. and Mugelli, G. and Taddei, A. and Boschetti, F. and Del Gratta, R.},
TITLE = {Homeric Greek WordNet: costruire una risorsa lessico-semantica fra ricerca e didattica},
YEAR = {2016},
KEYWORDS = {wordnet, semantica, greco antico},
PAGES = {129-132},
URL = {http://www.himeros.eu/aiucd2016/c40.pdf},
CONFERENCE_NAME = {Quinto Convegno Annuale AIUCD. Edizioni digitali: rappresentazione, interoperabilità, analisi del testo e infrastrutture},
BOOKTITLE = {AIUCD 2016-Book of Abstracts},
EDITOR = {Boschetti, F.},
}
@TECHREPORT{ALBANESI_2016_TECHREPORT_ABBGP_350498,
AUTHOR = {Albanesi, D. and Bellandi, A. and Benotto, G. and Giovannetti, E. and Pecchioli, A.},
TITLE = {Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-Rapporto tecnico 10},
YEAR = {2016},
ABSTRACT = {Il presente documento descrive lo stato di avanzamento del lavoro condotto dall'Istituto di Linguistica Computazionale "A. Zampolli" del CNR (ILC-CNR) nel contesto del progetto "Traduzione del Talmud Babilonese" (vedi sezione "Pubblicazioni relative al PTTB") in italiano nei mesi di luglio, agosto, settembre e ottobre 2016. Quanto qui descritto costituisce un "Rapporto sullo Stato di Avanzamento dei Lavori (SAL) dell'applicazione Web" unicamente da parte dell'ILC-CNR e si configura come il decimo dei fascicoli previsti a cadenza quadrimestrale},
URL = {https://iris.cnr.it/handle/20.500.14243/350498},
}
@TECHREPORT{ALBANESI_2016_TECHREPORT_ABBGP_350494,
AUTHOR = {Albanesi, D. and Bellandi, A. and Benotto, G. and Giovannetti, E. and Pecchioli, A.},
TITLE = {Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-Rapporto tecnico 9},
YEAR = {2016},
ABSTRACT = {Il presente documento descrive lo stato di avanzamento del lavoro condotto dall'Istituto di Linguistica Computazionale "A. Zampolli" del CNR (ILCCNR) nel contesto del progetto "Traduzione del Talmud Babilonese" (vedi sezione "Pubblicazioni relative al PTTB") in italiano nei mesi di marzo, aprile, maggio e giugno 2016. Quanto qui descritto costituisce un "Rapporto sullo Stato di Avanzamento dei Lavori (SAL) dell'applicazione Web" unicamente da parte dell'ILCCNR e si configura come il nono dei fascicoli previsti a cadenza quadrimestrale},
URL = {https://iris.cnr.it/handle/20.500.14243/350494},
}
@TECHREPORT{BOSCHETTI_2016_TECHREPORT_B_456574,
AUTHOR = {Boschetti, F.},
TITLE = {Relazione sulle attività dell'Unità di Pisa (CNR-ILC) per il progetto PRIN 2010/2011 "Memoria poetica e poesia della memoria" (Memorata Poetis)},
YEAR = {2016},
ABSTRACT = {Report finale delle attività svolte dall'Unità di Ricerca del CNR per il progetto PRIN 2010-2011 "Memorata Poetis". La relazione sintetizza le attività di Federico Boschetti (coordinamento generale, trattamento della lingua greca, OCR storico, progettazione di Ancient Greek WordNet), Marion Lamé (studio di documenti epigrafici), Ouafae Nahli (trattamento della lingua araba), Riccardo Del Gratta (creazione di servizi web per LEMLAT, interfaccia web di Ancient Greek WordNet), Anas Fahad Khan (riorganizzazione di ontologie), Angelo Mario Del Grosso (consulenza per la progettazione di componenti software)},
KEYWORDS = {annotazione, greco antico, latino, wordnet},
URL = {https://iris.cnr.it/handle/20.500.14243/456574},
}
@TECHREPORT{CARLINO_2016_TECHREPORT_C_459247,
AUTHOR = {Carlino, M.},
TITLE = {Rapporto annuale 2015 del CNR-ILC},
YEAR = {2016},
ABSTRACT = {CNR-ILC Activity Annual Report 2015},
KEYWORDS = {Annual Report, Activity report, CNR-ILC, Rapporto Annuale},
PAGES = {1-50},
URL = {https://iris.cnr.it/handle/20.500.14243/459247},
}
@TECHREPORT{DELGROSSO_2016_TECHREPORT_D_348345,
AUTHOR = {Del Grosso, A. M.},
TITLE = {Relazione progetto Clavius On the Web},
YEAR = {2016},
ABSTRACT = {La ricerca condotta dal Dott. Angelo Mario Del Grosso, di cui si sintetizzano i risultati in questo documento, si è svolta presso l'Istituto di Linguistica Computazionale "A. Zampolli" durante il periodo che va dal 11 Aprile 2015 al 10 Aprile 2016, in relazione al rinnovo dell'assegno di ricerca, bando n. 126. 048/ASS. 003. 2013. PI del 07-03-2013 Protocollo ILC n. 0000285, sotto la responsabilità scientifica del Dott. Emiliano Giovannetti e nell'ambito del progetto "Clavius on The Web", finanziato da Registro. it. Il contratto stipulato tra l'ILC e il Dott. Del Grosso, per l'attività di collaboratore di ricerca, è stato formalmente protocollato con il numero 0000441 del 10/04/2015},
KEYWORDS = {Digital Humanities, Clavius On the Web, Software Engineering},
URL = {https://iris.cnr.it/handle/20.500.14243/348345},
}
@TECHREPORT{FERRETTI_2016_TECHREPORT_FMC_328856,
AUTHOR = {Ferretti, M. and Morgavi, G. and Confetti, D.},
TITLE = {L'anziano e il mondo dell'ICT: indagine sulle tecnologie accettabili},
YEAR = {2016},
ABSTRACT = {Il lavoro analizza i dati raccolti dalla dottoressa Daniela Confetti, nell'ambito del tirocinio post laurea magistrale, attraverso la somministrazione di un questionario di 98 domande ad un campione di 100 persone con fascia d'età compresa fra i sessantacique e gli ottantun anni. Il questionario mirava a comprendere il grado di conoscenza e di accettazione delle nuove tecnologie da parte della popolazione anziana e si poneva quale obiettivo quello di analizzare quanto la tecnologia possa essere considerata dalla fascia più anziana della popolazione una risorsa per la vita quotidiana piuttosto che un qualche cosa di alieno di cui diffidare},
KEYWORDS = {Active Aging, ICT for elderly, Intervista strutturata},
PAGES = {1-19},
URL = {https://iris.cnr.it/handle/20.500.14243/328856},
}
@TECHREPORT{LUCENTINI_2016_TECHREPORT_LC_319712,
AUTHOR = {Lucentini, R. and Chiarella, D.},
TITLE = {ILCatalogo: archivio digitale per i beni culturali relativi al teatro},
YEAR = {2016},
ABSTRACT = {Il rapporto tecnico descrive le attività svolte in relazione al progetto di ricerca "Archivio digitale del patrimonio artistico di Emanuele Luzzati: il teatro"},
URL = {https://iris.cnr.it/handle/20.500.14243/319712},
}
@TECHREPORT{SASSI_2016_TECHREPORT_SCSC_344119,
AUTHOR = {Sassi, M. and Cinini, A. and Sassolini, E. and Cucurullo, S.},
TITLE = {La SALUTE MENTALE nel Web},
YEAR = {2016},
ABSTRACT = {Relazione annuale 2016 per la presentazione dei risultati raggiunti nell'ambito dell'Accordo di Collaborazione fra ILC-CNR e Coordinamento Toscano delle Associazioni per la Salute Mentale (Prot. ILC-CNR 0000856 del 4/10/2012) e del Contratto di sponsorizzazione Otsuka-Lundbeck del 2015, il cui Annesso Tecnico prevede le azioni descritte. Il progetto è articolato nei seguenti obiettivi, che verranno perseguiti mediante le Azioni dettagliate di seguito: 1. Realizzazione di un Sito dedicato alla Salute Mentale; 2. Servizio automatizzato di ricerca su Internet di informazioni e notizie che riguardano la salute mentale, con procedure di analisi linguistica. Tale relazione è stata presentata da Manuela Sassi al Corso finanziato dal CESVOT e organizzato dal Coordinamento Toscano delle Associazioni per la Salute Mentale a Lucca il 23 luglio 2016. Il sito realizzato viene aggiornato due volte al giorno e contiene i documenti recuperati in rete che hanno attinenza con la Salute Mentale tramite un dizionario di ricerca specializzato. Il periodo coperto inizia nel 2013 fino alla data odierna},
URL = {https://iris.cnr.it/handle/20.500.14243/344119},
}
@MISC{BARONI_2016_MISC_BA_461444,
AUTHOR = {Baroni, P. and Affè, F.},
TITLE = {ILC4CLARIN Web Site},
YEAR = {2016},
ABSTRACT = {Web Site of the ILC4CLARIN Centre at the Institute for Computational Linguistics, powered by WordPress, developed in Italian and English},
KEYWORDS = {CLARIN, Metadata Providing Centre, Service Providing Centre},
URL = {https://ilc4clarin.ilc.cnr.it},
}
@MISC{BELLANDI_2016_MISC_B_350508,
AUTHOR = {Bellandi, A.},
TITLE = {Controlled Natural Language Interface for querying the CLAVIUS resource},
YEAR = {2016},
ABSTRACT = {In the context of the project "Clavius on the Web" a diachronic termino-ontological resource, named CLAVIUS, has been developed, aimed at representing the evolution of astronomical concepts and theories from antiquity until the dawn of the modern age. The resource was built by means of existing tools allowing the scholars to formalize knowledge even though they are not familiar with the models and the languages underlying the representation. More specifically, Protégé, a free open-source ontology editor, which supports OWL (and OWL 2) and Chronos, a plug-in for Protégé to manage temporal aspect, were used. In order to facilitate access for scholars, a demo of a controlled natural language interface was developed to query the ontology. Query templates were created, and each of them is made up of a fixed part that typifies a specific querying model and a variable part that allows the user to select an element of the ontology from the drop-down list. Question templates are processed by the software into SPARQL queries. Queries can be made in controlled natural language by taking into account the lexical level ("What are the relations of a specific term ?"), the ontological level ("What are the relations of a concept denoted by a specific term ?") or both. The questions themselves could involve diachronic aspects, such as in "what relation exists between two concepts in a specific temporal interval?"},
URL = {https://iris.cnr.it/handle/20.500.14243/350508},
}
@MISC{DELGROSSO_2016_MISC_D_308093,
AUTHOR = {Del Grosso, A. M.},
TITLE = {Modelli concettuali e architetture Object-Oriented per la progettazione e lo sviluppo di una Digital Scholarly Platform},
YEAR = {2016},
ABSTRACT = {"OOP e DH": incontro possibile? E' possibile modellare il dominio relativo allo studio scientifico del testo attraverso l'approccio Object-Oriented? Cosa implica, dal punto di vista metodologico e tecnologico, progettare e sviluppare strumenti modulari e riusabili per l'analisi scientifica di risorse testuali? L'intervento esaminerà questi e ad altri temi di natura ingegneristica nell'ambito delle Digital Humanities. Il seminario, quindi, ripercorrerà alcuni risultati ottenuti all'interno della linea di ricerca presente presso l'ILC-CNR orientata allo sviluppo di componenti software per sistemi Web di linguistica e filologia computazionale volti al trattamento di testi di tradizione medievale, a stampa e di autori moderni e contemporanei. La progettazione di strumenti computazionali nel dominio delle Digital Humanities deve necessariamente rispondere alle esigenze di diverse tipologie di utenti: 1) l'utente generico, inteso come persona curiosa oppure pubblico poco esperto che ha comunque competenze per arricchire il prodotto digitale; 2) l'utente accademico, inteso come lo studente, il docente, o il ricercatore, in grado di aumentare la significatività, l'espressività e la rilevanza della risorsa digitale, 3) il programmatore, inteso come sviluppatore di applicazioni nel campo dell'Informatica Umanistica. Durante il seminario si introdurranno le basi della modellazione Object-Oriented a partire da concreti casi di studio ed esperienze maturate in progetti di ricerca nazionali ed internazionali. In particolare, si illustreranno gli esiti di alcune iniziative: oil progetto "Clavius On the Web", finanziato dal Registro. it, che vede coinvolti due istituti del CNR di Pisa (IIT-CNR e ILC-CNR) e l'Archivio Storico della Pontificia Università Gregoriana (APUG); oil progetto "Greek into Arabic", finanziato dall'European Resource Council e diretto dalla Prof. ssa Cristina D'Ancona dell'Università di Pisa; oil progetto PRIN "Per un'edizione dei manoscritti di F. De Saussure", diretto dal Prof. Daniele Gambarara dell'Università della Calabria. oil progetto "Talmud" finanziato dal MIUR e partecipato dal CNR, dall'Unione delle Comunità Ebraiche e dal Collegio Rabbinico Italiano},
KEYWORDS = {Object-Oriented, UML, Filologia Computazionale, Literary Computing, Digital Humanities},
URL = {http://www.labcd.unipi.it/seminari/angelo-mario-del-grosso-modelli-concettuali-e-architetture-object-oriented-per-la-progettazione-e-lo-sviluppo-di-una-digital-scholarly-platform/},
}
@MISC{DELGROSSO_2016_MISC_D_308094,
AUTHOR = {Del Grosso, A. M.},
TITLE = {INTERNET, QUANTO CI PIACE!},
YEAR = {2016},
ABSTRACT = {Cultura digitale è stato progettato per far conoscere ed esplorare con spirito critico-il mondo di Internet e del Web;-Gli accorgimenti ed i sistemi di prevenzione atti a evitare quei pericoli nei quali spesso si imbattono gli internauti poco esperti ed informati;-Le tecnologie informatiche per l'approfondimento di temi legati alle attività di studio letterario intertestuale, attraverso il sistema ideato dall'ILC-CNR},
KEYWORDS = {Digital Humanities, Educational},
URL = {https://iris.cnr.it/handle/20.500.14243/308094},
}
@MISC{DELGROSSO_2016_MISC_D_344092,
AUTHOR = {Del Grosso, A. M.},
TITLE = {il progetto "Cultura Digitale": Promozione alla cittadinanza Digitale},
YEAR = {2016},
ABSTRACT = {Il contributo presenta il lavoro di allineamento e traduzione svolto con strumenti digitali dagli studenti del Liceo Classico Medi-Livatino di San Marco dei Cavoti (BN) su una selezione di passi tratti dall'opera di Ippocrate "Sulle Arie, Sulle Acque, e Sui Luoghi"},
KEYWORDS = {digital humanities, cultura digitale, tools, scuola digitale},
URL = {https://iris.cnr.it/handle/20.500.14243/344092},
}
@MISC{DELGROSSO_2016_MISC_DA_318698,
AUTHOR = {Del Grosso, A. M. and Abrate, M.},
TITLE = {Annotazioni collaborative di testi storici},
YEAR = {2016},
ABSTRACT = {Introduzione ai sistemi di annotazione e coinvolgimento degli intervenuti nell'uso di strumenti digitali per l'annotazione di documenti e testi storici},
URL = {https://iris.cnr.it/handle/20.500.14243/318698},
}
@MISC{DIDONATO_2016_MISC_D_408443,
AUTHOR = {Di Donato, F.},
TITLE = {Pundit. Web annotation for the Digital Humanities},
YEAR = {2016},
ABSTRACT = {Presentazione sella suite di web annotation Pundit},
URL = {https://iris.cnr.it/handle/20.500.14243/408443},
}
@MISC{DIDONATO_2016_MISC_D_381987,
AUTHOR = {Di Donato, F.},
TITLE = {From the Past to the Future. Some reflections after DH2016},
YEAR = {2016},
ABSTRACT = {Report of the conference DH2016},
URL = {https://iris.cnr.it/handle/20.500.14243/381987},
}
@MISC{DIDONATO_2016_MISC_D_408446,
AUTHOR = {Di Donato, F.},
TITLE = {Data Reuse in the Humanities},
YEAR = {2016},
ABSTRACT = {Presentation of the project: Looking at words through images (ERC-AdG-2011)},
URL = {https://iris.cnr.it/handle/20.500.14243/408446},
}
@MISC{DOLOWYRYBINSKA_2016_MISC_DS_316367,
AUTHOR = {Dolowyrybinska, N. and Soria, C.},
TITLE = {Surveying the ethnolinguistic vitality of two regional collateral languages: the case of Kashubian and Piedmontese},
YEAR = {2016},
ABSTRACT = {The paper presents the results of a Polish-Italian research project concerning the vitality of two regional collateral languages: Kashubian in Poland and Piedmontese in Italy. Despite their diffeent status (Kashubian is a language recognised under the Polish law while Piedmontese is not), they are both perceived as dialects of the State language by the inhabitants of Poland and Italy. The status and prestige of both languages in their respective countries are low; consciousness about the importance of their maintenance within the communities and outside them is weakening. As they belong to the same language family as the dominant language they were/are treated as dialects of the State languages not worth of preservation. Current accounts of language vitality for Kashubian and Piedmontese are not entirely satisfactory in that they seem to overestimate the importance of the number of speakers over speakers' attitudes and stigma. In this paper, we will present the preliminary results of the survey, focusssing on the interdependence between actual and perceived use of the two languages on the one side, and different ethnolinguistic vitality parameters, such as self-assessment of language proficiency, awareness of the language institutional status and policies, attitudes towards the language, and language ideology. This research is a pilot study that aims to raise the discussion on current assessment of ethnolinguistic vitality and to broaden it to other languages that are contested, unrecognized or treated as dialects of the State languages},
KEYWORDS = {regional and minority language, ethnolinguistic vitality study},
URL = {https://iris.cnr.it/handle/20.500.14243/316367},
CONFERENCE_NAME = {Contested Languages in the Old World #2},
}
@MISC{GUADAGNINI_2016_MISC_G_357029,
AUTHOR = {Guadagnini, E.},
TITLE = {#2 Pictor ludens 2. 6. All'inferno con un Dante biondo},
YEAR = {2016},
KEYWORDS = {dante, fumetti},
URL = {http://www.arabeschi.it/collection/poemi-a-fumetti/},
VOLUME = {7},
ISSN = {2282-0876},
}
@MISC{MONACHINI_2016_MISC_M_333126,
AUTHOR = {Monachini, M.},
TITLE = {CLARIN-IT The Italian Common Language Resources and Technology Infrastructure CLARIN-IT: l'infrastruttura di ricerca per le scienze umane e sociali},
YEAR = {2016},
ABSTRACT = {The CLARIN-IT National Coordinator presented a keynote CLARIN-IT, l'Infrastruttura di Ricerca per le Scienze Umane e Sociali, in the 5th Annual Conference of the Associazione per l'Informatica Umanistica e la Cultura Digitale (AIUCD) held in Venezia from 7th to 9th September 2016. It is time for research infrastructures to be able to guarantee interoperability and integration between the instruments for philological studies and the instruments for the analysis of large textual corpora, breaking down the rigid barriers between digital and computational philology, on the one hand, and corpus linguistics on the other hand. Programma: https: //docs. google. com/viewer?a=v\&pid=sites\&srcid=dW5pdmUuaXR8YWl1Y2QyMDE2fGd4OjIyMDhhMzk2ODk0MjUyNDQ},
KEYWORDS = {CLARIN-IT, scienze umane e sociali},
URL = {http://www.clarin-it.it/en/content/clarin-it-aiucd-2016},
CONFERENCE_NAME = {5th Annual Conference of the Associazione per l'Informatica Umanistica e la Cultura Digitale (AIUCD)},
}
@MISC{MONACHINI_2016_MISC_M_341689,
AUTHOR = {Monachini, M.},
TITLE = {Infrastrutture e ricerca nel settore umanistico},
YEAR = {2016},
ABSTRACT = {L'informatica applicata allo studio del testo ha una lunga storia che parte dagli anni '50 dello scorso secolo. Nel corso del tempo allo sviluppo di risorse e strumenti prevalentemente pensati per l'analisi linguistica, come ad esempio la lemmatizzazione, si sono affiancati metodi, risorse e strumenti più squisitamente filologici, come la codifica delle varianti, i repertori digitali di molteplici edizioni del medesimo testo e gli strumenti per l'allineamento automatico delle stesse. Tuttavia la conoscenza di queste tecniche ed il loro utilizzo è ancora piuttosto limitato nel panorama degli studi italiani di filologia classica, nonostante alcune acquisizioni concettuali e tecniche di prima grandezza nel settore siano dovute a studiosi italiani. Il workshop si propone di discutere temi e problematiche attinenti la filologia digitale sulla scorta di una rassegna del settore iniziata all'università di Parma con la collaborazione del CNR-ILC di Pisa: o Motivazioni per l'adozione di tecniche di filologia digitale nel campo della ricerca e dell'insegnamento. Barriere al loro utilizzo. o I risultati di una rassegna sull'impiego di tecniche di filologia digitale da parte di studiosi italiani sulla base di un questionario o Diffusione della conoscenza del settore in Italia o Correnti e future tematiche di ricerca},
KEYWORDS = {Digital Humanities, Computational Philology},
URL = {https://iris.cnr.it/handle/20.500.14243/341689},
CONFERENCE_NAME = {Utilizzo e diffusione di metodi, strumenti e tecnologie digitali per gli studi filologici: l'applicazione della filologia digitale al greco antico},
}
@MISC{MONACHINI_2016_MISC_MEF_333124,
AUTHOR = {Monachini, M. and Enea, A. and Frontini, F.},
TITLE = {CLARIN-IT: servizi per la comunità italiana delle scienze umane e sociali},
YEAR = {2016},
ABSTRACT = {CLARIN-IT-The Italian Common Language Resources and Technology Infrastructure: Monica Monachini-CLARIN Italian National Coordinator Alessandro Enea-Responsible of ILCforCLARIN \& contact person for IDEM Francesca Frontini-Standing Committee for CLARIN Technical Centres (SCCTC) ILC-CNR National Representative},
KEYWORDS = {CLARIN-IT, The Italian Common Language Resources and Technology Infrastructure},
URL = {http://www.clarin-it.it/en/content/clarin-it-idem-day-2016},
CONFERENCE_NAME = {CLARIN-IT @ IDEM Day 2016},
}
@MISC{NAHLI_2016_MISC_N_370085,
AUTHOR = {Nahli, O.},
TITLE = {Corpus dei testi arabi in "Memorata Poestis"},
YEAR = {2016},
ABSTRACT = {Corpus epigrafico arabo, per motivi didattici e scientifici, i testi sono stati vocalizzati e tradotti in italiano},
KEYWORDS = {Poesia, Epigrafi, Memorata Poetis, lingua araba},
URL = {http://www.memoratapoetis.it/public/},
}
@MISC{PICCINI_2016_MISC_PBB_370150,
AUTHOR = {Piccini, S. and Bellandi, A. and Benotto, G.},
TITLE = {Clavius' Ontology},
YEAR = {2016},
ABSTRACT = {Clavius' Ontology},
URL = {https://iris.cnr.it/handle/20.500.14243/370150},
}
@MISC{PRESENTING_2016_MISC_PGIPADGB_408445,
AUTHOR = {Presenting, H. M. and Gordea, S. and Isaac, A. and Piccioli, A. and Andreini, G. and Di Donato, F. and Gardien, R. and Brinkerink, M.},
TITLE = {Challenges on modeling annotations in the Europeana Sounds project},
YEAR = {2016},
ABSTRACT = {Presentation of the work done in the project Europeana Sounds},
URL = {https://iris.cnr.it/handle/20.500.14243/408445},
}
@MISC{SASSI_2016_MISC_S_324846,
AUTHOR = {Sassi, M.},
TITLE = {Cuestiones pertinentes e impertinentes de los diccionarios temáticos},
YEAR = {2016},
ABSTRACT = {Los diccionarios han representado el hilo conductor de mi carrera en el Istituto di Linguistica Computazionale del Consiglio Nazionale delle Ricerche (ILC-CNR) de Pisa desde sus orígenes (en los años 1965-1978 se denominaba Divisione Linguistica del CNUCE). En los anos '70 en colaboracion con el Parlamemto Italiano, se produjo el Diccionario Maquina del Italiano. En los anos 80 se comenzaron los primeros estudios de diccionarios organizados en Campos Léxicos a partir de las "intuiciones" de Julio Casares, aplicándose los mismos criterios al italiano. A partir de estas lejanas experiencias, a lo largo de 40 años, se desarrollaron diferentes estudios, aplicaciones y bancos de datos en varias disciplinas (Derecho, Justicia, Administración, Turismo, Medicina, etc.) y también sobre Autores (S. Teresa de Ávila, Cervantes, Unamuno, Borges, Vallejo, etc.) que serán ilustrados en este Congreso},
URL = {https://iris.cnr.it/handle/20.500.14243/324846},
}
@MISC{SASSI_2016_MISC_S_324859,
AUTHOR = {Sassi, M.},
TITLE = {Salute mentale: diritti e doveri},
YEAR = {2016},
ABSTRACT = {Corso di Formazione per Volontari organizzato dal Coordinamento Toscano delle Associazioni per la Salute Mentale e finanziato dal CESVOT con il Bando "Formazione". Si svolge durante tutto il 2016 ed è organizzato a Seminari di Esperti su vari temi collegati. In particolare ho presentato i risultati del progetto"Salute Mentale e Web" cofinanziato dal Coordinamento Toscano e da fondi esterni di sponsorizzazione},
URL = {https://iris.cnr.it/handle/20.500.14243/324859},
}
@ARTICLE{ATTARDI_2015_ARTICLE_ABBCDMPSS_333938,
AUTHOR = {Attardi, G. and Basile, V. and Bosco, C. and Caselli, T. and Dell'Orletta, F. and Montemagni, S. and Patti, V. and Simi, M. and Sprugnoli, R.},
TITLE = {State of the Art Language Technologies for Italian: The EVALITA 2014 Perspective},
YEAR = {2015},
ABSTRACT = {Shared task evaluation campaigns represent a well established form of competitive evaluation, an important opportunity to propose and tackle new challenges for a specific research area and a way to foster the development of benchmarks, tools and resources. The advantages of this approach are evident in any experimental field, including the area of Natural Language Processing. An outlook on state-of-the-art language technologies for Italian can be obtained by reflecting on the results of the recently held workshop "Evaluation of NLP and Speech Tools for Italian", EVALITA 2014. The motivations underlying individual shared tasks, the level of knowledge and development achieved within each of them, the impact on applications, society and economy at large as well as directions for future research will be discussed from this perspective},
KEYWORDS = {Evaluation Campaign, Natural Language Processing, Dependency Parsing, Sentiment Analysis, Temporal Processing},
PAGES = {43-61},
URL = {https://iris.cnr.it/handle/20.500.14243/333938},
VOLUME = {9 (1)},
DOI = {10.3233/IA-150076},
ISSN = {1724-8035},
JOURNAL = {INTELLIGENZA ARTIFICIALE},
}
@ARTICLE{BANTERLE_2015_ARTICLE_BCM_269786,
AUTHOR = {Banterle, F. and Cardillo, F. A. and Malomo, L.},
TITLE = {LecceAR: an augmented reality App for cultural heritage},
YEAR = {2015},
ABSTRACT = {Augmented Reality (AR)-the augmentation of a physical world's view with digital media-has recently gained popularity thanks to the increasing computational power and diffusion of mobile devices such as tablets, and smartphones. These developments allow many practical applications of AR technology, especially in the cultural heritage domain. LecceAR is an advanced app that allows tourists to view rich 3D reconstructions of cultural heritage sites within the city of Lecce in Italy. LecceAR is an iOS app for markerless AR that will be exhibited at the MUST museum in Lecce, Italy. The app shows a rich 3D reconstruction of the Lecce Roman amphitheatre, which is only partially unearthed (see Figure 1). The use of state-of-the-art algorithms in computer graphics and computer vision allows an ancient theatre to be viewed and explored in real-time},
KEYWORDS = {Augmented Reality, IMAGE PROCESSING AND COMPUTER VISION, Picture/Image Generation Display Algorithms},
PAGES = {16-17},
URL = {https://ercim-news.ercim.eu/en103/special/leccear-an-augmented-reality-app-for-cultural-heritage},
VOLUME = {103},
ISSN = {0926-4981},
JOURNAL = {ERCIM NEWS},
}
@ARTICLE{BARBAGLI_2015_ARTICLE_BLDMV_322610,
AUTHOR = {Barbagli, A. and Lucisano, P. and Dell'Orletta, F. and Montemagni, S. and Venturi, G.},
TITLE = {Il ruolo delle tecnologie del linguaggio nel monitoraggio dell'evoluzione delle abilità di scrittura: primi risultati},
YEAR = {2015},
ABSTRACT = {L'ultimo decennio ha visto l'affermarsi a livello internazionale dell'uso di tecnologie del linguaggio per lo studio dei processi di apprendimento. Questo contributo riporta i primi e promettenti risultati di uno studio interdisciplinare che si è avvalso di metodi e tecniche di analisi propri della linguistica computazionale, della linguistica e della pedagogia sperimentale. Lo studio, finalizzato al monitoraggio dell'evoluzione del processo di apprendimento della lingua italiana, è stato condotto a partire dalle produzione scritte di studenti della scuola secondaria di primo grado con strumenti di annotazione linguistica automatica e di estrazione di conoscenza e ha portato all'identificazione di un insieme di tratti qualificanti il processo di apprendimento linguistico},
KEYWORDS = {evoluzione delle competenze linguistiche, Didattica Sperimentale, Estrazione di conoscenza, Annotazione linguistica automatica},
PAGES = {99-117},
URL = {https://journals.openedition.org/ijcol/326},
DOI = {10.4000/ijcol.326},
ISSN = {2499-4553},
JOURNAL = {IJCOL},
}
@ARTICLE{BOSCHETTI_2015_ARTICLE_BD_228545,
AUTHOR = {Boschetti, F. and Del Grosso, A. M.},
TITLE = {TeiCoPhiLib: A Library of Components for the Domain of Collaborative Philology},
YEAR = {2015},
ABSTRACT = {The aim of this contribution is to illustrate a work in progress related to a library of software components devoted to editing, visualizing and processing TEI annotated documents in the domain of philological studies, in particular in the subdomain of collaborative philology. After a short introduction and a general overview, the second section is devoted to the technologies related to XML mark-up languages and how to process marked documents. The third section illustrates the method applied to design and implement the TeiCoPhiLib. General benefits of the overall architecture are discussed and the used design patterns are described. The fourth section is devoted to case studies in which some components of the ongoing TeiCoPhiLib have been used. The fifth section exposes the conclusions},
KEYWORDS = {APIs, design patterns, library of components, collaborative philology},
URL = {http://jtei.revues.org/1285},
VOLUME = {8},
DOI = {10.4000/jtei.1285},
ISSN = {2162-5603},
JOURNAL = {JOURNAL OF THE TEXT ENCODING INITIATIVE},
}
@ARTICLE{CUTUGNO_2015_ARTICLE_CCLMM_289609,
AUTHOR = {Cutugno, P. and Chiarella, D. and Lucentini, R. and Marconi, L. and Morgavi, G.},
TITLE = {Language, communication and society: a gender based linguistics analysis},
YEAR = {2015},
ABSTRACT = {The purpose of this study is to find evidence for supporting the hypothesis that language is the mirror of our thinking, our prejudices and cultural stereotypes. In this analysis, a questionnaire was administered to 537 people. The answers have been analysed to see if gender stereotypes were present such as the attribution of psychological and behavioural characteristics. In particular, the aim was to identify, if any, what are the stereotyped images, which emerge in defining the roles of men and women in modern society. Moreover, the results given can be a good starting point to understand if gender stereotypes, and the expectations they produce, can result in penalization or inequality. If so, the language and its use would create inherently a gender bias, which influences evaluations both in work settings both in everyday life},
URL = {https://iris.cnr.it/handle/20.500.14243/289609},
ISSN = {1790-5117},
JOURNAL = {RECENT ADVANCES IN ELECTRICAL ENGINEERING},
}
@ARTICLE{DELGRATTA_2015_ARTICLE_DFKM_222847,
AUTHOR = {Del Gratta, R. and Frontini, F. and Khan, F. and Monachini, M.},
TITLE = {Converting the PAROLE SIMPLE CLIPS Lexicon into RDF with lemon},
YEAR = {2015},
ABSTRACT = {This paper describes the publication and linking of (parts of) PAROLE SIMPLE CLIPS (PSC), a large scale Italian lexicon, to the Semantic Web and the Linked Data cloud using the lemon model. The main challenge of the conversion is discussed, namely the reconciliation between the PSC semantic structure which contains richly encoded semantic information, following the qualia structure of the Generative Lexicon theory and the lemon view of lexical sense as a reified pairing of a lexical item and a concept in an ontology. The result is two datasets: one consists of a list of lemon lexical entries with their lexical properties, relations and senses; the other consists of a list of OWL individuals representing the referents for the lexical senses. These OWL individuals are linked to each other by a set of semantic relations and mapped onto the SIMPLE OWL ontology of higher level semantic types},
KEYWORDS = {lemon, linked data, generative lexicon, RDF, OWL, lexical resource},
PAGES = {387-392},
URL = {http://www.semantic-web-journal.net/content/converting-parole-simple-clips-lexicon-rdf-lemon-0},
VOLUME = {6},
DOI = {10.3233/SW-140168},
ISSN = {1570-0844},
JOURNAL = {SEMANTIC WEB (PRINT)},
}
@ARTICLE{GIANNINI_2015_ARTICLE_GBGP_291577,
AUTHOR = {Giannini, S. and Biagioni, S. and Goggi, S. and Pardelli, G.},
TITLE = {Mapping Italian grey communities: what is there beyond the Academy?},
YEAR = {2015},
ABSTRACT = {This research aims at verifying whether-and eventually how much-the grey literature available on the web is actually structured, accessible or even managed by systems dealing with its organization and aiming at its retrieval and storing. The utmost goal is to build up a map of non-academic communities and their mechanisms for managing, presenting and disseminating this type of material. It is a sort of journey among the streams of the Web, which channel meeting minutes, manifests, fliers, pictures, newspapers articles, journalistic services and audio/video material on various topics. These "grey" products-by conveying basic information about social and popular culture-store, represent and spread knowledge},
KEYWORDS = {Italian Grey Literature, A.1 INTRODUCTORY AND SURVEY},
PAGES = {17-28},
URL = {http://www.greynet.org/thegreyjournal.html},
VOLUME = {11 (1)},
ISSN = {1574-1796},
JOURNAL = {THE GREY JOURNAL},
}
@ARTICLE{GOGGI_2015_ARTICLE_GMFBPDBM_296111,
AUTHOR = {Goggi, S. and Monachini, M. and Frontini, F. and Bartolini, R. and Pardelli, G. and De Mattei, M. and Bustaffa, F. and Manzella, G.},
TITLE = {Marine Planning and Service Platform (MAPS) An Advanced Research Engine for Grey Literature in Marine Science},
YEAR = {2015},
ABSTRACT = {The MAPS (Marine Planning and Service Platform) project is a development of the Marine project (Ricerca Industriale e Sviluppo Sperimentale Regione Liguria 2007-2013) aiming at building a computer platform for supporting a Marine Information and Knowledge System, as part of the data management activities. One of the main objective of the project is to develop a repository that should gather, classify and structure marine scientific literature and data thus guaranteeing their accessibility to researchers and institutions by means of standard protocols. We will present the scenario of the Operative Oceanography together with the technologies used to develop an advanced search engine which aims at providing rapid and efficient access to a Digital Library of oceanographic data. The case-study is also highlighting how the retrieval of grey literature from this specific marine community could be reproduced for similar communities as well, thus revealing the great impact that the processing, re-use as well as application of grey data have on societal needs/problems and their answers},
KEYWORDS = {Marine Science, Search Engine, Source Data, Oceanography},
PAGES = {171-178},
URL = {https://iris.cnr.it/handle/20.500.14243/296111},
VOLUME = {11 (3)},
ISSN = {1574-1796},
JOURNAL = {THE GREY JOURNAL},
}
@ARTICLE{GOGGI_2015_ARTICLE_GPGBB_294907,
AUTHOR = {Goggi, S. and Pardelli, G. and Giannini, S. and Biagioni, S. and Battisti, M.},
TITLE = {La littérature grise des projets de recherche européens},
YEAR = {2015},
ABSTRACT = {Les projets scientifiques financés par la Commission européenne produisent de la littérature grise. Une étude menée en 2013 sur 226 projets CNR du 7e programme-cadre (2007-2013) a analysé la typologie, le format et la disponibilité des documents signalés sur le serveur Cordis (rapports de recherche et articles scientifiques) et les sites projets (contenant listes de partenaires, brochures, communiqués},
KEYWORDS = {Grey Literature. European Commission Projects},
PAGES = {34-34},
URL = {http://www.cairn.info/revue-i2d-information-donnees-et-documents-2015-1-p-34.htm},
VOLUME = {52 (1)},
DOI = {10.3917/i2d.151.0034},
ISSN = {0012-4508},
JOURNAL = {DOCUMENTALISTE},
}
@ARTICLE{GUADAGNINI_2015_ARTICLE_G_300886,
AUTHOR = {Guadagnini, E.},
TITLE = {Variazioni aborigene: note di lessicografia dell'italiano antico},
YEAR = {2015},
ABSTRACT = {A},
KEYWORDS = {lessicografia, italiano antico, volgarizzamenti},
PAGES = {389-403},
URL = {https://iris.cnr.it/handle/20.500.14243/300886},
VOLUME = {19-20},
ISSN = {1591-8254},
JOURNAL = {BOLLETTINO-OPERA DEL VOCABOLARIO ITALIANO},
}
@ARTICLE{GUADAGNINI_2015_ARTICLE_G_312045,
AUTHOR = {Guadagnini, E.},
TITLE = {Scelta di voci del Tesoro della Lingua Italiana delle Origini (diciottesima serie)},
YEAR = {2015},
ABSTRACT = {Voci abbruciaticcio s. m., arturo s. m., contradegnare v., giovanaglia s. f., gorgone (1) s. m., gorgoneo agg., gorgoni s. f. /s. m. pl., lasciva (1) s. f., lascivamente avv., lascivanza s. f., lascivare v., lascivia s. f., lasciviare v., lasciviente agg. /s. m., lascivio agg., lascivire v., lascività s. f., lascivo agg. /s. m., petulante agg., petulanza s. f., petulenzia s. f., radunaticcio agg. (pp. 23-24, 26-27, 45, 70-71, 74-75, 122-131, 155-156, 182)},
KEYWORDS = {TLIO},
PAGES = {23-224},
URL = {https://iris.cnr.it/handle/20.500.14243/312045},
VOLUME = {19-20},
ISSN = {1591-8254},
JOURNAL = {BOLLETTINO-OPERA DEL VOCABOLARIO ITALIANO},
}
@ARTICLE{MANCINI_2015_ARTICLE_M_443997,
AUTHOR = {Mancini, L.},
TITLE = {Un "increscioso ma non trascurabile argomento": la fine del matrimonio di Aldo Manuzio il Giovane e la sua mancata ammissione agli ordini sacri},
YEAR = {2015},
ABSTRACT = {The supposed admission to the holy orders of Aldus Manutius the Younger (1547-1597) has been already a subject of debate a few years after his death. Some unknown letters by Aldus to Antonio Maria Graziani (1537-1611) allow to shed new light about this event. Through the review of already known documents and with the help of unpublished sources it can be argued that Aldus' decision was closely connected to the end of his marriage with Francesca Giunti. Niccolò Manassi, Aldus' associate and manager of the Venetian shop ad signum Aldi, had a considerable role in their separation; after Aldus' death he married Francesca and took the lead of what remained of the glorious Aldine Press},
KEYWORDS = {Aldo Manuzio il Giovane, storia del commercio librario},
PAGES = {27-43},
URL = {https://iris.cnr.it/handle/20.500.14243/443997},
VOLUME = {29},
ISSN = {1122-0775},
JOURNAL = {NUOVI ANNALI DELLA SCUOLA SPECIALE PER ARCHIVISTI E BIBLIOTECARI},
}
@ARTICLE{MANCINI_2015_ARTICLE_M_443998,
AUTHOR = {Mancini, L.},
TITLE = {"Et questo mi pare quanto agli studij vostri": una lettera inedita di Juan de Polanco a Pedro de Ribadeneyra (1547) alle origini della pedagogia gesuita},
YEAR = {2015},
ABSTRACT = {This essay presents an analysis of a previously unpublished letter, sent by Juan de Polanco to Pedro de Ribadeneira on 9 July 1547, now preserved at the Historical Archives of the Pontifical Gregorian University. The document constitutes a valuable addition to the patrimony of available sources concerning the early history of Jesuit education. The first part of the essay outlines the circumstances of the letter's recovery, as well as its physical features. It then proceeds to an analysis of the text, which can be divided into two parts: Polanco's didactic instructions containing a list of specific authors-some of whom appear for the first time among the early sources on Jesuit education-and subjects recommended for deeper study, both to be compared here with similar extant Jesuit documentation from the same period. The second part of the letter, instead, contains spiritual considerations associated with a life of study. The article concludes with some reflections about the significance of this document, and an appendix containing a full transcription of the letter},
KEYWORDS = {Gesuiti, storia della pedagogia, Juan de Polanco, Pedro Ribadeneira},
PAGES = {187-219},
URL = {https://iris.cnr.it/handle/20.500.14243/443998},
VOLUME = {84},
ISSN = {0037-8887},
JOURNAL = {ARCHIVUM HISTORICUM SOCIETATIS IESU},
}
@ARTICLE{MANCINI_2015_ARTICLE_M_444034,
AUTHOR = {Mancini, L.},
TITLE = {"Amabo te, mi Murete": le lettere di Paolo Manuzio a Marc'Antoine Muret e il gesuita Pietro Lazzari. Con documenti inediti},
YEAR = {2015},
ABSTRACT = {The discovery of 32 letters sent by Paolo Manuzio (1512-1574) to Marc'Antoine Muret (1526-1585) at the Historical Archives of the Pontifical Gregorian University could permit for the first time a comparison between the original text and that one published by the heir of Aldo Manuzio. A lot of the discrepancies was already reported by the Jesuit Pietro Lazzari (1711-1789), who in 1757 pointed in the one of his works dedicated to some texts of the Bibliotheca Maior, where the private library of the French Scholar arrived in 1601. This work was quite unknown until now and it is revived with the publication of other variants not reported by Lazzari and two unpublished letters},
KEYWORDS = {Paolo Manuzio, Marc'Antoine Muret, Pietro Lazzari, Ester Pastorello, Collegio, Bibliotheca Maior, Bibliotheca Secreta, Pontificia Università Gregoriana, Roma},
PAGES = {35-53},
URL = {https://iris.cnr.it/handle/20.500.14243/444034},
VOLUME = {4 (1)},
DOI = {10.6092/issn.2283-9364/5785},
ISSN = {2280-7934},
JOURNAL = {BIBLIOTHECAE. IT},
}
@ARTICLE{MARZI_2015_ARTICLE_MP_342523,
AUTHOR = {Marzi, C. and Pirrelli, V.},
TITLE = {A Neuro-Computational Approach to Understanding the Mental Lexicon},
YEAR = {2015},
ABSTRACT = {Human lexical knowledge does not appear to be organised to minimise storage, but rather to maximise processing efficiency. The way lexical information is stored reflects the way it is dynamically processed, accessed and retrieved. A detailed analysis of the way words are memorised, of the dynamic interaction between lexical representations and distribution and degrees of regularity in input data, can shed some light on the emergence of structures and relations within fully-stored words. We believe that a bottom-up investigation of low-level memory and processing functions can help understand the cognitive mechanisms that govern word processing in the mental lexicon. Neuro-computational models can play an important role in this inquiry, as they help understand the dynamic nature of lexical representations by establishing an explanatory connection between lexical structures and processing models dictated by the micro-functions of human brain. Starting from some linguistic, psycholinguistic and neuro-physiological evidence supporting a dynamic view of the mental lexicon as an integrative system, we illustrate Temporal Self Organising-Maps (TSOMs), artificial neural networks that can model such a view by memorising time series of symbolic units (words) as routinized patterns of short-term node activation. On the basis of a simple pool of principles of adaptive Hebbian synchronisation, TSOMs can perceive possible surface relations between word forms and store them by partially overlapping activation patterns, reflecting gradient levels of lexical specificity, from holistic to decompositional lexical representations. We believe that TSOMs offer an algorithmic model of the emergence of high-level, global and language-specific morphological structure through the working of low-level, language-aspecific processing functions, thus promising to bridge the persisting gap between high-level principles of grammar architecture (lexicon vs. rules), computational correlates (storage vs. processing) and low-level principles and localisations of brain functions. Extensions of the current TSOM architecture are envisaged and their theoretical implications are discussed},
KEYWORDS = {Mental lexicon, dynamic storage, parallel distributed processing, hebbian learning, temporal self-organising maps.},
PAGES = {493-535},
URL = {http://jcs.snu.ac.kr/jcs/issue/vol16/no4/05+Marzi+and+Pirrelli.pdf},
VOLUME = {16 (4)},
ISSN = {1976-6939},
JOURNAL = {JOURNAL OF COGNITIVE SCIENCE},
}
@ARTICLE{PICCINI_2015_ARTICLE_P_395266,
AUTHOR = {Piccini, S.},
TITLE = {Transimpersonal constructions in Lithuanian: towards the emergence of Split Intransitivity},
YEAR = {2015},
ABSTRACT = {Transimpersonalines konstrukcijos pastaruoju metu yra patraukusios daugelio tyreju, ypac funkcines tipologijos specialistu, demesi, kadangi jos atlieka svarbu vaidmeni formuojantis dalinio intranzityvumo (ang. split intransitivity) modeliams ivairiose kalbose. Straipsnyje naujausiu pasiekimu sviesoje ivertinamos kai kurios lietuviu kalbos konstrukcijos, gramatikose laikomos beasmenemis (, impersonalinemis"), meginant interpretuoti jas kaip transimpersonalines. Tyrimas atliktas is sinchronines perspektyvos, didziausia demesi skiriant dabartinei bendrinei kalbai, taciau tam tikrais atvejais lyginama ir su senosios lietuviu kalbos ir ypac tarmiu duomenimis. Analize remiasi fizine bukle nusakanciais veiksmazodziais, kurie priklausomai nuo reiksmes gali buti vartojami ivairiose sintaksinese konstrukcijose. Sinchroniname lygmenyje matomas skirtingas siu eksperienciniu veiksmazodziu elgesys gali buti projektuojamas diachronineje perspektyvoje. Taip galima geriau isryskinti ivairius reanalizes proceso, rodancio laipsniska raida dalinio intranzityvumo atsiradimo kryptimi, etapus. Kai kurie veiksmazodziai, atrodo, reanalizes kelyje yra pazenge gana toli, taciau tikrieji dalinio intranzityvumo modeliai dar nesusiformave. Analizuojamuju veiksmazodziu eksperienciniu argumentu subjekto statusas sintakses poziuriu tebelieka problemiskas},
KEYWORDS = {verbi impersonali, codifica non canonica del soggetto, lituano, intransitività scissa},
PAGES = {19-55},
URL = {http://www.baltistica.lt/index.php/baltistica/article/view/2239/2214},
VOLUME = {50 (1)},
DOI = {10.15388/baltistica.50.1.2239},
ISSN = {0132-6503},
JOURNAL = {BALTISTICA},
}
@BOOK{CHIARELLA_2015_BOOK_CCLM_306227,
AUTHOR = {Chiarella, D. and Cutugno, P. and Lucentini, R. and Marconi, L.},
TITLE = {Glossario Italiano-Spagnolo. Le parole dei servizi demografici},
YEAR = {2015},
ABSTRACT = {Il glossario è stato realizzato nell'ambito del progetto "Ascolto Accoglienza Azioni Offresi (AAA Offresi)", finanziato dal Fondo Europeo per l'Integrazione di cittadini di paesi terzi (FEI)-Ministero dell'Interno. Le lingue in cui il glossario è stato tradotto sono: albanese, arabo, cinese, spagnolo, ucraino. Il glossario è stato realizzato da ILC-CNR, U. O. S. di Genova e contiene 423 ingressi; è il risultato di elaborazioni effettuate nel corso del progetto e di successive selezioni effettuate dal gruppo di ricerca su parole ritenute di difficile comprensione presenti nella modulistica dei Servizi Demografici del Comune di Genova. Le parole o gli insiemi di parole sono dotate di una breve spiegazione collegata all'uso nella modulistica; l'informazione in ogni volume è fornita in italiano ed è seguita dalla traduzione in una delle lingue citate. Per facilitare il recupero delle parole è stato scelto di strutturare un indice che contiene, per ogni lemma del glossario, il riferimento alla pagina dove è possibile trovarlo con la relativa traduzione. Nell'indice compare, insieme al lemma, anche il plurale di alcune parole che sono presenti in tal forma nella modulistica. Il glossario ha due scopi principali: il primo, fornire un supporto, a un cittadino di un paese terzo, nella compilazione della modulistica dei servizi demografici del Comune di Genova; il secondo, agevolare il front office dei servizi demografici nella comunicazione con l'utente},
URL = {https://iris.cnr.it/handle/20.500.14243/306227},
ISBN = {9788880801610},
}
@BOOK{CHIARELLA_2015_BOOK_CCLM_306225,
AUTHOR = {Chiarella, D. and Cutugno, P. and Lucentini, R. and Marconi, L.},
TITLE = {Glossario Italiano-Albanese. Le parole dei servizi demografici},
YEAR = {2015},
ABSTRACT = {Il glossario è stato realizzato nell'ambito del progetto "Ascolto Accoglienza Azioni Offresi (AAA Offresi)", finanziato dal Fondo Europeo per l'Integrazione di cittadini di paesi terzi (FEI)-Ministero dell'Interno. Le lingue in cui il glossario è stato tradotto sono: albanese, arabo, cinese, spagnolo, ucraino. Il glossario è stato realizzato da ILC-CNR, U. O. S. di Genova e contiene 423 ingressi; è il risultato di elaborazioni effettuate nel corso del progetto e di successive selezioni effettuate dal gruppo di ricerca su parole ritenute di difficile comprensione presenti nella modulistica dei Servizi Demografici del Comune di Genova. Le parole o gli insiemi di parole sono dotate di una breve spiegazione collegata all'uso nella modulistica; l'informazione in ogni volume è fornita in italiano ed è seguita dalla traduzione in una delle lingue citate. Per facilitare il recupero delle parole è stato scelto di strutturare un indice che contiene, per ogni lemma del glossario, il riferimento alla pagina dove è possibile trovarlo con la relativa traduzione. Nell'indice compare, insieme al lemma, anche il plurale di alcune parole che sono presenti in tal forma nella modulistica. Il glossario ha due scopi principali: il primo, fornire un supporto, a un cittadino di un paese terzo, nella compilazione della modulistica dei servizi demografici del Comune di Genova; il secondo, agevolare il front office dei servizi demografici nella comunicazione con l'utente},
URL = {https://iris.cnr.it/handle/20.500.14243/306225},
ISBN = {9788880801634},
}
@BOOK{CHIARELLA_2015_BOOK_CCLM_306231,
AUTHOR = {Chiarella, D. and Cutugno, P. and Lucentini, R. and Marconi, L.},
TITLE = {Glossario Italiano-Arabo. Le parole dei servizi demografici},
YEAR = {2015},
ABSTRACT = {Il glossario è stato realizzato nell'ambito del progetto "Ascolto Accoglienza Azioni Offresi (AAA Offresi)", finanziato dal Fondo Europeo per l'Integrazione di cittadini di paesi terzi (FEI)-Ministero dell'Interno. Le lingue in cui il glossario è stato tradotto sono: albanese, arabo, cinese, spagnolo, ucraino. Il glossario è stato realizzato da ILC-CNR, U. O. S. di Genova e contiene 423 ingressi; è il risultato di elaborazioni effettuate nel corso del progetto e di successive selezioni effettuate dal gruppo di ricerca su parole ritenute di difficile comprensione presenti nella modulistica dei Servizi Demografici del Comune di Genova. Le parole o gli insiemi di parole sono dotate di una breve spiegazione collegata all'uso nella modulistica; l'informazione in ogni volume è fornita in italiano ed è seguita dalla traduzione in una delle lingue citate. Per facilitare il recupero delle parole è stato scelto di strutturare un indice che contiene, per ogni lemma del glossario, il riferimento alla pagina dove è possibile trovarlo con la relativa traduzione. Nell'indice compare, insieme al lemma, anche il plurale di alcune parole che sono presenti in tal forma nella modulistica. Il glossario ha due scopi principali: il primo, fornire un supporto, a un cittadino di un paese terzo, nella compilazione della modulistica dei servizi demografici del Comune di Genova; il secondo, agevolare il front office dei servizi demografici nella comunicazione con l'utente},
URL = {https://iris.cnr.it/handle/20.500.14243/306231},
ISBN = {9788880801641},
}
@BOOK{CHIARELLA_2015_BOOK_CCLM_306233,
AUTHOR = {Chiarella, D. and Cutugno, P. and Lucentini, R. and Marconi, L.},
TITLE = {Glossario Italiano-Ucraino. Le parole dei servizi demografici},
YEAR = {2015},
ABSTRACT = {Il glossario è stato realizzato nell'ambito del progetto "Ascolto Accoglienza Azioni Offresi (AAA Offresi)", finanziato dal Fondo Europeo per l'Integrazione di cittadini di paesi terzi (FEI)-Ministero dell'Interno. Le lingue in cui il glossario è stato tradotto sono: albanese, arabo, cinese, spagnolo, ucraino. Il glossario è stato realizzato da ILC-CNR, U. O. S. di Genova e contiene 423 ingressi; è il risultato di elaborazioni effettuate nel corso del progetto e di successive selezioni effettuate dal gruppo di ricerca su parole ritenute di difficile comprensione presenti nella modulistica dei Servizi Demografici del Comune di Genova. Le parole o gli insiemi di parole sono dotate di una breve spiegazione collegata all'uso nella modulistica; l'informazione in ogni volume è fornita in italiano ed è seguita dalla traduzione in una delle lingue citate. Per facilitare il recupero delle parole è stato scelto di strutturare un indice che contiene, per ogni lemma del glossario, il riferimento alla pagina dove è possibile trovarlo con la relativa traduzione. Nell'indice compare, insieme al lemma, anche il plurale di alcune parole che sono presenti in tal forma nella modulistica. Il glossario ha due scopi principali: il primo, fornire un supporto, a un cittadino di un paese terzo, nella compilazione della modulistica dei servizi demografici del Comune di Genova; il secondo, agevolare il front office dei servizi demografici nella comunicazione con l'utente},
URL = {https://iris.cnr.it/handle/20.500.14243/306233},
ISBN = {9788880801627},
}
@BOOK{CHIARELLA_2015_BOOK_CCLM_306229,
AUTHOR = {Chiarella, D. and Cutugno, P. and Lucentini, R. and Marconi, L.},
TITLE = {Glossario Italiano-Cinese. Le parole dei servizi demografici},
YEAR = {2015},
ABSTRACT = {Il glossario è stato realizzato nell'ambito del progetto "Ascolto Accoglienza Azioni Offresi (AAA Offresi)", finanziato dal Fondo Europeo per l'Integrazione di cittadini di paesi terzi (FEI)-Ministero dell'Interno. Le lingue in cui il glossario è stato tradotto sono: albanese, arabo, cinese, spagnolo, ucraino. Il glossario è stato realizzato da ILC-CNR, U. O. S. di Genova e contiene 423 ingressi; è il risultato di elaborazioni effettuate nel corso del progetto e di successive selezioni effettuate dal gruppo di ricerca su parole ritenute di difficile comprensione presenti nella modulistica dei Servizi Demografici del Comune di Genova. Le parole o gli insiemi di parole sono dotate di una breve spiegazione collegata all'uso nella modulistica; l'informazione in ogni volume è fornita in italiano ed è seguita dalla traduzione in una delle lingue citate. Per facilitare il recupero delle parole è stato scelto di strutturare un indice che contiene, per ogni lemma del glossario, il riferimento alla pagina dove è possibile trovarlo con la relativa traduzione. Nell'indice compare, insieme al lemma, anche il plurale di alcune parole che sono presenti in tal forma nella modulistica. Il glossario ha due scopi principali: il primo, fornire un supporto, a un cittadino di un paese terzo, nella compilazione della modulistica dei servizi demografici del Comune di Genova; il secondo, agevolare il front office dei servizi demografici nella comunicazione con l'utente},
URL = {https://iris.cnr.it/handle/20.500.14243/306229},
ISBN = {9788880801658},
}
@INCOLLECTION{BELLANDI_2015_INCOLLECTION_B_348541,
AUTHOR = {Bellandi, A.},
TITLE = {Towards a Translation Platform as a Bridge Between Ancient and Modern Languages. Part II: A Research Infrastructure for Translation and Interpretation of Ancient Texts},
YEAR = {2015},
ABSTRACT = {Il contributo presenta la definizione e la realizzazione di una piattaforma web collaborativa per il supporto alla traduzione di lingue antiche in lingue moderne, portando l'esempio del Progetto di Traduzione del Talumd Babilonese in Italiano},
URL = {https://iris.cnr.it/handle/20.500.14243/348541},
ISBN = {9788822263933},
}
@INCOLLECTION{BRANDO_2015_INCOLLECTION_BFG_292095,
AUTHOR = {Brando, C. and Frontini, F. and Ganascia, J.},
TITLE = {Disambiguation of Named Entities in Cultural Heritage Texts Using Linked Data Sets},
YEAR = {2015},
ABSTRACT = {This paper proposes a graph-based algorithm baptized REDEN for the disambiguation of authors' names in French literary criticism texts and scientific essays from the 19th century. It leverages knowledge from different Linked Data sources in order to select candidates for each author mention, then performs fusion of DBpedia and BnF individuals into a single graph, and finally decides the best referent using the notion of graph centrality. Some experiments are conducted in order to identify the best size of disambiguation context and to assess the influence on centrality of specific relations represented as edges. This work will help scholars to trace the impact of authors' ideas across different works and time periods},
KEYWORDS = {Named-entity disambiguation Centrality Linked data Data fusion Digital humanities},
PAGES = {505-514},
URL = {http://link.springer.com/chapter/10.1007%2F978-3-319-23201-0_51},
DOI = {10.1007/978-3-319-23201-0_51},
ISBN = {978-3-319-23200-3},
BOOKTITLE = {New Trends in Databases and Information Systems},
EDITOR = {Morzy, T. and Valduriez, P. and Bellatreche, L.},
}
@INCOLLECTION{BURGASSI_2015_INCOLLECTION_B_357042,
AUTHOR = {Burgassi, C.},
TITLE = {volgarizzamenti di Livio (già attribuiti a Boccaccio): appunti sul testo e sulla tradizione},
YEAR = {2015},
ABSTRACT = {The medieval translations of Livy's work are particularly interesting because of their doubtful provenance. Even if they aren't signed, certain scholars have attributed some of these weighty translations to the pen of Giovanni Boccaccio. This paper takes into consideration certain aspects of the language and style of the volgarizzamenti of Livy's Third Decade, paying special attention to the two different translations into volgare of the first four books. On one hand, we highlight the differences in language and style, underlying the two "philosophies" behind the practice of vulgarization. On the other hand, we demonstrate that each translation shows a different knowledge of Latin. Finally, we analyze the tradition of the original Latin text. Particular attention is dedicated to the spurious fragment (the so-called «additamentum Allifanum») which is translated in both vulgarizations. This allows us not only to identify the branch of the Latin tradition on which the two volgarizzamenti are based, but also to hypothesize that the original Latin text comes from the monastery of Monte Cassino},
KEYWORDS = {Volgarizzamenti, Tito Livio, Boccaccio},
PAGES = {139-147},
URL = {https://iris.cnr.it/handle/20.500.14243/357042},
PUBLISHER = {Longo (Ravenna, ITA)},
ISBN = {978-88-8063-827-8},
CONFERENCE_PLACE = {Ravenna},
BOOKTITLE = {Boccaccio 1313-2013},
EDITOR = {Ciabattoni, F. and Filosa, E. and Olson, K.},
}
@INCOLLECTION{GUADAGNINI_2015_INCOLLECTION_G_268593,
AUTHOR = {Guadagnini, E.},
TITLE = {«Secondo la forma del libro»: note sulla tradizione manoscritta della "Rettorica" di Brunetto Latini},
YEAR = {2015},
ABSTRACT = {This paper examines some neglected aspects of the textual tradition of Brunetto Latini's Rettorica. It deals first with some texts coming along with Brunetto's work in the manuscript tradition: this is particularly the case of the Fiore di rettorica. The mise en page is then considered: as usually happens when dealing with typical study books, the Rettorica presents a changing writing module (a major one for Cicero's words, and a minor one for the glosses) and a series of schemes ("trees") aiming to illustrate some of this treatise's key concepts. The analysis of such paratextual elements through the entire span of the textual tradition (eight manuscripts) shows a diachronic evolution eventually leading to the obliteration of Brunetto's original book model},
KEYWORDS = {Filologia italiana, Brunetto Latini},
PAGES = {355-367},
URL = {https://iris.cnr.it/handle/20.500.14243/268593},
PUBLISHER = {Edizioni del Galluzzo (Impruneta, ITA)},
ISBN = {9788884504777},
CONFERENCE_PLACE = {Firenze},
BOOKTITLE = {Il Ritorno dei Classici nell'Umanesimo. Studi in memoria di Gianvito Resta},
EDITOR = {Villa, G. A. C. C. M. C. C.},
}
@INCOLLECTION{MARCHETTI_2015_INCOLLECTION_MMM_308101,
AUTHOR = {Marchetti, A. and Marchi, S. and Maria Morales, M.},
TITLE = {Il progetto Clavius on the Web entra nelle scuole},
YEAR = {2015},
ABSTRACT = {Il progetto Clavius on the Web (CoW) costituisce il frutto della collaborazione tra l'Archivio storico della Pontificia Università Gregoriana (APUG), l'Istituto di Informatica e Telematica (IIT) e l'Istituto di Linguistica Computazionale "Antonio Zampolli" (ILC), questi ultimi due afferenti al Consiglio Nazionale delle Ricerche di Pisa. CoW è iniziato nel 2012, anno in cui ricorreva il quarto centenario della morte del matematico gesuita Christophorus Clavius (1537-1612). Tedesco di Bamberga, professore presso il Collegio Romano, Clavius era considerato una delle massime autorità dei suoi tempi per ciò che concerneva le scienze matematiche. Egli fu, infatti, il maestro dei primi quadri scientifici della Compagnia di Gesù e grazie al suo insegnamento alcuni missionari come Matteo Ricci (1552-1610) o Giovanni Antonio Rubino (1578-1643) riuscirono a condurre con mezzi non esclusivamente teologici la loro opera di missione in Asia. Oggi si ricorda Clavius principalmente per il suo contributo alla riforma gregoriana del calendario, approvata nel 1582 su un modello proposto da Luigi Lilio (1510-1576), successivamente perfezionato dal gesuita tedesco},
KEYWORDS = {Digital Humanities, Cultural Heritage, TEI, XML, Information Visualization, School},
PAGES = {74-84},
URL = {http://digitalia.sbn.it/article/download/1476/983},
PUBLISHER = {ICCU-Istituto Centrale per il Catalogo Unico (Roma, ITA)},
CONFERENCE_PLACE = {Roma},
BOOKTITLE = {Rivista del digitale nei beni culturali},
}
@INCOLLECTION{MARCHI_2015_INCOLLECTION_M_337084,
AUTHOR = {Marchi, S.},
TITLE = {GREEK INTO ARABIC, A RESEARCH INFRASTRUCTURE BASED ON COMPUTATIONAL MODULES TO ANNOTATE AND QUERY HISTORICAL AND PHILOSOPHICAL DIGITAL TEXTS Part ii. System components and features},
YEAR = {2015},
ABSTRACT = {Computer technology nowadays allows users to build simple and effective tools designed to meet the needs of researchers and institutions in various fields of research. Since its reation, the World Wide Web prompted the existence of an environment that breaks down the boundaries of time (i. e. synchronous activity) and space (i. e. location of activities), a prerequisite for the design of tools enabling the collaboration among users. Over the past years text processing systems have become part and parcel of the daily language of scholars working in the field of Humanities, despite some objections raised against this type of technology because of their apparent lack of simplicity of usage, appropriateness, and flexibility. Usage requires special attention with respect to the interface between the information system and the user, while appropriateness and flexibility have not been sufficiently taken into account, not to mention that they two desiderata almost seem to be in contrast to each other. Therefore, it is not easy to plan and implement a text processing system which is suitable for specific types of research and at the same time as flexible as to operate in various fields of research},
KEYWORDS = {textual scholarship, Collaborative Application, web application},
PAGES = {43-56},
URL = {http://www.olschki.it/libro/9788822263933},
PUBLISHER = {Leo S. Olschki (Firenze, ITA)},
ISBN = {9788822263933},
CONFERENCE_PLACE = {Firenze},
BOOKTITLE = {Digital texts, translations, lexicons in a multi-modular web application: methods and samples},
EDITOR = {Bozzi, A.},
}
@INCOLLECTION{MORGAVI_2015_INCOLLECTION_MNMCFCM_297268,
AUTHOR = {Morgavi, G. and Nerino, R. and Marconi, L. and Cutugno, P. and Ferraris, C. and Cinini, A. and Morando, M.},
TITLE = {An Integrated Approach to the Well-Being of the Elderly People at Home},
YEAR = {2015},
ABSTRACT = {The paper presents the outline and the preliminary developments of NINFA (iNtelligent Integrated Network For Aged people), a project for the well-being of the elderly people at home. This architecture is based on a service platform suited for elder people called the Virtual Village Network, whose user interface allows to deliver different services at home, namely: user supervision, communication and interaction among users for social inclusion, exergame delivering, monitoring of the wellness status},
KEYWORDS = {ICT platform, Wellness network services, 3D movement analysis, Linguistic and cognitive analysis, exergames, "at-home" technologies},
PAGES = {265-274},
URL = {https://iris.cnr.it/handle/20.500.14243/297268},
DOI = {10.1007/978-3-319-18374-9_25},
ISBN = {978-3-319-18373-2},
BOOKTITLE = {Springer-Ambient Assisted Living-Italian Forum 2014},
EDITOR = {Andò, P. B. and Siciliano, P. P. and Marletta, P. V. and Monteriù, P. A.},
}
@INCOLLECTION{PICCINI_2015_INCOLLECTION_PR_401726,
AUTHOR = {Piccini, S. and Ruimy, N.},
TITLE = {Plotiterm: Une Ressource Termino-Ontologique du Vocabulaire Plotinien},
YEAR = {2015},
ABSTRACT = {L'articolo presenta la risorsa termino-ontologica bilingue (greco-araba) PLOTITERM, dedicata alla terminologia delle Enneadi di Plotino e della loro traduzione in lingua araba, conosciuta sotto il nome di pseudo-Teologia di Aristotele. Sia il livello linguistico sia il livello concettuale hanno ricevuto una strutturazione formale nel linguaggio OWL-DL},
KEYWORDS = {lessicografia computazionale, lessico filosofico, Plotino, ontologie},
PAGES = {105-137},
URL = {https://iris.cnr.it/handle/20.500.14243/401726},
PUBLISHER = {Leo S. Olschki (Firenze, ITA)},
ISBN = {9788822263933},
CONFERENCE_PLACE = {Firenze},
BOOKTITLE = {Digital Texts, Translations, Lexicons in a Multi-Modular Web Application: Methods and Samples},
EDITOR = {Bozzi, A.},
}
@INCOLLECTION{PIRRELLI_2015_INCOLLECTION_PFM_290722,
AUTHOR = {Pirrelli, V. and Ferro, M. and Marzi, C.},
TITLE = {Computational complexity of abstractive morphology},
YEAR = {2015},
ABSTRACT = {Abstractive and constructive approaches to word structure make radically different assumptions concerning nature and role of the building blocks that make up a speaker's morphological competence. In this contribution, we show that the two views are also computationally different. In particular, we contend that a number of problems arising in connection with a subsymbolic implementation of the constructive view (as epitomised by classical multi-layered perceptrons) are tackled effectively, or disappear altogether, in a neurally-inspired implementation of associative networks, resting on key-notions such as self-organization and emergence. A particular variant of Kohonen's Self-Organizing Map is introduced as a model to explore and assess the implications of an abstractive approach in terms of its computational complexity. Details of the model (Temporal Self-Organizing Map, TSOM) and experimental data are shown to illustrate the interplay between processing and storage in language acquisition},
KEYWORDS = {Word processing, computational complexity, mental lexicon, dynamic memories, self-organisation, word structure, morphology},
PAGES = {141-166},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-84938781714\&origin=inward},
DOI = {10.1093/acprof:oso/9780198723769.003.0008},
PUBLISHER = {Oxford University Press (Oxford, GBR)},
ISBN = {978-0-19-872376-9},
CONFERENCE_PLACE = {Oxford},
BOOKTITLE = {Understanding and Measuring Mprphological Complexity},
EDITOR = {Baerman, M. and Brown, D. and Corbett, G. G.},
}
@INCOLLECTION{RUSSO_2015_INCOLLECTION_RR_320885,
AUTHOR = {Russo, I. and Robaldo, L.},
TITLE = {From language to action: Extraction and disambiguation of affordances in ModelAct},
YEAR = {2015},
ABSTRACT = {In this paper we focus on how information about concrete actions performed on food should be provided to IoT devices in terms of affordances extracted from corpora. Natural language processing has a role in defining which kind of knowledge devices interacting with machines and appliances should handle when humans send requests through natural language interfaces. We propose a model for the extraction of affordances of food from corpora and their role in sequences of procedural (sub)actions. The food processor of the future can find helpful this knowledge to interact with users suggesting alternatives in food processing in recipes steps and basic reasoning about preconditions and consequences in making meals},
URL = {https://iris.cnr.it/handle/20.500.14243/320885},
DOI = {10.1007/978-3-319-19656-5_15},
ISBN = {978-3-319-19655-8},
}
@INCOLLECTION{SAGRI_2015_INCOLLECTION_STVM_340887,
AUTHOR = {Sagri, M. and Tiscornia, D. and Venturi, G. and Montemagni, S.},
TITLE = {Neuroscienze e genetica comportamentale in un corpus di sentenze italiane alla luce dei risultati di elaborazioni linguistico-computazionali},
YEAR = {2015},
ABSTRACT = {Il contributo intende illustrare i primi risultati di uno studio, tutt'ora in corso, finalizzato a monitorare evoluzione e mutamenti dell'uso della neurogenetica e delle neuroscienze all'interno del sistema della giustizia in Italia},
URL = {https://iris.cnr.it/handle/20.500.14243/340887},
ISBN = {9788849529326},
}
@INCOLLECTION{SIMI_2015_INCOLLECTION_SMB_297500,
AUTHOR = {Simi, M. and Montemagni, S. and Bosco, C.},
TITLE = {Harmonizing and merging Italian treebanks: Towards a merged Italian dependency treebank and beyond},
YEAR = {2015},
ABSTRACT = {In this paper we address the challenge of combining existing CoNLL-compliant dependency-annotated corpora with the final aim of constructing a bigger treebank for the Italian language. To this end, we defined amethodology formapping different annotation schemes, based on: (i)The analysis of similarities and differences of considered source and target dependency annotation schemes; (ii) The analysis of the performance of state of the art dependency parsers trained on the source and target treebanks; (iii) The mapping of the source annotation scheme(s) onto a set of target (possibly underspecified) data categories. This methodology was applied in two different case studies. The first one was aimed at constructing a "Merged Italian Dependency Treebank" (MIDT) starting from existing Italian dependency treebanks, namely TUT and ISST-TANL. The second case study, still ongoing, consists in the conversion of the MIDT resource into the Stanford Dependencies de facto standard with the final aim of developing an "Italian Stanford Dependency Treebank" (ISDT)},
KEYWORDS = {Harmonization and merging of resources, Italian, Dependency Treebank},
PAGES = {3-23},
URL = {http://www.scopus.com/inward/record.url?eid=2-s2.0-84927143016\&partnerID=q2rCbXpz},
DOI = {10.1007/978-3-319-14206-7_1},
PUBLISHER = {Springer International Publishing (CH-6330 Cham (ZG), CHE)},
ISBN = {978-3-319-14205-0},
CONFERENCE_PLACE = {CH-6330 Cham (ZG)},
BOOKTITLE = {Harmonization and Development of Resources and Tools for Italian Natural Language Processing within the PARLI Project},
EDITOR = {Basili, R. and Bosco, C. and Delmonte, R. and Moschitti, A. and Simi, M.},
}
@INCOLLECTION{SORIA_2015_INCOLLECTION_S_420848,
AUTHOR = {Soria, C.},
TITLE = {Language Technologies for Digital Language Diversity},
YEAR = {2015},
ABSTRACT = {According to the research carried out by the META-NET European Excellence Network, 30 European languages are at risk of digital extinction. Such a risk occurs when usability of a language over digital tools and devices is seriously compromised, essentially because of a total or partial lack of sufficient language technologies. Insufficient support can rapidly put a language in a condition where the contexts of digital use are eroded, or are never accessible. Examples of digital use range from sheer availability of contents over the web, to the possibility to access contents written in a different language, thanks to machine translation applications; the availability of voice interfaces, ebooks, edu-tainment applications, etc. Shrinking contexts of uses can have a devastating effect, eventually leading to the abandonment of a language in favor of another, better supported one. Should this happen, the consequences for a language profile would be dramatic: any language that cannot be used over digital contexts will engage in a "digital diglossia" relationship with another, better supported language. In order to act and put preventive measures into place, it is of utmost importance to have an instrument that allows to evaluate the degree of digital vitality of a language, namely its functional capacity in the new contexts of use and the new media. In this paper we intend to make a reflection over the importance of language diversity in general and in the particular context of digital applications, by showing the breadth and depth of research and technology needed to support the actual usability of languages over digital devices. A preliminary agenda for fostering digital language vitality is then presented, together with preventive measures needed in order to ensure a safe level of digital language diversity},
KEYWORDS = {Digital language diversity, language technology, linguistic digital divide, non-dominant languages},
PAGES = {47-60},
URL = {https://dom.lndb.lv/data/obj/765930.html},
}
@INCOLLECTION{SORIA_2015_INCOLLECTION_S_297723,
AUTHOR = {Soria, C.},
TITLE = {Assessing the effect of official recognition on the vitality of minority and regional languages: a case study from Italy},
YEAR = {2015},
ABSTRACT = {In 1999, a rather controversial Italian law granted official recognition to twelve endangered regional and minority languages but denied it to others that were nevertheless also classed as endangered by UNESCO and the Ethnologue. This turn of events has produced a perfect scenario to assess the impact of language policies on protected languages and, at the same time, the effects of lack of official protection and recognition for languages that are denied such institutional support. This chapter presents the results of a survey carried out among speakers of these endangered languages. It assesses their vitality in terms of speaker numbers, domains of use, intergenerational transmission and speaker attitudes, arguing that a correlation can be established, on the one hand, between positive speaker attitudes and favourable language policies and, on the other, between lack of policy support and negative language attitudes. The chapter further argues language policy can actually alter linguistic behaviour},
KEYWORDS = {language policy, endangered languages, regional languages},
PAGES = {123-137},
URL = {https://iris.cnr.it/handle/20.500.14243/297723},
PUBLISHER = {Cambridge university press (Cambridge, GBR)},
ISBN = {978-1-107-09922-7},
CONFERENCE_PLACE = {Cambridge},
BOOKTITLE = {Policy and Planning for Endangered Languages},
EDITOR = {Jones, M. C.},
}
@EDITORIAL{PIRRELLI_2015_EDITORIAL_PMF_290958,
AUTHOR = {Pirrelli, V. and Marzi, C. and Ferro, M.},
TITLE = {Proceedings of the NetWordS Final Conference on Word Knowledge and Word Usage: Representations and Processes in the Mental Lexicon},
YEAR = {2015},
ABSTRACT = {The international conference "Word Knowledge and Word Usage: Representations and processes in the mental lexicon" is the final outcome of 4 years of intense multi-disciplinary research networking and cooperation funded by the European Science Foundation within the framework of the NetWordS programme (May 2011-April 2015). NetWordS' mission was to bring together experts of various research fields (from brain sciences and computing to cognition and linguistics) and of different theoretical inclinations, to advance the current awareness of theoretical, typological, psycholinguistic, computational and neurophysiological evidence on the structure and processing of words, with a view to developing novel research paradigms and bringing up a new generation of language scholars. The conference was intended to provide a first forum for assessing current progress of crossdisciplinary research on language architecture and usage, and discussing prospects of future synergy. People are known to memorise, parse and access words in a context-sensitive and opportunistic way, by caching their most habitual and productive processing patterns into routinized behavioural schemes. Speakers not only take advantage of token-based information such as frequency of individual, holistically stored words, but they are also able to organise stored words through paradigmatic structures (or word families) whose overall size and frequency is an important determinant of ease of lexical access and interpretation. Accordingly, lexical organisation is not necessarily functional to descriptive economy and minimisation of storage, but to more performance-oriented factors such as efficiency of memorisation, access and recall. Usage-based approaches to word processing lend support to this view, to promote explanatory frameworks that aim to investigate the stable correlation patterns linking distributional entrenchment of lexical units with productivity, internal structure and ease of interpretation. Ultimately, this is intended to establish a deep interconnection between performance-oriented, low-level lexical functions such as memorisation, rehearsal, access and recall, and their neuroanatomical correlates},
KEYWORDS = {mental lexicon, linguistics, brain sciences, psycholinguistics, computing, cognition},
PAGES = {1-189},
URL = {http://ceur-ws.org/Vol-1347/},
VOLUME = {1347},
PUBLISHER = {CEUR-WS. org (Aachen, DEU)},
CONFERENCE_PLACE = {Aachen},
}
@INPROCEEDINGS{ALBANESI_2015_INPROCEEDINGS_ABBDG_289694,
AUTHOR = {Albanesi, D. and Bellandi, A. and Benotto, G. and Di Segni, G. and Giovannetti, E.},
TITLE = {When Translation Requires Interpretation: Collaborative Computer-Assisted Translation of Ancient Texts},
YEAR = {2015},
ABSTRACT = {This paper introduces the main features of Traduco, a Web-based, collaborative Computer-Assisted Translation (CAT) tool developed to support the translation of ancient texts. In addition to the standard components offered by traditional CAT tools, Traduco includes a number of features designed to ease the translation of ancient texts, such as the Babylonian Talmud, posing specific structural, stylistic, linguistic and hermeneutical challenges},
KEYWORDS = {Computer-Assisted Translation, Babylonian Talmud},
PAGES = {84-88},
URL = {https://iris.cnr.it/handle/20.500.14243/289694},
ISBN = {978-1-941643-63-1},
CONFERENCE_NAME = {9th SIGHUM Workshop on Language Technology for Cultural Heritage, Social Sciences, and Humanities (LaTeCH 2015)},
BOOKTITLE = {Proceedings of the 9th SIGHUM Workshop on Language Technology for Cultural Heritage, Social Sciences, and Humanities},
}
@INPROCEEDINGS{ANGIOLINI_2015_INPROCEEDINGS_ARDSRV_381996,
AUTHOR = {Angiolini, A. and Rossi, F. and Di Donato, F. and Salvatori, E. and Rosati, L. and Vitali, S.},
TITLE = {Digital humanities: Crafts and occupations},
YEAR = {2015},
ABSTRACT = {This panel aims at discussing about new crafts and occupations in the Digital Humanities domain. Some experts in different contexts (publishing house, computer agency, freelance professional, library, archive, and university) are asked to reflect on the role of Digital Humanities in refining traditional working practices and methods},
URL = {https://iris.cnr.it/handle/20.500.14243/381996},
DOI = {10.1145/2802612.2802630},
}
@INPROCEEDINGS{BANTERLE_2015_INPROCEEDINGS_BCMPGAS_296082,
AUTHOR = {Banterle, F. and Cardillo, F. A. and Malomo, L. and Pingi, P. and Gabellone, F. and Amato, G. and Scopigno, R.},
TITLE = {LecceAR: an augmented reality App},
YEAR = {2015},
ABSTRACT = {This paper discusses a case study on the use of augmented reality (AR) within the context of cultural heritage. We implemented an iOS app for markerless AR that will be exhibited at the MUST museum in Lecce, Italy. The app shows a rich 3D reconstruction of the Roman amphitheater, which is nowadays only partially visible. The use of state-of-the-art algorithms in computer graphics and computer vision allows the viewing and the exploration of the ancient theater in real-time},
KEYWORDS = {Augmented Reality, Image processing and Computer vision, Picture/Image generation display algorithms},
PAGES = {99-108},
URL = {https://www.ceeol.com/search/article-detail?id=283512},
VOLUME = {5},
DOI = {10.55630/dipp.2015.5.9},
PUBLISHER = {Institute of Mathematics and Informatics at the Bulgarian Academy of Sciences (Sofia, Bulgaria)},
ISSN = {2535-0366},
CONFERENCE_NAME = {Digital Presentation and Preservation of Cultural and Scientific Heritage},
CONFERENCE_PLACE = {Sofia, Bulgaria},
BOOKTITLE = {Digital Presentation and Preservation of Cultural and Scientific Heritage},
EDITOR = {Pavlov, R. and Stanchev, P.},
}
@INPROCEEDINGS{BARBAGLI_2015_INPROCEEDINGS_BLDMV_322147,
AUTHOR = {Barbagli, A. and Lucisano, P. and Dell'Orletta, F. and Montemagni, S. and Venturi, G.},
TITLE = {CItA: un Corpus di Produzioni Scritte di Apprendenti l'Italiano L1 Annotato con Errori},
YEAR = {2015},
ABSTRACT = {In questo articolo presentiamo CItA il primo corpus di produzioni scritte di apprendenti l'italiano L1 del primo e del secondo anno della scuola secondaria di primo grado annotato con errori grammaticali, ortografici e lessicali. Le specificità del corpus e la sua natura diacronica lo rendono particolarmente utile sia per applicazioni linguistico-computazionali sia per studi socio-pedagogici},
KEYWORDS = {Apprendiemento della lingua madre, evoluzione delle competenze linguistiche},
PAGES = {31-35},
URL = {http://www.italianlp.it/wp-content/uploads/2016/03/CItA_errori.pdf},
PUBLISHER = {Accademia University Press (Torino, ITA)},
ISBN = {978-88-99200-62-6},
CONFERENCE_NAME = {2nd Italian Conference on Computational Linguistics (CLiC-it)},
CONFERENCE_PLACE = {Torino},
}
@INPROCEEDINGS{BELLANDI_2015_INPROCEEDINGS_BBG_264615,
AUTHOR = {Bellandi, A. and Bellusci, A. and Giovannetti, E.},
TITLE = {Computer Assisted Translation of Ancient Texts: the Babylonian Talmud Case Study},
YEAR = {2015},
ABSTRACT = {In this paper we introduce some of the features of the Computer Assisted Translation web application developed to support the translation of the Babylonian Talmud (BT) in Italian. The BT is a late antique Jewish anthological corpus, which, as other ancient texts, presents a number of hurdles related to its intrinsic linguistic and philological nature. In this work, we illustrate the solutions we adopted in the system, with particular emphasis on the Translation Memory and the translation suggestion component},
KEYWORDS = {computer-assisted translation, Babylonian Talmud, Translation Memory},
PAGES = {287-302},
URL = {https://www.degruyter.com/view/book/9781501501289/10.1515/9781501501289.287.xml},
DOI = {10.1515/9781501501289},
PUBLISHER = {De Gruyter Saur (Berlin/Munich, DEU)},
ISBN = {9781501501289},
CONFERENCE_NAME = {NLPCS 2014: 11th International Workshop on Natural Language Processing and Cognitive Science},
CONFERENCE_PLACE = {Berlin/Munich},
BOOKTITLE = {Natural Language Processing and Cognitive Science, Proceedings 2014},
EDITOR = {Sharp, B. and Delmonte, R.},
}
@INPROCEEDINGS{BIZZONI_2015_INPROCEEDINGS_BBDR_403996,
AUTHOR = {Bizzoni, Y. and Boschetti, F. and Del Gratta, R. and Reboul, M.},
TITLE = {Enhancing the Accuracy of Ancient Greek WordNet by Multilingual Distributional Semantics},
YEAR = {2015},
ABSTRACT = {We discuss a method toenhance the accuracy of a subset of theAncient Greek WordNet based on theHomeric lexicon and the related conceptualnetwork, by using multilingualsemantic spaces built from aligned corpora},
KEYWORDS = {Distributional Semantics, WordNet, Ancient Greek},
URL = {https://books.openedition.org/aaccademia/1312},
ISBN = {978-88-99200-62-6},
CONFERENCE_NAME = {Second Italian Conference on Computational Linguistics CLiC-it 2015},
BOOKTITLE = {Second Italian Conference on Computational Linguistics CLiC-it 2015},
}
@INPROCEEDINGS{BOSCHETTI_2015_INPROCEEDINGS_BDDMDN_255756,
AUTHOR = {Boschetti, F. and Del Gratta, R. and Del Grosso, A. M. and Monachini, M. and Diakoff, H. and Nahli, O.},
TITLE = {Collaborative Philology on the way to Web Services: the case of CoPhiWordnet},
YEAR = {2015},
ABSTRACT = {Starting from previous initiatives of the CoPhiLab, we show how they can be reinterpreted as Web Services, especially when they become part of a wider scenario: Web Services are used to make connections between lexicons, semantic resources and a fine grained text management. Linked Open Data is chosen to be the paradigm used to link the dierent resources, but also as the modality of data presentation},
KEYWORDS = {Collaborative Philology, Web Services, Linked Open Data, Text Services, Text Interpretation},
URL = {https://iris.cnr.it/handle/20.500.14243/255756},
CONFERENCE_NAME = {The Second International Workshop on Worldwide Language Service Infrastructure, WLSI 2015},
BOOKTITLE = {The Second International Workshop on Worldwide Language Service Infrastructure, WLSI 2015},
}
@INPROCEEDINGS{BOSCHETTI_2015_INPROCEEDINGS_BDFKM_305311,
AUTHOR = {Boschetti, F. and Del Gratta, R. and Frontini, F. and Khan, F. and Monachini, M.},
TITLE = {(Re)thinking the BLARK for Ancient Greek},
YEAR = {2015},
ABSTRACT = {The paper discusses the Basic LAnguage Resource Kit (BLARK) for Ancient Greek, measuring the BLARK matrix against what is actually available for this language, and assessing its applicability to ancient languages in general. In addition, the BLARK and the FLaReNet recommendations are used to define priorities in the sector in close collaboration between philologists and the broader LRT community},
URL = {https://iris.cnr.it/handle/20.500.14243/305311},
ISBN = {978-83-932640-8-7},
}
@INPROCEEDINGS{BOUKHALED_2015_INPROCEEDINGS_BFG_297255,
AUTHOR = {Boukhaled, M. and Frontini, F. and Ganascia, J.},
TITLE = {A Peculiarity-based Exploration of Syntactical Patterns: a Computational Study of Stylistics},
YEAR = {2015},
ABSTRACT = {In this contribution, we present a computational stylistic study and comparison of classic French literary texts based on a datadriven approach where discovering interesting linguistic patterns is done without any prior knowledge. We propose an objective measure capable of capturing and extracting meaningful stylistic syntactic patterns from a given author's work. Our hypothesis is based on the fact that the most relevant syntactic patterns should significantly reflect the author's stylistic choice and thus they should exhibit some kind of peculiar overrepresentation behavior controlled by the author's purpose with respect to a linguistic norm. The analyzed results show the effectiveness in extracting interesting syntactic patterns from novels, and seem particularly promising for the analysis of such particular texts},
KEYWORDS = {Computational Stylistics, Interestingness Measure, Sequential Pattern Mining, Syntactic Style},
PAGES = {31-39},
URL = {http://ceur-ws.org/Vol-1410/paper5.pdf},
VOLUME = {1410},
CONFERENCE_NAME = {Workshop on Interactions between Data Mining and Natural Language Processing 2015 co-located with European Conference on Machine Learning and Principles and Practice of Knowledge Discovery in Databases (ECML PKDD 2015)},
}
@INPROCEEDINGS{BOUKHALED_2015_INPROCEEDINGS_BFG_294757,
AUTHOR = {Boukhaled, M. and Frontini, F. and Ganascia, J.},
TITLE = {Une mesure d'intérêt à base de surreprésentation pour l'extraction des motifs syntaxiques stylistiques},
YEAR = {2015},
ABSTRACT = {Dans cette contribution, nous présentons une étude sur la stylistique computationnelle des textes de la littérature classiques française fondée sur une approche conduite par données, où la découverte des motifs linguistiques intéressants se fait sans aucune connaissance préalable. Nous proposons une mesure objective capable de capturer et d'extraire des motifs syntaxiques stylistiques significatifs à partir d'un oeuvre d'un auteur donné. Notre hypothèse de travail est fondée sur le fait que les motifs syntaxiques les plus pertinents devraient refléter de manière significative le choix stylistique de l'auteur, et donc ils doivent présenter une sorte de comportement de surreprésentation contrôlé par les objectifs de l'auteur. Les résultats analysés montrent l'efficacité dans l'extraction de motifs syntaxiques intéressants dans le texte littéraire français classique, et semblent particulièrement prometteurs pour les analyses de ce type particulier de texte},
KEYWORDS = {Computational stylistic, text mining, syntactic patterns, interestingness measure},
PAGES = {391-396},
URL = {http://www.atala.org/taln_archives/TALN/TALN-2015/taln-2015-court-012.html},
CONFERENCE_NAME = {22e Conférence Sur Le Traitement Automatique Des Langues Naturelles (TALN 2015)},
BOOKTITLE = {Actes de La 22e Conférence Sur Le Traitement Automatique Des Langues Naturelles},
}
@INPROCEEDINGS{BRANDO_2015_INPROCEEDINGS_BFG_340774,
AUTHOR = {Brando, C. and Frontini, F. and Ganascia, J.},
TITLE = {Linked data for toponym linking in French literary texts},
YEAR = {2015},
ABSTRACT = {The present article discusses first experiments in toponym linking of Modern French digital editions aiming to provide an external referent to Linked Data sources. We have so far focused on testing two knowledge bases-French DBpedia and Geonames-for recall. Results highlight quality issues in these data sets for usage in NLP-tasks in domain-specific heritage texts},
KEYWORDS = {Named-Entity Linking, Linked Data, Digital Humanities},
URL = {https://iris.cnr.it/handle/20.500.14243/340774},
DOI = {10.1145/2837689.2837699},
ISBN = {978-1-4503-3937-7},
CONFERENCE_NAME = {GIR'15 9th Workshop on Geographic Information Retrieval},
BOOKTITLE = {GIR '15 Proceedings of the 9th Workshop on Geographic Information Retrieval},
EDITOR = {Purves, R. S. and Jones, C. B.},
}
@INPROCEEDINGS{BRUNATO_2015_INPROCEEDINGS_BD_321093,
AUTHOR = {Brunato, D. and Dell'Orletta, F.},
TITLE = {ISACCO: a corpus for investigating spoken and written language development in Italian school-age children},
YEAR = {2015},
ABSTRACT = {We present ISACCO (Italian school-age children corpus)1, a new corpus of oral and written retellings of Italian speaking children attending the primary school. All texts were digitalized and automatically enriched with linguistic information allowing preliminary explorations based on NLP features. Written retellings were also manually annotated with a typology of linguistic errors. The resource is conceived to support research and computational modeling of "later language acquisition", with an emphasis for comparative assessment of oral and written language skills across early school grades},
KEYWORDS = {Child language acquisition, Oral and written language, multi-level linguistic analysis},
PAGES = {62-66},
URL = {http://www.italianlp.it/wp-content/uploads/2016/03/IsaccoCorpus.pdf},
PUBLISHER = {Accademia University Press (Torino, ITA)},
ISBN = {978-88-99200-62-6},
CONFERENCE_NAME = {Second Italian Conference on Computational Linguistics (CLiC-it 2015)},
CONFERENCE_PLACE = {Torino},
BOOKTITLE = {Proceedings of the Second Italian Conference on Computational Linguistics (CLiC-it 2015)},
EDITOR = {Bosco, C. and Tonelli, S. and Zanzotto, F. M.},
}
@INPROCEEDINGS{BRUNATO_2015_INPROCEEDINGS_BDVM_296574,
AUTHOR = {Brunato, D. and Dell'Orletta, F. and Venturi, G. and Montemagni, S.},
TITLE = {Design and Annotation of the First Italian Corpus for Text Simplification},
YEAR = {2015},
ABSTRACT = {In this paper, we present design and construction of the first Italian corpus for automatic and semi-automatic text simplification. In line with current approaches, we propose a new annotation scheme specifically conceived to identify the typology of changes an original sentence undergoes when it is manually simplified. Such a scheme has been applied to two aligned Italian corpora, containing original texts with corresponding simplified versions, selected as representative of two different manual simplification strategies and addressing different target reader populations. Each corpus was annotated with the operations foreseen in the annotation scheme, covering different levels of linguistic description. Annotation results were analysed with the final aim of capturing peculiarities and differences of the different simplification strategies pursued in the two corpora},
KEYWORDS = {Annotation Scheme, Automatic Text Simplification},
PAGES = {31-34},
URL = {https://aclweb.org/anthology/W/W15/W15-1604.pdf},
ISBN = {978-1-941643-47-1},
CONFERENCE_NAME = {Proceedings of LAW IX-The 9th Linguistic Annotation Workshop},
}
@INPROCEEDINGS{CHIARELLA_2015_INPROCEEDINGS_CBBCRZMC_302858,
AUTHOR = {Chiarella, D. and Bibuli, M. and Bruzzone, G. and Caccia, M. and Ranieri, A. and Zereik, E. and Marconi, L. and Cutugno, P.},
TITLE = {Gesture-based Language for Diver-Robot Underwater Interaction},
YEAR = {2015},
ABSTRACT = {Underwater environment is characterized by harsh conditions and is difficult to monitor. The CADDY project deals with the development of a companion robot devoted to support and to monitor human operations and activities during the dive. In this scenario the communication and correct reception of messages between the diver and the robot are essential for success of the dive goals. However, the underwater environment poses a set of technical constraints hardly limiting the communication possibilities. For such reasons the solution proposed is to develop a communication language based on the consolidated and standardized diver gestures, commonly employed during professional and recreational dives, thus leading to the definition of a CADDY language, called CADDIAN, and a communication protocol. This article focuses on the creation of the language providing alphabet, syntax and semantics: future work will explain the part of recognition of gestures that is still in progress},
KEYWORDS = {gesture language, human robot interaction, mobile robots, underwater environment, marine systems},
PAGES = {9},
URL = {http://ieeexplore.ieee.org/xpl/articleDetails.jsp?arnumber=7271710\&filter=AND%28p_Publication_Number:7227859%29},
DOI = {10.1109/OCEANS-Genova.2015.7271710},
CONFERENCE_NAME = {OCEANS 2015 MTS/IEEE-Genova},
}
@INPROCEEDINGS{CHIARELLA_2015_INPROCEEDINGS_CCML_374035,
AUTHOR = {Chiarella, D. and Cutugno, P. and Marconi, L. and Lucentini, R.},
TITLE = {Domain-specific languages: a gesture-based approach for Human Robot Interaction in underwater environments},
YEAR = {2015},
ABSTRACT = {This paper introduces a gesture-based language for Human Robot Interaction (HRI) specifically aimed to divers. Divers generally operate in environments with harsh conditions and, at the same time, difficult to monitor; in this scenario, any sudden event can create an emergency situation that may compromise the immersion or even turns into worse consequences involving the safety of divers themselves. To cope with such situations, standard procedures suggest to dive in pairs and to follow well-defined rules to avoid the risk of accidents. However, these procedures may not be sufficient to avoid dangerous events such as failure in the breathing apparatus, burst eardrum, decompression sickness and nitrogen narcosis. FP7 CADDY project was developed to overcome these problems, with the idea to transfer robotics technology in diving: the main aim is improving the level of safety during diving. CADDY project focuses, in fact, on the development of a companion robot designed to support human operations and activities during the dive, as well as to monitor the status of the diver and in such a way to prevent harmful events. Various problems have to be confronted to provide the diver a reliable and useful supporting robotic vehicle: one of them is the development of a communication and interaction methodology that allows the diver and the robot to cooperate actively for the fulfilment of tasks required when diving. Communication and correct reception of messages between the diver and underwater robot are essential for the success of the objectives of immersion. However, the underwater environment poses a number of difficult technical constraints limiting the possibilities of communication (electro-magnetic waves strong attenuation and signal scattering and dispersion). The most reliable solution for underwater communication is acoustic technology, with two main drawbacks: high prices of devices and very low data rates. To solve these issues, the solution proposed is the development of acommunication language (called CADDIAN) based, partly, on the consolidated and standardized diver gestures that are commonly employed during professional and recreational dives},
KEYWORDS = {domain-specific languages, human robot interaction, gesture-based language, underwater communication},
PAGES = {12},
URL = {https://iris.cnr.it/handle/20.500.14243/374035},
ISBN = {9789597152347},
CONFERENCE_NAME = {IX Conferencia Científica Internacional Lingüística},
}
@INPROCEEDINGS{CIGNONI_2015_INPROCEEDINGS_CFF_290986,
AUTHOR = {Cignoni, L. and Fornaciari, G. and Fornaciari, A.},
TITLE = {Many hands make light work: collaborative CLIL activities for University courses in Medieval funerary archaeology},
YEAR = {2015},
ABSTRACT = {This paper describes the activities performed by the students of the course of funerary archaeology held at the Division of Palaeopathology of Pisa University in collaboration with the Institute for Computational Linguistics (ILC) of the National Research Council (CNR) in Pisa in the period April-June 2014. The lessons, which used a Content and Language Integrated Learning (CLIL) approach, were aimed at studying the funerary beliefs and burial practices in Italy and England in the Middle Ages. The 2014 course followed on from the courses of the year 2012 (focused on the more general issue of taphonomy; primary and secondary burials; single, double, or multiple burials), and 2013 (which examined the world of the ancient Romans and their burial customs of cremation and inhumation). The lessons were conducted by using extracts from self-contained specialized texts that were simple to read and that offered the basic concepts of medieval funerary archaeology. The students were supported by a reference text for funerary archaeology, which established the correct nomenclature to use when describing bodies, grave goods and tombs. Powerpoint slide presentations helped students break up the monotony of the text work and made the material more interesting and engaging. The slides were used to illustrate different types of burials in filled or empty spaces; the position of burials in both rural and urban environments; the disposition of the limbs in the burial; the rise of the Monasteries in the early Middle Ages and of the religious Orders of the Dominicans and Franciscans in the late Middle Ages. Each student was responsible for researching and reporting on a particular topic, and was supported by the use of information and communication techniques. Particular attention was devoted to the Books of Hours, important illuminated medieval manuscripts (containing psalms, short prayers and biblical quotations) that marked the different parts of the day and that were specifically composed for wealthy people. Classroom activities ranged from the simpler multi-matching and gap-filling exercises to the more complex tasks of providing definitions for given words, creating mind-maps, enriching a bilingual English-Italian glossary and providing contextualized examples for an English grammar book. Educational videos from the BBC or other channels and pertaining to the topics treated during the lessons were projected each time and were followed by direct questioning and more general conversation, to help students gain proficiency in oral communication. In the last three years, the Italian students from Pisa University have been working in collaboration with those of Ohio University on an excavation project carried out at the Field School in Medieval Archaeology and Bioarchaeology at Badia Pozzeveri (Lucca, Italy), to which the prestigious International journal SCIENCE dedicated a special issue and cover in December 2013. Finally, multidisciplinary elements were also included in the courses, by exploiting the information extracted from videos related to disciplines other than funerary archaeology, for example a BBC Channel 4 video describing the British meals of the day, the origins of which date back to medieval times},
KEYWORDS = {CLIL, collaborative learning, medieval funerary archaeology, computer technology, archaeological field work},
PAGES = {2271-2279},
URL = {https://iris.cnr.it/handle/20.500.14243/290986},
ISBN = {978-84-606-5763-7},
CONFERENCE_NAME = {9th International Technology, Education and Development Conference},
}
@INPROCEEDINGS{CRESCI_2015_INPROCEEDINGS_CCDT_303899,
AUTHOR = {Cresci, S. and Cimino, A. and Dell'Orletta, F. and Tesconi, M.},
TITLE = {Crisis Mapping during Natural Disasters via Text Analysis of Social Media Messages},
YEAR = {2015},
ABSTRACT = {Recent disasters demonstrated the central role of social media during emergencies thus motivating the exploitation of such data for crisis mapping. We propose a crisis mapping system that addresses limitations of current state-of-the-art approaches by analyzing the textual content of disaster reports from a twofold perspective. A damage detection component employs a SVM classifier to detect mentions of damage among emergency reports. A novel geoparsing technique is proposed and used to perform message geolocation. We report on a case study to show how the information extracted through damage detection and message geolocation can be combined to produce accurate crisis maps. Our crisis maps clearly detect both highly and lightly damaged areas, thus opening up the possibility to prioritize rescue efforts where they are most needed},
KEYWORDS = {crisis informatics, Emergency Management, geoparsing, social media mining, Twitter},
PAGES = {1-8},
URL = {https://iris.cnr.it/handle/20.500.14243/303899},
CONFERENCE_NAME = {Web Information Systems Engineering-WISE 2015},
}
@INPROCEEDINGS{CRESCI_2015_INPROCEEDINGS_CTCD_271161,
AUTHOR = {Cresci, S. and Tesconi, M. and Cimino, A. and Dell'Orletta, F.},
TITLE = {A Linguistically-driven Approach to Cross-Event Damage Assessment of Natural Disasters from Social Media Messages},
YEAR = {2015},
ABSTRACT = {This work focuses on the analysis of Italian social media messages for disaster management and aims at the detection of messages carrying critical information for the damage assessment task. A main novelty of this study consists in the focus on out-domain and cross-event damage detection, and on the investigation of the most relevant tweet-derived features for these tasks. We devised different experiments by resorting to a wide set of linguistic features qualifying the lexical and grammatical structure of a text as well as ad-hoc features specifically implemented for this task. We investigated the most effective features that allow to achieve the best results. A further result of this study is the construction of the first manually annotated Italian corpus of social media messages for damage assessment},
KEYWORDS = {crisis informatics, Damage assessment, Emergency Management, feature selection, social media mining, Social Sensing},
PAGES = {6},
URL = {https://iris.cnr.it/handle/20.500.14243/271161},
CONFERENCE_NAME = {Proceedings of the 24th international conference companion on World Wide Web. ACM, 2015},
}
@INPROCEEDINGS{CUTUGNO_2015_INPROCEEDINGS_CLMC_276344,
AUTHOR = {Cutugno, P. and Lucentini, R. and Marconi, L. and Chiarella, D.},
TITLE = {Relaciones sin violencia: lenguaje, estereotipos y sexismo benévolo},
YEAR = {2015},
PAGES = {200-204},
URL = {https://iris.cnr.it/handle/20.500.14243/276344},
VOLUME = {I},
PUBLISHER = {Centro de Lingüística Aplicada, Ministero de Ciencia, Tecnología y Medio Ambiente (Santiago de Cuba, CUB)},
ISBN = {9789597174295},
CONFERENCE_NAME = {XIV Simposio Internacional de Comunicación Social: retos y perspectivas},
CONFERENCE_PLACE = {Santiago de Cuba},
BOOKTITLE = {Comunicación Social: retos y perspectivas Vol. I°},
EDITOR = {Miyares, L. R. and Alvarado, A. M. and Silva, M. R. A. and Joa, Y. P. and Rodríguez, D. J.},
}
@INPROCEEDINGS{DEFELICE_2015_INPROCEEDINGS_D_288825,
AUTHOR = {De Felice, I.},
TITLE = {GraDes: a corpus of grasp descriptions},
YEAR = {2015},
CONFERENCE_NAME = {AISV 2015},
}
@INPROCEEDINGS{DELGRATTA_2015_INPROCEEDINGS_DFMPRBGKQSC_307390,
AUTHOR = {Del Gratta, R. and Frontini, F. and Monachini, M. and Pardelli, G. and Russo, I. and Bartolini, R. and Goggi, S. and Khan, F. and Quochi, V. and Soria, C. and Calzolari, N.},
TITLE = {Visualising Italian Language Resources: a Snapshot},
YEAR = {2015},
ABSTRACT = {This paper aims to provide a first snapshot of Italian Language Resources (LRs) and their uses by the community, as documented by the papers presented at two different conferences, LREC2014 and CLiC-it 2014. The data of the former were drawn from the LOD version of the LRE Map, while those of the latter come from manually analyzing the proceedings. The results are presented in the form of visual graphs and confirm the initial hypothesis that Italian LRs require concrete actions to enhance their visibility},
KEYWORDS = {Italian Language Resources},
PAGES = {100-104},
URL = {https://books.openedition.org/aaccademia/1277?lang=it},
ISBN = {978-88-99200-62-6},
CONFERENCE_NAME = {Second Italian Conference on Computational Linguistics CLiC-it 2015},
BOOKTITLE = {Proceedings of the Second Italian Conference on Computational Linguistics CLiC-it 2015},
EDITOR = {Bosco, C. and Tonelli, S. and Zanzotto, F. M.},
}
@INPROCEEDINGS{FERRARI_2015_INPROCEEDINGS_FSGD_310030,
AUTHOR = {Ferrari, A. and Spagnolo, G. O. and Gnesi, S. and Dell'Orletta, F.},
TITLE = {CMT and FDE: tools to bridge the gap between natural language documents and feature diagrams},
YEAR = {2015},
ABSTRACT = {A business subject who wishes to enter an established technological market is required to accurately analyse the features of the products of the different competitors. Such features are normally accessible through natural language (NL) brochures, or NL Web pages, which describe the products to potential customers. Building a feature model that hierarchically summarises the different features available in competing products can bring relevant benefits in market analysis. A company can easily visualise existing features, and reason about aspects that are not covered by the available solutions. However, designing a feature model starting from publicly available documents of existing products is a time consuming and error-prone task. In this paper, we present two tools, namely Commonality Mining Tool (CMT) and Feature Diagram Editor (FDE), which can jointly support the feature model definition process. CMT allows mining common and variant features from NL descriptions of existing products, by leveraging a natural language processing (NLP) approach based on contrastive analysis, which allows identifying domain-relevant terms from NL documents. FDE takes the commonalities and variabilities extracted by CMT, and renders them in a visual form. Moreover, FDE allows the graphical design and refinement of the final feature model, by means of an intuitive GUI},
KEYWORDS = {Software Product Lines, Variability Mining, Tools},
PAGES = {402-410},
URL = {http://dl.acm.org/citation.cfm?doid=2791060.2791117},
DOI = {10.1145/2791060.2791117},
ISBN = {978-1-4503-3613-0},
CONFERENCE_NAME = {19th International Conference on Software Product Line},
}
@INPROCEEDINGS{FERRO_2015_INPROCEEDINGS_FMP_299099,
AUTHOR = {Ferro, M. and Marzi, C. and Pirrelli, V.},
TITLE = {Lexical parsability and morphological structure},
YEAR = {2015},
ABSTRACT = {A classical tenet in the psycholinguistic literature on the mental lexicon is that a parsed affix presents high activation levels (and thus contributes to activation spreading to other words with the same affix), and that such levels are tightly correlated with the affix productivity. In a number of influential papers, it has been suggested that parsability criteria interact with frequency to define morphological productivity in the lexicon. For example, the frequency of a derivative (e. g. government) relative to its base (govern) is shown to be a good predictor for parsability/productivity. The higher the frequency ratio, the more likely the morphological structure to be perceived, and the associated affix to be used productively. The present contribution intends to offer a computational explanatory basis for this correlational evidence, and assess its applicability to the acquisition of complex inflectional paradigms. In those languages, like Italian and German, whose inflection is stem-based rather than word-based, there is often no single paradigmatic form which can act as a base by being properly contained in all other inflected variants. Yet, it seems intuitive to suggest that verbs that are inflected for one paradigm cell only (e. g. neighbouring), are learned earlier and more easily but exhibit lower levels of perceived inflectional structure than verbs with richer paradigms. This appears to be in good accord with experimental evidence of time latencies in lexical decision, which are shown to correlate negatively with token frequency, paradigm size and paradigm entropy. Our simulations, based on Temporal Self-Organizing Maps (TSOMs) allow us to establish an interesting connection between inflectional parsability, frequency-based paradigm structure, and acquisitional constraints on the interaction between the human processor and working memory. Self-organising topological models of the mental lexicon can mimic the spatial and temporal organization of memory structures supporting the processing of symbolic sequences, and can provide an interesting framework for testing integrative accounts of lexical processing/acquisition as the complex result of general-purpose operations on word stimuli (e. g. working memory, long-term storage, sensory-motor mapping, rehearsal, unit integration, unit analysis, executive control, time-series processing), in line with recent acquisitions on the neuro-functional architecture of the perisylvian language network in the left hemisphere of human brain. Simulations of the incremental acquisition of "mini-paradigms" (small islands of morphological contrast encompassing up to three different forms for the same verb support the hypothesis that perception of structure (parsability) and morphological productivity strongly correlate in the inflectional lexica of German and Italian. In particular, by monitoring longitudinal progress in storage and generalisation of differently distributed inflectional paradigms in the two languages, we show that: i) high-frequency forms are stored and accessed significantly earlier than low-frequency forms; ii) deeply entrenched but paradigmatically isolated forms tend to block usage of other forms in the same paradigm; iii) low-frequency evenly distributed (highly entropic) intra-paradigmatic forms are acquired later but are easily extended. Our investigation credits the proposed computational framework with psycholinguistic plausibility, and grounds parsability-based models of morphological productivity on a specific, explicit proposal of lexical architecture. This provides an explanatory basis for both psycholinguistic and linguistic accounts of morphological structure, and offers an intermediate framework for scientific inquiry bridging the gap between linguistic units and functional units in neurosciences. Finally, it makes the interesting suggestion that principles of morpheme-based organisation of the mental lexicon are compatible with a learning strategy requiring memorisation of full forms},
KEYWORDS = {morphological structure, word processing, token/type frequency},
PAGES = {22-37},
URL = {http://mmm.lis.upatras.gr/index.php/mmm/issue/view/293/showToc},
ISSN = {1826-7491},
CONFERENCE_NAME = {Morphology and Semantics-Ninth Mediterranean Morphology Meeting},
BOOKTITLE = {ONLINE PROCEEDINGS OF THE MEDITERRANEAN MORPHOLOGY MEETINGS},
EDITOR = {Audring, J. and Koutsoukos, N. and Masini, F. and Raffaelli, I.},
}
@INPROCEEDINGS{FRONTINI_2015_INPROCEEDINGS_FAG_276113,
AUTHOR = {Frontini, F. and Amine Boukhaled, M. and Ganascia, J.},
TITLE = {Linguistic Pattern Extraction and Analysis for Classic French Plays},
YEAR = {2015},
ABSTRACT = {Great authors of fiction and theatre have the capacity of creating memorable characters that take life and become almost as real as living persons to the readers/audience. The study of characterization, namely of how this is achieved, is a well-researched topic in corpus stylistics: for instance (Mahlberg, 2012) attempts to identify typical lexical patterns for memorable Dickens' characters by extracting those lexical bundles that stand out (namely are overrepresented) in comparison to a general corpus. In other works, authorship attribution methods are applied to the different characters of a play to identify whether the author has been able to provide each of them with a "distinct" voice. For instance (Vogel \& Lynch, 2008) compare individual Shakespeare characters against the whole play or even against all plays of the same author. The purpose of this paper is to propose a methodology for the study characterization of several characters in French plays of the classical period. The tools developed are meant to support textual analysis by: 1) Verifying the degree of characterization of each character with respect to others. 2) Automatically inducing a list of linguistic features that are significant, representative for that character. Preliminary investigations have been conducted on plays by Moliere, cross-comparing four protagonists from four different plays. The proposed methodology relies on sequential data mining for the extraction of linguistic patterns and on correspondence analysis for comparison of patterns frequencies in each character and for the visual representation of such differences},
KEYWORDS = {computational stylometry, thater, sequential pattern mining},
PAGES = {3},
URL = {http://lipn.univ-paris13.fr/~charnois/conscilaGenres/resumes/frontini.pdf},
CONFERENCE_NAME = {Journée ConSciLa (Confrontations en Sciences du Langage) Grammaire des genres et des styles: quelles approches privilégier ?},
}
@INPROCEEDINGS{FRONTINI_2015_INPROCEEDINGS_FBG_290872,
AUTHOR = {Frontini, F. and Brando, C. and Ganascia, J.},
TITLE = {Semantic Web based Named Entity Linking for Digital Humanities and Heritage Texts},
YEAR = {2015},
ABSTRACT = {This paper proposes a graph based methodology for automatically disambiguating authors' mentions in a corpus of French literary criticism. Candidate referents are identified and evaluated using a graph based named entity linking algorithm, which exploits a knowledge-base built out of two different resources (DBpedia and the BnF linked data). The algorithm expands previous ones applied for word sense disambiguation and entity linking, with good results. Its novelty resides in the fact that it successfully combines a generic knowledge base such as DBpedia with a domain specific one, thus enabling the efficient annotation of minor authors. This will help specialists to follow mentions of the same author in different works of literary criticism, and thus to investigate their literary appreciation over time},
KEYWORDS = {named-entity linking, linked data, digital humanities},
PAGES = {77-88},
URL = {http://ceur-ws.org/Vol-1364/paper9.pdf},
VOLUME = {VOL-1364},
CONFERENCE_NAME = {SW4SH 2015 Semantic Web for Scientific Heritage 2015},
BOOKTITLE = {SW4SH 2015 Semantic Web for Scientific Heritage 2015},
EDITOR = {Zucker, A. and Draelants, I. and Zucker, C. F. and Monnin, A.},
}
@INPROCEEDINGS{FRONTINI_2015_INPROCEEDINGS_FBG_295464,
AUTHOR = {Frontini, F. and Brando, C. and Ganascia, J.},
TITLE = {Domain-adapted named-entity linker using Linked Data},
YEAR = {2015},
ABSTRACT = {We present REDEN, a tool for graph-based Named Entity Linking that allows for the disambiguation of entities using domain-specific Linked Data sources and different configurations (e. g. context size). It takes TEI-annotated texts as input and outputs them enriched with external references (URIs). The possibility of customizing indexes built from various knowledge sources by defining temporal and spatial extents makes REDEN particularly suited to handle domain-specific corpora such as enriched digital editions in the Digital Humanities},
KEYWORDS = {named-entity disambiguation, evaluation, linked data, digital humanities},
PAGES = {10},
URL = {http://ceur-ws.org/Vol-1386/named_entity.pdf},
VOLUME = {VOL-1386},
CONFERENCE_NAME = {Workshop on NLP Applications: Completing the Puzzle co-located with the 20th International Conference on Applications of Natural Language to Information Systems (NLDB 2015)},
BOOKTITLE = {Proceedings of the Workshop on NLP Applications: Completing the Puzzle},
EDITOR = {Izquierdo, R.},
}
@INPROCEEDINGS{FRONTINI_2015_INPROCEEDINGS_FQM_267184,
AUTHOR = {Frontini, F. and Quochi, V. and Monachini, M.},
TITLE = {Generative Lexicon and polysemy: inducing logical alternations},
YEAR = {2015},
ABSTRACT = {The current paper brings together the results of a series of experiments for inducing regular sense alternations, or regular/ logical polysemy, from a computational lexicon based on the Generative Lexicon theory. The results are discussed in light of the potential benefits and uses of the amended algorithm},
KEYWORDS = {Polysemy, Generative Lexicon, Logical Alternations},
PAGES = {7},
URL = {https://iris.cnr.it/handle/20.500.14243/267184},
PUBLISHER = {MAPLEX2015 Multiple Approaches to Lexicon Conference (Yamagata, JPN)},
CONFERENCE_NAME = {MAPLEX2015 Multiple Approaches to Lexicon Conference},
CONFERENCE_PLACE = {Yamagata},
EDITOR = {Hsieh, S. K. and Kanzaki, K.},
}
@INPROCEEDINGS{GIANNINI_2015_INPROCEEDINGS_GBGP_290975,
AUTHOR = {Giannini, S. and Biagioni, S. and Goggi, S. and Pardelli, G.},
TITLE = {Mapping Italian grey communities: what is there beyond the Academy?},
YEAR = {2015},
ABSTRACT = {This research aims at verifying whether-and eventually how much-the grey literature available on the web is actually structured, accessible or even managed by systems dealing with its organization and aiming at its retrieval and storing. The utmost goal is to build up a map of non-academic communities and their mechanisms for managing, presenting and disseminating this type of material. It is a sort of journey among the streams of the Web, which channel meeting minutes, manifests, fliers, pictures, newspapers articles, journalistic services and audio/video material on various topics. These "grey" products-by conveying basic information about social and popular culture-store, represent and spread knowledge},
KEYWORDS = {Italian Grey Literature, A.1 INTRODUCTORY AND SURVEY},
PAGES = {17-29},
URL = {http://www.textrelease.com/publications/proceedings.html},
PUBLISHER = {TextRelease (Amsterdam, NLD)},
ISSN = {1386-2316},
ISBN = {978-90-77484-23-4},
CONFERENCE_NAME = {GL16-Sixteenth International Conference on Grey Literature Grey Literature Lobby: Engines and Requesters for Change},
CONFERENCE_PLACE = {Amsterdam},
BOOKTITLE = {THE GL-CONFERENCE SERIES. CONFERENCE PROCEEDINGS},
EDITOR = {Farace, D. and Frantzen, J.},
}
@INPROCEEDINGS{GOGGI_2015_INPROCEEDINGS_GMFBPDBM_290971,
AUTHOR = {Goggi, S. and Monachini, M. and Frontini, F. and Bartolini, R. and Pardelli, G. and De Mattei, M. and Bustaffa, F. and Manzella, G.},
TITLE = {Marine Planning and Service Platform (MAPS): An Advanced Research Engine for Grey Literature in Marine Science},
YEAR = {2015},
ABSTRACT = {The MAPS (Marine Planning and Service Platform) project is a development of the Marine project (Ricerca Industriale e Sviluppo Sperimentale Regione Liguria 2007-2013) aiming at building a computer platform for supporting a Marine Information and Knowledge System, as part of the data management activities. One of the main objective of the project is to develop a repository that should gather, classify and structure marine scientific literature and data thus guaranteeing their accessibility to researchers and institutions by means of standard protocols. We will present the scenario of the Operative Oceanography together with the technologies used to develop an advanced search engine which aims at providing rapid and efficient access to a Digital Library of oceanographic data. The case-study is also highlighting how the retrieval of grey literature from this specific marine community could be reproduced for similar communities as well, thus revealing the great impact that the processing, re-use as well as application of grey data have on societal needs/problems and their answers},
KEYWORDS = {Marine Science, Search Engine, Source Data, Oceanography},
PAGES = {108-114},
URL = {http://www.textrelease.com/gl16program.html},
PUBLISHER = {TextRelease (Amsterdam, NLD)},
ISSN = {1386-2316},
ISBN = {978-90-77484-23-4},
CONFERENCE_NAME = {Sixteenth International Conference on Grey Literature Grey Literature Lobby: Engines and Requesters for Change},
CONFERENCE_PLACE = {Amsterdam},
BOOKTITLE = {THE GL-CONFERENCE SERIES. CONFERENCE PROCEEDINGS},
EDITOR = {Farace, D. and Frantzen, J.},
}
@INPROCEEDINGS{GOGGI_2015_INPROCEEDINGS_GPSGB_287902,
AUTHOR = {Goggi, S. and Pardelli, G. and Sassi, M. and Giannini, S. and Biagioni, S.},
TITLE = {A terminological survey on the titles of the Seventh Framework Programme (FP7)},
YEAR = {2015},
ABSTRACT = {This paper focuses on the automatic extraction of domain-specific knowledge from the European Commission projects of the 7th Framework Programme, hereinafter referred as FP7. The study is divided in three parts: the first part introduces the work starting from the building up of a corpus containing the titles of European Projects of the whole FP7 in order to obtain a relevant terminological sample for the different domains; the second describes software and methods while the third part focuses on the evaluation of results. Finally, we conclude by suggesting possible directions for further development of a comparison between terminological extraction from FP7 and FP5/FP6},
KEYWORDS = {7th Framework Programme (FP7), Natural Language Processing, Terminology, Knowledge extraction, Grey Literature, I.2.7 Natural Language Processing. Text analysis, I.2.1 Applications and Expert Systems. Natural language interfaces},
PAGES = {223-227},
URL = {https://iris.cnr.it/handle/20.500.14243/287902},
ISBN = {978-959-7174-28-8},
CONFERENCE_NAME = {Fourteenth International Symposium on Comunicación Social: retos y perspectivas},
EDITOR = {Miyares, L. R. and Alvarado, M. R. A. S. Y. A. M.},
}
@INPROCEEDINGS{KHAN_2015_INPROCEEDINGS_KF_295959,
AUTHOR = {Khan, F. and Frontini, F.},
TITLE = {Using Ontologies to Model Polysemy in Lexical Resources},
YEAR = {2015},
ABSTRACT = {In this article we look at how the use of ontologies can assist in analysing polysemy in natural languages. We develop a model, the Lexical-Sense-Ontology model (LSO), to represent the interaction between a lexicon and ontology, based on lemon. We use the LSO model to show how default rules can be used to represent semi-productivity in polysemy as well as discussing the kinds of ontological information that are useful for studying polysemy},
KEYWORDS = {Polysemy, Ontology, Default Logic},
URL = {http://www.aclweb.org/anthology/W/W15/W15-0404.pdf},
CONFERENCE_NAME = {Workshop on Language and Ontologies},
BOOKTITLE = {Proceedings of the Workshop on Language and Ontologies},
}
@INPROCEEDINGS{MARCONI_2015_INPROCEEDINGS_MCCL_354387,
AUTHOR = {Marconi, L. and Cutugno, P. and Chiarella, D. and Lucentini, R.},
TITLE = {Glosario: las palabras de los Servicios Demográficos de la ciudad de Génova},
YEAR = {2015},
ABSTRACT = {Uno de los objetivos del proyecto ha sido la construcción de un glosario de palabras difíciles en los formularios de los Servicios Demográficos de la ciudad de Génova. ¿Por qué crear un glosario de términos difíciles que están presentes en los formularios? Las palabras casi nunca tienen un significado simple, fijo y único, sino más bien complejo, en el sentido de que a cada signo corresponden más significados, a menudo similares, a veces totalmente diferentes; por esta razón, el verdadero significado de una palabra se puede captar sólo en el contexto específico. El lenguaje de la burocracia se basa, en general, en el vocabulario de otras lenguas especiales (el lenguaje jurídico, económico, etc.); en este proyecto hemos hecho referencia al lenguaje de los formularios de los servicios demográficos que los ciudadanos de la ciudad de Génova deben completar para obtener documentos o servicios. Se pueden distinguir tres fases principales en las que se llevaron a cabo algunas actividades específicas: 1. recolección y lematización de los formularios-elección de palabras que pertenecen a algunas categorías gramaticales-verificación de la pertenencia de los lemas a los léxicos de frecuencia (vocabulario básico y vocabulario elemental); 2. realización de un cuestionario que contiene las entradas, que en parte, pertenece a los léxicos y, que en parte, no pertenecen a los léxicos-distribución del cuestionario a 720 personas de diferentes nacionalidades-análisis lingüístico y estadístico sobre los datos del cuestionario; 3. diseño e implementación del glosario. Los idiomas en los que el glosario se ha traducido son: albanés, árabe, chino, español, ucraniano. El glosario fué desarrollado por el Instituto Lingüística Computacional-Consejo Nacional de Investigaciones, Unidad de Génova y contiene 423 entradas. Las palabras o conjuntos de palabras se proporcionan con una breve explicación relativa a la utilización de los formularios; la información de cada volumen se ofrece en italiano y es seguida por la traducción en uno de los idiomas mencionados. Con el fin de facilitar la recuperación de las frases se escogió estructurar un índice que contiene, para cada voz del glosario, la referencia a la página en la que se puede encontrar su traducción. Aparece en el índice, junto a la frase, también el plural de algunas palabras que están presentes de esa misma manera en el formulario},
URL = {https://iris.cnr.it/handle/20.500.14243/354387},
ISBN = {9789597152347},
}
@INPROCEEDINGS{MARCONI_2015_INPROCEEDINGS_MCLCMM_276372,
AUTHOR = {Marconi, L. and Cutugno, P. and Lucentini, R. and Chiarella, D. and Morgavi, G. and Morando, M.},
TITLE = {La tecnología como sostén de la organización de datos lingüísticos concernientes a las plantas medicinales},
YEAR = {2015},
PAGES = {605-609},
URL = {https://iris.cnr.it/handle/20.500.14243/276372},
VOLUME = {II},
PUBLISHER = {Centro de Lingüística Aplicada, Ministero de Ciencia, Tecnología y Medio Ambiente (Santiago de Cuba, CUB)},
ISBN = {9789597174301},
CONFERENCE_NAME = {XIV Simposio Internacional de Comunicación Social: retos y perspectivas},
CONFERENCE_PLACE = {Santiago de Cuba},
BOOKTITLE = {Comunicación Social: retos y perspectivas Vol. II°},
EDITOR = {Miyares, L. R. and Alvarado, A. M. and Silva, M. R. A. and Joa, Y. P. and Rodríguez, D. J.},
}
@INPROCEEDINGS{MARZI_2015_INPROCEEDINGS_MFP_290953,
AUTHOR = {Marzi, C. and Ferro, M. and Pirrelli, V.},
TITLE = {Lexical emergentism and the "frequency-by-regularity" interaction},
YEAR = {2015},
ABSTRACT = {In spite of considerable converging evidence of the role of inflectional paradigms in word acquisition and processing, little efforts have been put so far into providing detailed, algorithmic models of the interaction between lexical token frequency, paradigm frequency, paradigm regularity. We propose a neurocomputational account of this interaction, and discuss some theoretical implications of preliminary experimental results},
KEYWORDS = {morphological strucutre, frequency distribution, temporal self-orgabnising maps},
PAGES = {37-41},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-84927156830\&origin=inward},
VOLUME = {1347},
CONFERENCE_NAME = {NetWordS Final Conference on Word Knowledge and Word Usage: Representations and Processes in the Mental Lexicon},
BOOKTITLE = {Word Knowledge and Word Usage 2015},
EDITOR = {Pirrelli, V. and Marzi, C. and Ferro, M.},
}
@INPROCEEDINGS{NAHLI_2015_INPROCEEDINGS_NM_300996,
AUTHOR = {Nahli, O. and Marchi, S.},
TITLE = {Improved Written Arabic Word Parsing through Orthographic, Syntactic and Semantic constraints},
YEAR = {2015},
ABSTRACT = {Le convenzioni ortografiche della lingua araba consentono l'omissione dei diacritici, introducendo così numerosi casi di omografia tra forme flesse e la conseguente proliferazione di analisi morfologiche contestualmente spurie. Un analizzatore morfologico che utilizzi i vincoli ortografici, morfo-sintattici e semantici che operano a livello lessicale, può tuttavia ridurre drasticamente il livello di ambiguità morfologica del testo scritto, producendo analisi più efficienti e accurate},
KEYWORDS = {Arabic Language, Arabic NLP, Orthography, Morpho-syntax, Semantics},
PAGES = {210-214},
URL = {http://www.aaccademia.it/elenco-libri?aaref=CLIC_2015},
PUBLISHER = {Accademia University Press (Torino, ITA)},
ISBN = {9788899200626},
CONFERENCE_NAME = {Second Italian Conference on Computational Linguistics CLiC-it 2015},
CONFERENCE_PLACE = {Torino},
}
@INPROCEEDINGS{PICCIOLI_2015_INPROCEEDINGS_PDGZA_381992,
AUTHOR = {Piccioli, A. and Di Donato, F. and Giacomi, D. and Zitarosa, R. and Aiola, C.},
TITLE = {Linked open data portal how to make use of linked data to generate serendipity},
YEAR = {2015},
ABSTRACT = {The Linked Open Data Portal (LODPortal) is an open source application for the Digital Humanities which has been developed within the European Project(CIP-ICT-PSP) Agora-Scholarly Open Access Research in European Philosophy. Although it is in aprototypal stage of development, it presents an innovative use of Linked data technologies applied to the Digital Humanities domain. By combining thousands of resources coming from different Digital Libraries, thanks to the use of Semantic Web technologies it offers to Scholars novel tools to create, reuse and visualize research data and results. In particular, the LODPortal gathers and indexes resources coming from twelve Digital Libraries and the Linked Data cloud (such as DBPedia and Freebase) and includes a module based on Pundit, 1 enabling automatic entity extraction, thanks to the service DANDELION, 2 and manual semantic enrichment. Based on the semantic indexing, the navigation interface offers advanced visualizations such as the Timeline, the people graph and a map of places},
URL = {https://iris.cnr.it/handle/20.500.14243/381992},
DOI = {10.1145/2802612.2802642},
}
@INPROCEEDINGS{PIRRELLI_2015_INPROCEEDINGS_PNBDM_293690,
AUTHOR = {Pirrelli, V. and Nahli, O. and Boschetti, F. and Del Gratta, R. and Marzi, C.},
TITLE = {Computational Linguistics and Language Physiology: Insights from Arabic NLP and Cooperative Editing},
YEAR = {2015},
ABSTRACT = {Computer processing of written Arabic raises a number of challenges to traditional parsing architectures on many levels of linguistic analysis. In this contribution, we review some of these core issues and the demands they make, to suggest different strategies to successfully tackle them. In the end, we assess these issues in connection with the behaviour of neuro-biologically inspired lexical architectures known as Temporal Self-Organising Maps. We show that, far from being language-specific problems, issues in Arabic processing can shed light on some fundamental characteristics of the human language processor, such as structure-based lexical recoding, concurrent, competitive activation of output candidates and dynamic selection of optimal solutions},
KEYWORDS = {Non-concatenative morphology, Optical Character Recognition, WordNet, Temporal Self-organising Maps, Mental Lexicon, Language neuro-physiology},
PAGES = {1-8},
URL = {http://dl.acm.org/citation.cfm?id=2802612},
DOI = {10.1145/2802612.2802637},
ISBN = {978-1-4503-3295-8},
CONFERENCE_NAME = {Third AIUCD Annual Conference-Humanities and Their Methods in the Digital Ecosystem},
BOOKTITLE = {Third AIUCD Annual Conference-Humanities and Their Methods in the Digital Ecosystem},
EDITOR = {Tomasi, F. and Del Turco, R. R. and Tammaro, A. M.},
}
@INPROCEEDINGS{RICHTER_2015_INPROCEEDINGS_RCDV_322145,
AUTHOR = {Richter, S. and Cimino, A. and Dell'Orletta, F. and Venturi, G.},
TITLE = {Tracking the Evolution of Written Language Competence: an NLP-based Approach},
YEAR = {2015},
ABSTRACT = {In this paper, we present an NLP-based innovative approach for tracking the evolution of written language competence relying on different sets of linguistic features that predict text quality. This approach was tested on a corpus essays written by Italian L1 learners of the first and second year of the lower secondary school},
KEYWORDS = {Evolution of Written Language Competence, multi-level linguistic analysis},
PAGES = {236-240},
URL = {http://www.italianlp.it/wp-content/uploads/2016/03/tracking-language-competence.pdf},
PUBLISHER = {Accademia University Press (Torino, ITA)},
ISBN = {978-88-99200-62-6},
CONFERENCE_NAME = {2nd Italian Conference on Computational Linguistics (CLiC-it)},
CONFERENCE_PLACE = {Torino},
}
@INPROCEEDINGS{RUSSO_2015_INPROCEEDINGS_RCM_294132,
AUTHOR = {Russo, I. and Caselli, T. and Monachini, M.},
TITLE = {Extracting and Visualising Biographical Events from Wikipedia},
YEAR = {2015},
ABSTRACT = {This work presents a proposal for the development of a natural language processing module for event and temporal analysis of biographies as available in Wikipedia. At the current level of development, we restricted the extraction to temporally anchored events as they represent salient information which can be further used to extract additional events and facilitate their chronological ordering and the representation of a person's timeline. Visualising data about basic facts concerning groups of people helps with historical reasoning and enables comparisons among them},
KEYWORDS = {mining biographies for structured information, visualising biographical data, temporal information},
PAGES = {111-115},
URL = {http://ceur-ws.org/Vol-1399/paper17.pdf},
CONFERENCE_NAME = {BD2015 Biographical Data in a Digital World 2015},
BOOKTITLE = {BD2015 Biographical Data in a Digital World 2015},
EDITOR = {Braake, S. T. and Fokkens, A. and Sluijter, R. and Declerck, T. and Wandl Vogt, E.},
}
@INPROCEEDINGS{RUSSO_2015_INPROCEEDINGS_RCS_299129,
AUTHOR = {Russo, I. and Caselli, T. and Strapparava, C.},
TITLE = {SemEval-2015 Task 9: CLIPEval Implicit Polarity of Events},
YEAR = {2015},
ABSTRACT = {Sentiment analysis tends to focus on the po-larity of words, combining their values to de-tect which portion of a text is opinionated. CLIPEval wants to promote a more holistic approach, looking at psychological researches that frame the connotations of words as the emotional values activated by them. The implicit polarity of events is just one aspect of connotative meaning and we address it with a task that is based on a dataset of sentences annotated as instantiations of pleasant and un-pleasant events previously collected in psy-chological research as the ones on which human judgments converge},
KEYWORDS = {sentiment analysis},
PAGES = {443-450},
URL = {http://alt.qcri.org/semeval2015/cdrom/pdf/SemEval077.pdf},
ISBN = {978-1-941643-40-2},
CONFERENCE_NAME = {Proceedings of SemEval-2015},
}
@INPROCEEDINGS{SORIA_2015_INPROCEEDINGS_S_294062,
AUTHOR = {Soria, C.},
TITLE = {Towards a notion of "Digital Language Diversity"},
YEAR = {2015},
ABSTRACT = {This paper introduces the concept of digital language diversity and advocates for its increase in order to foster the digital vitality of languages, and secure their overall vitality},
KEYWORDS = {digital language diversity, NLP, less-resourced languages, regional languages, minority languages, digital rights},
PAGES = {111-125},
URL = {https://iris.cnr.it/handle/20.500.14243/294062},
CONFERENCE_NAME = {3rd International Conference on Linguistic and Culturaol Diversity in Cyberspace},
BOOKTITLE = {Linguistic and Cultural Diversity in Cyberspace-Proceedings of the 3rd International Conference},
EDITOR = {Kuzmin, E. and Parshakova, A. and Ignatova, D.},
}
@INPROCEEDINGS{SORIA_2015_INPROCEEDINGS_SR_301026,
AUTHOR = {Soria, C. and Russo, I.},
TITLE = {The Digital Language Diversity Project},
YEAR = {2015},
ABSTRACT = {In this paper we introduce The Digital Language Diversity Project, a three-year project funded under EC Erasmus programme started in September 2015. The project addresses the problem of the scarce use and usability of EU regional and minority languages over digital devices by developing a training programme for adult speakers of regional and minority languages to empower them with the know-how for creating and sharing digital content. Availability of digital content and technical support to collect it are essential prerequisites for the development of language-based digital applications, which in turn will boost digital usage of these languages},
KEYWORDS = {Less-resourced languages, Language Technology, digital language vitality, digital language diversity},
PAGES = {329-332},
URL = {https://iris.cnr.it/handle/20.500.14243/301026},
ISBN = {978-83-932640-8-7},
CONFERENCE_NAME = {7th Language \& Technology Conference},
BOOKTITLE = {Proceedings of the 7th Language \& Technology Conference},
EDITOR = {Vetulani, Z. and Mariani, J.},
}
@INPROCEEDINGS{SPRUGNOLI_2015_INPROCEEDINGS_SDCMB_333943,
AUTHOR = {Sprugnoli, R. and Dell'Orletta, F. and Caselli, T. and Montemagni, S. and Bosco, C.},
TITLE = {Parsing Events: a New Perspective on Old Challenges},
YEAR = {2015},
ABSTRACT = {The paper proposes a new evaluation exercise, meant to shed light on the syntax-semantics interface for the analysis of written Italian and resulting from the combination of the EVALITA 2014 dependency parsing and event extraction tasks. It aims at investigating the cross-fertilization of tasks, generating a new resource combining dependency and event annotations, and devising metrics able to evaluate the applicative impact of the achieved results},
URL = {https://iris.cnr.it/handle/20.500.14243/333943},
ISBN = {978-88-99200-62-6},
}
@INPROCEEDINGS{VENTURI_2015_INPROCEEDINGS_VBDM_304237,
AUTHOR = {Venturi, G. and Bellandi, T. and Dell'Orletta, F. and Montemagni, S.},
TITLE = {NLP-Based Readability Assessment of Health-Related Texts: a Case Study on Italian Informed Consent Forms},
YEAR = {2015},
ABSTRACT = {The paper illustrates the results of a case study aimed at investigating and enhancing the accessibility of Italian health-related documents by relying on advanced NLP techniques, with particular attention to informed consent forms. Results achieved show that the features automatically extracted from the linguistically annotated text and ranging across different levels of linguistic description have a high discriminative power in order to guarantee a reliable readability assessment},
KEYWORDS = {Readability assessment, health-related information},
PAGES = {131-141},
URL = {http://www.aclweb.org/anthology/W15-2618},
ISBN = {978-1-941643-32-7},
CONFERENCE_NAME = {Sixth International Workshop on Health Text Mining and Information Analysis (Louhi)},
}
@INPROCEEDINGS{ALBANESI_2015_INPROCEEDINGS_ABBG_302509,
AUTHOR = {Albanesi, A. and Bellandi, A. and Benotto, G. and Giovannetti, E.},
TITLE = {Translation, Annotation and Knowledge Modelling of the Babylonian Talmud: the Traduco System},
YEAR = {2015},
ABSTRACT = {In this work, we are going to present the Traduco System, a collaborative web-based application for the translation of the Babylonian Talmud (BT) into Italian. The System has been designed around a Computer-Assisted Translation (CAT) component, constituting its core. However, Traduco is not limited to assist the translation process and to provide printing functionalities. In fact, it allows linguistic and semantic annotations and advanced searches, paving the way to the construction of a talmudic knowledge base. In order to achieve these results, the Traduco development process abided by a model that took into account aspects of Natural Language Processing and Knowledge Engineering. The component based architectural structure was implemented using the object oriented Java 2 Enterprise Edition framework},
KEYWORDS = {Computer-Assisted Translation, Interpretation, Semantic Annotation, Babylonian Talmud},
URL = {https://dh-abstracts.library.virginia.edu/works/2399},
CONFERENCE_NAME = {Digital Humanities 2015},
}
@INPROCEEDINGS{BIZZONI_2015_INPROCEEDINGS_BDR_308102,
AUTHOR = {Bizzoni, Y. and Del Grosso, A. M. and Reboul, M.},
TITLE = {Diachronic Trends in Homeric translations},
YEAR = {2015},
ABSTRACT = {This field of study is part of the more general "Classical Receptions" studies that try to analyse the influence and adaptation of classical texts in modern and contemporary literature, theater, cinema, and so on. While scholastic analyses of Greek texts are practiced since more than two thousand years, research about classical translations is a relatively unexplored area. In recent years this theme has raised a growing interest in the academic community. With this intent, we built a program that can align in blocks texts of extended length, such as one book of the Odyssey, without need of previous training, segmentation, or textual tagging. Furthermore, it behaves with reasonable results also on very free and literary translations, a problem that wasn't generally considered by textual aligners since recent studies. While other programs allow an upper bound for 1-to-many alignments (for example with a maximum of 4 translated elements aligned to the same original element) this algorithm allows n-to-n alignments, with no limit to the number of translated elements that can be aligned to an original, or vice versa. The aligner is based on a implementation of Needleman-Wunsch algorithm and on a string-based similarity approach between textual segments. The aligner works finding anchor words in proper names, that are a relatively stable feature through different translations and generally don't become unrecognizable from one language to the other. Thanks to the alignments thus obtained, we can explore Homeric translations in a number of ways. We will illustrate the creation of an interface to visualize French Homeric translations making it possible to highlight aligned portions of texts and the translation of single words. We will finally show some resulting syntactic analyses carried out on a small sample of texts taken from a corpus of one hundred unabridged French translations of the Odyssey and we will try to demonstrate that the study of diachronic translations throughout algorithms of computational linguistics can produce interesting results for literary and linguistics studies},
URL = {https://iris.cnr.it/handle/20.500.14243/308102},
}
@INPROCEEDINGS{BOSCHETTI_2015_INPROCEEDINGS_BDFKM_305309,
AUTHOR = {Boschetti, F. and Del Gratta, R. and Frontini, F. and Khan, A. F. and Monachini, M.},
TITLE = {Strumenti, Risorse e Linguistic Linked Open Data per le lingue antiche},
YEAR = {2015},
ABSTRACT = {Strumenti e metodi dell'Informatica Umanistica hanno portato e portano ad una ridefinizione di processi teorici, metodologici e tecnici, fino a una vera e propria ri-concettualizzazione dei saperi nell'ambito dei beni culturali. L'Istituto di Linguistica Computazionale è attivo con varie iniziative sul fronte delle Digital Humanities per la creazione di strumenti e risorse linguistiche per il mondo classico. La direzione intrapresa si inserisce nel paradigma che si va consolidando nel settore delle tecnologie del linguaggio e che prevede la fruizione di servizi linguistici attraverso infrastrutture di ricerca, secondo un modello già operativo per le lingue moderne. Tale paradigma è in connessione con l'emergere degli standard e dei formati del web semantico per le tecnologie del linguaggio e per la pubblicazione di dati linguistici},
URL = {https://iris.cnr.it/handle/20.500.14243/305309},
}
@INPROCEEDINGS{DELGROSSO_2015_INPROCEEDINGS_DDB_308100,
AUTHOR = {Del Grosso, A. M. and Del Gratta, R. and Boschetti, F.},
TITLE = {The role of digital scholarly editors in the design of components for cooperative philology},
YEAR = {2015},
ABSTRACT = {This contribution is focused on the role of the digital scholarly editor in the continuous process of analysis, development and evaluation of libraries of components for cooperative philology. By following a general trend, in the domain of digital humanities developers are progressively shifting from the project-driven approach to the new community-driven paradigm. This shift is solicited by the increasing aggregation of scholars in communities of practice that are expressing common requirements and sharing best practices. In most cases, service providers are responding to these needs by offering web services quickly developed by taking into account the specific functionality that they expose or, worse, by wrapping legacy code. Although a pipeline of web services devoted to linguistic analysis and collaborative annotation provides many advantages in terms of flexibility, we are concerned by the impact of the main drawbacks, in order to study alternative or complementary solutions for our domain. Maintainability, performance and atomicity are the principal issues in which we are interested. In a chain of web services, the overall system depends by the status of the singles nodes and medium or small projects not always are able to grant the necessary level of redundancy or caching strategies. Performance is affected by the trade-off among challenging conditions (e. g. memory resources, computational overload, bandwidth). Atomicity influences the reusability and the extension of services (e. g. from many points of view, Latin metrical analysis is very similar to ancient Greek metrical analysis, but a web service that atomically provides the former could be totally unusable for the latter). At the Cooperative Philology Lab (Institute of Computational Linguistics "A. Zampolli", CNR, Pisa) we try to address these issues by designing and developing a library of components for the domain of scholarly editing. A library can be installed locally or remotely and it provides multiple choices for maintenance and performance tuning. But above all a library of components provides the building blocks to shape local or remote services at the adequate level of atomicity, in order to ensure reusability and extendibility. The role of the digital scholarly editors with which we have collaborated in pilot and funded projects at the CNR-ILC is crucial, because they are providing the necessary use cases that we are generalizing for the design of our library. During the workshop, we would like to stress the importance of a new generation of digital scholars that are not only creators of digital resources and consumers of computational tools or web infrastructures, but also actors in the analysis of requirements and in the evaluation of the libraries of components devoted to their activities. ReferencesBozzi, "Computer-assisted scholarly editing of manuscript sources, " in New publication cultures in the humanities: exploring the paradigm shift, Davidhazi, Ed. Amsterdam: Amsterdam University Press, 2014, pp. 99-115. [Online]. Available: http: //www. oapen. org/record/515678McGann, "From text to work: Digital tools and the emergence of the social text, " Variants: The Journal of the European Society for Textual Scholarship, vol. 4, pp. 225-240, 2005. Robinson, "Towards a scholarly editing system for the next decades, " in Sanskrit Computational Linguistics, ser. Lecture Notes in Computer Science, G. Huet, A. Kulkarni, and P. Scharf, Eds. Springer Berlin Heidelberg, 2009, vol. 5402, pp. 346-357. [Online]. Available: http: //dx. doi. org/10. 1007/978-3-642-00155-0 18Robinson, "Towards a theory of digital editions, " Variants, no. 10, 105-131, 2013. Siemens, M. Timney, C. Leitch, C. Koolen, A. Garnett et al., "Toward modeling the social edition: An approach to understanding the electronic scholarly edition in the context of new and emerging social media, " Literary and Linguistic Computing, vol. 27, no. 4, pp. 445-461, 2012},
KEYWORDS = {Digital Scholarly Editing, Digital Humanities, Digital Philology, Literary Computing},
URL = {http://dixit.huygens.knaw.nl/?page_id=138#boschetti},
VOLUME = {4},
CONFERENCE_NAME = {Technology, Software, Standards for the Digital Scholarly Edition},
BOOKTITLE = {Technology, Software, Standards for the Digital Scholarly Edition},
}
@INPROCEEDINGS{FRONTINI_2015_INPROCEEDINGS_FBG_289592,
AUTHOR = {Frontini, F. and Boukhaled, M. A. and Ganascia, J. G.},
TITLE = {Moliere's Raisonneurs: a quantitative study of distinctive linguistic patterns},
YEAR = {2015},
KEYWORDS = {Computational Stylistics, Correspondence analysis, Corpus linguistics, Molière},
PAGES = {114-117},
URL = {http://ucrel.lancs.ac.uk/cl2015/doc/CL2015-AbstractBook.pdf},
CONFERENCE_NAME = {Corpus Linguistics 2015},
BOOKTITLE = {Corpus Linguistics 2015-Abstract Book},
EDITOR = {Formato, F. and Hardie, A.},
}
@INPROCEEDINGS{GIANNINI_2015_INPROCEEDINGS_GBGP_307872,
AUTHOR = {Giannini, S. and Biagioni, S. and Goggi, S. and Pardelli, G.},
TITLE = {Grey Literature citations in the age of Digital Repositories and Open Access},
YEAR = {2015},
ABSTRACT = {The work measures grey citations in the years 2012, 2013 and 2014 and then describes the features of GL documents cited in different areas of knowledge: Computational Linguistics, Computer Science and Engineering. With the aim to survey a wide and varied range of resources, we selected a sample data based on the bibliographic references of articles contained in 4 journals-all indexed by the ISI Web of Science and with an Impact Factor over the last three years-and two proceedings of international conferences held in 2012 and 2014},
KEYWORDS = {Grey Literature, Digital Repositories, Open Access},
PAGES = {109-110},
URL = {http://greyguide.isti.cnr.it/attachments/category/27/GL17_Program_Book.pdf},
ISBN = {978-90-77484-26-5},
CONFERENCE_NAME = {Seventeenth International Conference on Grey Literature. A New Wave of Textual and Non-Textual Grey Literature},
BOOKTITLE = {GL17 Program Book},
EDITOR = {Farace, D. and Frantzen, J.},
}
@INPROCEEDINGS{GOGGI_2015_INPROCEEDINGS_GPBFMMDB_307398,
AUTHOR = {Goggi, S. and Pardelli, G. and Bartolini, R. and Frontini, F. and Monachini, M. and Manzella, G. and De Mattei, M. and Bustaffa, F.},
TITLE = {A semantic engine for grey literature retrieval in the oceanography domain},
YEAR = {2015},
ABSTRACT = {Here we present the final results of MAPS (Marine Planning and Service Platform), an environment designed for gathering, classifying, managing and accessing marine scientific literature and data, making it available for search to Operative Oceanography researchers of various institutions by means of standard protocols. In previous publications the general architecture of the system as well as the set of metadata (Common Data Index) used to describe the documents were presented [3]; it was shown how individual oceanographic data-sets could be indexed within the MAPS library by types of measure, measurement tools, geographic areas, and also linked to specific textual documentation. Documentation is described using the current international standards: Title, Authors, Publisher, Language, Date of publication, Body/Institution, Abstract, etc.; serial publications are described in terms of ISSN, while books are assigned ISBN; content of various types on electronic networks is described by means of doi and url. Each description is linked to the document. Thanks to this, the MAPS library already enables researchers to go from structured oceanographic data to documents describing it. But this was not enough: documents may contain important information that has not been encoded in the metadata. Thus an advanced Search Engine was put in place that uses semantic-conceptual technologies in order to extract key concepts from unstructured text such as technical documents (reports and grey literature) and scientific papers and to make them indexable and searchable by the end user in the same way as the structured data (such as oceanographic observations and metadata) is. More specifically once a document is uploaded in the MAPS library, key domain concepts in documents are extracted via a natural language processing pipeline and used as additional information for its indexing. The key term identification algorithm is based on marine concepts that were pre-defined in a domain ontology, but crucially it also allows for the discovery of new related concepts. So for instance starting from the domain term salinity, related terms such as sea salinity and average sea salinity will also be identified as key terms and used for indexing and searching documents. A hybrid search system is then put in place, where users can search the library by metadata or by free text queries. In the latter case, the NLP pipeline performs an analysis of the text of the query, and when key concepts are matched, the relevant documents are presented. The results may be later refined by using other structured information (e. g. date of publication, area,.). Currently a running system has been put in place, with data from satellites, buoys and sea stations; such data is documented and searchable by its relevant metadata and documentation. Results of quantitative evaluation in terms of information retrieval measures will be presented in the poster; more specifically, given an evaluation set defined by domain experts and composed of pre-defined queries together with documents that answer such queries, it will be shown how the system is highly accurate in retrieving the correct documents from the library. Though this work focuses on oceanography, its results may be easily extended to other domains; more generally, the possibility of enhancing the visibility and accessibility of grey literature via its connection to the data it describes and to an advanced full text indexing are of great relevance for the topic of this conference},
KEYWORDS = {Information Extraction, Search Engine, Oceanography},
PAGES = {76-77},
URL = {https://iris.cnr.it/handle/20.500.14243/307398},
ISBN = {978-90-77484-26-5},
CONFERENCE_NAME = {Seventeenth International Conference on Grey Literature. A New Wave of Textual and Non-Textual Grey Literature},
BOOKTITLE = {GL17 Program Book},
EDITOR = {Farace, D. and Frantzen, J.},
}
@INPROCEEDINGS{MONTEMAGNI_2015_INPROCEEDINGS_MWN_353725,
AUTHOR = {Montemagni, S. and Wieling, M. and Nerbonne, J.},
TITLE = {The contribution of dialectometry to the study of the dialects of Italy. A case study on Tuscan},
YEAR = {2015},
ABSTRACT = {We will illustrate the extent to which the recent advances of dialectometry can help to gain insight into the nature of linguistic variation-both synchronically and diachronically-in the study of the dialects of Tuscany, which have a special status in the complex puzzle of Italian dialects. This will be done by discussing the results achieved in a case study carried out over the last five years based on the corpus of dialectal data of the Atlante Lessicale Toscano ('Lexical Atlas of Tuscany', henceforth ALT, Giacomelli et al., 2000), a regional linguistic atlas focusing on dialec tal variation throughout Tuscany, a region where both Tuscan and non-Tuscan dialects are spoken},
KEYWORDS = {dialectometry, lexical atlas, italian dialects, Tuscany, Atlante Lessicale Toscano},
URL = {http://media.leidenuniv.nl/legacy/montemagni-wieling-nerbonne.pdf},
CONFERENCE_NAME = {Italian Dialect Meeting 2015 \& CIDSM X},
}
@INPROCEEDINGS{PICCIOLI_2015_INPROCEEDINGS_PDGZA_382000,
AUTHOR = {Piccioli, A. and Di Donato, F. and Giacomi, D. and Zitarosa, R. and Aiola, C.},
TITLE = {Linked Open Data per le Digital Humanities: l'esempio del Linked Open Data PORTAL},
YEAR = {2015},
ABSTRACT = {Il Linked Open Data PORTAL (o LODPORTAL) è stato sviluppato all'interno del progetto europeo europeo (CIP-ICT-PSP) Agorà-Scholarly Open Access Research in European Philosophy. Pur essendo ancora un prototipo, l'applicazione, rilasciata con licenze open source, presenta un uso innovativo delle tecnologie Linked Data applicate all'ambito delle Digital Humanities. Associata all'impiego di tecnologie del Semantic Web, la combinazione di risorse provenienti da diversi content provider offre al ricercatore strumenti innovativi per la creazione, il riuso, la fruizione e la visualizzazione dei contenuti. In particolare, il LODPORTAL raccoglie e indicizza risorse provenienti da dieci biblioteche digitali, create dai gruppi di ricerca afferenti al progetto Agorà e dalla cosiddetta Linked Open Data Cloud (dbpedia e freebase) e include un modulo, basato su Pundit, per l'estrazione automatica di entit( e l'arricchimento semantico manuale. Grazie all'indicizzazione semantica, l'interfaccia di navigazione offre alcune visualizzazioni avanzate, tra cui la timeline, il grafo delle persone e una mappa dei luoghi citati e associati alle risorse delle biblioteche digitali},
URL = {https://iris.cnr.it/handle/20.500.14243/382000},
}
@INPROCEEDINGS{VENTURI_2015_INPROCEEDINGS_VRMSTFB_304238,
AUTHOR = {Venturi, G. and Rinnone, S. and Montemagni, S. and Sassi, M. and Terranova, G. and Flore, E. and Bellandi, T.},
TITLE = {Language technologies for automatic readability assessment of health-related Information: a preliminary investigation into the informed consent forms used in a regional health service},
YEAR = {2015},
ABSTRACT = {Rationale: Within an information society, where everyone should be able to access all available information, improving access to written language is becoming more and more a central issue. This is the case for health-related information which should be accessible to all members of the society, including people who have reading difficulties as a result of a low education level or of language-based learning disabilities or because the language of the text is not their native language. Moreover, the breakdown of doctor-patient communication is one of the most frequent cause of adverse events. Research questions: We conducted a preliminary investigation to assess the readability of a corpus of informed consent forms used before a clinical procedure in the hospitals of a Regional Healthcare Service. Secondary goals include the comparison of readability across specialties and healthcare trusts. Methods: Providing complex scientific information in a way that is comprehensible to a lay person is a challenge that nowadays can be addressed by resorting to advanced Natural Language Processing (NLP) techniques, which make it possible to monitor the linguistic complexity of texts at the syntactic and lexical levels and to support their simplification, whenever needed. The study has been carried out by combining NLP-enabled feature extraction and state-of-the-art machine learning algorithms. To this end we used READ-IT, the first NLP-based readability assessment tool for Italian. Results: We analysed 584 documents, covering 29 specialties, for a total of 607. 790 word tokens, currently used at the 36 public hospitals in Tuscany. Although the readability level of all documents in the corpus is low, both at the lexical and syntactic level, significant differences can be observed between specialties and healthcare trust releasing the forms. With the readability level ranging between 0 (easy-to-read) and 100 (difficult-to-read), it resulted that the pediatric informed consent documents are the most easy-to-read forms (with an average score of 75) while the most difficult-to read documents are documents of the surgical area (whose average score is 80) (standard deviation 2). Discussion: The state of the art resulting from this preliminary study shows that NLP-based readability assessment tools can help to measure the linguistic complexity of informed consent forms and guide the editor to identify linguistically complex passages that need to be simplified, either syntactically or lexically. The use of an assessment tool designed for the general language is the main limitation of the study and should be addressed through the customization of the tool to assess the readability of the healthcare jargon. A further step of the research consider also the design of a guidance to prepare readable informed consent forms},
KEYWORDS = {Readability assessment, health-related information},
URL = {http://static1.squarespace.com/static/561c0d01e4b0b5ad2e65cc48/t/561d44dfe4b089431662d174/1444758751213/LibrettoProgramma.pdf},
CONFERENCE_NAME = {ISCOME 2015 Conference: "The Golden Bridge: Communication and Patient Safety"},
}
@TECHREPORT{ALBANESI_2015_TECHREPORT_ABBG_350492,
AUTHOR = {Albanesi, D. and Bellandi, A. and Benotto, G. and Giovannetti, E.},
TITLE = {Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-Rapporto tecnico 7},
YEAR = {2015},
ABSTRACT = {Il presente documento descrive lo stato di avanzamento del lavoro condotto dall'Istituto di Linguistica Computazionale "A. Zampolli" del CNR (ILCCNR) nel contesto del progetto "Traduzione del Talmud Babilonese" (vedi sezione "Pubblicazioni relative al PTTB") in italiano nei mesi di luglio, agosto, settembre e ottobre 2015. Quanto qui descritto costituisce un "Rapporto sullo Stato di Avanzamento dei Lavori (SAL) dell'applicazione Web" unicamente da parte dell'ILCCNR e si configura come il settimo dei fascicoli previsti a cadenza quadrimestrale},
URL = {https://iris.cnr.it/handle/20.500.14243/350492},
}
@TECHREPORT{ALBANESI_2015_TECHREPORT_ABBG_350489,
AUTHOR = {Albanesi, D. and Bellandi, A. and Benotto, G. and Giovannetti, E.},
TITLE = {Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-Rapporto tecnico 5},
YEAR = {2015},
ABSTRACT = {Il presente documento descrive lo stato di avanzamento del lavoro condotto dall'Istituto di Linguistica Computazionale "A. Zampolli" del CNR (ILC-CNR) nel contesto del progetto "Traduzione del Talmud Babilonese" in italiano. Quanto qui descritto costituisce un "Rapporto sullo Stato di Avanzamento dei Lavori (SAL) dell'applicazione Web" unicamente da parte dell'ILC-CNR e si configura come il quinto dei fascicoli previsti a cadenza quadrimestrale},
URL = {https://iris.cnr.it/handle/20.500.14243/350489},
}
@TECHREPORT{ALBANESI_2015_TECHREPORT_ABBG_350491,
AUTHOR = {Albanesi, D. and Bellandi, A. and Benotto, G. and Giovannetti, E.},
TITLE = {Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-Rapporto tecnico 6},
YEAR = {2015},
ABSTRACT = {Il presente documento descrive lo stato di avanzamento del lavoro condotto dall'Istituto di Linguistica Computazionale "A. Zampolli" del CNR (ILC-CNR) nel contesto del progetto "Traduzione del Talmud Babilonese" in italiano [1, 2, 3]. Quanto qui descritto costituisce un "Rapporto sullo Stato di Avanzamento dei Lavori (SAL) dell'applicazione Web" unicamente da parte dell'ILC-CNR e si configura come il sesto dei fascicoli previsti a cadenza quadrimestrale},
URL = {https://iris.cnr.it/handle/20.500.14243/350491},
}
@TECHREPORT{CARLINO_2015_TECHREPORT_CMPPT_317819,
AUTHOR = {Carlino, M. and Moroni, D. and Pardini, F. and Pieri, G. and Tampucci, M.},
TITLE = {MobiWallet-Dissemination pack (2nd Generation)},
YEAR = {2015},
ABSTRACT = {This deliverable is an update of the first dissemination pack and describes all the activities carried out towards an optimal dissemination of project aims and achievements. In addition, it contains and discusses the second generation of all the dissemination material that has been prepared during the second ten months of project life},
KEYWORDS = {Intelligent Transportation System, Integrated fare management, Dissemination},
PAGES = {96},
URL = {https://iris.cnr.it/handle/20.500.14243/317819},
}
@TECHREPORT{CARLINO_2015_TECHREPORT_CMPPT_324586,
AUTHOR = {Carlino, M. and Moroni, D. and Pardini, F. and Pieri, G. and Tampucci, M.},
TITLE = {Mobility and Transport Digital Wallet},
YEAR = {2015},
ABSTRACT = {This deliverable is an update of the first dissemination pack and describes all the activities carried out towards an optimal dissemination of project aims and achievements. In addition, it contains and discusses the second generation of all the dissemination material that has been prepared during the second ten months of project life},
KEYWORDS = {Intelligent Transportation System, Integrated fare managemet, Dissemination},
URL = {https://iris.cnr.it/handle/20.500.14243/324586},
}
@TECHREPORT{CARLINO_2015_TECHREPORT_CMPTFA_286592,
AUTHOR = {Carlino, M. and Moroni, D. and Pardini, F. and Tampucci, M. and Fell, M. and Arrazola, J.},
TITLE = {MobiWallet-Dissemination Pack (1st Generation)},
YEAR = {2015},
ABSTRACT = {This deliverable describes all the activities carried out towards an optimal dissemination of project aims and achievements. In addition, it contains and discusses the first generation of all the dissemination material that has been prepared during the first ten months of project life; Progetto: Mobility and Transport Digital Wallet Acronimo: MobiWallet Tipo Progetto: EU},
KEYWORDS = {Intelligent Transportation System, Integrated fare managemet, Dissemination},
PAGES = {1-43},
URL = {https://iris.cnr.it/handle/20.500.14243/286592},
}
@TECHREPORT{CUCURULLO_2015_TECHREPORT_C_316210,
AUTHOR = {Cucurullo, S.},
TITLE = {Sviluppo di funzioni software per il recupero di testi dell'Archivio Testuale dell'ILC e conversione in un formato di rappresentazione XML/TEI},
YEAR = {2015},
ABSTRACT = {This report describes the activities carried out under the Operating Agreement on the development of software functions for the recovery of Archives Textual ILC texts and conversion to a format of XML /TEI representation, stipulated in the Agreement Scientific Collaboration ILC-CNR-Accademia della Crusca. In particular, the report focuses on the following subject of the Operating Agreement: 1. definition of a format of XML /TEI representation that takes into account on the one hand the type of annotations in the source text and the other of the analysis and processing to which the converted text will have to be subjected; 2. development of procedures for converting the format of "Periodici Milanesi" to the XML format / TEI and verification of the results by parsing XML. The report traces the different phases of the work, with a focus archive textual analysis of departure and the results achieved, to get to a discussion of the issues that remain open at the time and the developments that can be envisaged for such activities},
KEYWORDS = {banca-dati testuale, Periodici Milanesi},
PAGES = {43},
URL = {https://iris.cnr.it/handle/20.500.14243/316210},
}
@TECHREPORT{CUCURULLO_2015_TECHREPORT_C_316211,
AUTHOR = {Cucurullo, S.},
TITLE = {Sviluppo di funzioni software per il recupero di testi dell'Archivio Testuale dell' ILC e conversione in un formato di rappresentazione XML/TEI Fase 2},
YEAR = {2015},
ABSTRACT = {This report documenting the activities under the Operating Agreement on the development of software functions for the recovery of Archives Textual ILC texts and conversion to a format of XML/TEI representation, stipulated in the Agreement Scientific Collaboration ILC-CNR-Accademia della Crusca. In particular, this report focuses on the following object of the Operating Agreement: "Development of conversion procedures from DBT format to XML / TEI format, according to the indications contained in the Report on the Phase 1 and verification of the results by parsing XML consists of the corpus 800 and '900 of extract text from Heritage Textual ILC, the Its composition has been agreed upon with Accademia della Crusca. Many of the solutions adopted for that type of texts has been chosen to be used in texts lemmatized, as in the case of works by Italian authors of the nineteenth and twentieth centuries. The general structure of the TEI XML document header and body and the definition of the main TAG used is shared by both the text of this Corpus that those lemmatized Periodici Milanesi, where we started because they were significantly more cases of encodings and simultaneously a format earliest time origin. It is indeed formats and storage media prior to the era of personal computers and who have already undergone the transformation from EBCDIC to ASCII},
KEYWORDS = {Archivi Testuali},
PAGES = {21},
URL = {https://iris.cnr.it/handle/20.500.14243/316211},
}
@TECHREPORT{DELGROSSO_2015_TECHREPORT_D_350039,
AUTHOR = {Del Grosso, A. M.},
TITLE = {Relazione attività di ricerca Clavius on The Web},
YEAR = {2015},
ABSTRACT = {La ricerca condotta dal Dott. Angelo Mario Del Grosso, di cui si sintetizzano i risultati in questo documento, è stata svolta presso l'Istituto di Linguistica Computazionale "A. Zampolli" durante il periodo Marzo 2013-Marzo 2015 in relazione all'assegno di ricerca bando n. 126. 048/ASS. 003. 2013. PI del 07-03-2013 Protocollo ILC n. 0000285, sotto la responsabilità scientifica del Dott. Emiliano Giovannetti e nell'ambito del progetto "Clavius on The Web" finanziato da Registro. it},
KEYWORDS = {digital humanities, computational philology, software enginnering, Clavius on The Web},
URL = {http://claviusontheweb.it},
}
@TECHREPORT{DELGROSSO_2015_TECHREPORT_D_348344,
AUTHOR = {Del Grosso, A. M.},
TITLE = {Attività e ricerche svolte nell'ambito del dottorato},
YEAR = {2015},
ABSTRACT = {L'attività di ricerca scientifica, effettuata dall'Ing. Angelo Mario Del Grosso nell'ambito del corso di dottorato di ricerca in Ingegneria dell'Informazione, si è svolta nel settore della progettazione e dello sviluppo di metodologie e di sistemi software in grado di soddisfare le necessità degli studiosi di risorse documentarie. In particolare, il lavoro si inserisce nel contesto degli studi di Digital Humanities per la produzione di edizioni digitali e per la critica del testo, in ambito computazionale e collaborativo},
KEYWORDS = {Digital Humanities, Software Engineering},
URL = {https://iris.cnr.it/handle/20.500.14243/348344},
}
@TECHREPORT{MARZI_2015_TECHREPORT_M_290723,
AUTHOR = {Marzi, C.},
TITLE = {Word knowledge and word usage-Representations and processes in the mental lexicon},
YEAR = {2015},
ABSTRACT = {The final NetWordS Conference, held on the 30th and 31st of March, and 1st of April 2015in Pisa, was convened by Prof. Pier Marco Bertinetto, Dr. Vito Pirrelli and Dr. ClaudiaMarzi, and brought together 91 participants (scholars, Post-Docs, PhD students) fromnumerous European, and some non-European, countries. A 3-day schedule involved all participants in a focused, cross-disciplinary discussion onrepresentations and processes in the mental lexicon. People are known to understand, memorise and parse words in a context-sensitive, opportunistic way, by caching their most habitual and productive processing patterns intoroutinized behavioural schemes, similarly to what we observe for sequences ofcoordinated motor acts. Speakers, however, do not only take advantage of token-basedinformation such as frequency of individual, holistically stored words, or episodicmemories of word usage, but they are also able to organise stored word forms throughabstract paradigmatic structures (or word families) whose overall size and distributionare important determinants of lexical categorisation, inference and productivity. Lexicalorganisation is, in fact, not necessarily functional to descriptive economy andminimisation of storage, but appears to be influenced by more dynamic, communicationorientedfunctions such as memorisation, prediction-based recognition and production. Lending support to this view, usage-based approaches to word processing have recentlyoffered novel explanatory frameworks that capitalise on the stable correlation patternsbetween lexical representations on the one hand and process-based operations thatmake representations functional to communicative exchanges on the other hand. Byfocusing on the battery of cognitive functions supporting verbal communication (rangingfrom input recoding to rehearsal, access, recall and coactivation) and by exploring their psycholinguistic correlates and neuroanatomical substrates, these approaches promotea new view of language architecture as an emergent property of the interaction betweenlanguage-specific input conditions and low-level, domain-specific cognitivepredispositions},
KEYWORDS = {word knowledge, word usage, mental lexicon, interdisciplinary approach},
PAGES = {2-12},
URL = {http://www.networds-esf.eu/uploads/NetWordS/Science_Meeting_Scientific_Report_5810.pdf},
}
@TECHREPORT{SASSOLINI_2015_TECHREPORT_S_335264,
AUTHOR = {Sassolini, E.},
TITLE = {Strategie per la conversione in XML-TEI dei testi della biblioteca di Galileo},
YEAR = {2015},
ABSTRACT = {Descrizione delle attività svolte nell'ambito dell'accordo di collaborazione scientifica tra ILC-CNR e Museo Galileo di Firenze, per la conversione di tutti i testi presenti nella biblioteca Galileiana in Edizione FAVARO, in un formato standard di rappresentazione (XML TEI)},
URL = {https://iris.cnr.it/handle/20.500.14243/335264},
}
@THESIS{DELGROSSO_2015_THESIS_D_308098,
AUTHOR = {Del Grosso, A. M.},
TITLE = {Designing a Library of Components for Textual Scholarship},
YEAR = {2015},
ABSTRACT = {The present work is the result of the research activity carried out during my PhD studies. This thesis addresses the application of new technologies, computer science methodologies, and software design principles in the interdisciplinary and evolving field of DH-in other contexts known as Humanities Computing. In particular, this contribution highlights the specific needs entailed in collaborative literary computing and in digital textual scholarship. The source context especially concentrates on documents written in Latin, Greek and Arabic, or on documents in modern languages concerning historical and philological topics. In the specific, the research activity focuses on the design of a modular library (TSLib) dealing with scholarly sources for what regards their editing, processing, comparison, analysis, visualization and searching. The thesis explores the aforementioned topics across five chapters. Chapter 1 tracks the context of the digital textual scholarship and gives a summary of the objectives and the benefits of this research. Chapter 2 illustrates related works and similar initiatives, along with worth mentioning projects and outcomes in the area of Digital Humanities. Chapter 3 thoroughly describes and motivates the design process implemented. The process starts by describing well-known engineering principles and shows how they are applied for the digital textual domain and for the computational scholarly needs. Then, it continues introducing requirements, architecture and models of the proposed method. Design issues with regards to patterns and APIs are highlighted. The final part of this work (chapter 4) illustrates concrete results deriving from a number of research projects that, on the one hand, have contributed to the design of the library and, on the other hand, have based their work on it. Several topics have been discussed: (a) acquisition and text encoding, (b) alignment and variant annotation, and (c) multi-level annotation. In the conclusion, a few reflections and considerations are presented, together for suggestions and for further studies (chapter 5)},
URL = {https://iris.cnr.it/handle/20.500.14243/308098},
}
@MISC{BARONI_2015_MISC_B_312490,
AUTHOR = {Baroni, P.},
TITLE = {2015-1-IT02-KA204-015090 DLDP: Interactive Web Site},
YEAR = {2015},
ABSTRACT = {Interactive Web site of DLDP-Digital Language Diversity Project (Erasmus Programme | Grant Agreement No. 2015-1-IT02-KA204-015090), powered by Drupal, developed in English, Italian, Basque, Finnish, French, German and Spanish},
KEYWORDS = {Sito web},
URL = {http://www.dldp.eu},
}
@MISC{BARONI_2015_MISC_B_461445,
AUTHOR = {Baroni, P.},
TITLE = {CLARIN-IT Web Site},
YEAR = {2015},
ABSTRACT = {Web Site of the CLARIN-IT National Consortium, powered by Drupal, developed in English and Italian},
KEYWORDS = {CLARIN, National Consortium},
URL = {https://www.clarin-it.it},
}
@MISC{BARONI_2015_MISC_B_461458,
AUTHOR = {Baroni, P.},
TITLE = {LaRI Web Site},
YEAR = {2015},
ABSTRACT = {Web site of CNR-ILC Research Group "LaRI-Language Resources and Infrastructures", powered by WordPress, developed in Italian and English},
KEYWORDS = {risorse linguistiche, infrastrutture linguistiche},
URL = {http://lari.ilc.cnr.it},
}
@MISC{BRANDO_2015_MISC_BFAG_300554,
AUTHOR = {Brando, C. and Frontini, F. and Abi Haidar, A. and Ganascia, J.},
TITLE = {Reconnaissance d'entités nommées: adaptation au domaine de la littérature française du XIXe siècle},
YEAR = {2015},
ABSTRACT = {La reconnaissance d'entités nommées (REN) est un enjeu fondamental pour la recherche en humanités numériques (HN). En littérature française, il est particulièrement important de repérer des entités telles que les auteurs, les personnages fictifs, les lieux géographiques et imaginaires, les titres d'ouvrages, les marqueurs temporels, entre autres. Actuellement, il existe peu de corpus de littérature française du passé annotés et disponibles en ligne. Le coût élevé de l'annotation manuelle motive donc l'utilisation de méthodes automatiques. Les approches REN de l'état de l'art fonctionnent efficacement sur des corpus journalistique et de littérature scientifique en biologie [1]. Néanmoins, l'adaptation à un nouveau domaine semble affecter négativement la performance de ces approches [5]. La diversité des textes en littérature (fiction, critique, théâtre.) et la spécificité des époques prises en compte représentent un travail considérable d'adaptation des ressources linguistiques et des algorithmes à un domaine particulier. En général, les thèmes traités sont hétérogènes et les textes possèdent un style fréquemment caractérisé par un bas degré de standardisation et de prédictibilité. Il est par exemple difficile d'identifier des mentions candidates car les conventions typographiques et le registre linguistique varient selon le domaine (textes journalistiques vs. littérature française)},
KEYWORDS = {entités nommeés, littérature française},
URL = {https://iris.cnr.it/handle/20.500.14243/300554},
CONFERENCE_NAME = {8esJournées Internationales de Linguistique de Corpus (JLC2015)},
}
@MISC{CININI_2015_MISC_CCM_370637,
AUTHOR = {Cinini, A. and Cutugno, P. and Marconi, L.},
TITLE = {Sviluppo di una banca dati strutturata di trascrizioni di parlato di singoli soggetti anziani monitorati nel tempo},
YEAR = {2015},
ABSTRACT = {The Institute of Computational Linguistics "Antonio Zampolli" of the National Research Council, ILC-CNR, as a partner of the Ninfa project "iNtelligent Integrated Network for Aged People" and within the WP3 "Analysis and test of implementation of cognitive deficit through the analysis of the language ", has created a structured database consisting of a body of recordings and transcripts of the individual elderly subjects monitored over time},
KEYWORDS = {Natural Language Processing, Cognitive Impairment, trattamento automatico del linguaggio, analisi del linguaggio},
URL = {https://iris.cnr.it/handle/20.500.14243/370637},
}
@MISC{DANCONA_2015_MISC_DBNFCBDM_344598,
AUTHOR = {D'Ancona, C. and Bozzi, A. and Nahli, O. and Farina, M. and Coda, E. and Boschetti, F. and Del Grosso, A. M. and Marchi, S.},
TITLE = {Banca dati testuale Greek into Arabic},
YEAR = {2015},
ABSTRACT = {Banca dati testuale con la codifica XML della pericopatura dei testi Greco-Arabo di alcuni trattati delle Enneadi di Plotino},
KEYWORDS = {Digital Humanities, Computational Philology, Greek into Arabic, http://g2a.ilc.cnr.it},
URL = {http://g2a.ilc.cnr.it/},
}
@MISC{DELGROSSO_2015_MISC_D_344096,
AUTHOR = {Del Grosso, A. M.},
TITLE = {Una applicazione Web per lo studio specialistico dei testi. Il modello adottato e i risultati fino ad oggi ottenuti},
YEAR = {2015},
ABSTRACT = {Il lavoro si concentra sulla realizzazione di una libreria di moduli software relativi ad una applicazione Web per la Textual Scholarship. Tale libreria è basata su un modello che considera la molteplicità degli approcci per analizzare un testo, soprattutto, ma non esclusivamente, antico. In questo quadro il modello prende in considerazione elementi di carattere filologico e linguistico fra i quali anche quelli che derivano dalla Linguistica computazionale. Dal momento che è impensabile che un sistema, sia pure complesso e articolato in sottosistemi, possa ambire a intervenire in qualunque punto della filiera delle analisi scientifiche sui testi, il lavoro è particolarmente apprezzabile perché impostato sulla base di una architettura informatica multi-modulare. In tal modo è possibile inserire nel sistema un cospicuo numero di moduli software ed è aperto alla possibilità di inserirne (o farne inserire) molti altri a seconda di specifiche necessità. Fra i moduli più significativi, sono già attivi quelli per: 1) l'annotazione di parti di testo (dalla singola parola ad una espressione completa, ecc.); 2) la classificazione delle annotazioni stesse secondo una tipologia indicata dall'utente (per esempio, annotazione di tipo semantico, morfologico, ontologico, ecc.); 3) la produzione di indici e concordanze; 4) l'allineamento fra testo e eventuale traduzione (antica o moderna); 5) l'estrazione di named entity (NER). Il modello e i moduli realizzati hanno mostrato grande efficacia in almeno 3 progetti: 1) Progetto PRIN 2008 "Edizione digitale dei manoscritti di F. de Saussure; 2) Progetto ERC advanced grant "Greek into Arabic: Philosophical Concepts and Linguistic Bridges"; 3) Progetto "Traduzione Italiana del Talmud Babilonese". L'applicazione parzialmente già realizzata prevede un auspicabile sviluppo nei prossimi anni con sperimentazioni su testi manoscritti di autori moderni e contemporanei, oltre che su opere antiche e medievali per finalità di critica testuale, è interamente open source e sviluppata con l'utilizzo di standard internazionali, quali, tra l'altro, il sistema di mark-up TEI},
KEYWORDS = {computational philology, digital humanities, software enginnering},
URL = {https://iris.cnr.it/handle/20.500.14243/344096},
}
@MISC{DELGROSSO_2015_MISC_D_350036,
AUTHOR = {Del Grosso, A. M.},
TITLE = {ClaviusLemmata},
YEAR = {2015},
ABSTRACT = {Software di lemmatizzazione per l'analisi linguistica delle lettere scritte in lingua latina, sviluppato in seno al progetto ClaviusOnTheWeb finanziato dal Registro. it e partecipato dal CNR attraverso due istituti (IIT e ILC) e dall'Archivio Storico della Pontificia Università Gregoriana (APUG)},
KEYWORDS = {digital humanities, computational philology, software engineering, computational linguistics},
URL = {https://github.com/angelodel80/ClaviusLemmata},
}
@MISC{DIDONATO_2015_MISC_D_408437,
AUTHOR = {Di Donato, F.},
TITLE = {Verso una scienza aperta? Nuovi modelli di comunicazione della ricerca},
YEAR = {2015},
ABSTRACT = {Presentazione alla Scuola Normale Superiore},
URL = {https://iris.cnr.it/handle/20.500.14243/408437},
}
@MISC{DIDONATO_2015_MISC_D_407995,
AUTHOR = {Di Donato, F.},
TITLE = {Rethinking the Role of Social Sciences and Humanities (SSH) in Horizon 2020: Towards a Reflective and Generative Perspective},
YEAR = {2015},
ABSTRACT = {Europeana e l'open science per il cultural heritage: un'introduzione},
URL = {https://iris.cnr.it/handle/20.500.14243/407995},
}
@MISC{DIDONATO_2015_MISC_D_408442,
AUTHOR = {Di Donato, F.},
TITLE = {Riusare i dati: limiti, possibilità, incentivi},
YEAR = {2015},
ABSTRACT = {che cosa significa riusare i dati in ambito umanistico? un esempio di ricerca},
URL = {https://iris.cnr.it/handle/20.500.14243/408442},
}
@MISC{FRONTINI_2015_MISC_F_295465,
AUTHOR = {Frontini, F.},
TITLE = {Indexing names in digital editions},
YEAR = {2015},
ABSTRACT = {This presentation outlines the work done on Named Entity Recognition and Linking in texts of French Literary criticism, underlying the points of interest for what concerns the creation of enriched digital editions},
URL = {https://iris.cnr.it/handle/20.500.14243/295465},
}
@MISC{FRONTINI_2015_MISC_F_300594,
AUTHOR = {Frontini, F.},
TITLE = {Trattamento automatico del linguaggio per le Digital Humanities. Riconoscimento e disambiguazione di menzioni di autori in testi di critica letteraria},
YEAR = {2015},
ABSTRACT = {L'intervento scaturisce da una collaborazione tra ILC-CNR e il Labex OBVIL di Parigi. Lo scopo del progetto è quello di adattare ed estendere algoritmi di riconoscimento, classificazione e disambiguazione di entità nominate (in particolare menzioni di autori) nel "Corpus Critique", un insieme di testi di critica letteraria francese che il Labex OBVIL sta pubblicando in edizione digitale (formato TEI). Tali algoritmi si basano su approcci TAL supervisionati e non supervisionati e sfruttano massicciamente le basi di conoscenza, sia generiche (DBpedia) che di dominio, disponibili online sotto forma di linked data; lo scopo di tali lavori è di produrre risorse testuali annotate per facilitare la ricerca nell'ambito della storia della critica letteraria e della storia delle idee in generale. Durante il seminario verranno introdotti i formati e le risorse utilizzate, i criteri e le problematiche di annotazione emersi, e gli algoritmi riconoscimento e disambiguazione di entità nominate sviluppati. Più in generale si cercherà di mostrare con alcuni casi di utilizzo quali siano i vantaggi di arricchire risorse testuali con questo livello di annotazione, nel più ampio contesto delle convergenze tra digital humanities e trattamento automatico del linguaggio. Link http: //obvil. paris-sorbonne. fr/ https: //github. com/cvbrandoe/REDEN/blob/master/README. md},
KEYWORDS = {Named-entity disambiguation Centrality Linked data Data fusion Digital humanities},
URL = {https://iris.cnr.it/handle/20.500.14243/300594},
CONFERENCE_NAME = {Seminario di Cultura Digitale},
}
@MISC{FRONTINI_2015_MISC_F_289092,
AUTHOR = {Frontini, F.},
TITLE = {What makes them different: the extraction of distinctive linguistic patterns for the protagonists of Molière's plays},
YEAR = {2015},
ABSTRACT = {Quantitative approaches to the study of style in literature are far from a modern novelty. They have however recently gained more and more popularity, not only among computer scientists and corpus linguistics, but also among some influential literary critics. The present panorama of quantitative techniques is very rich, but often confusing, with a plethora of denominations and methodologies often difficult to reconcile; computer scientists classify their work as stylometry or computational stylistics, while linguists may use the label corpus stylistics, and finally critics like Franco Moretti will talk about macro-analysis and distant reading. This talk will try first to identify the differences between these trends, distinguishing between corpus based and corpus driven approaches on the methodological side (Quiniou et al 2012), and (following Ramsey 2011) between experimental and hermeneutical approaches. Finally we will present ongoing work conducted at Labex OBVIL on syntactic pattern extraction from theatrical characters. The proposed approach, using correspondence analysis to extract distinctive traits for each character, is imagined rather as an hermeneutical tool, in the sense that it does not seek to demonstrate that two different characters have been endowed with significantly different stylistic traits by the playwright, but it does enable the visualisation of their relative distances and the extraction of those elements that make them distinct},
URL = {https://iris.cnr.it/handle/20.500.14243/289092},
CONFERENCE_NAME = {Cycle des séminaires ILES LIMSI},
}
@MISC{FRONTINI_2015_MISC_F_296549,
AUTHOR = {Frontini, F.},
TITLE = {Mining for characterising patterns in literature using correspondence analysis: an experiment on French novels},
YEAR = {2015},
ABSTRACT = {The talk presents and describes a bottom up methodology for the detection of stylistic traits in the syntax of literary texts. The extraction of syntactic patterns is performed blindly by a sequential pattern mining algorithm, while the identification of significant and interesting features is performed later by using correspondence analysis and filtering for the most contributive patterns},
KEYWORDS = {computational stylistics, French},
URL = {https://iris.cnr.it/handle/20.500.14243/296549},
CONFERENCE_NAME = {Göttingen Dialog in Digital Humanities},
}
@MISC{FRONTINI_2015_MISC_F_295960,
AUTHOR = {Frontini, F.},
TITLE = {Analyse et extraction des motifs syntaxiques dans la prose de Robert Challe et de ses apocryphes},
YEAR = {2015},
ABSTRACT = {Cette contribution presente une extraction et une analyse des motifs syntaxiques dans la prose de Robert Challe et de ses apocryphes. En particulier nous analysons les différence dans la syntaxe des contes originaux des Illustres Françaises et celle des contes apocryphes},
KEYWORDS = {Robert Challe, authorship attribution, stilistica computazionale},
URL = {http://obvil.paris-sorbonne.fr/sites/default/files/projets/analyse_motifs_syntaxiques_if_et_apocryphes.pdf},
CONFERENCE_NAME = {Robert Challe: approches numériques des questions d'auctorialité},
}
@MISC{GUADAGNINI_2015_MISC_G_268598,
AUTHOR = {Guadagnini, E.},
TITLE = {recensione: Denis Foulechat, Ethique chrétienne et philosophies antiques. Le Policratique de Jean de Salisbury, livres VI et VII, Édition critique par Charles Brucker, Genève, Droz, 2013, pp. 750 («Publications romanes et françaises», 260)},
YEAR = {2015},
KEYWORDS = {Filologia romanza, Volgarizzamenti},
URL = {https://iris.cnr.it/handle/20.500.14243/268598},
ISSN = {0390-0711},
}
@MISC{GUADAGNINI_2015_MISC_G_312041,
AUTHOR = {Guadagnini, E.},
TITLE = {Recensione: Andrea Bocchi, Il glossario di Cristiano da Camerino. Introduzione, edizione sinottica dei testimoni di Assisi, Fabriano, Fermo, Firenze, Londra e indici delle forme, 2 voll., Premessa di Alfredo Stussi, Padova, Libreriauniversitaria. it Edizioni, 2015, III 994},
YEAR = {2015},
KEYWORDS = {Linguistica italiana},
PAGES = {168-178},
URL = {https://iris.cnr.it/handle/20.500.14243/312041},
VOLUME = {61},
ISSN = {0585-4962},
}
@MISC{KHAN_2015_MISC_KB_298719,
AUTHOR = {Khan, A. F. A. and Boschetti, F.},
TITLE = {Restructuring a Taxonomy of Literary Themes and Motifs for More Efficient Querying},
YEAR = {2015},
ABSTRACT = {Restructuring a Taxonomy of Literary Themes and Motifs for More Efficient Querying We present ongoing work on the restructuring of a taxonomy of literary themes and motifs on the basis of ontology design principles. The original taxonomy is part of a project in which epigraphic texts are tagged with items from the taxonomy, either on a line by line basis or on the basis of whole epigraphs at a time. These tags, then, describe the different themes or motifs that are contained within the text. The taxonomy was originally devised by domain experts and based on long standing traditions in literary analysis. Our work aims to make it easier to query these tagged texts by altering the structure of the taxonomy in order to make it more efficient for querying; while, at the same time, maintaining its ease of use by potential users. First of all we describe some of the features of the original taxonomy that make it difficult to use in querying. We go onto describe how we used principles from ontology design and informatics research to suggest to ameliorate these difficulties, and our efforts to preserve as much of the initial, intuitive, structure as possible. Finally, we discuss further work},
URL = {https://iris.cnr.it/handle/20.500.14243/298719},
}
@MISC{MANCINI_2015_MISC_MPDL_344597,
AUTHOR = {Mancini, L. and Pedretti, I. and Del Grosso, A. M. and Luzzi, D.},
TITLE = {Banca dati testuale codifica delle lettere Cristoforo Clavius},
YEAR = {2015},
ABSTRACT = {Banca dati testuale delle lettere di Cristoforo Clavio derivante dal lavoro di codifica fatto adottando il vocabolario XML e le linee guida della text encoding initiative (TEI). L'attività è frutto del progetto Clavius on The Web},
KEYWORDS = {digita, Cristoforo Clavio, computational philology, TEI-XML},
URL = {http://claviusontheweb.it},
}
@MISC{MARCHI_2015_MISC_MD_344191,
AUTHOR = {Marchi, S. and Del Grosso, A. M.},
TITLE = {Greek into Arabic philological Web platform},
YEAR = {2015},
ABSTRACT = {Piattaforma filologico-computazionale sviluppata nell'ambito del progetto ERC 2009 Advanced Grant n. 249431. Titolo: Greek into Arabic. Philosophical concepts and linguistic bridges},
KEYWORDS = {computational philology, digital humanities, ERC, Greek into Arabic},
URL = {http://g2a.ilc.cnr.it/},
}
@MISC{NAHLI_2015_MISC_N_370088,
AUTHOR = {Nahli, O.},
TITLE = {Aggiornamenti banca dati del Motore morfologico Aramorph},
YEAR = {2015},
ABSTRACT = {AraMorph's components are essentially two: the rule engine for morphological analysis and a repository of linguistic resources mainly composed of three lexicons: i) the dictStems lexicon, which contains 38. 600 lemmas; ii) the dictPrefixes lexicon, which consists of sequences of proclitics and inflectional prefixes; iii) the dictSuffixes lexicon, which consists of sequences of inflectional suffixes and enclitics. These lexica are accompanied by three compatibility tables used for checking combinations of A (proclitics prefixes), B (stems) and C (suffixes enclitics). To cut down on arabic parse overgeneration, one has to enforce further restrictions in compatibility tables, e. g. the verb's ability to accept nominative and accusative pronouns, and to select a rational subject. We then augmented verb entries with subcategorization information such as case assignment and the restriction on rational subjects. At the same time, it was necessary to update compatibility tables},
KEYWORDS = {analisi morfo-sintattica, Lingua araba, Aramorph},
URL = {https://iris.cnr.it/handle/20.500.14243/370088},
}
@MISC{NAHLI_2015_MISC_N_370083,
AUTHOR = {Nahli, O.},
TITLE = {Banca dati dell'analisi morfo-sintattica del testo "Aflūṭīn ʻinda al-ʻArab", ʻAbd al-Raḥmān Badawī, Cairo 1955, 1966},
YEAR = {2015},
ABSTRACT = {Banca dati testuali con l'analisi morfo-sintattica del testo "Afl???n ?inda l-?Arab"; editore ?A. Badaw?, D?r al-Nah?at al-?arabiyya, Cairo 1966},
KEYWORDS = {analisi morfo-sintattica, Lingua araba, Greek Into Arabic},
URL = {http://g2a.ilc.cnr.it:8080/Teologia_Wapp/Home.xhtml?centerPage=teologia},
}
@MISC{PICCINI_2015_MISC_PB_370148,
AUTHOR = {Piccini, S. and Bellandi, A.},
TITLE = {Saussure's Lexicon-RDF version},
YEAR = {2015},
ABSTRACT = {Ferdinand de Saussure's Lexicon},
URL = {https://iris.cnr.it/handle/20.500.14243/370148},
}
@MISC{SORIA_2015_MISC_S_294066,
AUTHOR = {Soria, C.},
TITLE = {Towards an Alliance for Digital Language Diversity: Vision, Goals, and Challenges},
YEAR = {2015},
ABSTRACT = {In order to foster the world's digital language diversity, and to ensure equal digital opportunities for languages, we encourage the creation of an Alliance for Digital Language Diversity, i. e. a network of different stakeholders involved in the creation and deployment of data. The Alliance needs-and presupposed-educational activities aimed at building the necessary digital skills and creating the psychological self-confidence necessary for speakers to produce data using their mother tongue},
KEYWORDS = {digital language diversity, less-resourced languages, minority languages, digital rights, data production},
URL = {https://iris.cnr.it/handle/20.500.14243/294066},
CONFERENCE_NAME = {Ugra Global Expert Meeting on Multilingualism in Cyberspace},
}
@ARTICLE{BRUNATO_2014_ARTICLE_BV_245146,
AUTHOR = {Brunato, D. and Venturi, G.},
TITLE = {Le tecnologie linguistico-computazionali nella misura della leggibilità di testi giuridici},
YEAR = {2014},
ABSTRACT = {This paper presents an innovative NLP-based methodology for automatically assessing the readability of legal documents, with a view to their simplification. As part of a broader research field investigating the accessibility of the language of the law, we consider the specific domain of the bureaucratic language through an analysis of real texts; the accessibility to this typology of texts is indeed a crucial requisite of the communication between institutions and citizens. To the best of our knowledge, this is the first attempt aimed at showing that state-of-the-art language technologies are nowadays mature not only to enable the automatic readability evaluation of legal texts but also to support their simplification. For these purposes, we adopted READ-IT, the first advanced readability assessment tool for the Italian language},
PAGES = {111-142},
URL = {https://iris.cnr.it/handle/20.500.14243/245146},
VOLUME = {XXIII (1)},
ISSN = {0390-0975},
JOURNAL = {INFORMATICA E DIRITTO},
}
@ARTICLE{BURGASSI_2014_ARTICLE_B_284555,
AUTHOR = {Burgassi, C.},
TITLE = {Le projet DiVo et ses corpus: une base de données italo-latine de traductions médiévales},
YEAR = {2014},
ABSTRACT = {Il contributo espone i criteri guida per la costituzione delle due banche dati del progetto DiVo ("Dizionario dei volgarizzamenti") e mette in luce, anche attraverso l'esemplificazione di casi emblematici, l'impatto del progetto nell'ambito degli studi sul lessico dell'Italiano antico},
KEYWORDS = {Lessicologia, Volgarizzamenti, Digital Humanities},
URL = {https://iris.cnr.it/handle/20.500.14243/284555},
VOLUME = {18 (1)},
ISSN = {1954-3093},
JOURNAL = {BULLETIN DU CENTRE D'ÉTUDES MÉDIÉVALES D'AUXERRE},
}
@ARTICLE{BURGASSI_2014_ARTICLE_BG_256342,
AUTHOR = {Burgassi, C. and Guadagnini, E.},
TITLE = {Prima dell'«indole». Latinismi latenti dell'italiano},
YEAR = {2014},
ABSTRACT = {This contribution is one of the studies that are part of the DiVo project (Dizionario dei Volgarizzamenti), hosted by the Opera del vocabolario italiano (CNR) and by the Scuola normale superiore di Pisa, and aims at recognizing the special kind of latinisms that are found in the Italian language. The definition of "hidden" (latenti) applies to loanwords from Latin that are, on the one hand, common in contemporary Italian and that, on the other hand, were generally speaking poorly attested or even unknown in the past. These latinisms are therefore in the medieval vernacular language a minor and deliberate lexical choice, which reached, in the modern age, the linguis-364 SOMMARI DEGLI ARTICOLI tic standard currently in use. The data concerning the first attestation of a word is therefore examined in close connection with the stylistic change of the word itself over time, according to the results of an analysis of the available documentation. The class of "hidden" latinisms, defined in this way, is then described in its inner articulations. Three lexical sub-categories can be singled out: the essay examines one in particular, retracing the history of the word indole. Specifically, starting from the valuable evidence testimony of the translations in vernacular language, archeological research on the word indole focuses on the phases before its lexical confirmation and its modern semantic definition},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana, Latinismi, Progetto DiVo},
PAGES = {5-43},
URL = {https://iris.cnr.it/handle/20.500.14243/256342},
VOLUME = {31},
ISSN = {0392-5218},
JOURNAL = {STUDI DI LESSICOGRAFIA ITALIANA},
}
@ARTICLE{CHERSI_2014_ARTICLE_CFPP_256840,
AUTHOR = {Chersi, F. and Ferro, M. and Pezzulo, G. and Pirrelli, V.},
TITLE = {Topological Self-Organization and Prediction Learning Support Both Action and Lexical Chains in the Brain},
YEAR = {2014},
ABSTRACT = {A growing body of evidence in cognitive psychology and neuroscience suggests a deep interconnection between sensory-motor and language systems in the brain. Based on recent neurophysiological findings on the anatomo-functional organization of the fronto-parietal network, we present a computational model showing that language processing may have reused or co-developed organizing principles, functionality, and learning mechanisms typical of premotor circuit. The proposed model combines principles of Hebbian topological self-organization and prediction learning. Trained on sequences of either motor or linguistic units, the network develops independent neuronal chains, formed by dedicated nodes encoding only context-specific stimuli. Moreover, neurons responding to the same stimulus or class of stimuli tend to cluster together to form topologically connected areas similar to those observed in the brain cortex. Simulations support a unitary explanatory framework reconciling neurophysiological motor data with established behavioral evidence on lexical acquisition, access, and recall},
KEYWORDS = {Motor chains, Lexical chains, Serial working memory, Computational modeling, Self-organizing maps, Somatotopic organization, Prediction},
PAGES = {476-491},
URL = {http://onlinelibrary.wiley.com/doi/10.1111/tops.12094/abstract?deniedAccessCustomisedMessage=\&userIsAuthenticated=false},
VOLUME = {6 (3)},
DOI = {10.1111/tops.12094},
ISSN = {1756-8757},
JOURNAL = {TOPICS IN COGNITIVE SCIENCE},
}
@ARTICLE{CUTUGNO_2014_ARTICLE_CMGCM_245096,
AUTHOR = {Cutugno, P. and Marconi, L. and Gmorgavi and Chiarella, D. and Morando, M.},
TITLE = {Analysis of new collaborative writing within Web 2. 0},
YEAR = {2014},
ABSTRACT = {In recent years, the transition from Web 1. 0 to Web 2. 0 enabled the creation of content by the users of the Network: social networks, blogs, forums, chats and wikis have arisen. Phenomena, such as collaborative/collective writing, already born at the beginning of the 20th century, found their natural setting, a wide audience of reference of writers and readers in multiple languages within the Web 2. 0. In this paper our goal is to verify if and how the characteristics of the textual analysis of narrative plots can be used for the analysis of collaborative narrative texts. In particular, we will check if features like correctness, completeness, consistency and coherence together with tools for statistical analysis of language suitable for analysing the new collaborative writing 2. 0},
PAGES = {91-97},
URL = {https://iris.cnr.it/handle/20.500.14243/245096},
VOLUME = {22},
ISSN = {1790-5109},
JOURNAL = {RECENT ADVANCES IN COMPUTER ENGINEERING},
}
@ARTICLE{DEFELICE_2014_ARTICLE_D_257265,
AUTHOR = {De Felice, I.},
TITLE = {«Possibilities of action» in language: affordances and verbal polysemy},
YEAR = {2014},
PAGES = {179-191},
VOLUME = {1},
JOURNAL = {RETI SAPERI LINGUAGGI},
}
@ARTICLE{DEFELICE_2014_ARTICLE_D_257266,
AUTHOR = {De Felice, I.},
TITLE = {La sinestesia linguistica nella poesia latina},
YEAR = {2014},
ABSTRACT = {The main purpose of this study is to explore linguistic synaesthesia in Latin poetic language. Through the analysis of a poetic corpus, which consists of works of Catullus, Horace, Lucretius, Ovid, Vergil, all occurrences of twenty Latin synaesthetic adjectives (previously extracted by Aeneid and De Rerum Natura) were retrieved; all lemmas co-occurring with these adjectives in nominal phrases were then classified into the following categories according to their meaning in context: monoaesthetic, synaesthetic (touch, temperature perception, taste, smell, sight, motion perception, hearing), pseudo-synaesthetic (i. e. psycho-moral), abstract. The research not only shows how much linguistic synaesthesia is present in Latin poetry, but also demonstrates that Latin synaesthesias comply with cross-linguistic tendencies, especially with regard to the hypothesis of directional hierarchy},
PAGES = {61-107},
VOLUME = {52 (1)},
JOURNAL = {STUDI E SAGGI LINGUISTICI},
}
@ARTICLE{DEFELICE_2014_ARTICLE_D_265428,
AUTHOR = {De Felice, I.},
TITLE = {From hands to handles: How objects' orientation affects grasp descriptions},
YEAR = {2014},
PAGES = {109-115},
URL = {http://www.neapolisanit.eu/neascience/wp-content/uploads/2014/12/ATTI_AISC_2014_ROMA2.pdf},
VOLUME = {5},
JOURNAL = {NEA SCIENCE},
}
@ARTICLE{DELLORLETTA_2014_ARTICLE_DMV_260898,
AUTHOR = {Dell'Orletta, F. and Montemagni, S. and Venturi, G.},
TITLE = {Assessing document and sentence readability in less resourced languages and across textual genres},
YEAR = {2014},
ABSTRACT = {In this paper, we tackle three underresearched issues of the automatic readability assessment literature, namely the evaluation of text readability in less resourced languages, with respect to sentences (as opposed to documents) as well as across textual genres. Different solutions to these issues have been tested by using and refining READ-IT, the first advanced readability assessment tool for Italian, which combines traditional raw text features with lexical, morpho-syntactic and syntactic information. In READ-IT readability assessment is carried out with respect to both documents and sentences, with the latter constituting an important novelty of the proposed approach: READ-IT shows a high accuracy in the document classification task and promising results in the sentence classification scenario. By comparing the results of two versions of READ-IT, adopting a classification-versus ranking-based approach, we also show that readability assessment is strongly influenced by textual genre; for this reason a genre-oriented notion of readability is needed. With classification-based approaches, reliable results can only be achieved with genre-specific models: Since this is far from being a workable solution, especially for less resourced languages, a new ranking method for readability assessment is proposed, based on the notion of distance},
KEYWORDS = {readability assessment, less resourced languages, multi-level linguistic annotation, textual genres},
PAGES = {163-193},
URL = {http://www.ingentaconnect.com/content/jbp/itl/2014/00000165/00000002/art00005},
VOLUME = {165 (2)},
DOI = {10.1075/itl.165.2.03del},
}
@ARTICLE{DIDONATO_2014_ARTICLE_DM_381999,
AUTHOR = {Di Donato, F. and Müller, S.},
TITLE = {Burckhardtsource. org: The Unpublished Correspondence to Jacob Burckhardt},
YEAR = {2014},
ABSTRACT = {Burckhardsource. org is the semantic Digital Library designed and developed by EUROCORR ERC Advanced Grant Project, which hosts the on-going critical edition work on the correspondence of over 300 European intellectuals with the Swiss cultural historian Jacob Burckhardt over a period of more than half a century. Aim of this article is to outline an introduction to EUROCORR by describing content and tools of Burckhardtsource. org platform},
URL = {https://iris.cnr.it/handle/20.500.14243/381999},
ISSN = {2283-7833},
JOURNAL = {LEXICON PHILOSOPHICUM. INTERNATIONAL JOURNAL FOR THE HISTORY OF TEXTS AND IDEAS},
}
@ARTICLE{GOGGI_2014_ARTICLE_GPGB_257204,
AUTHOR = {Goggi, S. and Pardelli, G. and Giannini, S. and Biagioni, S.},
TITLE = {Grey Literature in European Commission Projects},
YEAR = {2014},
ABSTRACT = {The survey is focused on the documentation produced by the European Commission (EC) projects involved in the Framework Programme for Research and Technological Development (hereafter FP7) and managed by the Italian National Research Council (hereafter CNR). In particular, the Grey Literature (GL) available on CORDIS and European Projects websites was analysed. In order to verify how it is managed and whether it is compliant with EC recommendations, some categories were introduced to identify, measure and evaluate the usability and availability of projects production. Data was obtained from a sample of European projects websites},
KEYWORDS = {Grey Literature, European Commission Projects},
PAGES = {133-144},
URL = {http://www.greynet.org/thegreyjournal/previousissues.html},
VOLUME = {10 (3)},
ISSN = {1574-1796},
JOURNAL = {THE GREY JOURNAL},
}
@ARTICLE{GUADAGNINI_2014_ARTICLE_G_275422,
AUTHOR = {Guadagnini, E.},
TITLE = {Voce RUDDURA s. f. del Tesoro della Lingua Italiana delle Origini},
YEAR = {2014},
ABSTRACT = {Francesismo: dal francese antico "radeur", 'impeto'},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana, Francesismi, Progetto DiVo},
URL = {http://tlio.ovi.cnr.it/voci/031509.htm},
VOLUME = {18},
ISSN = {2240-5216},
JOURNAL = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI},
}
@ARTICLE{GUADAGNINI_2014_ARTICLE_G_272461,
AUTHOR = {Guadagnini, E.},
TITLE = {Voce RIGIDO agg. del Tesoro della Lingua Italiana delle Origini},
YEAR = {2014},
ABSTRACT = {Latinismo. 1 Che non si può piegare né flettere, che permane stabile, fermo e immoto; che manca di elasticità, scioltezza o mutevolezza. 1. 1 [Di un corpo o un arto: ] che manca di elasticità e scioltezza, intorpidito o contratto (per il freddo, la morte incombente). 2 Fig. Che denota estrema fermezza nel tenere un det. comportamento, atteggiamento, disposizione; che mostra instransigenza e indisponibilità al compromesso. [Con sfumatura neg.: ] che denota durezza o inflessibilità (eccessiva). 3 Che comporta delle forti difficoltà o delle gravi conseguenze; che appare o risulta difficile da sopportare o da superare},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana, Progetto DiVo},
URL = {http://tlio.ovi.cnr.it/voci/031507.htm},
VOLUME = {18},
ISSN = {2240-5216},
JOURNAL = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI},
}
@ARTICLE{GUADAGNINI_2014_ARTICLE_G_272455,
AUTHOR = {Guadagnini, E.},
TITLE = {Voce REDDO agg. del Tesoro della Lingua Italiana delle Origini},
YEAR = {2014},
ABSTRACT = {Probabile francesismo che completa la famiglia del latinismo "rigido"},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana, Francesismi, Progetto DiVo},
URL = {http://tlio.ovi.cnr.it/voci/031503.htm},
VOLUME = {18},
ISSN = {2240-5216},
JOURNAL = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI},
}
@ARTICLE{GUADAGNINI_2014_ARTICLE_G_275429,
AUTHOR = {Guadagnini, E.},
TITLE = {Voce RUGGITO s. m. del Tesoro della Lingua Italiana delle Origini},
YEAR = {2014},
ABSTRACT = {Notevole il significato medico, che costituisce un forte latinismo semantico: 1 Verso rauco, sonoro e possente caratteristico del leone. 1. 1 Estens. Suono fragoroso. 2 [Med. ] Forte gorgoglio (del ventre, degli intestini), borborigmo},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana, Progetto DiVo},
URL = {http://tlio.ovi.cnr.it/voci/031515.htm},
VOLUME = {18},
ISSN = {2240-5216},
JOURNAL = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI},
}
@ARTICLE{GUADAGNINI_2014_ARTICLE_G_272445,
AUTHOR = {Guadagnini, E.},
TITLE = {Voce IRRIGIDIRE v. del Tesoro della Lingua Italiana delle Origini},
YEAR = {2014},
ABSTRACT = {Completa la famiglia del latinismo "rigido"},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana, Progetto DiVo},
URL = {http://tlio.ovi.cnr.it/voci/031488.htm},
VOLUME = {18},
ISSN = {2240-5216},
JOURNAL = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI},
}
@ARTICLE{GUADAGNINI_2014_ARTICLE_G_275438,
AUTHOR = {Guadagnini, E.},
TITLE = {Voce RUVIDO agg. del Tesoro della Lingua Italiana delle Origini},
YEAR = {2014},
ABSTRACT = {Interessante con riferimento a un passo boccacciano (punto 3. 1 della voce): 1 La cui superficie presenta irregolarità o asperità al tatto. 2 [Rif. a una persona: ] duro, vigoroso e rigido; privo di ricercatezza, mollezza e artificio. 3 Che comporta delle forti difficoltà o delle gravi conseguenze; che appare o risulta difficile da sopportare o da superare. 3. 1 [Rif. specif. agli effetti del freddo sull'acqua: ] insopportabilmente gelido?},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana, Progetto DiVo},
URL = {http://tlio.ovi.cnr.it/voci/031519.htm},
VOLUME = {18},
ISSN = {2240-5216},
JOURNAL = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI},
}
@ARTICLE{GUADAGNINI_2014_ARTICLE_G_275416,
AUTHOR = {Guadagnini, E.},
TITLE = {Voce ROIDAMENTE avv. del Tesoro della Lingua Italiana delle Origini},
YEAR = {2014},
ABSTRACT = {Francesismo che completa la famiglia di "rigido"},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana, Francesismi, Progetto DiVo},
URL = {http://tlio.ovi.cnr.it/voci/031508.htm},
VOLUME = {18},
ISSN = {2240-5216},
JOURNAL = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI},
}
@ARTICLE{MARZI_2014_ARTICLE_MFK_229241,
AUTHOR = {Marzi, C. and Ferro, M. and Keuleers, E.},
TITLE = {Perception of typicality in the lexicon: Wordlikeness, lexical density and morphonotactic constraints},
YEAR = {2014},
ABSTRACT = {The extent to which a symbolic time-series (a sequence of sounds or letters) is a typical word of a language, referred to as WORDLIKENESS, has been shown to have effects in speech perception and production, reading proficiency, lexical development and lexical access, short-term and long-term verbal memory. Two quantitative models have been suggested to account for these effects: serial phonotactic probabilities (the likelihood for a given symbolic sequence to appear in the lexicon) and lexical density (the extent to which other words can be obtained from a target word by changing, deleting or inserting one or more symbols in the target). The two measures are highly correlated and thus easy to be confounded in measuring their effects in lexical tasks. In this paper, we propose a computational model of lexical organisation, based on Self-Organising Maps with Hebbian connections defined over a temporal layer (TSOMs), providing a principled algorithmic account of effects of lexical acquisition, processing and access, to further investigate these issues. In particular, we show that (morpho-)phonotactic probabilities and lexical density, though correlated in lexical organisation, can be taken to focus on different aspects of speakers' word processing behaviour and thus provide independent cognitive contributions to our understanding of the principles of perception of typicality that govern lexical organisation},
KEYWORDS = {wordlikeness, lexical access, word processing, frequency, memory},
PAGES = {171-191},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-84919701117\&origin=inward},
VOLUME = {40 (78)},
ISSN = {0586-0296},
JOURNAL = {SUVREMENA LINGVISTIKA},
}
@ARTICLE{MARZI_2014_ARTICLE_MFP_226384,
AUTHOR = {Marzi, C. and Ferro, M. and Pirrelli, V.},
TITLE = {Morphological structure through lexical parsability},
YEAR = {2014},
ABSTRACT = {The emergence of morphological structure in lexical acquisition is analysed in the computational framework of Temporal Self-Organising Maps (TSOMs), to provide an explanatory basis for both psycholinguistic and linguistic accounts of lexical parsability. The investigation we propose is grounded on the hypothesis that perception of morphological structure (parsability) and frequency strongly correlate in the acquisition of inflectional paradigms. Analysis of experimental results of word acquisition obtained by artificially varying training conditions, allows us to understand developmental competition between fully-inflected word forms, and to investigate a hierarchy of frequency effects. The computational and theoretical implications of such a memory-based view of the relationship between frequency and perception, and its potential to account},
KEYWORDS = {inflectional paradigms, morphological structure, token/type frequency, word processing.},
PAGES = {263-290},
URL = {http://www.rivisteweb.it/doi/10.1418/78410},
VOLUME = {XIII (2)},
DOI = {10.1418/78410},
ISSN = {1720-9331},
JOURNAL = {LINGUE E LINGUAGGIO},
}
@ARTICLE{PROIETTI_2014_ARTICLE_PO_405480,
AUTHOR = {Proietti, C. and Olsson, E. J.},
TITLE = {A DDL Approach to Pluralistic Ignorance and Collective Belief},
YEAR = {2014},
ABSTRACT = {A group is in a state of pluralistic ignorance (PI) if, roughly speaking, every member of the group thinks that his or her belief or desire is different from the beliefs or desires of the other members of the group. PI has been invoked to explain many otherwise puzzling phenomena in social psychology. The main purpose of this article is to shed light on the nature of PI states-their structure, internal consistency and opacity-using the formal apparatus of Dynamic Doxastic Logic, and also to study the sense in which such states are "fragile", i. e. to identify plausible conditions under which a PI state cascades into a state of shared belief as the result of announcement},
KEYWORDS = {Pluralistic ignorance, Informational cascades, Dynamic logic, Social epistemology},
PAGES = {499-515},
URL = {https://iris.cnr.it/handle/20.500.14243/405480},
VOLUME = {43 (2-3)},
DOI = {10.1007/s10992-013-9277-3},
ISSN = {0022-3611},
JOURNAL = {JOURNAL OF PHILOSOPHICAL LOGIC},
}
@ARTICLE{SASSI_2014_ARTICLE_SBP_255583,
AUTHOR = {Sassi, M. and Biagioni, S. and Pardelli, G.},
TITLE = {A Linguistic and Gender Approach to 1841 Tuscany Population Census},
YEAR = {2014},
ABSTRACT = {The Census of 1841 in Tuscany was the first official data registry which tried to describe Tuscan population as a whole on the basis of the Granducato's territory. With the use of special ad-hoc created forms, all demographic and socioeconomic characteristics of families and single persons in "Granducato di Toscana" were described. Work is developed in five points: (1) informatics retrieval of linguistic information from Tuscany of 1800 focused by the arts and craftsmanship more in use in families of that time; (2) gender division of works and craftsmanship; (3) observation of lexical disparity in the four communities and terminological curiosities of that historical period; (4) actually no longer existing craftsmanship; and (5) diachronic analysis of communities, where possible. In this scenario, the authors will introduce the methodology they used for data analysis. Tables and figures will be used to better focus different moments and results of the work. A Glossary in Appendix will contain the English translation of the Italian terms extracted from the Corpus},
KEYWORDS = {Tuscany Population Census, sociological analysis, gender analysis, the 19th work terminology, linguistic statistics},
PAGES = {318-329},
URL = {http://www.davidpublishing.com/show.html?16049},
VOLUME = {12 (4)},
ISSN = {1539-8080},
JOURNAL = {US-CHINA FOREIGN LANGUAGE},
}
@ARTICLE{SORIA_2014_ARTICLE_SCMQBCMOP_260814,
AUTHOR = {Soria, C. and Calzolari, N. and Monachini, M. and Quochi, V. and Bel, N. and Choukri, K. and Mariani, J. and Odijk, J. and Piperidis, S.},
TITLE = {The language resource Strategic Agenda: the FLaReNet synthesis of community recommendations},
YEAR = {2014},
ABSTRACT = {The main purpose of this paper is to serve as a landmark for future research and in particular for future strategic, infrastructural and coordination initiatives. It presents a preliminary plan for actions and infrastructures that could become the basis for future initiatives in the sector of Language Resources and Technologies (LRTs). The FLaReNet Language Resource Strategic Agenda presents a set of recommen-dations for the development and progress of LRT in Europe, as issued from a three-year consultation of the FLaReNet European project. Recommendations cover a broad range of topics and activities, spanning over production and use of language resources, licensing, maintenance and preservation issues, infrastructures for language resour-ces, resource identification and sharing, evaluation and validation, interoperability and policy issues. The intended recipients belong to a large set of players and stakeholders in LRT, ranging from individuals to research and education institutions, to policy-makers, funding agencies, SMEs and large companies, service and media providers},
KEYWORDS = {Strategic agenda, Language resources planning, Recommended priority actions},
PAGES = {753-775},
URL = {https://iris.cnr.it/handle/20.500.14243/260814},
VOLUME = {48 (4)},
DOI = {10.1007/s10579-014-9279-y},
ISSN = {1574-020X},
JOURNAL = {LANGUAGE RESOURCES AND EVALUATION},
}
@ARTICLE{WIELING_2014_ARTICLE_WMNB_260804,
AUTHOR = {Wieling, M. and Montemagni, S. and Nerbonne, J. and Baayen, R. H.},
TITLE = {Lexical differences between Tuscan dialects and standard Italian: Accounting for geographic and socio-demographic variation using generalized additive mixed modeling},
YEAR = {2014},
ABSTRACT = {This study uses a generalized additive mixed-effects regression model to predict lexical differences in Tuscan dialects with respect to standard Italian. We used lexical information for 170 concepts used by 2, 060 speakers in 213 locations in Tuscany. In our model, geographical position was found to be an important predictor, with locations more distant from Florence having lexical forms more likely to differ from standard Italian. In addition, the geographical pattern varied significantly for low-versus high-frequency concepts and older versus younger speakers. Younger speakers generally used variants more likely to match the standard language. Several other factors emerged as significant. Male speakers as well as farmers were more likely to use lexical forms different from standard Italian. In contrast, higher-educated speakers used lexical forms more likely to match the standard. The model also indicates that lexical variants used in smaller communities are more likely to differ from standard Italian. The impact of community size, however, varied from concept to concept. For a majority of concepts, lexical variants used in smaller communities are more likely to differ from the standard Italian form. For a minority of concepts, however, lexical variants used in larger communities are more likely to differ from standard Italian. Similarly, the effect of the other community-and speaker-related predictors varied per concept. These results clearly show that the model succeeds in teasing apart different forces influencing the dialect landscape and helps us to shed light on the complex interaction between the standard Italian language and the Tuscan dialectal varieties. In addition, this study illustrates the potential of generalized additive mixed-effects regression modeling applied to dialect data. *},
KEYWORDS = {Tuscan dialects, lexical variation, gene, mixed-effects regression modeling, geographical variation},
PAGES = {669-692},
URL = {http://www.linguisticsociety.org/files/wieling.pdf},
VOLUME = {90 (3)},
ISSN = {0097-8507},
JOURNAL = {LANGUAGE},
}
@INCOLLECTION{BOSCHETTI_2014_INCOLLECTION_B_276504,
AUTHOR = {Boschetti, F.},
TITLE = {Strumenti on-line per l'analisi e l'annotazione di testi letterari ed epigrafici bilingui},
YEAR = {2014},
ABSTRACT = {Methods and tools for the study of bilingual texts in parallel are illustrated. The granularity of the alignments is discussed, distinguishing in particular among document by document, sentence by sentence and word by word alignment. The concept of pericope is defined as a syntactic and semantic unity for the parallelization of consistent and continuous segments. Automated techniques of alignment used by the Perseus Project and tools for the dynamic division of texts in parallel pericopes developed at the ILC-CNR are illustrated and criticized. Eventually, the system for the visualization and interrogation of the Latin and Greek version of the RGDA edited by Mommsen is described, focusing on the study of the complementarity between the texts},
KEYWORDS = {Digital Epigraphy, Cooperative Philology},
PAGES = {1-9},
URL = {http://www.edizionicafoscari.unive.it/col/exp/30/59/Archivistica/3},
PUBLISHER = {Edizioni Ca' Foscari (Venezia, ITA)},
ISBN = {978-88-97735-94-6},
CONFERENCE_PLACE = {Venezia},
BOOKTITLE = {Memoria poetica e poesia della memoria-La versificazione epigrafica dall'antichità all'umanesimo},
EDITOR = {Pistellato, A.},
}
@INCOLLECTION{BOZZI_2014_INCOLLECTION_B_287419,
AUTHOR = {Bozzi, A.},
TITLE = {Computer-assisted Scholarly Editing of Manuscripts Sources},
YEAR = {2014},
ABSTRACT = {The contribution will concentrate on the specific aspect of textual criticism. I realize this is a discipline that could be defined as being 'very exclusive, ' as the scholars are not numerically equivalent to the community of people working in other Humanities disciplines; for example historians, philosophers, or those dealing with the history and criticism of literature. However, if we consider that textual criticism covers a very large period (Ancient, Medieval and Modern times) and many languages, there is also an increase in the population of specialists},
KEYWORDS = {Computer-aided Textual Scholarship, Textual Criticism, Computational Philology},
PAGES = {99-115},
URL = {http://www.oapen.org/search?identifier=515678},
PUBLISHER = {Amsterdam University Press (Amsterdam, NLD)},
ISBN = {978-90-896-4564-7},
CONFERENCE_PLACE = {Amsterdam},
BOOKTITLE = {New Publication Cultures in the Humanities. Exploring the Paradigm Shift},
EDITOR = {Dávidházi, P.},
}
@INCOLLECTION{CALZOLARI_2014_INCOLLECTION_CMQST_259412,
AUTHOR = {Calzolari, N. and Monachini, M. and Quochi, V. and Soria, C. and Toral, A.},
TITLE = {Lexicons, Terminologies, Ontologies: Reflections from Experiences in Resource Construction},
YEAR = {2014},
ABSTRACT = {This contribution aims at highlighting the strong interconnection between lexicons, terminologies and ontologies and especially the fundamental role that ontologies and lexica mutually play. Our view is that lexical resources are evolving in nature, from ontologically based lexicons we are going towards lexically based ontologies. We explore different instantiations of the current trend of using formal ontologies as a core module of computational lexicons, presenting the advantages especially in multilingual and terminological contexts. We present work showing that the lexical knowledge already present in non formal computational lexicons can be exploited to derive or enrich a formal ontology without much manual effort. In the terminology domain, we describe the construction of a resource for biology, directly linked to a parallel domain-ontology, that combines characteristics of both lexicons and terminologies, so that is can allow for intelligent access to content. Finally, we describe our experience in two projects in which formal ontologies play a central role in the context of multilingual computational lexicons, where the ontology is what acts as the glue among the different monolingual lexicons and what provides cross-lingual reasoning capabilities},
KEYWORDS = {Computational Lexicons, Ontology, Terminology, Interoperability, Standards},
PAGES = {103-121},
URL = {http://www.springer.com/computer/ai/book/978-3-642-45326-7},
DOI = {10.1007/978-3-642-45327-4_7},
PUBLISHER = {Springer (Berlin Heidelberg, DEU)},
ISBN = {978-3-642-45326-7},
CONFERENCE_PLACE = {Berlin Heidelberg},
BOOKTITLE = {Language, Culture, Computation. Computational Linguistics and Linguistics. Essays Dedicated to Yaacov Choueka on the Occasion of His 75th Birthday, Part III},
EDITOR = {Dershowitz, N. and Nissan, E.},
}
@INCOLLECTION{MARCONI_2014_INCOLLECTION_M_339253,
AUTHOR = {Marconi, L.},
TITLE = {L'italiano scritto nelle scuole: analisi e creazione di corpora},
YEAR = {2014},
ABSTRACT = {La Linguistica Computazionale è un settore di ricerca interdisciplinare che, negli ultimi anni, è cresciuto in molte direzioni; ha attinto contributi e sviluppato collaborazioni in ambiti diversi con altre scienze quali la linguistica, la psicologia, la statistica, la matematica, l'informatica. L'essere umano si relaziona con gli altri parlando o scrivendo; attraverso il linguaggio l'uomo elabora concetti, esprime sentimenti e trasferisce agli altri le sue conoscenze. È, di conseguenza, importante capire come evolve la lingua, misurare o rilevare un dato fenomeno linguistico. I corpora hanno un ruolo fondamentale per poter riconoscere e classificare un determinato fenomeno linguistico, per effettuare studi sull'evoluzione della lingua, per contribuire alla costruzione di tools di analisi linguistica desumendo le informazioni dai dati empirici. La costruzione di modelli e strumenti di elaborazione del linguaggio naturale di un dato fenomeno, realizzati con procedure basate su regole o con metodologie di tipo statistico, fa riferimento a basi di conoscenza costituite dai dati dei corpora di riferimento},
URL = {https://iris.cnr.it/handle/20.500.14243/339253},
ISBN = {9788880801269},
}
@INCOLLECTION{RUSSO_2014_INCOLLECTION_RC_228532,
AUTHOR = {Russo, I. and Caselli, T.},
TITLE = {Converging evidences on the eventivity of Italian nouns},
YEAR = {2014},
ABSTRACT = {This paper aims at shedding lights on the complex semantic concept of "event noun". Starting with the working hypothesis that linguistic context and corpus-based distributional information can be decisive, we propose a measure for eventivity that relies on syntagmatic cues. By means of a comparison between syntagmatic evidence obtained from a corpus study and speakers' judgments, we have identified a measure of eventivity for nouns. The comparison with annotated data proves its soundness},
KEYWORDS = {event nominals, syntagmatic cues, degree of eventivity},
PAGES = {179-200},
URL = {https://iris.cnr.it/handle/20.500.14243/228532},
PUBLISHER = {Düsseldorf University Press (Düsseldorf, DEU)},
ISBN = {978-3-943460-87-2},
CONFERENCE_PLACE = {Düsseldorf},
BOOKTITLE = {Meaning, frames, and conceptual representation},
EDITOR = {Gamerschlag, T. and Gerland, D. and Osswald, R. and Wiebke, P.},
}
@EDITORIAL{BOSCO_2014_EDITORIAL_BCDFMS_297502,
AUTHOR = {Bosco, C. and Cosi, P. and Dell'Orletta, F. and Falcone, M. and Montemagni, S. and Simi, M.},
TITLE = {Proceedings of the Fourth International Workshop EVALITA 2014},
YEAR = {2014},
KEYWORDS = {Trattamento Automatico del Linguaggio, Speech Processing, Lingua Italiana},
PAGES = {167},
URL = {http://clic.humnet.unipi.it/proceedings/Proceedings-EVALITA-2014.pdf},
PUBLISHER = {Pisa University Press (Pisa, ITA)},
ISBN = {978-88-67414-72-7},
CONFERENCE_PLACE = {Pisa},
}
@EDITORIAL{ELMOHAJIR_2014_EDITORIAL_EACAEPZE_290901,
AUTHOR = {El Mohajir, M. and Al Achhab, M. and Chahhou, M. and Arioua, M. and El Mohajir, B. and Pirrelli, V. and Zarghili, A. and Elfar, M.},
TITLE = {Proceedings of IEEE-CiST14-Third IEEE International Colloquium in Information Science and Technology (CIST)},
YEAR = {2014},
ABSTRACT = {The 3rd international IEEE Colloquium on Information Science and Technology (CIST'14) is part of the IEEE CONFERENCE SERIES that are held in Morocco, and is sponsored by the IEEE Morocco Section and the IEEE Morocco Computer \& Communication Joint Chapter, and the UAE IEEE Student Branch. The 2014 edition was organized in collaboration with the Faculty of Sciences of Tetuan, the national school of applied sciences of Tetuan and the University of Abdelmalek Essaadi. IEEE CIST is emerging as a key annual event that aims to serve as a forum to promote the exchange of the latest advances achieved by IT researchers, IT decision makers, IT managers, application designers and software engineers in the domain of information science and related technology. Computing challenges, models, applications and IT solutions will be discussed from the perspectives of academia, industry and government. In addition to the main conference topics, IEEE CIST will also provide a platform for supporting innovative and original contributions in three complementary disciplines that are: Arabic natural language processing, Information and multimedia processing and Internet of Things. We would like to extend our most sincere thanks and gratitude to the keynote speakers of IEEE CIST'14 for their important added value to this edition and to the Scientific Committee Members who helped us in the review process. We would like also to express our thanks to the IEEE Computer Society for their support through their Distinguished Lecturers Programs. We are also very glad to express our most sincere gratitude for the organizing committee members for their full dedication and professional organization of this edition. The success of this colloquium will be mainly attributed to the authors who contributed with their posters and talks. We hope that CIST will continue to offer a privileged context for participants to develop new ways and methods to achieve our objectives in advancing our research and projects. We can together achieve more and face more efficiently the challenges of the current millennium},
PAGES = {440},
URL = {http://ieeexplore.ieee.org/xpl/mostRecentIssue.jsp?punumber=6996097},
DOI = {10.1109/CIST.2014.7016582},
PUBLISHER = {IEEE (New York, USA)},
ISBN = {978-1-4799-5979-2},
CONFERENCE_PLACE = {New York},
}
@EDITORIAL{FRANCESCONI_2014_EDITORIAL_FMPVW_280049,
AUTHOR = {Francesconi, E. and Montemagni, S. and Peters, W. and Venturi, G. and Wyner, A.},
TITLE = {Proceedings of the Fourth Workshop on Semantic Processing of Legal Texts},
YEAR = {2014},
PAGES = {33},
URL = {http://www.lrec-conf.org/proceedings/lrec2014/workshops/LREC2014Workshop-SPLeT%20Proceedings.pdf},
ISBN = {978-2-9517408-8-4},
CONFERENCE_PLACE = {Parigi},
}
@EDITORIAL{LEONARDI_2014_EDITORIAL_LLSABBDFFFGGIMMMRRRVVZ_298144,
AUTHOR = {Leonardi, L. D. and Larson, P. C. and Squillacioti, P. C. and Artale, E. and Boccellari, A. and Burgassi, C. and Dotto, D. and Felici, A. and Ferroni, G. and Fortunato, M. and Giuliani, M. and Guadagnini, E. and Iorio Fili, D. and Maggiore, M. and Morlino, L. and Mosti, R. and Ravani, S. and Ricotta, V. and Rinaldin, A. and Vaccaro, G. and Verlato, Z. and Zamuner, I.},
TITLE = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI-Edizione online: www. vocabolario. org (ISSN 2240-5216)-Versione dicembre 2014},
YEAR = {2014},
ABSTRACT = {A pdf copy of the «Tesoro della Lingua Italiana delle Origini» (TLIO), a dictionary of early Italian in progress, published online, as it was at the end of December 2014 (29, 425 entries). TLIO is the first section of the Italian Historical Dictionary which is the mission of the OVI Institute},
KEYWORDS = {Lessico, Lessicografia, Lingua italiana},
PAGES = {12787},
URL = {http://tlio.ovi.cnr.it/TLIO/},
ISSN = {2240-5216},
}
@EDITORIAL{PIRRELLI_2014_EDITORIAL_PR_274740,
AUTHOR = {Pirrelli, V. and Raffaelli, I.},
TITLE = {Special Issue of Suvremena Lingvistika},
YEAR = {2014},
PAGES = {127-235},
URL = {https://iris.cnr.it/handle/20.500.14243/274740},
PUBLISHER = {Croatian Philological Society (Zagreb, HRV)},
CONFERENCE_PLACE = {Zagreb},
}
@EDITORIAL{PRETORIUS_2014_EDITORIAL_PSB_257905,
AUTHOR = {Pretorius, L. and Soria, C. and Baroni, P.},
TITLE = {Proceedings of the Workshop on Collaboration and Computing for Under-Resourced Languages in the Linked Open Data Era (CCURL 2014)},
YEAR = {2014},
ABSTRACT = {Proceedings del Workshop su Collaborazione e Computazione per le Lingue con Risorse Insufficienti nell'era dei Dati Aperti Collegati (CCURL 2014 | Reykjavik, 26/05/2014)},
KEYWORDS = {under-resourced languages},
PAGES = {107},
URL = {http://www.lrec-conf.org/proceedings/lrec2014/index.html},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {978-2-9517408-8-4},
CONFERENCE_PLACE = {Paris},
}
@EDITORIAL{VV_2014_EDITORIAL_V_404023,
AUTHOR = {Vv, A.},
TITLE = {Social Dynamics and Collective Rationality},
YEAR = {2014},
ABSTRACT = {This issue collects ten papers selected from five international Copenhagen Lund Workshops in Social Epistemology, held between December 2010 and December 2012, that were made possible through a research grant to Vincent F. Hendricks and Erik J. Olsson by the Einar Hansen Research Fond and RQ8-funds from Lund University. Besides providing a platform for basic-level research, workshops focused on applied research related to social dynamics that lead group members to influence each other's beliefs and choices in ways that can produce not only suboptimal but genuinely catastrophic, and thus pathological, collective outcomes},
URL = {https://iris.cnr.it/handle/20.500.14243/404023},
ISSN = {0039-7857},
}
@EDITORIAL{ZENKER_2014_EDITORIAL_ZP_405498,
AUTHOR = {Zenker, F. and Proietti, C.},
TITLE = {Editors' introduction: social dynamics and collective rationality},
YEAR = {2014},
KEYWORDS = {Belief polarization, Belief merging, Debiasing, Doxastic disagreement, Dynamic epistemic logic, Echo chambers, Group topology, Informational cascades, Pluralistic ignorance, Truth approximation},
PAGES = {2353-2358},
URL = {https://iris.cnr.it/handle/20.500.14243/405498},
VOLUME = {191 (11)},
DOI = {10.1007/s11229-014-0430-5},
ISSN = {0039-7857},
}
@INPROCEEDINGS{ABRATE_2014_INPROCEEDINGS_AMGLLMMPP_264619,
AUTHOR = {Abrate, M. and M Del Grosso, A. and Giovannetti, E. and Lo Duca, A. and Luzzi, D. and Mancini, L. and Marchetti, A. and Pedretti, I. and Piccini, S.},
TITLE = {Sharing Cultural Heritage: the Clavius on the Web Project},
YEAR = {2014},
ABSTRACT = {In the last few years the amount of manuscripts digitized and made available on the Web has been constantly increasing. However, there is still a considarable lack of results concerning both the explicitation of their content and the tools developed to make it available. The objective of the Clavius on the Web project is to develop a Web platform exposing a selection of Christophorus Clavius letters along with three different levels of analysis: linguistic, lexical and semantic. The multilayered annotation of the corpus involves a XML-TEI encoding followed by a tokenization step where each token is univocally identified through a CTS urn notation and then associated to a part-of-speech and a lemma. The text is lexically and semantically annotated on the basis of a lexicon and a domain ontology, the former structuring the most relevant terms occurring in the text and the latter representing the domain entities of interest (e. g. people, places, etc.). Moreover, each entity is connected to linked and non linked resources, including DBpedia and VIAF. Finally, the results of the three layers of analysis are gathered and shown through interactive visualization and storytelling techniques. A demo version of the integrated architecture was developed},
KEYWORDS = {language technologies for digital cultural heritage, lexica and ontologies, data visualization},
PAGES = {8},
URL = {https://iris.cnr.it/handle/20.500.14243/264619},
ISBN = {978-2-9517408-8-4},
CONFERENCE_NAME = {LREC 2014-The 9th edition of the Language Resources and Evaluation Conference},
BOOKTITLE = {LREC 2014 Proceedings},
}
@INPROCEEDINGS{ANTICO_2014_INPROCEEDINGS_AQMM_259425,
AUTHOR = {Antico, G. and Quochi, V. and Monachini, M. and Martinelli, M.},
TITLE = {Marrying Technical Writing with LRT},
YEAR = {2014},
ABSTRACT = {In the last years the Technical Writer operational scenarios and the workflow sensibly changed; specifically, "free style" writing-or manual writing-has become outdated and technical writing is now much more concerned with structured management of content than in the past. Technical writing has become more demanding due to a number of factors among which the rise and spread of mobile devices usage. This paper discusses the new needs of technical writing and content management business and how LRT can help it improve quality and productivity},
KEYWORDS = {controlled language, technical writing, content management systems},
PAGES = {19-25},
URL = {http://www.lrec-conf.org/proceedings/lrec2014/index.html},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {978-2-9517408-8-4},
CONFERENCE_NAME = {9th International Conference on Language Resources and Evaluation (LREC)},
CONFERENCE_PLACE = {Paris},
EDITOR = {Isahara, H. and Lee, K. S. C. S. and Nam, S.},
}
@INPROCEEDINGS{BARBAGLI_2014_INPROCEEDINGS_BLDMV_266268,
AUTHOR = {Barbagli, A. and Lucisano, P. and Dell'Orletta, F. and Montemagni, S. and Venturi, G.},
TITLE = {Tecnologie del linguaggio e monitoraggio dell'evoluzione delle abilità di scrittura nella scuola secondaria di primo grado},
YEAR = {2014},
ABSTRACT = {Over the last ten years, the use of language technologies was successfully extended to the study of learning processes. The paper reports the first results of a study, which is part of a broader experimental pedagogy project, aimed at monitoring the evolution of the learning process of the Italian language based on a corpus of written productions by students and exploiting automatic linguistic annotation and knowledge extraction tools},
PAGES = {23-27},
URL = {http://www.italianlp.it/wp-content/uploads/2014/12/Tecnologie-del-linguaggio-per-la-scuola.pdf},
DOI = {10.12871/CLICIT201415},
PUBLISHER = {Pisa University Press srl (Pisa, ITA)},
ISBN = {978-8-86741-472-7},
CONFERENCE_NAME = {First Italian Conference on Computational Linguistics (CLiC-it 2014)},
CONFERENCE_PLACE = {Pisa},
BOOKTITLE = {Proceedings of the First Italian Conference on Computational Linguistics (CLiC-it 2014)},
EDITOR = {Basili, R. and Lenci, A. and Magnini, B.},
}
@INPROCEEDINGS{BARTOLINI_2014_INPROCEEDINGS_BQDRM_228452,
AUTHOR = {Bartolini, R. and Quochi, V. and De Felice, I. and Russo, I. and Monachini, M.},
TITLE = {From Synsets to Videos: Enriching ItalWordNet Multimodally},
YEAR = {2014},
ABSTRACT = {The paper describes the multimodal enrichment of ItalWordNet action verbs' entries by means of an automatic mapping with a conceptual ontology of action types instantiated by video scenes (ImagAct). The two resources present significative differences as well as interesting complementary features, such that a mapping of these two resources can lead to a an enrichment of IWN, through the connection between synsets and videos apt to illustrate the meaning described by glosses. Here, we describe an approach inspired by ontology matching methods for the automatic mapping of ImagAct video scenes onto ItalWordNet. The experiments described in the paper are conducted on Italian, but the same methodology can be extended to other languages for which WordNets have been created, since ImagAct is available also for English, Chinese and Spanish. This source of multimodal information can be exploited to design second language learning tools, as well as for language grounding in action recognition in video sources and potentially for robotics},
KEYWORDS = {Action ontology, Multimodality, WordNet},
PAGES = {3110-3117},
URL = {http://www.lrec-conf.org/proceedings/lrec2014/index.html},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {978-2-9517408-8-4},
CONFERENCE_NAME = {LREC 2014. European Language Resources Association ELRA: Paris (Francia)},
CONFERENCE_PLACE = {Paris},
EDITOR = {Calzolari, N. and Choukri, K. and Declerck, T. and Loftsson, H. and Maegaard, B. and Mariani, J. and Moreno, A. and Odijk, J. and Piperidis, S.},
}
@INPROCEEDINGS{BELLANDI_2014_INPROCEEDINGS_BABBG_253556,
AUTHOR = {Bellandi, A. and Albanesi, D. and Bellusci, A. and Bozzi, A. and Giovannetti, E.},
TITLE = {The Talmud System: a Collaborative Web Application for the Translation of the Babylonian Talmud Into Italian},
YEAR = {2014},
URL = {https://iris.cnr.it/handle/20.500.14243/253556},
PUBLISHER = {Pisa University Press srl (Pisa, ITA)},
ISBN = {978-8-86741-472-7},
CONFERENCE_NAME = {First Italian Conference on Computational Linguistics (CLiC-it 2014)},
CONFERENCE_PLACE = {Pisa},
BOOKTITLE = {Proceedings of the First Italian Conference on Computational Linguistics (CLiC-it 2014)},
EDITOR = {Basili, R. and Lenci, A. and Magnini, B.},
}
@INPROCEEDINGS{BELLANDI_2014_INPROCEEDINGS_BBCG_264618,
AUTHOR = {Bellandi, A. and Bellusci, A. and Cappelli, A. and Giovannetti, E.},
TITLE = {Graphic visualization in literary text interpretation},
YEAR = {2014},
ABSTRACT = {We here illustrate a possible approach combining existing technologies for Natural Language Processing (NLP), Knowledge Representation and Reasoning (KRR) and Data Visualization in a coherent Decision Support System (DSS). The approach to the development of the system we are working on can be articulated in two main steps: the customization and integration of existing tools for automatic text annotation (at least linguistic, lexicographic and semantic) and the construction of a user-friendly and highly expressive GUI. The interface should allow a user to: upload her/his own text, run the desired annotation tools, visually interact with the resulting multilayered network to: i) proof-read the results of the automatic annotations, ii) manually add missing elements and/or relations between elements and, finally, iii) formulate and verify specific interpretative hypotheses},
KEYWORDS = {Computational hermeneutics, Text processing, Knowledge representation and reasoning, Data visualization},
PAGES = {392-397},
URL = {https://ieeexplore.ieee.org/document/6902939},
DOI = {10.1109/IV.2014.62},
PUBLISHER = {IEEE (New York, USA)},
ISBN = {978-1-4799-4103-2},
CONFERENCE_NAME = {IV 2014-18th International Conference on Information Visualisation},
CONFERENCE_PLACE = {New York},
BOOKTITLE = {2014 18th International Conference on Information Visualisation-IV 2014. Proceedings},
EDITOR = {Banissi, E. and Bannatyne, M. W. M. and Marchese, F. T. and Sarfraz, M. and Ursyn, A. and Venturini, G. and Wyeld, T. G. and Cvek, U. and Trutschl, M. and Grinstein, G. and Geroimenko, V. and Kenderdine, S. and Bouali, F.},
}
@INPROCEEDINGS{BELLANDI_2014_INPROCEEDINGS_BBCG_264621,
AUTHOR = {Bellandi, A. and Bellusci, A. and Carniani, E. and Giovannetti, E.},
TITLE = {Content Elicitation: Towards a New Paradigm for the Analysis and Interpretation of Texts},
YEAR = {2014},
ABSTRACT = {In this paper we show how semantic technologies can be exploited, with the help of user friendly interfaces, to identify and structure the knowledge embedded in literary texts. The proposed approach, that we have called Content Elicitation, supports the experts in defining hierarchical and associative relationships between semantically annotated chunks of text denoting relevant entities, allowing visual structuring of knowledge, which can be edited by different experts in a collaborative way. This knowledge, formally coded as an ontology, can then be used by scholars and students as a guide for the analysis of the text and for the discovery of potential novel interpretations. We are testing and evaluating this approach on the Babylonian Talmud, due to its historical, linguistic, semantic and structural richness},
KEYWORDS = {semantic annotation, knowledge representation, text ontology, content elicitation, literary computing, da},
URL = {https://iris.cnr.it/handle/20.500.14243/264621},
DOI = {10.2316/P.2014.810-031},
PUBLISHER = {Acta press (Calgary, CAN)},
CONFERENCE_NAME = {The 13th IASTED International Conference on Software Engineering},
CONFERENCE_PLACE = {Calgary},
EDITOR = {Hamza, M. H.},
}
@INPROCEEDINGS{BELLUSCI_2014_INPROCEEDINGS_BBBCGM_253555,
AUTHOR = {Bellusci, A. and Bellandi, A. and Benotto, G. and Cappelli, A. and Giovannetti, E. and Marchi, S.},
TITLE = {Towards a decision support system for text interpretation},
YEAR = {2014},
ABSTRACT = {This article illustrates the first steps towards the implementation of a Decision Support System aimed to recreate a research environment for scholars and provide them with computational tools to assist in the processing and interpretation of texts. While outlining the general characteristics of the system, the paper presents a minimal set of user requirements and provides a possible use case on Dante's Inferno},
KEYWORDS = {DDS, XML, Text interpretation, Literary computing},
PAGES = {58-62},
URL = {http://clic.humnet.unipi.it/proceedings/vol1/CLICIT2014112.pdf},
VOLUME = {I},
DOI = {10.12871/CLICIT2014118},
ISBN = {9788867414727},
CONFERENCE_NAME = {CLiC-it 2014-First Italian Conference on Computational Linguistics},
BOOKTITLE = {Proceedings of the First Italian Conference on Computational Linguistics (CLiC-it 2014)},
EDITOR = {, B. R. L. A. and Magnini, B.},
}
@INPROCEEDINGS{BOSCHETTI_2014_INPROCEEDINGS_B_228539,
AUTHOR = {Boschetti, F.},
TITLE = {Acquisizione e Creazione di Risorse Plurilingui per gli Studi di Filologia Classica in Ambienti Collaborativi},
YEAR = {2014},
ABSTRACT = {Questo articolo illustra metodi e strumenti per l'acquisizione e l'estensione di risorse digitali plurilingui per gli studi classici, sviluppati in collaborazione tra il CoPhiLab dell'Ilc-Cnr e il Perseus Project della Tufts University. Si descrivono tre linee di intervento: a) la progettazione e l'implementazione di un sistema di correzione dell'output dell'Ocr applicato al Greco antico; b) la creazione e la valutazione di un nucleo di synsets per Ancient Greek WordNet e c) l'allineamento di un campione di testi greci e latini con le relative traduzioni italiane},
KEYWORDS = {Greco Antico, OCR, WordNet, Allineamento},
PAGES = {55-67},
URL = {https://iris.cnr.it/handle/20.500.14243/228539},
PUBLISHER = {CLEUP (Padova, ITA)},
ISBN = {9788867872602},
CONFERENCE_NAME = {AIUCD 2013},
CONFERENCE_PLACE = {Padova},
BOOKTITLE = {Collaborative Research Practices and Shared Infrastructures for Humanities Computing-2nd Aiucd Annual Conference, Aiucd 2013 Padua, Italy, 11-12 December 2013-Proceedings of Revised Papers},
EDITOR = {Agosti, M. and Tomasi, F.},
}
@INPROCEEDINGS{BOSCHETTI_2014_INPROCEEDINGS_B_228543,
AUTHOR = {Boschetti, F.},
TITLE = {La localizzazione del Perseus Project in lingua italiana},
YEAR = {2014},
ABSTRACT = {Si illustra il progetto di localizzazione in lingua italiana dell'infrastruttura per lo studio dei classici greci e latini costituita dal Perseus Project (Tufts University, Medford, MA), usando risorse per l'analisi della nostra lingua sviluppate presso l'ILC-CNR di Pisa e mettendo a disposizione nuovi componenti software per la visualizzazione e l'annotazione di testi bilingui},
KEYWORDS = {filologia computazionale, allineamento, lessico dinamico},
PAGES = {221-234},
URL = {http://digilab2.let.uniroma1.it/ojs/index.php/Quaderni_DigiLab/issue/view/12},
DOI = {10.13133/978-88-98533-27-5},
ISBN = {978-88-98533-27-5},
CONFERENCE_NAME = {AIUCD 2012},
BOOKTITLE = {Digital Humanities: progetti italiani ed esperienze di convergenza multidisciplinare-Atti del convegno annuale dell'Associazione per l'Informatica Umanistica e la Cultura Digitale (AIUCD) Firenze, 13-14 dicembre 2012},
EDITOR = {Ciotti, F.},
}
@INPROCEEDINGS{BOSCHETTI_2014_INPROCEEDINGS_BCDLPPVM_228541,
AUTHOR = {Boschetti, F. and Cimino, A. and Dell'Orletta, F. and Lebani, G. E. and Passaro, L. and Picchi, P. and Venturi, G. and Montemagni, S. L. A.},
TITLE = {Computational Analysis of Historical Documents: An Application to Italian War Bulletins in World War I and II},
YEAR = {2014},
ABSTRACT = {World War (WW) I and II represent crucial landmarks in the history on mankind: They have affected the destiny of whole generations and their consequences are still alive throughout Europe. In this paper we present an ongoing project to carry out a computational analysis of Italian war bulletins in WWI and WWII, by applying state-of-the-art tools for NLP and Information Extraction. The annotated texts and extracted information will be explored with a dedicated Web interface, allowing for multidimensional access and exploration of historical events through space and time},
KEYWORDS = {World War I},
PAGES = {70-75},
URL = {http://www.lrec-conf.org/proceedings/lrec2014/workshops/LREC2014Workshop-LRT4HDA%20Proceedings.pdf},
PUBLISHER = {European language resources association (ELRA) (Paris, FRA)},
CONFERENCE_NAME = {LREC 2014},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of workshop on Language resources and technologies for processing and linking historical documents and archives-Deploying Linked Open Data in Cultural Heritage-LREC 2014, 26 May, Reykjavik, Iceland},
}
@INPROCEEDINGS{BOSCHETTI_2014_INPROCEEDINGS_BDL_228558,
AUTHOR = {Boschetti, F. and Del Gratta, R. and Lamé, M.},
TITLE = {Computer Assisted Annotation of Themes and Motifs in Ancient Greek Epigrams: First Steps},
YEAR = {2014},
ABSTRACT = {This paper aims at illustrating some tools to assist the manual annotation of themes and motifs in literary and epigraphic epigrams for the PRIN 2010/2011 Memorata Poetis Project},
KEYWORDS = {Filologia collaborativa},
PAGES = {83-86},
URL = {http://clic.humnet.unipi.it/it/atti.html},
VOLUME = {1},
DOI = {10.12871/CLICIT2014158},
PUBLISHER = {Pisa University Press (Pisa, ITA)},
ISBN = {978-8-86741-472-7},
CONFERENCE_NAME = {First Italian Conference on Computational Linguistics},
CONFERENCE_PLACE = {Pisa},
BOOKTITLE = {The First Italian Conference on Computational Linguistics-Proceedings},
EDITOR = {Basili, R. and Lenci, A. and Magnini, B.},
}
@INPROCEEDINGS{BRUNATO_2014_INPROCEEDINGS_B_253611,
AUTHOR = {Brunato, D.},
TITLE = {Complessità necessaria o stereotipi del "burocratese"? Un'indagine sulla leggibilità del linguaggio amministrativo da una prospettiva linguistico-computazionale},
YEAR = {2014},
ABSTRACT = {Questo contributo intende presentare una metodologia di ricostruzione del profilo linguistico di un corpus di testi amministrativi basata sull'uso delle tecnologie linguistico-computazionali e finalizzata alla specializzazione di un indice di leggibilità "avanzato" sulle caratteristiche di questi testi. Tale metodologia, documentata in [3], si propone di indagare la variazione linguistica tramite il monitoraggio di parametri estratti automaticamente dal testo sottoposto ad analisi linguistica multi-livello. La complessità della lingua della pubblica amministrazione, soprattutto nei documenti rivolti al cittadino, è un problema ben noto e, malgrado le molteplici iniziative in favore di un linguaggio più chiaro ed efficace, tratti tipici del "burocratese" continuano a persistere, anche quando non imposti da requisiti di legittimità e precisione. Un ausilio alla semplificazione può venire dai sistemi per la misurazione della leggibilità del testo, come suggerito anche dai manuali di stile ispirati alla letteratura del Plain Language. Tuttavia le formule tradizionali, quali Gulpease [2], si limitano ad approssimare la complessità testuale, in quanto considerano esclusivamente parametri del testo superficiali, come la lunghezza della frase e della parola. Più recentemente, è emersa una nuova generazione di indici di leggibilità, fondati su metodologie di Trattamento Automatico del Linguaggio, che riescono a intercettare i luoghi di complessità del testo in maniera più granulare, computando un ampio spettro di parametri linguistici, che risultano anche maggiormente implicati nei processi di comprensione. È il caso di READ-IT [1], lo strumento utilizzato in questo studio. L'analisi linguistica ha esplorato la distribuzione di caratteristiche lessicali, morfo-sintattiche e sintattiche, estratte automaticamente da un "corpus parallelo monolingue" di testi amministrativi, ovvero internamente suddiviso in due sotto-corpora: uno costituito da testi autentici delle pubbliche amministrazioni e uno dalle relative versioni semplificate, frutto di un lavoro di riscrittura coordinato da linguisti. Queste caratteristiche, già risultate predittive del livello di leggibilità di testi giornalistici, sono state selezionate allo scopo di verificare l'incidenza delle peculiarità della scrittura amministrativa nella caratterizzazione della leggibilità. I risultati hanno permesso infatti di discriminare tra aspetti di complessità "ineliminabile" e tratti tipici del burocratese: i primi sono rappresentati da quei parametri che, pur indicativi di maggior complessità nella lingua comune, risultano similmente distribuiti nelle due sottovarietà; i secondi sono invece quelli che contraddistinguono solo la varietà dei testi originali, dunque quelli su cui hanno agito le riscritture. Questi dati potranno supportare tanto lo sviluppo di indici di leggibilità adattati alle peculiarità del linguaggio amministrativo, quanto le ricerche più attuali sulla semplificazione semiautomatica del testo},
URL = {http://www.csfls.it/silfi2014/wp-content/uploads/2014/08/Atti-SILFI-2014-Riassunti.pdf},
ISBN = {978-88-96312-56-8},
CONFERENCE_NAME = {XIII Congresso della SILFI (Società Internazionale di Linguistica e Filologia Italiana)},
BOOKTITLE = {La lingua variabile nei testi letterari, artistici e funzionali contemporanei. Analisi, interpretazione, traduzione},
EDITOR = {Di Studi Filologici, C. and Siciliani, L. and Di Scienze Umanistiche, D. and Di Palermo, U. D. S.},
}
@INPROCEEDINGS{BRUNATO_2014_INPROCEEDINGS_BDVM_266263,
AUTHOR = {Brunato, D. and Dell'Orletta, F. and Venturi, G. and Montemagni, S.},
TITLE = {Defining an annotation scheme with a view to automatic text simplification},
YEAR = {2014},
ABSTRACT = {This paper presents the preliminary steps of ongoing research in the field of automatic text simplification. In line with current approaches, we propose here a new annotation scheme specifically conceived to identify the typologies of changes an original sentence undergoes when it is manually simplified. Such a scheme has been tested on a parallel corpus available for Italian, which we have first aligned at sentence level and then annotated with simplification rules},
PAGES = {87-92},
URL = {http://www.italianlp.it/wp-content/uploads/2014/12/Text-simplification.pdf},
DOI = {10.12871/CLICIT2014118},
PUBLISHER = {Pisa University Press srl (Pisa, ITA)},
ISBN = {978-8-86741-472-7},
CONFERENCE_NAME = {First Italian Conference on Computational Linguistics (CLiC-it 2014)},
CONFERENCE_PLACE = {Pisa},
BOOKTITLE = {Proceedings of the First Italian Conference on Computational Linguistics (CLiC-it 2014)},
EDITOR = {Basili, R. and Lenci, A. and Magnini, B.},
}
@INPROCEEDINGS{BURGASSI_2014_INPROCEEDINGS_B_265642,
AUTHOR = {Burgassi, C.},
TITLE = {Il lessico delle antiche traduzioni e il progetto DiVo (Dizionario dei volgarizzamenti)},
YEAR = {2014},
ABSTRACT = {Il contributo espone i criteri guida per la costituzione delle due banche dati del progetto DiVo ("Dizionario dei volgarizzamenti") e mette in luce, anche attraverso l'esemplificazione di casi emblematici, l'impatto del progetto nell'ambito degli studi sul lessico dell'Italiano antico},
PAGES = {183-189},
URL = {https://iris.cnr.it/handle/20.500.14243/265642},
PUBLISHER = {Il Calamo (Roma, ITA)},
CONFERENCE_NAME = {Atti del XXXVII Convegno della Società Italiana di Glottologia},
CONFERENCE_PLACE = {Roma},
BOOKTITLE = {Il lessico nella teoria e nella storia linguistica. Atti del XXXVII Convegno della Società Italiana di Glottologia},
EDITOR = {Marchese, M. P. and Nocentini, A.},
}
@INPROCEEDINGS{CHIARELLA_2014_INPROCEEDINGS_CCMMM_245100,
AUTHOR = {Chiarella, D. and Cutugno, P. and Marconi, L. and Morando, M. and Morgavi, G.},
TITLE = {La pesca, la caza, la agricultura y el bosque: una organización de datos lingüísticos por un léxico con referencia al mundo fang},
YEAR = {2014},
ABSTRACT = {El lenguaje es una forma privilegiada de desarrollo de ideas, expresión de sentimientos y conocimientos, enfrentarse con otros y también de cohesión social; el saber es generalmente procesado y transmitido a través del lenguaje. Cada persona está tan acostumbrada a vivir en su propia realidad cultural que la cree universal; cada cultura tiende a ponerse al centro del mundo y considerarse como un punto de referencia y medida de todas las otras. Un fenómeno evidente de la lengua fang es la falta de "palabras-conceptos" en sentido occidental, o palabras que abarcan una cantidad de objetos que tienen características en común. En la estructuración del diccionario hemos elegido algunos elementos de la cultura fang como organización y jerarquía social, constitución de la familia, ámbito económico, ámbito artístico, ámbito literario, ámbito de la medicina; además hemos examinado unos aspectos de la representación del tiempo y del espacio, algunas topologías de danza y juegos y unos elementos descriptivos del bosque},
KEYWORDS = {Fang, Spagnolo, lessici specifici},
PAGES = {16},
URL = {https://iris.cnr.it/handle/20.500.14243/245100},
PUBLISHER = {Centro Cultural Africano "Fernando Ortiz (Santiago de Cuba, CUB)},
ISBN = {9789592840195},
CONFERENCE_NAME = {XIII° Conferencia Internacional de Cultura Africana y Afroamericana},
CONFERENCE_PLACE = {Santiago de Cuba},
}
@INPROCEEDINGS{CIGNONI_2014_INPROCEEDINGS_CGMF_228523,
AUTHOR = {Cignoni, L. and Giuffra, V. and Minozzi, S. and Fornaciari, G.},
TITLE = {CLIL Funerary Archaeology Courses for First-Cycle and Second-Cycle Degree Students},
YEAR = {2014},
ABSTRACT = {This paper reports on the differences between two specialized funerary archaeology courses conducted by a native language teacher from the Institute for Computational Linguistics of the National Research Council in Pisa and a subject specialist in paleopathology and funerary archaeology from the Division of Palaeopathology, Department of Translational Research on New Technologies in Medicine and Surgery of Pisa University. Lessons addressed to first cycle three-year Bachelor's degree undergraduates who were studying archaeology, art history, natural and environmental sciences took place in the second semester of the year 2012-2013. Classes in the same discipline and addressed to students from the same faculties had been held a year earlier for a second cycle twoyear Master's degree course. The classes were delivered in English using CLIL (exploitation of a vehicular foreign language to teach a special subject) associated with blended learning methodology (combination of face-to-face instructor-led training with web-based technology). Appropriate teaching materials selected by the two teachers covered a wide range of topics, from the study of death to ancient burials, rites, and dynamics of human settlements, as well as evidence of past human societies recovered by excavations. In particular, ancient Roman funerary customs (inhumation, cremation) and Medieval mortuary practices and burials were studied, alongside artifacts such as weapons, jewellery, and pottery vessels recovered from archaeological sites both in Italy and in Britain. Collaboration between language teacher and subject specialist was crucial for the selection of the reading and listening materials, for the correction of the oral and written work assigned to the students, and for the intervention on the part of the subject teacher to clarify points that had been raised, to assist the students during the individual presentations, pairwork or group discussions, and to encourage their work. Two researchers collaborating with the subject specialist also contributed to the lessons by presenting studies they had performed in their area of expertise and by assisting the students during the discussions. These student-centred tasks were aimed at accomplishing important educational goals such as student motivation, improved cognitive and academic performance, enhanced access to online learning resources, peer learning and collaboration. The 2012-2013 course proved to be much more interactive and challenging than the previous one, owing to the major emphasis given to the more practical aspects, in preparation for the fieldwork in archaeology and bioarchaeology, which was carried out in the summer of 2013, working with their peers from Ohio State University and other Universities in the USA, Canada and Australia. Particular attention was devoted to the language of funerary archaeology, and the trainees extracted definitions from the texts they were using to enrich an ongoing English-Italian glossary of funerary archaeology terms. The most important items and sentence structures of the English language were studied and revised, and an English grammar containing contextualized examples drawn from specialized works in that domain was enriched with new material. Student exchanges under different European and international programmes have emphasized on the need for specialist knowledge in specific thematic areas, alongside an oral and written command of a foreign language},
KEYWORDS = {funerary archaeology, CLIL, Roman and Medieval archaeology, University education, collaborative learning},
URL = {https://iris.cnr.it/handle/20.500.14243/228523},
PUBLISHER = {International Association of Technology, Education and Development (IATED) Academy (www. iated. org, ESP)},
ISBN = {978-84-616-8412-0},
CONFERENCE_NAME = {INTED (International Technology, Education and Development Conference)},
CONFERENCE_PLACE = {www. iated. org},
}
@INPROCEEDINGS{CIGNONI_2014_INPROCEEDINGS_CMS_254626,
AUTHOR = {Cignoni, L. and Marinelli, R. and Spadoni, G. P.},
TITLE = {A CLIL/blended learning approach for cruise tourism courses in Italy using lexical/semantic databases and information technology resources},
YEAR = {2014},
ABSTRACT = {In this paper we discuss the possibility of exploiting specialized texts for cruise shipping, hotel and catering management courses in English to be held in nautical and other senior high schools in Italy, more and more involved in the promising and strongly developing field of tourism. The courses will be carried out using a content and language integrated (CLIL) approach, and will be run by native language teachers working alone or in collaboration with instructional supporting experts in the different sectors. The aims of the courses are to study the maritime terminology related to ships and navigation (crew members, safety and security systems on board, etc.) and, in particular, to the cruise ship industry and hospitality operations environment (passenger mobility on board and ashore during excursions, etc.). Students will become acquainted with the language of routine operations, giving directions, understanding commands in emergency situations, reporting on weather forecasts, and with the terms and definitions belonging to the tourist activity specialized in the management of cruise ships and passengers. The scarce number of text books available for maritime English makes it necessary to supply Italian students with a variety of material in paper and computer format, so as to help them expand their vocabulary in the foreign language with greater confidence and proficiency. The texts will include shipping and cruise shipping books and magazines, manuals, contracts, technical documents, cruise line and tour operator websites, passenger blogs, and other texts of the cruise community. The trainees, constantly exposed to the language, will work individually, in pairs and in groups, at the presence of English teachers and operators in the field of cruise tourism, and will perform activities that cover the four communication skills of reading, writing, listening and speaking (gap filling, matching, summarizing, etc.). They will use modern technological equipment including computers, ipads, and other devices, incorporated in the classrooms according to a blended learning approach, which combines face-to-face and on-line education. Students can explore the meanings of single words by consulting the English lexical semantic database WordNet implemented at Princeton University, alongside the Italian terminological database Mariterm containing data belonging to the navigation and sea transport domains, as well as visualized images. Both databases are managed by user-friendly tools that can be easily accessed by teachers and students. Mariterm can be constantly enriched and updated with new information in the different sectors of maritime English. Finally, a grammar illustrating the most important items of the English language will be made available to the students, who can copy it on a file and expand it with contextualized examples extracted from the texts they will be reading and share the outcomes with their peers. English has been internationally accepted as the language for communication, and is therefore particularly important for exchanges among those who wish to work in the tourism industry},
KEYWORDS = {maritime English, tourism, CLIL, lexical semantic databases, blended learning.},
PAGES = {6552-6559},
URL = {https://iris.cnr.it/handle/20.500.14243/254626},
PUBLISHER = {International Association of Technology, Education and Development (IATED) (Valencia, ESP)},
ISBN = {978-84-616-8412-0},
CONFERENCE_NAME = {INTED2014. 8th International Technology, Education and Development Conference},
CONFERENCE_PLACE = {Valencia},
BOOKTITLE = {INTED2014. 8th International Technology, Education and Development Conference. Valencia (Spain), 10th-12th of March, 2014. Proceedings},
EDITOR = {Chova, L. G. and Martínez, A. L. and Torres, I. C.},
}
@INPROCEEDINGS{CIMINO_2014_INPROCEEDINGS_CCDT_255596,
AUTHOR = {Cimino, A. and Cresci, S. and Dell'Orletta, F. and Tesconi, M.},
TITLE = {Linguistically-motivated and Lexicon Features for Sentiment Analysis of Italian Tweets},
YEAR = {2014},
ABSTRACT = {In this paper we describe our approach to EVALITA 2014 SENTIment POLarity Classification (SENTIPOLC) task. We participated only in the Polarity Classification sub-task. By resorting to a wide set of general-purpose features qualifying the lexical and grammatical structure of a text, automatically created ad-hoc lexicons and existing free available resources, we achieved the second best accuracy},
KEYWORDS = {Lexicons resources},
URL = {https://iris.cnr.it/handle/20.500.14243/255596},
CONFERENCE_NAME = {The 4th Conference for Evaluation of NLP and Speech Tools for Italian (EVALITA)},
}
@INPROCEEDINGS{DEFELICE_2014_INPROCEEDINGS_D_227083,
AUTHOR = {De Felice, I.},
TITLE = {The Affordance of grasping. A Psycholinguistic Study},
YEAR = {2014},
CONFERENCE_NAME = {Experimental Psycholinguistics Conference},
}
@INPROCEEDINGS{DEFELICE_2014_INPROCEEDINGS_D_288822,
AUTHOR = {De Felice, I.},
TITLE = {Pragmatics and Semantics in Grasp Events},
YEAR = {2014},
CONFERENCE_NAME = {AISV 2014},
}
@INPROCEEDINGS{DEFELICE_2014_INPROCEEDINGS_D_288820,
AUTHOR = {De Felice, I.},
TITLE = {Quanti oggetti possiamo "prendere" e come? Un solo verbo, tante azioni e tante traduzioni},
YEAR = {2014},
CONFERENCE_NAME = {Seminario rivolto agli alunni dell'Istituto Tecnico Economico "F. Carrara" di Lucca, organizzato dall'Istituto di Linguistica Computazionale "A. Zampolli" del CNR di Pisa},
}
@INPROCEEDINGS{DEFELICE_2014_INPROCEEDINGS_DBRQM_224510,
AUTHOR = {De Felice, I. and Bartolini, R. and Russo, I. and Quochi, V. and Monachini, M.},
TITLE = {Evaluating ImagAct-WordNet mapping for English and Italian through videos},
YEAR = {2014},
ABSTRACT = {In this paper we present the results of the evaluation of an automatic mapping between two lexical resources, WordNet/ItalWordNet and ImagAct, a conceptual ontology of action types instantiated by video scenes. Results are compared with those obtained from a previous experiment performed only on Italian data. Differences between the two evaluation strategies, as well as between the quality of the mappings for the two languages considered in this paper, are iscussed},
KEYWORDS = {Language Resources (LRs)},
PAGES = {128-131},
URL = {http://clic.humnet.unipi.it/proceedings/Proceedings-CLICit-2014.pdf},
DOI = {10.12871/CLICIT2014126},
PUBLISHER = {Pisa University Press srl (Pisa, ITA)},
ISBN = {978-88-67-41472-7},
CONFERENCE_NAME = {Proceedings of the First Italian Conference on Computational Linguistics CLiC-it 2014 \& the Fourth International Workshop EVALITA 2014. Pisa University Press srl: Pisa (Italia)},
CONFERENCE_PLACE = {Pisa},
EDITOR = {Basili, R. and Lenci, A. and Magnini, B.},
}
@INPROCEEDINGS{DEFELICE_2014_INPROCEEDINGS_DDM_257774,
AUTHOR = {De Felice, I. and Donati, M. and Marotta, G.},
TITLE = {CLaSSES: a new digital resource for Latin epiraphy},
YEAR = {2014},
ABSTRACT = {CLaSSES (Corpus for Latin Sociolinguistic Studies on Epigraphic textS) è un corpus annotato finalizzato all'analisi sociolinguistica quantitativa e qualitativa delle epigrafi latine. Permette di analizzare i fenomeni fonologici e morfofonologici che caratterizzano le forme latine non standard, in relazione alla tipologia testuale, all'area geografica di provenienza e alla datazione delle iscrizioni. L'articolo presenta la prima macrosezione di CLaSSES, incentrata sulle iscrizioni risalenti al periodo preletterario e arcaico},
PAGES = {132-137},
URL = {http://clic.humnet.unipi.it/proceedings/Proceedings-EVALITA-2014.pdf},
PUBLISHER = {Pisa University Press (Pisa, ITA)},
CONFERENCE_NAME = {CLiC-it. La Prima Conferenza Italiana di Linguistica Computazionale},
CONFERENCE_PLACE = {Pisa},
BOOKTITLE = {Proceedings of the First Italian Conference on Computational Linguistics CLiC-it 2014 and the Fourth International Workshop EVALITA 2014},
EDITOR = {Basili, R. and Lenci, A. and Magnini, B.},
}
@INPROCEEDINGS{DELGRATTA_2014_INPROCEEDINGS_DFKMS_257904,
AUTHOR = {Del Gratta, R. and Frontini, F. and Khan, F. and Mariani, J. and Soria, C.},
TITLE = {The LREMap for Under-Resourced Languages},
YEAR = {2014},
ABSTRACT = {A complete picture of currently available language resources and technologies for the under-resourced languages of Europe is still lacking. Yet this would help policy makers, researchers and developers enormously in planning a roadmap for providing all languages with the necessary instruments to act as fully equipped languages in the digital era. In this paper we introduce the LRE Map and show its utility for documenting available language resources and technologies for under-resourced languages. The importance of the serialization of the LREMap into (L)LOD along with the possibility of its connection to a wider world is also introduced},
KEYWORDS = {language resources, less-resourced languages, linguistic linked open data},
PAGES = {78-83},
URL = {http://www.lrec-conf.org/proceedings/lrec2014/index.html},
CONFERENCE_NAME = {Workshop on Collaboration and Computing for Under-Resourced Languages in the Linked Open Data Era (CCURL 2014)},
BOOKTITLE = {Proceedings of the Workshop on Collaboration and Computing for Under-Resourced Languages in the Linked Open Data Era (CCURL 2014)},
EDITOR = {Pretorius, L. and Soria, C. and Baroni, P.},
}
@INPROCEEDINGS{DELGRATTA_2014_INPROCEEDINGS_DN_284932,
AUTHOR = {Del Gratta, R. and Nahli, O.},
TITLE = {Enhancing Arabic WordNet with the use on Princeton WordNet and a bilingual dictionary},
YEAR = {2014},
ABSTRACT = {This paper describes an heuristic-based approach to enhance existing WordNets with freely available bilingual resources. The approach has been applied to the Arabic WordNet using the AraMorph bilingual dictionary as bilingual resource, but its guidelines are quite general to be effectively applied to other languages. The English words extracted from the bilingual resource are checked against Princeton WordNet in order to quantify their coverage and to select only those words which share the same set of synsets. This strongly reduces the number of Arabic words of the pairs. These latter are then checked against the Arabic WordNet to make new words emerge and-possibly-add new synonyms},
KEYWORDS = {WordNet, Arabic, English, Bilingual Resource, Enhancement},
PAGES = {278-284},
URL = {http://ieeexplore.ieee.org/stamp/stamp.jsp?tp=\&arnumber=7016632},
DOI = {10.1109/CIST.2014.7016632},
PUBLISHER = {IEEE Communications Society (Piscataway, USA)},
ISBN = {978-1-4799-5978-5},
CONFERENCE_NAME = {ANLP IEEE CIST14},
CONFERENCE_PLACE = {Piscataway},
BOOKTITLE = {3rd International IEEE Colloquium on Information Science and Technology; From 20th to 22nd of October 2014 Tetuan-Chefchaouen Morocco},
}
@INPROCEEDINGS{DELGRATTA_2014_INPROCEEDINGS_DPG_244705,
AUTHOR = {Del Gratta, R. and Pardelli, G. and Goggi, S.},
TITLE = {The LRE Map disclosed},
YEAR = {2014},
ABSTRACT = {This paper describes a serialization of the LRE Map database according to the RDF model. Due to the peculiar nature of the LRE Map, many ontologies are necessary to model the map in RDF, including newly created and reused ontologies. The importance of having the LRE Map in RDF and its connections to other open resources is also addressed},
KEYWORDS = {Language Resource, LOD, Metadata},
PAGES = {3534-3541},
URL = {http://www.lrec-conf.org/proceedings/lrec2014/index.html},
PUBLISHER = {EUROPEAN LANGUAGE RESOURCES ASSOC-ELRA FRANCE (Parigi, FRA)},
ISBN = {978-2-9517408-8-4},
CONFERENCE_NAME = {Ninth International Conference on Language Resources and Evaluation (LREC'14)},
CONFERENCE_PLACE = {Parigi},
BOOKTITLE = {Proceedings of the Ninth International Conference on Language Resources and Evaluation (LREC'14)},
EDITOR = {Calzolari, N. and Choukri, K. and Declerck, T. and Loftsson, H. and Maegaard, B. and Mariani, J. and Moreno, A. and Odijk, J. and Piperidis, S.},
}
@INPROCEEDINGS{DELGROSSO_2014_INPROCEEDINGS_DMMP_228557,
AUTHOR = {Del Grosso, A. M. and Marchi, S. and Murano, F. and Pesini, L.},
TITLE = {A collaborative tool for philological research: experiments on Ferdinand de Saussure's manuscripts},
YEAR = {2014},
ABSTRACT = {The present paper describes a philological-computational tool developed by the Istituto di Linguistica Computazionale (ilc-cnr) of Pisa, aimed at creating a digital edition of Ferdinand de Saussure's unpublished manuscripts. Since the use of a digital edition and of the most modern computer technology allows a more in-depth research, the ilc is developing a set of digital tools in order to take ad-vantage of both the documents and the related information added by the scientific community. The integration exploits the Java enterprise platform by organizing the different features in modules. Thus, the tool meets the following requirements: (i) converting legacy digital resources into valid Xml documents (tei compliant); (ii) parallel visualization among imported texts and related images; (iii) search and in-dexing; (iv) handling of variant readings; and (v) collaborative annotation},
KEYWORDS = {Computational and collaborative philology},
PAGES = {163-175},
URL = {https://iris.cnr.it/handle/20.500.14243/228557},
PUBLISHER = {CLEUP (Padova, ITA)},
ISBN = {978-88-6787-260-2},
CONFERENCE_NAME = {Aiucd},
CONFERENCE_PLACE = {Padova},
BOOKTITLE = {Collaborative Research Practices and Shared Infrastructures for Humanities Computing},
EDITOR = {Agosti, M. and Tomasi, F.},
}
@INPROCEEDINGS{DELGROSSO_2014_INPROCEEDINGS_DN_221676,
AUTHOR = {Del Grosso, A. M. and Nahli, O.},
TITLE = {Towards a flexible open-source software library for multi-layered scholarly textual studies: An Arabic case study dealing with semi-automatic language processing},
YEAR = {2014},
ABSTRACT = {This paper presents both the general model and a case study of the Computational and Collaborative Philology Library (CoPhiLib), an ongoing initiative underway at the Institute for Computational Linguistics (ILC) of the National Research Council (CNR), Pisa, Italy. The library, designed and organized as a reusable, abstract and open-source software component, aims at solving the needs of multi-lingual and cross-lingual analysis by exposing common Application Programming Interfaces (APIs). The core modules, coded by the Java programming language, constitute the groundwork of a Web platform designed to deal with textual scholarly needs. The Web application, implemented according to the Java Enterprise specifications, focuses on multi-layered analysis for the study of literary documents and related multimedia sources. This ambitious challenge seeks to obtain the management of textual resources, on the one hand by abstracting from current language, on the other hand by decoupling from the specific requirements of single projects. This goal is achieved thanks to methodologies declared by the "agile process", and by putting into effect suitable use case modeling, design patterns, and component-based architectures. The reusability and flexibility of the system have been tested on an Arabic case study: the system allows users to choose the morphological engine (such as AraMorph or Al-Khalil), along with linguistic granularity (i. e. with or without declension). Finally, the application enables the construction of annotated resources for further statistical engines (training set)},
KEYWORDS = {Design, Information Engineering, Design Patterns, Text Processing, Arabic Natural Language Processing},
PAGES = {285-290},
URL = {http://ieeexplore.ieee.org/xpl/articleDetails.jsp?tp=\&arnumber=7016633\&queryText=del+grosso+philology},
DOI = {10.1109/CIST.2014.7016633},
PUBLISHER = {IEEE (New York, USA)},
ISBN = {978-1-4799-5978-5},
CONFERENCE_NAME = {Third IEEE International Colloquium in Information Science and Technology (CIST)},
CONFERENCE_PLACE = {New York},
BOOKTITLE = {Third IEEE International Colloquium in Information Science and Technology (CIST)},
EDITOR = {El Mohajir, M. and Al Achhab, M. and Chahhou, M. and Mounir, A. and El Mohajir, B. and Pirrelli, V. and Zarghili, A. and Elfar, M.},
}
@INPROCEEDINGS{DELLORLETTA_2014_INPROCEEDINGS_DVCM_226944,
AUTHOR = {Dell'Orletta, F. and Venturi, G. and Cimino, A. and Montemagni, S.},
TITLE = {T2K: a System for Automatically Extracting and Organizing Knowledge from Texts},
YEAR = {2014},
ABSTRACT = {In this paper, we present T2K, a suite of tools for automatically extracting domain-specific knowledge from collections of Italian and English texts. T2K (Text-To-Knowledge v2) relies on a battery of tools for Natural Language Processing (NLP), statistical text analysis and machine learning which are dynamically integrated to provide an accurate and incremental representation of the content of vast repositories of unstructured documents. Extracted knowledge ranges from domain-specific entities and named entities to the relations connecting them and can be used for indexing document collections with respect to different information types. T2K also includes "linguistic profiling" functionalities aimed at supporting the user in constructing the acquisition corpus, e. g. in selecting texts belonging to the same genre or characterized by the same degree of specialization or in monitoring the "added value" of newly inserted documents. T2K is a web application which can be accessed from any browser through a personal account which has been tested in a wide range of domains},
KEYWORDS = {Natural Language Processing, Information Extraction, Knowledge Management},
PAGES = {2062-2070},
URL = {http://www.lrec-conf.org/proceedings/lrec2014/pdf/590_Paper.pdf},
ISBN = {978-2-9517408-8-4},
CONFERENCE_NAME = {International Conference on Language Resources and Evaluation (LREC)},
}
@INPROCEEDINGS{DELLORLETTA_2014_INPROCEEDINGS_DWCVM_266274,
AUTHOR = {Dell'Orletta, F. and Wieling, M. and Cimino, A. and Venturi, G. and Montemagni, S.},
TITLE = {Assessing the readability of sentences: which corpora and features?},
YEAR = {2014},
ABSTRACT = {The paper investigates the problem of sentence readability assessment, which is modelled as a classification task, with a specific view to text simplification. In particular, it addresses two open issues connected with it, i. e. the corpora to be used for training, and the identification of the most effective features to determine sentence readability. An existing readability assessment tool developed for Italian was specialized at the level of training corpus and learning algorithm. A maximum entropy-based feature selection and ranking algorithm (grafting) was used to identify to the most relevant features: it turned out that assessing the readability of sentences is a complex task, requiring a high number of features, mainly syntactic ones},
PAGES = {163-173},
URL = {http://acl2014.org/acl2014/W14-18/pdf/W14-1820.pdf},
PUBLISHER = {Association for Computational Linguistics (Stroudsburg, USA)},
ISBN = {978-1-941643-03-7},
CONFERENCE_NAME = {9th Workshop on Innovative Use of NLP for Building Educational Applications (BEA 2014)},
CONFERENCE_PLACE = {Stroudsburg},
BOOKTITLE = {Proceedings of 9th Workshop on Innovative Use of NLP for Building Educational Applications (BEA 2014)},
}
@INPROCEEDINGS{FERRARI_2014_INPROCEEDINGS_FDSG_261380,
AUTHOR = {Ferrari, A. and Dell'Orletta, F. and Spagnolo, G. and Gnesi, S.},
TITLE = {Measuring and improving the completeness of natural language requirements},
YEAR = {2014},
ABSTRACT = {[Context and motivation] System requirements specifications are normally written in natural language. These documents are required to be complete with respect to the input documents of the requirements definition phase, such as preliminary specifications, transcripts of meetings with the customers, etc. In other terms, they shall include all the relevant concepts and all the relevant interactions among concepts expressed in the input documents. [Question/Problem] Means are required to measure and improve the completeness of the requirements with respect to the input documents. [Principal idea/results] To measure this completeness, we propose two metrics that take into account the relevant terms of the input documents, and the relevant relationships among terms. Furthermore, to improve the completeness, we present a natural language processing tool named Completeness Assistant for Requirements (CAR), which supports the definition of the requirements: the tool helps the requirements engineer in discovering relevant concepts and interactions. [Contribution] We have performed a pilot test with CAR, which shows that the tool can help improving the completeness of the requirements with respect to the input documents. The study has also shown that CAR is actually useful in the identification of specific/alternative system behaviours that might be overseen without the tool. © 2014 Springer International Publishing Switzerland},
KEYWORDS = {natural language processing, relation extraction, Requirements analysis},
PAGES = {23-38},
URL = {https://link.springer.com/chapter/10.1007%2F978-3-319-05843-6_3#citeas},
DOI = {10.1007/978-3-319-05843-6_3},
ISBN = {978-3-319-05843-6},
CONFERENCE_NAME = {REFSQ 2014, Requirements Engineering: Foundation for Software Quality. 20th International Working Conference},
BOOKTITLE = {Requirements Engineering: Foundation for Software Quality 20th International Working Conference, REFSQ 2014, Essen, Germany, April 7-10, 2014. Proceedings},
EDITOR = {Salinesi, C. and Van De Weerd, I.},
}
@INPROCEEDINGS{FRONTINI_2014_INPROCEEDINGS_FQM_259129,
AUTHOR = {Frontini, F. and Quochi, V. and Monachini, M.},
TITLE = {Polysemy alternations extraction using the PAROLE SIMPLE CLIPS Italian lexicon},
YEAR = {2014},
ABSTRACT = {This paper presents the results of an experiment of polysemy alternations induction from a lexicon (Utt and Pad´o, 2011; Frontini et al., 2014), discussing the results and proposing an amendment in the original algorithm},
KEYWORDS = {Language Resources and Technologies},
PAGES = {175-179},
URL = {http://clic.humnet.unipi.it/proceedings/Proceedings-CLICit-2014.pdf},
DOI = {10.12871/CLICIT2014134},
PUBLISHER = {Pisa University Press srl (Pisa, ITA)},
ISBN = {978-88-67-41472-7},
CONFERENCE_NAME = {Proceedings of the First Italian Conference on Computational Linguistics CLiC-it 2014 \& the Fourth International Workshop EVALITA 2014},
CONFERENCE_PLACE = {Pisa},
EDITOR = {Basili, R. and Lenci, A. and Magnini, B.},
}
@INPROCEEDINGS{FRONTINI_2014_INPROCEEDINGS_FQPUM_222781,
AUTHOR = {Frontini, F. and Quochi, V. and Padó, S. and Utt, J. and Monachini, M.},
TITLE = {Polysemy Index for Nouns: an Experiment on Italian using the PAROLE SIMPLE CLIPS Lexical Database},
YEAR = {2014},
ABSTRACT = {An experiment is presented to induce a set of polysemous basic type alternations (such as ANIMAL-FOOD, or BUILDING-INSTITUTION) by deriving them from the sense alternations found in an existing lexical resource. The paper builds on previous work and applies those results to the Italian lexicon PAROLE SIMPLE CLIPS. The new results show how the set of frequent type alternations that can be induced from the lexicon is partly different from the set of polysemy relations selected and explicitly applied by lexicographers when building it. The analysis of mismatches shows that frequent type alternations do not always correspond to prototypical polysemy relations, nevertheless the proposed methodology represents a useful tool offered to lexicographers to systematically check for possible gaps in their resource},
KEYWORDS = {Polysemy, lexical resources, semantics},
PAGES = {2955-2963},
URL = {http://www.lrec-conf.org/proceedings/lrec2014/index.html},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {978-2-9517408-8-4},
CONFERENCE_NAME = {9th International Conference on Language Resources and Evaluation, LREC 2014},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {LREC 2014 Ninth International Conference on Language Resources and Evaluation Proceedings},
EDITOR = {Calzolari, N. and Choukri, K. and Declerck, T. and Loftsson, H. and Maegaard, B. and Mariani, J. and Moreno, A. and Odijk, J. and Piperidis, S.},
}
@INPROCEEDINGS{GAGGIOLI_2014_INPROCEEDINGS_GCSPTBCFCTDGTRR_256842,
AUTHOR = {Gaggioli, A. and Cipresso, P. and Serino, S. and Pioggia, G. and Tartarisco, G. and Baldus, G. and Corda, D. and Ferro, M. and Carbonaro, N. and Tognetti, A. and De Rossi, D. and Giakoumis, D. and Tzovaras, D. and Riera, A. and Riva, G.},
TITLE = {A decision support system for real-time stress detection during virtual reality exposure},
YEAR = {2014},
ABSTRACT = {Virtual Reality (VR) is increasingly being used in combination with psycho-physiological measures to improve assessment of distress in mental health research and therapy. However, the analysis and interpretation of multiple physiological measures is time consuming and requires specific skills, which are not available to most clinicians. To address this issue, we designed and developed a Decision Support System (DSS) for automatic classification of stress levels during exposure to VR environments. The DSS integrates different biosensor data (ECG, breathing rate, EEG) and behavioral data (body gestures correlated with stress), following a training process in which self-rated and clinical-rated stress levels are used as ground truth. Detected stress events for each VR session are reported to the therapist as an aggregated value (ranging from 0 to 1) and graphically displayed on a diagram accessible by the therapist through a web-based interface},
KEYWORDS = {Psychological Stress, Psychophysiology, Virtual Reality, Decision Support System, Biosensors.},
PAGES = {114-120},
URL = {https://iris.cnr.it/handle/20.500.14243/256842},
VOLUME = {196},
DOI = {10.3233/978-1-61499-375-9-114},
CONFERENCE_NAME = {Medicine Meets Virtual Reality (MMVR21)},
BOOKTITLE = {Medicine Meets Virtual Reality},
EDITOR = {Westwood, J. D.},
}
@INPROCEEDINGS{GOGGI_2014_INPROCEEDINGS_GPGB_263924,
AUTHOR = {Goggi, S. and Pardelli, G. and Giannini, S. and Biagioni, S.},
TITLE = {Grey Literature in European Commission Projects},
YEAR = {2014},
ABSTRACT = {The survey is focused on the documentation produced by the European Commission (EC) projects involved in the Framework Programme for Research and Technological Development (hereafter FP7) and managed by the Italian National Research Council (hereafter CNR). In particular, the Grey Literature (GL) available on CORDIS and European Projects websites was analysed. In order to verify how it is managed and whether it is compliant with EC recommendations, some categories were introduced to identify, measure and evaluate the usability and availability of projects production. Data was obtained from a sample of European projects websites},
KEYWORDS = {Grey Literature. European Commission Projects, A.1 INTRODUCTORY AND SURVEY},
PAGES = {98-109},
URL = {https://iris.cnr.it/handle/20.500.14243/263924},
ISSN = {1386-2316},
ISBN = {978-90-77484-22-7},
CONFERENCE_NAME = {GL15-Fifteenth International Conference on Grey Literature. The Grey Audit: a Field Assessment in Grey Literature},
BOOKTITLE = {THE GL-CONFERENCE SERIES. CONFERENCE PROCEEDINGS},
EDITOR = {Farace, D. J. and Frantzen, J. and Service, G. I. L. N.},
}
@INPROCEEDINGS{GUADAGNINI_2014_INPROCEEDINGS_GV_256344,
AUTHOR = {Guadagnini, E. and Vaccaro, G.},
TITLE = {Un contributo allo studio del «volgarizzare e tradurre»: il progetto DiVo},
YEAR = {2014},
ABSTRACT = {L'intervento vuole focalizzare il genere "volgarizzamento" come canale di innovazione linguistica, oltre che di appropriazione culturale. L'ipotesi che si intende argomentare è che sia ricostruibile un'evoluzione in diacronia che oppone i primi volgarizzamenti, duecenteschi, alla ricca attività traduttiva del secolo successivo. Nel Duecento il volgarizzamento dai classici è (anche) un importante canale di arricchimento linguistico-in virtù soprattutto di una "posizione mentale" del volgarizzatore che vede spesso nel latino una sorta di variante diafasica alta del volgare scritto, o comunque un modello sulla base del quale si possa innalzare stilisticamente e lessicalmente il volgare. Nel corso del Trecento invece la traduzione dei classici sembra evolversi principalmente con la finalità al rendere accessibili dei contenuti: i volgarizzatori sembrano preferire rese traduttive genuinamente volgari, i nuovi conî linguistici si fanno più rari e sembrano stentare ad attecchire nella lingua. L'intervento, che si inscrive in una serie di lavori derivati da un progetto di studio complessivo dei volgarizzamenti italoromanzi medievali dei classici latini, si fonderà sui dati raccolti da un corpus digitale on line, che sarà oggetto di una breve presentazione, e dal loro confronto con il corpus dei testi italiani antichi costituiti e resi disponibili alla consultazione dall'Istituto Opera del Vocabolario Italiano (Corpus OVI dell'Italiano antico) e con le voci del TLIO (Tesoro della Lingua Italiana delle Origini)},
KEYWORDS = {Volgarizzamenti, Lessicografia italiana, Storia della tradizione, Dizionario dei Volgarizzamenti},
PAGES = {91-105},
URL = {https://iris.cnr.it/handle/20.500.14243/256344},
PUBLISHER = {Esedra (Padova, ITA)},
CONFERENCE_NAME = {Lingua testi culture. L'eredità di Folena vent'anni dopo},
CONFERENCE_PLACE = {Padova},
BOOKTITLE = {Lingua testi culture. L'eredità di Folena vent'anni dopo. Atti del XL Convegno Interuniversitario (Bressanone, 12-15 luglio 2012)},
EDITOR = {Paccagnella, I. and Gregori, E.},
}
@INPROCEEDINGS{KHAN_2014_INPROCEEDINGS_KBF_259370,
AUTHOR = {Khan, F. and Boschetti, F. and Frontini, F.},
TITLE = {Using lemon to Model Lexical Semantic Shift in Diachronic Lexical Resources},
YEAR = {2014},
ABSTRACT = {In this paper we propose a model, called lemonDIA, for representing lexical semantic change using the lemon framework and based on the ontological notion of the perdurant. Namely we extend the notion of sense in lemon by adding a temporal dimension and then define a class of perdurant entities that represents a shift in meaning of a word and which contains different related senses. We start by discussing the general problem of semantic shift and the utility of being able to easily access and represent such information in diachronic lexical resources. We then describe our model and illustrate it with examples},
URL = {https://iris.cnr.it/handle/20.500.14243/259370},
}
@INPROCEEDINGS{LYDING_2014_INPROCEEDINGS_LSBBCDDLP_261825,
AUTHOR = {Lyding, V. and Stemle, E. and Borghetti, C. and Brunello, M. and Castagnoli, S. and Dell'Orletta, F. and Dittmann, H. and Lenci, A. and Pirrelli, V.},
TITLE = {The PAISÀ Corpus of Italian Web Texts},
YEAR = {2014},
ABSTRACT = {PAIS`A is a Creative Commons licensed, large web corpus of contemporary Italian. We describe the design, harvesting, and processing steps involved in its creation},
PAGES = {36-43},
URL = {http://aclweb.org/anthology/W14-04},
PUBLISHER = {Association for Computational Linguistics (Stroudsburg, USA)},
CONFERENCE_NAME = {Corpus annotation, Tree-bank, Corpus design, Corpus harvesting},
CONFERENCE_PLACE = {Stroudsburg},
BOOKTITLE = {Proceedings of the 9th Web as Corpus Workshop (WaC-9)},
EDITOR = {Bildhauer, F. and Schäfer, R.},
}
@INPROCEEDINGS{MARCONI_2014_INPROCEEDINGS_M_228341,
AUTHOR = {Marconi, L.},
TITLE = {La tecnología como auxilio en la creación de un diccionario de una lengua oral de Africa},
YEAR = {2014},
ABSTRACT = {Questo studio, riferito alla lingua fang della Guinea Equatoriale, intende mostrare come la tecnologia possa fornire un valido aiuto nello sviluppo di strumenti per la salvaguardia di lingue orali. Il fang, parlato da più di 1000000 di persone, è parlato soprattutto in Gabon. Camerun, Giunea Equatoriale e nell'estremo nordest del Congo e a Sao Tomé. Si considera suddiviso in sei dialetti principali: ntumu, okak, achí, meké, mveñ, nzaman. In Guinea Equatoriale risulta la più parlata tra le lingue nazionali e quella più omogenea, ciò nonostante si possono individuare due varietà: l'oka e l'ntumu. Il fang, lingua quasi esclusivamente orale, nonostante i numerosi parlanti è in pericolo di estinzione poiché non sta realizzando una evoluzione autonoma e usa lo spagnolo per descrivere elementi della società attuale; il fang è la lingua della comunicazione quotidiana, usata nelle comunicazioni private, in famiglia e nelle situazioni di lavoro non intellettuale. Il fattore più potente nella salvaguardia di una lingua è quello di utilizzarla, anche se in modo non perfetto, la sua introduzione in ogni occasione della vita fino a che il suo uso sia percepito come qualcosa di naturale e non percepito come artificiale; è essenziale quindi dirigere gli sforzi della trasmissione della lingua e della cultura alle generazioni più giovani realizzando strumenti (dizionari, file audio, ecc.) per proteggere la lingua e la cultura. Nell'articolo vengono fatte considerazioni sui dizionari cartacei ed elettronici, descritti gli scopi per la realizzazione di un dizionario elettronico, individuati i possibili destinatari del dizionario bilingue e descritte le linee guida per la progettazione, l'implementazione e la consultazione. Viene infine descritto sommariamente il dizionario realizzato fornendo informazioni sull'alfabeto adottato, sulla categorizzazione delle parole, sul tono, sulle varietà considerate e su elementi inclusi nella parte elettronica quali il suono e infine una descrizione degli ingressi sia per la parte fang-spagnolo che per la parte spagnolo-fang},
KEYWORDS = {diccionarios electrónicos, lengua fang, español},
URL = {https://iris.cnr.it/handle/20.500.14243/228341},
PUBLISHER = {Ediciones Catedra 2014 (Santiago de Cuba, CUB)},
ISBN = {9789592840195},
CONFERENCE_NAME = {XIII° Conferencia Internacional de Cultura Africana y Afroamericana},
CONFERENCE_PLACE = {Santiago de Cuba},
}
@INPROCEEDINGS{MARZI_2014_INPROCEEDINGS_MNF_221667,
AUTHOR = {Marzi, C. and Nahli, O. and Ferro, M.},
TITLE = {Word Processing for Arabic Language: A reappraisal of morphology induction through adaptive memory self-organisation strategies},
YEAR = {2014},
ABSTRACT = {Modelling the mental lexicon focuses on processing and storage dynamics, since lexical organisation relies on the process of input recoding and adaptive strategies for long-term memory organisation. A fundamental issue in word processing is represented by the emergence of the morphological organisation level in the lexicon, based on paradigmatic relations between fully-stored word forms. Morphology induction can be defined as the task of identifying morphological formatives within morphologically complex word forms. In the computational framework we propose here (TSOMs), based on Self-Organising Maps with Hebbian connections defined over a temporal layer, the identification/perception of surface morphological relations involves the alignment of recoded representations of morphologically-related input words. Facing a non-concatenative morphology such as the Arabic inflectional system prompts a reappraisal of morphology induction through adaptive organisation strategies, which affect both lexical representations and long-term storage. We will show how a strongly adaptive self-organisation during training is conducive to emergent relations between stored word forms, and to high accuracy rates in generalising knowledge of stored words to unknown forms},
KEYWORDS = {Non-concatenative morphological structure, lexical storage and access, SOMs, word recoding and processing, adaptive strategies, morphology},
PAGES = {241-247},
URL = {http://ieeexplore.ieee.org/xpl/articleDetails.jsp?arnumber=7016626\&punumber=6996097},
DOI = {10.1109/CIST.2014.7016626},
PUBLISHER = {IEEE (New York, USA)},
ISBN = {978-1-4799-5979-2},
CONFERENCE_NAME = {Third IEEE International Colloquium in Information Science and Technology (CIST)},
CONFERENCE_PLACE = {New York},
BOOKTITLE = {IEEE Conference Publications-Catalog Number: CFP1467R-ART},
EDITOR = {El Mohajir, M. and Al Achhab, M. and Chahhou, M. and Mounir, A. and El Mohajir, B. and Pirrelli, V. and Zarghili, A. and Elfar, M.},
}
@INPROCEEDINGS{MONEGLIA_2014_INPROCEEDINGS_MBFGKMP_222787,
AUTHOR = {Moneglia, M. and Brown, S. and Frontini, F. and Gagliardi, G. and Khan, F. and Monachini, M. and Panunzi, A.},
TITLE = {The IMAGACT Visual Ontology. an Extendable Multilingual Infrastructure for the Representation of Lexical Encoding of Action},
YEAR = {2014},
ABSTRACT = {Action verbs have many meanings, covering actions in different ontological types. Moreover, each language categorizes action in its own way. One verb can refer to many different actions and one action can be identified by more than one verb. The range of variations within and across languages is largely unknown, causing trouble for natural language processing tasks. IMAGACT is a corpus-based ontology of action concepts, derived from English and Italian spontaneous speech corpora, which makes use of the universal language of images to identify the different action types extended by verbs referring to action in English, Italian, Chinese and Spanish. This paper presents the infrastructure and the various linguistic information the user can derive from it. IMAGACT makes explicit the variation of meaning of action verbs within one language and allows comparisons of verb variations within and across languages. Because the action concepts are represented with videos, extension into new languages beyond those presently implemented in IMAGACT is done using competence-based judgments by mother-tongue informants without intense lexicographic work involving underdetermined semantic description},
URL = {https://iris.cnr.it/handle/20.500.14243/222787},
ISBN = {978-2-9517408-8-4},
}
@INPROCEEDINGS{MONTEMAGNI_2014_INPROCEEDINGS_M_297501,
AUTHOR = {Montemagni, S.},
TITLE = {DH@ILC: linee di attività e ricerca},
YEAR = {2014},
ABSTRACT = {Le principali linee di ricerca e sviluppo dell'ILC nel settore delle DH possono essere ricondotte ai seguenti filoni: acquisizione e conservazione di testi; progettazione e sviluppo di risorse e strumenti per il trattamento automatico di lingue classiche e varietà storiche della lingua; progettazione e sviluppo di strumenti per l'analisi del testo; costruzione di un'infrastruttura italiana per la ricerca nell'ambito delle scienze umane e sociali},
KEYWORDS = {Digital Humanities, Trattamento Automatico del Linguaggio, Risorse Linguistiche},
PAGES = {101-111},
URL = {https://iris.cnr.it/handle/20.500.14243/297501},
PUBLISHER = {CLEUP (Padova, ITA)},
ISBN = {9788867872602},
CONFERENCE_NAME = {2nd AIUCD Annual Conference},
CONFERENCE_PLACE = {Padova},
BOOKTITLE = {Collaborative Research Practices and Shared Infrastructures for Humanities Computing},
EDITOR = {Agosti, M. and Tomasi, F.},
}
@INPROCEEDINGS{MORGAVI_2014_INPROCEEDINGS_MNMCFCM_254209,
AUTHOR = {Morgavi, G. and Nerino, R. and Marconi, L. and Cutugno, P. and Ferraris, C. and Cinini, A. and Morando, M.},
TITLE = {NINFA iNtelligent Integrated Network For Aged people},
YEAR = {2014},
ABSTRACT = {In this paper we present the NINFA project outline and its preliminary developments. The project is based on a service platform suited for elder people called the Virtual Village Network, whose user interface allows to deliver at home different services. i. e.: user supervision, communication and interaction among users for social inclusion, exergame delivering, monitoring of the wellness status. The preliminary work done on ICT technologies acceptability issues and on the implementation of the User Interface (UI) and of the Human Computer Interface (HCI) is presented. The HCI we developed is particularly suited for elderly people and motor impaired patients because the interaction is managed only by finger/hand gestures and vocal control. Furthermore, the relationship between a sets of motor, linguistic and cognitive parameters evaluated during exergame execution and the wellness status of the user is investigated},
KEYWORDS = {service platform, elder people, at home services, exergame delivering, tele-monitoring, wellness status, human computer interface},
URL = {https://iris.cnr.it/handle/20.500.14243/254209},
DOI = {10.1007/978-3-319-18374-9_25},
PUBLISHER = {Springer (London, GBR)},
ISBN = {978-3-319-18374-9},
CONFERENCE_NAME = {5° Forum Italiano per l'Ambient Assisted Living-ForitAAL},
CONFERENCE_PLACE = {London},
BOOKTITLE = {Ambient assisted living, Italian Forum 2014},
EDITOR = {Andò, P. B. and Siciliano, P. P.},
}
@INPROCEEDINGS{PALLOTTI_2014_INPROCEEDINGS_PFAMF_222825,
AUTHOR = {Pallotti, G. and Frontini, F. and Affè, F. and Monachini, M. and Ferrari, S.},
TITLE = {Presenting a System of Human-Machine Interaction for Performing Map Tasks},
YEAR = {2014},
ABSTRACT = {A system for human machine interaction is presented, that offers second language learners of Italian the possibility of assessing their competence by performing a map task, namely by guiding the a virtual follower through a map with written instructions in natural language. The underlying natural language processing algorithm is described, and the map authoring infrastructure is presented},
KEYWORDS = {Language learning, human machine interaction, map tasks},
PAGES = {3963-3966},
URL = {http://www.lrec-conf.org/proceedings/lrec2014/index.html},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {978-2-9517408-8-4},
CONFERENCE_NAME = {9th International Conference on Language Resources and Evaluation, LREC 2014},
CONFERENCE_PLACE = {Paris},
EDITOR = {Calzolari, N. and Choukri, K. and Declerck, T. and Loftsson, H. and Maegaard, B. and Mariani, J. and Moreno, A. and Odijk, J. and Piperidis, S.},
}
@INPROCEEDINGS{PANUNZI_2014_INPROCEEDINGS_PDGJMMQR_257368,
AUTHOR = {Panunzi, A. and De Felice, I. and Gregori, L. and Jacoviello, S. and Monachini, M. and Moneglia, M. and Quochi, V. and Russo, I.},
TITLE = {Translating action verbs using a dictionary of images: the IMAGACT ontology},
YEAR = {2014},
ABSTRACT = {Action verbs have many meanings, covering actions in different ontological types. Moreover, each language categorizes action in its own way. One verb can refer to many different actions and one action can be identified by more than one verb. The range of variations within and across languages is largely unknown, causing trouble in all translation tasks. IMAGACT is a corpus-based ontology of action concepts, derived from English and Italian spontaneous speech corpora, which makes use of the universal language of images to identify the different action types extended by verbs referring to action in English, Italian, Chinese and Spanish. This paper presents the IMAGACT search interface and the various kinds of linguistic information the user can derive from it. IMAGACT makes explicit the variation of meaning of action verbs within one language and allows comparisons of verb variations within and across languages. Because the action concepts are represented with videos, extension into new languages beyond those presently implemented in IMAGACT is done using competence-based judgments by mother-tongue informants, without intense lexicographic work involving underdetermined semantic descriptions},
KEYWORDS = {Action verbs, Image ontology, Multilingual dictionary, Computer-aided translation},
PAGES = {1163-1170},
URL = {http://euralex2014.eurac.edu/en/callforpapers/Documents/EURALEX%202014_gesamt.pdf},
DOI = {10.13140/2.1.3719.2320},
PUBLISHER = {EURAC (Bolzano, ITA)},
ISBN = {978-88-88906-97-3},
CONFERENCE_NAME = {XVI EURALEX International Congress: The User in Focus},
CONFERENCE_PLACE = {Bolzano},
BOOKTITLE = {Proceedings of the XVI EURALEX International Congress: The User in Focus},
EDITOR = {Abel, A. and Vettori, C. and Ralli, N.},
}
@INPROCEEDINGS{PEDRETTI_2014_INPROCEEDINGS_PDGMPALM_300283,
AUTHOR = {Pedretti, I. and Del Grosso, A. and Giovannetti, E. and Mancini, L. and Piccini, S. and Abrate, M. and Lo Duca, A. and Marchetti, A.},
TITLE = {The Clavius on the Web Project: Digitization, Annotation and Visualization of Early Modern Manuscripts},
YEAR = {2014},
ABSTRACT = {This paper describes the full procedure adopted in the context of the Clavius on the Web project, which aims to help Web users to appraise the importance of specific manuscripts by going beyond their digital reproduction. The proposed approach is based on the multilayered explication of linguistic, lexical and semantic data representing the innermost nature of the analyzed manuscripts. The final purpose of the project is to gather and display the results of the three layers of analysis through interactive visualization techniques and export them as Linked Data. All the analyses rely on the XML/TEI encoding of the text, followed by a CTS-based tokenization. As a working example for this paper, the analysis of a portion of a manuscript provided by Historical Archives of the Pontifical Gregorian University will be illustrated. The text is a letter written in Latin and sent by Botvitus Nericius to Christophorus Clavius in 1598 from Madrid},
KEYWORDS = {Clavius, Data Visualization, Early Modern Manuscripts, Lexica and Ontologies, Linked Open Data, NLP for Latin, Promotion of Cultural Heritage},
PAGES = {7},
URL = {http://dl.acm.org/citation.cfm?id=2802636},
DOI = {10.1145/2802612.2802636},
PUBLISHER = {ACM, Association for computing machinery (New York, USA)},
ISBN = {978-1-4503-3295-8},
CONFERENCE_NAME = {Third AIUCD Annual Conference on Humanities and Their Methods in the Digital Ecosystem (AIUCD '14)},
CONFERENCE_PLACE = {New York},
BOOKTITLE = {Proceedings of the Third AIUCD Annual Conference on Humanities and Their Methods in the Digital Ecosystem (AIUCD '14)},
EDITOR = {Tomasi, F. and Del Turco, R. R.},
}
@INPROCEEDINGS{PICCINI_2014_INPROCEEDINGS_PRG_264633,
AUTHOR = {Piccini, S. and Ruimy, N. and Giovannetti, E.},
TITLE = {Il primo lessico elettronico della terminologia saussuriana},
YEAR = {2014},
ABSTRACT = {Il lavoro che intendiamo presentare si iscrive all'interno di un Progetto di Ricerca Nazionale finanziato dal governo italiano, intitolato "Per una edizione digitale dei manoscritti di Ferdinand de Saussure", e volto a creare un prototipo di edizione digitale degli scritti autografi del grande linguista ginevrino. A tal fine, ogni manoscritto è stato digitalizzato, classificato e dotato di un link ipertestuale che rimanda alla sua trascrizione. Un sistema di gestione dei testi permette di consultare e annotare il singolo manoscritto e di effettuare studi filologici e critici sul corpus digitalizzato. Le concordanze per forma e per lemma prodotte per l'insieme dei testi forniscono un insieme di termini caratteristici dei quali viene descritta la semantica. Accanto alla realizzazione di tale piattaforma filologica digitale, uno degli aspetti innovativi del progetto consiste nella creazione del primo thesaurus-lessico elettronico della terminologia linguistica saussuriana. Quest'ultima riceve per la prima volta una rappresentazione strutturata, con una definizione del contenuto semantico di ciascuno dei termini chiave del pensiero del maestro ginevrino ed un quadro esplicito della natura e dell'importanza dei legami che li uniscono. Tale fascio di informazioni dovrebbe contribuire in modo significativo a meglio conoscere ed interpretare il pensiero del padre della linguistica moderna. L'architettura del lessico è ispirata al modello lessicale SIMPLE. Tra i modelli lessicali di maggior rilievo (WordNet, EuroWordNet, ItalWordNet, FrameNet, Pattern Dictionary, SIMPLE e Brandeis Semantic Ontology) esso è apparso essere il più adeguato, in quanto si distingue per alcuni importanti ed innovati aspetti. Il modello SIMPLE, infatti, ha permesso la realizzazione di lessici elettronici multilivello armonizzati per dodici lingue europee, imponendosi così come standard de facto nell'ambito della Lessicografia Computazionale. Successivamente ha fortemente ispirato lo standard ISO per i lessici del TAL Lexical Markup Framework. La strutturazione del lessico ha necessitato anzitutto della creazione di una ontologia lessicale di dominio. A tal fine è stato adottato un approccio centrifugo: in un primo momento sono stati identificati i concetti centrali del dominio di interesse, i quali sono stati poi generalizzati o specificati. L'ontologia così modellizzata è attualmente costituita da 43 tipi semantici ed ha una profondità di 4 livelli. Alcune classi semantiche sono state poi ulteriormente "specificate" in termini di tratti e/o relazioni semantiche obbligatorie (definitorie). Un insieme di cinquantotto relazioni semantiche permette di collegare le istanze delle differenti classi ontologiche, mentre trentadue tratti semantici codificano informazioni tipiche di una classe semantica nella sua interezza o di una specifica istanza. La semantica lessicale di ciascuna delle istanze di una classe ontologica è rappresentata in una entrata lessicale, nella quale una ed una sola accezione di un termine, semplice o complesso, viene riccamente definita attraverso un vasto insieme di informazioni formalizzate ed altamente strutturate, che coprono un ampio ventaglio di aspetti semantici. Il senso analizzato è anzitutto associato alla definizione data da Saussure stesso, e laddove non disponibile, a quelle di R. Godel e R. Engler. Per ogni lemma vengono specificati anche il periodo di attestazione, le fonti nelle quali occorre, la sua frequenza di occorrenza e le collocazioni nelle quali appare. La classificazione ontologica del termine rappresenta un dato essenziale al quale si aggiungono l'informazione concernente il dominio d'uso, il tipo di evento denotato (qualora si tratti di un evento), dei tratti semantici distintivi e una vasta rete di relazioni semantico-lessicali. Il modello lessicale adottato, infatti, conferisce una attenzione particolare ai legami che esistono tra i differenti termini. La multidimensionalità intrinseca al senso di ogni lemma è colta e formalizzata attraverso un insieme di relazioni semantiche specifiche del modello SIMPLE e ispirate alla Struttura Qualia della teoria del Lessico Generativo. Esse offrono un quadro preciso della natura dei legami (intra ed extra categoriali) che sussistono tra le unità lessicali contenute nella base di dati sia sull'asse paradigmatico (iperonimia, iponimia, meronimia ed olonimia) sia sull'asse sintagmatico (fornendo in particolare informazioni sull'origine e la funzione dell'entità denotata). Inoltre, accanto alle classiche relazioni di sinonimia, antonimia e di derivazione morfologica, sono state create delle relazioni specifiche, al fine di formalizzare nel modo più preciso possibile i legami particolari esistenti tra i termini del dominio della conoscenza e più generalmente la sua organizzazione concettuale. Dei termini predicativi contenuti nel lessico viene descritta anche la struttura argomentale con indicazioni sul ruolo semantico e sulle restrizioni semantiche degli argomenti introdotti. Allo stato attuale, la popolazione del lessico è costituita da 500 entrate lessicali (379 nomi, 113 aggettivi e 8 verbi): si tratta principalmente dei termini proposti da Godel e Engler e di alcune parole-chiave estratte dagli Écrits de linguistique générale. In una fase successiva verrà integrata la nuova terminologia dei manoscritti attualmente studiati. In una prima fase i dati lessicali sono stai gestiti in una piattaforma MS ACCESS. Più recentemente, per esigenze di standardizzazione ed interoperabilità, è stata effettuata una migrazione sulla piattaforma Protégé-OWL. Owl è, infatti, il linguaggio standard del W3C per la rappresentazione e la condivisone di ontologie sul Web. Il sistema di gestione Access, tuttavia, non è stato abbandonato: il lessico, attualmente, è ospitato in entrambe le piattaforme grazie ad un software che consente la perfetta sincronizzazione dei dati. Questa provvisoria "doppia ubicazione" permette, intanto, di sfruttare in modo ottimale le potenzialità dei due sistemi di gestione. Una tale strutturazione informatizzata dei dati lessicali offre numerosi vantaggi. In fase di creazione del lessico, essa permette uno sviluppo collaborativo rigoroso, anche a distanza, e lo stoccaggio di una grande quantità di dati; favorisce una rappresentazione sistematica dei fenomeni linguistici ed assicura la coerenza e la completezza dell'informazione codificata. Inoltre, consente di operare costanti controlli di coerenza formale dell'informazione e di effettuare delle modifiche o delle correzioni sull'insieme dei dati. La strutturazione multidimensionale dei concetti del dominio di conoscenza e la rappresentazione semantica altamente strutturata, ricca, diversificata ed espressiva ne fanno uno strumento di ricerca lessicale particolarmente performante. Varie tipologie di ricerca possono essere effettuate molto semplicemente e rapidamente su qualsiasi dato memorizzato, sia esso una relazione, un tratto o una unità semantica e questi dati possono essere interrogati sia singolarmente sia in combinazione. Si ha quindi la possibilità di estrarre gruppi di unità lessicali che condividono una data proprietà o una combinazione di proprietà, secondo dei criteri stabiliti dallo studioso in relazione alle esigenze della sua ricerca. A titolo di esempio, verranno presentate alcune delle numerose ricerche che possono essere effettuate sui dati lessicali all'interno della base di dati. A nostro parere, il thesaurus-lessico semantico della terminologia saussuriana costituisce, per i motivi esposti, uno strumento di grande utilità per gli esperti del settore. Inoltre, l'organizzazione strutturata della conoscenza lessicale, favorendo la ricerca semantica, dovrebbe contribuire in modo significativo ad una più approfondita conoscenza del vocabolario del maestro e pertanto degli aspetti più complessi ed originali del suo pensiero},
KEYWORDS = {Saussure, SIMPLE, lessici computazionali},
URL = {https://iris.cnr.it/handle/20.500.14243/264633},
CONFERENCE_NAME = {XXXVII Convegno della Società Italiana di Glottologia, "Il lessico nella teoria e nella storia linguistica"},
}
@INPROCEEDINGS{PIPERIDIS_2014_INPROCEEDINGS_PPSRCHCDMG_222250,
AUTHOR = {Piperidis, S. and Papageorgiou, H. and Spurk, C. and Rehm, G. and Choukri, K. and Hamon, O. and Calzolari, N. and Del Gratta, R. and Magnini, B. and Girardi, C.},
TITLE = {META-SHARE: One year after},
YEAR = {2014},
ABSTRACT = {This paper presents META-SHARE (www. meta-share. eu), an open language resource infrastructure, and its usage since its Europe-wide deployment in early 2013. META-SHARE is a network of repositories that store language resources (data, tools and processing services) documented with high-quality metadata, aggregated in central inventories allowing for uniform search and access. META-SHARE was developed by META-NET (www. meta-net. eu) and aims to serve as an important component of a language technology marketplace for researchers, developers, professionals and industrial players, catering for the full development cycle of language technology, from research through to innovative products and services. The observed usage in its initial steps, the steadily increasing number of network nodes, resources, users, queries, views and downloads are all encouraging and considered as supportive of the choices made so far. In tandem, take-up activities like direct linking and processing of datasets by language processing services as well as metadata transformation to RDF are expected to open new avenues for data and resources linking and boost the organic growth of the infrastructure while facilitating language technology deployment by much wider research communities and industrial sectors},
KEYWORDS = {Infrastructures, language resources identification, language resources documentation, metadata, language resources sharing, language resources licensing},
PAGES = {1532-1538},
URL = {http://www.lrec-conf.org/proceedings/lrec2014/index.html},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {978-2-9517408-8-4},
CONFERENCE_NAME = {LREC'14},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the Ninth International Conference on Language Resources and Evaluation},
EDITOR = {Calzolari, N. and Choukri, K. and Declerck, T. and Loftsson, H. and Maegaard, B. and Mariani, J. and Moreno, A. and Odijk, J. and Piperidis, S.},
}
@INPROCEEDINGS{PIRRELLI_2014_INPROCEEDINGS_PMF_231380,
AUTHOR = {Pirrelli, V. and Marzi, C. and Ferro, M.},
TITLE = {Two-dimensional Wordlikeness Effects in Lexical Organisation},
YEAR = {2014},
ABSTRACT = {The main focus of research on wordlikeness has been on how serial processing strategies affect perception of similarity and, ultimately, the global network of associative relations among words in the mental lexicon. Comparatively little effort has been put so far, however, into an analysis of the reverse relationship: namely, how global organisation effects influence the speakers' perception of word similarity and of words' internal structure. In this paper, we explore the relationship between the two dimensions of wordlikeness (the "syntagmatic" and the "paradigmatic" one), to suggest that the same set of principles of memory organisation can account for both dimensions},
KEYWORDS = {wordlikeness, lexical access, word processing, frequency, memory},
PAGES = {301-305},
URL = {http://clic.humnet.unipi.it/it/atti.html},
VOLUME = {1},
DOI = {10.12871/CLICIT2014158},
ISBN = {978-8-86741-472-7},
CONFERENCE_NAME = {First Italian Conference on Computational Linguistics CLiC-it 2014 \& Fourth International Workshop EVALITA 2014},
BOOKTITLE = {The First Italian Conference on Computational Linguistics-Proceedings},
EDITOR = {Basili, R. and Lenci, A. and Magnini, B.},
}
@INPROCEEDINGS{SIMI_2014_INPROCEEDINGS_SBM_294411,
AUTHOR = {Simi, M. and Bosco, C. and Montemagni, S.},
TITLE = {Less is More? Towards a Reduced Inventory of Categories for Training a Parser for the Italian Stanford Dependencies},
YEAR = {2014},
ABSTRACT = {Stanford Dependencies (SD) represent nowadays a de facto standard as far as dependency annotation is concerned. The goal of this paper is to explore pros and cons of different strategies for generating SD annotated Italian texts to enrich the existing Italian Stanford Dependency Treebank (ISDT). This is done by comparing the performance of a statistical parser (DeSR) trained on a simpler resource (the augmented version of the Merged Italian Dependency Treebank or MIDT) and whose output was automatically converted to SD, with the results of the parser directly trained on ISDT. Experiments carried out to test reliability and effectiveness of the two strategies show that the performance of a parser trained on the reduced dependencies repertoire, whose output can be easily converted to SD, is slightly higher than the performance of a parser directly trained on ISDT. A non-negligible advantage of the first strategy for generating SD annotated texts is that semi-automatic extensions of the training resource are more easily and consistently carried out with respect to areduced dependency tagset. Preliminary experiments carried out for generating the collapsed and propagated SD representation are also reported},
KEYWORDS = {Italian Treebank, Harmonization and Merging of Resources, Stanford Dependencie s},
URL = {http://www.lrec-conf.org/proceedings/lrec2014/pdf/818_Paper.pdf},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {978-2-9517408-8-4},
CONFERENCE_NAME = {Ninth International Conference on Language Resources and Evaluation (LREC'14)},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the Ninth International Conference on Language Resources and Evaluation (LREC'14)},
EDITOR = {Calzolari, N. and Choukri, K. and Declerck, T. and Loftsson, H. and Maegaard, B. and Mariani, J. and Moreno, A. and Odijk, J. and Piperidis, S.},
}
@INPROCEEDINGS{YURI_2014_INPROCEEDINGS_YBDDMC_228466,
AUTHOR = {Yuri, B. and Boschetti, F. and Diakoff, H. and Del Gratta, R. and Monachini, M. and Crane, G.},
TITLE = {The Making of Ancient Greek WordNet},
YEAR = {2014},
ABSTRACT = {This paper describes the process of creation and review of a new lexico-semantic resource for the classical studies: AncientGreekWord-Net. The candidate sets of synonyms (synsets) are extracted from Greek-English dictionaries, on the assumption that Greek wordstranslated by the same English word or phrase have a high probability of being synonyms or at least semantically closely related. Theprocess of validation and the web interface developed to edit and query the resource are described in detail. The lexical coverage ofAncient Greek WordNet is illustrated and the accuracy is evaluated. Finally, scenarios for exploiting the resource are discussed},
KEYWORDS = {Ancient Greek, Multilingualism, Classical Philology},
PAGES = {1140-1147},
URL = {http://www.lrec-conf.org/proceedings/lrec2014/index.html},
PUBLISHER = {European language resources association (ELRA) (Paris, FRA)},
CONFERENCE_NAME = {LREC 2014. European Language Resources Association ELRA: Paris (Francia)},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {LREC 2014. European Language Resources Association ELRA: Paris (Francia)},
EDITOR = {Calzolari, N. and Choukri, K. and Declerck, T. and Loftsson, H. and Maegaard, B. and Mariani, J. and Moreno, A. and Odijk, J. and Piperidis, S.},
}
@INPROCEEDINGS{ABRATE_2014_INPROCEEDINGS_ADGLMMPP_264614,
AUTHOR = {Abrate, M. and Del Grosso, A. M. and Giovannetti, E. and Lo Duca, A. and Marchetti, A. and Mancini, L. and Pedretti, I. and Piccini, S.},
TITLE = {Il Progetto Clavius on the Web: tecnologie linguistico-semantiche al servizio del patrimonio documentale e degli archivi storici},
YEAR = {2014},
ABSTRACT = {L'obiettivo del progetto Clavius on the Web è quello di valorizzare una parte dei manoscritti conservati dall'Archivio storico della Pontificia Università Gregoriana (APUG). Il progetto prende in esame alcuni manoscritti relativi a Christophorus Clavius (1538-1612), matematico e astronomo gesuita. I manoscritti sono digitalizzati, trascritti, tradotti e analizzati dal punto di vista linguistico, lessicale e semantico. La terminologia e le entità di dominio individuate nel testo sono strutturate in un lessico e una ontologia, e collegate a risorse già disponibili sulla Rete secondo i principi dei Linked Data. La loro visualizzazione sul Web è implementata mediante tecniche di Data Visualization: la prima si basa sulla corrispondenza tra testo, traduzione e immagine mentre la seconda ha lo scopo di mostrare i contenuti delle analisi, con particolare enfasi alla navigazione delle risorse lessicali e ontologiche prodotte durante le varie fasi},
URL = {https://iris.cnr.it/handle/20.500.14243/264614},
CONFERENCE_NAME = {AIUCD 2014-Terzo convegno annuale: La metodologia della ricerca umanistica nell'ecosistema digitale},
BOOKTITLE = {AIUCD2014-La metodologia della ricerca umanistica nell'ecosistema digitale-Abstracts 3rd annual conference, 18-19 settembre 2014},
EDITOR = {Rossi, F. and Tomasi, F.},
}
@INPROCEEDINGS{BOSCHETTI_2014_INPROCEEDINGS_BDMNP_230690,
AUTHOR = {Boschetti, F. and Del Gratta, R. and Marzi, C. and Nahli, O. and Pirrelli, V.},
TITLE = {Modelli, metodi e strumenti per il trattamento automatico della lingua araba e per l'editing in ambienti collaborativi},
YEAR = {2014},
ABSTRACT = {La linguistica computazionale ha portato negli ultimi vent'anni a un profondo mutamento nello studio delle lingue e delle loro testimonianze scritte, spostando l'accento della ricerca da aspetti linguistico-formali all'uso linguistico in contesti comunicativi reali. Il presente contributo illustra l'impatto di questo cambio di prospettiva sullo studio della lingua araba, attraverso una rassegna di alcune attività di ricerca in corso presso l'Istituto di Linguistica Computazionale del CNR di Pisa: (i) acquisizione dei testi arabi tramite Optical Character Recognition (OCR) e sviluppo di strumenti per la correzione manuale del testo in ambienti collaborativi; (ii) sviluppo di algoritmi e strumenti per l'analisi morfologica della lingua araba; (iii) analisi delle dinamiche di acquisizione del lessico arabo mediante architetture bio-computazionali; (iv) sviluppo della WordNet dell'Arabo collegata a Princeton WordNet, ItalWordNet, LatinWordNet e alla nascente AncientGreek WordNet. Queste attività sono rivolte sia all'analisi delle caratteristiche linguistiche dell'arabo che allo studio della produzione letteraria araba e dei suoi rapporti storico-culturali con altre lingue. In particolare, il contributo intende illustrare la fertilità di un approccio metodologico che metta in relazione le dinamiche di acquisizione del lessico arabo, con la messa a punto di procedure di analisi ed edizione critica del testo e con i principi di organizzazione ontologica di una lingua ad alta produttività derivazionale},
KEYWORDS = {linguistica computazionale, uso linguistico, lessico arabo},
URL = {http://aiucd2014.unibo.it/book-of-abstracts.pdf},
CONFERENCE_NAME = {AIUCD 3rd annual conference},
BOOKTITLE = {La metodologia della ricerca umanistica nell'ecosistema digitale-AIUCD 2014 Terzo convegno annuale},
EDITOR = {Rossi, F. and Tomasi, F.},
}
@INPROCEEDINGS{BOSCHETTI_2014_INPROCEEDINGS_BDFLN_228548,
AUTHOR = {Boschetti, F. and Del Grosso, A. M. and Fahad Khan, A. and Lamé, M. and Nahli, O.},
TITLE = {A top-down approach to the design of components for the philological domain},
YEAR = {2014},
ABSTRACT = {This paper focuses on the methodology applied to the development of components in the domain of collaborative philology in the Memorata Poetis Project. This initiative, led by the University of Venice, coordinates eight units sharing the same cyber-infrastructure and is co-funded by the Italian Ministry of Instruction, University and Research (PRIN 2010/11). The project aims to study the multilingual intertextuality between epigraphic texts and literary epigrams, the transmission of themes, motives, etc. between different communicative situations (epigraphic versus literary) and different civilisations (Greek, Latin and Italian). As a control group, we analyse a corpus of epigraphic and literary texts in Arabic which do not belong to the same tradition as the others. The study of intertextuality affects both the reconstruction of the text (constitutio textus), by providing variants from the indirect tradition, and its interpretation (interpretatio), by widening the contexts in which the text has been reused},
URL = {https://iris.cnr.it/handle/20.500.14243/228548},
CONFERENCE_NAME = {DH2014},
BOOKTITLE = {Digital Humanities 2014-Book of Abstracts},
}
@INPROCEEDINGS{CHIARELLA_2014_INPROCEEDINGS_CCMM_268813,
AUTHOR = {Chiarella, D. and Cutugno, P. and Marconi, L. and Morgavi, G.},
TITLE = {Trame narrative nel social publishing},
YEAR = {2014},
PAGES = {13-13},
URL = {https://iris.cnr.it/handle/20.500.14243/268813},
CONFERENCE_NAME = {IV Congresso Nazionale CKBG "Tecnologia e Leggerezza" ovvero come rimuovere 'peso' dagli individui, organizzazioni, comunità, città},
}
@INPROCEEDINGS{CUTUGNO_2014_INPROCEEDINGS_CCLMN_276417,
AUTHOR = {Cutugno, P. and Chiarella, D. and Lucentini, R. and Marconi, L. and Noberini, S.},
TITLE = {EMOCHA: an everlasting temporary exhibition},
YEAR = {2014},
URL = {https://iris.cnr.it/handle/20.500.14243/276417},
CONFERENCE_NAME = {RENEWAL, INNOVATION AND CHANGE: HERITAGE AND EUROPEAN SOCIETY (RICHES) First International Conference},
}
@INPROCEEDINGS{DELGROSSO_2014_INPROCEEDINGS_DN_228544,
AUTHOR = {Del Grosso, A. M. and Nahli, O.},
TITLE = {Towards a flexible open-source software library for multi-layered scholarly textual studies-An Arabic use-case dealing with semi-automatic language processing},
YEAR = {2014},
ABSTRACT = {This paper presents both the general model and a case study of the Computational and Collaborative Philology Library (CoPhiLib), an ongoing initiative underway at the Institute for Computational Linguistics (ILC) of the National Research Council (CNR), Pisa, Italy. The library, designed and organized as a reusable, abstract and open-source software component, aims at solving the needs of multi-lingual and cross-lingual analysis by exposing common Application Programming Interfaces (APIs). The core modules, coded by the Java programming language, constitute the groundwork of a Web platform designed to deal with textual scholarly needs. The Web application, implemented according to the Java Enterprise specifications, focuses on multi-layered analysis for the study of literary documents and related multimedia sources. This ambitious challenge seeks to obtain the management of textual resources, on the one hand by abstracting from current language, on the other hand by decoupling from the specific requirements of single projects. This goal is achieved thanks to methodologies declared by the "agile process", and by putting into effect suitable use case modeling, design patterns, and component-based architectures. The reusability and flexibility of the system have been tested on an Arabic case study: the system allows users to choose the morphological engine (such as AraMorph or Al-Khalil), along with linguistic granularity (i. e. with or without declension). Finally, the application enables the construction of annotated resources for further statistical engines (training set)},
KEYWORDS = {Computational and collaborative philology, API},
URL = {https://iris.cnr.it/handle/20.500.14243/228544},
CONFERENCE_NAME = {ANLP IEEE CIST14},
}
@INPROCEEDINGS{DOTTO_2014_INPROCEEDINGS_DGL_265027,
AUTHOR = {Dotto, D. and Guadagnini, E. and Lorenzi, C.},
TITLE = {Presentazione del progetto DiVo},
YEAR = {2014},
ABSTRACT = {Sintetica presentazione del progetto DiVo nell'ambito della sezione "Presentazione di progetti di ricerca in corso" del convegno SIFR Verona 2014, i cui atti sono pubblicati on line (http: //www. sifr. it/storico/ricerca/)},
URL = {http://www.sifr.it/storico/ricerca/divo.pdf},
CONFERENCE_NAME = {Francofonie medievali. Lingue e letterature gallo-romanze fuori di Francia (sec. XII-XV)-Convegno di studio (Verona, 11-13 settembre 2014)},
}
@INPROCEEDINGS{GIANNINI_2014_INPROCEEDINGS_GBGP_259115,
AUTHOR = {Giannini, S. and Biagioni, S. and Goggi, S. and Pardelli, G.},
TITLE = {Mapping Italian Grey Communities: What is There Beyond the Academy?},
YEAR = {2014},
ABSTRACT = {The following title was published on an influential Italian newspaper, La Stampa, on November 7, 2013. "Tra i tesori della 'Letteratura Grigia' un'Eneide in napoletano del '600". The article is about the presentation of the "Fondo De Mauro" on the Italian Network of Popular Culture: this fund originates from a private collection built up in several decades and donated to the Network by Tullio De Mauro and his wife Silvana Ferreri in 2011; it is made up of thousands of books, brochures, pamphlets relating to Italian dialects and minority languages. In the field of healthcare, while browsing on the web, we found the title of a PhD thesis of last year: "Letteratura Grigia nelle meta-analisi delle prove ripartite con scelta casuale degli interventi di sanità". In the legal environment, the title of a Seminar at the University of Siena emerges from the web: "La "centralità" della legge e la letteratura grigia. Profili di politica del diritto in Italia tra Otto e Novecento". From these findings, the idea of a survey on the wide variety of grey material available on Italian web portals arises. A first analysis shows that this material is available in different forms and dissemination is carried out through various means such as thematic bibliographies, newspapers articles, various types of documents published in pdf format or simple descriptions on web sites. The following are a few examples excerpted from some home pages belonging to our corpus: ? Collection of grey literature. The Historical Archive of Women candidates for becoming the repository where the memories about these themes will be stored. ? Grey literature. Master copies · Reprints · Unreleased copies · Grey Literature. Archives for the history of Education. ? Grey literature. The high quality brand of parks. ?. International grey literature; national and international legislative data on the topic of drug addiction and related themes; documentary archive. ? Besides literature in German, there is literature in other languages and grey literature as well-in particular catalogues of museums and exhibitions. ? It is about a few thousand of books, brochures and documents of grey literature concerning two topics, Italian dialects and minority languages. Given this scenario, the research aims at verifying whether-and eventually how much-the grey literature available on the web is actually structured, accessible or even managed by systems dealing with its organization and aiming at its retrieval and storing. The utmost goal is to build up a map of non-academic communities and their mechanisms for managing, presenting and disseminating this type of material: a sort of journey among the streams of the web which channel meeting minutes, invites, manifests, fliers, pictures, newspapers articles, journalistic services and audio/video material on various topics. These "grey" products-by conveying basic information about social and popular culture-store, represent and spread knowledge. Significant examples could be identified in the web sites presenting the following matters: history of women's culture and of their movement in some specific Italian regions; projects dealing with the sustainability of urban environment with respect to childhood and adolescence; parks and other natural protected environments; archaeological documentation such as draft reports, diaries from the site, letters and miscellaneous documentation; nursing and health-related disciplines which produce guidelines, diagnostic and therapeutic courses, informative material for patients and their families. Also the theatrical culture is nourished by "grey products" as video archives, collections of music LPs and CDs, brochures, scripts, autograph manuscripts (i. e. letters, correspondences, fliers, musical scores). In substance, a heterogeneous set of material which could reveal especially interesting to both researchers, scientists, professionals and simple fans and lovers of the various subjects if ever made available and usable. Focus Analysis of the documentation and production of taxonomies finalized at the creation of a map of non-academic communities and stakeholders involved in the management of grey material. Material and methods The survey examines the several disciplines, the typology, the institutional nature and the fields to which these grey communities belong, noticing as well the variety of documentation provided, the structure of information and the presentation and access modalities through the following steps: 1) Selection of the web portals as resulted from the query "letteratura grigia" OR "letteratura non convenzionale" OR "documentazione grigia" OR "materiale grigio". 2) Creation of a corpus made up of 28, 000 occurrences. 3) Analysis of the various communities and of the grey material retrieved. 4) Statistical elaboration of the data. Conclusions: reflections on the communities and stakeholders involved in the management of grey literature and on the various ways of presenting the documentation provided by the web sites selected for this survey},
KEYWORDS = {Italian Grey Literature},
PAGES = {21-25},
URL = {http://greyguide.isti.cnr.it/linkdoc.php?idcode=2014-G01-019\&authority=GLConference\&collection=GL16\&langver=en},
ISBN = {978-90-77484-24-1},
CONFERENCE_NAME = {Sixteenth International Conference on Grey Literature Grey Literature Lobby: Engines and Requesters for Change},
EDITOR = {Farace, D. and Frantzen, J.},
}
@INPROCEEDINGS{GOGGI_2014_INPROCEEDINGS_GMFBPDBM_265502,
AUTHOR = {Goggi, S. and Monachini, M. and Frontini, F. and Bartolini, R. and Pardelli, G. and De Mattei, M. and Bustaffa, F. and Manzella, G.},
TITLE = {Marine Planning and Service Platform (MAPS): An Advanced Research Engine for Grey Literature in Marine Science},
YEAR = {2014},
ABSTRACT = {The MAPS (Marine Planning and Service Platform) project is a development of the Marine project (Ricerca Industriale e Sviluppo Sperimentale Regione Liguria 2007-2013) aiming at building a computer platform for supporting Operative Oceanography in its activities. One of the main objective of the project is to develop a repository that should gather, classify and structure marine scientific literature and data thus guaranteeing their accessibility to researchers and institutions by means of standard protocols. Community and Requirements. Operative Oceanography is the branch of marine research which deals with the development of integrated systems for examining and modeling the ocean monitoring and forecast. Experts need access to real-time data on the state of the sea such as forecasts on temperatures, streams, tides and the relevant scientific literature. This finds application in many areas, ranging from civilian and military safety to protection of off-shore and coastal infrastructures. The metadata. The set of metadata associated with marine data is defined in the CDI (Common Data Index) documented standard. They encode: the types of sizes which have been measured; the measurement tools the platform which has been employed; the geographic area where measures have been taken; the environmental matrix; the descriptive documentation. As concerns the scientific documentation, at the current stage of the CDI standard, a document is shaped around the following metadata: Title, Authors, Version, ISBN/DOI, Topic, Date of publication, Body/Institution, Abstract. The search engine. The query system (which is actually under development) has been designed for operating with structured data-the metadata-and raw data-the associated technical and scientific documentation. Full-text technologies are often unsuccessful when applied to this type of queries since they assume the presence of specific keywords in the text; in order to fix this problem, the MAPS project suggests to use different emantic technologies for retrieving the text and data and thus getting much more complying results. In the Poster we will present the scenario of the Operative Oceanography together with the technologies used to develop an advanced earch engine which aims at providing rapid and efficient access to a Digital Library of oceanographic data. The case-study is also highlighting how the retrieval of grey literature from this specific marine community could be reproduced for similar communities as well, thus revealing the 2 great impact that the processing, re-use as well as application of grey data have on societal needs/problems and their answers},
KEYWORDS = {Marine Science, Search Engine, Source Data, Oceanography},
PAGES = {93-94},
URL = {http://greyguide.isti.cnr.it/dfdownloadnew.php?ident=GLConference/GL16/2014-G01-015\&langver=en\&scelta=Metadata},
ISBN = {978-90-77484-24-1},
CONFERENCE_NAME = {Sixteenth International Conference on Grey Literature Grey Literature Lobby: Engines and Requesters for Change},
EDITOR = {Farace, C. B. D. and Frantzen, J.},
}
@INPROCEEDINGS{GUADAGNINI_2014_INPROCEEDINGS_G_265572,
AUTHOR = {Guadagnini, E.},
TITLE = {La lexicographie de l'italien médiéval et les corpora de l'Opera del Vocabolario Italiano: un bilan provisoire et quelques nouvelles perspectives},
YEAR = {2014},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana, Lessicologia, Filologia},
URL = {http://www.crealscience.fr/Colloque/index.php?article5/resume-elisa-guadagnini},
CONFERENCE_NAME = {Les états anciens de langues à l'heure du numérique},
}
@INPROCEEDINGS{GUADAGNINI_2014_INPROCEEDINGS_G_265631,
AUTHOR = {Guadagnini, E.},
TITLE = {The OVI Textual Databases: New Web Resources for Old Italian Studies},
YEAR = {2014},
URL = {https://www.arts.kuleuven.be/ling/dag_van_het_onderzoek/posters_en_demos/guadagnini_ovi},
CONFERENCE_NAME = {Aspecten van corpusonderzoek},
}
@INPROCEEDINGS{LAM_2014_INPROCEEDINGS_LBDRPSBB_281930,
AUTHOR = {Lamé, M. and Boschetti, F. and Dellepiane, M. and Rosmorduc, S. and Polis, S. and Sarullo, G. and Barmpoutis, A. and Bozia, E.},
TITLE = {Technology & Tradition: a Synergic Approach to Deciphering, Analyzing and Annotating Epigraphic Writings (abridgement/condensed presentation)},
YEAR = {2014},
ABSTRACT = {This panel intends to discuss the advantages of computer-assisted study of writings as well as the exigency for collaboration between digital and traditional epigraphists. The advances in computing in the past few decades have resulted in the development of several digital tools meant to assist scholars decipher and analyze inscribed symbols. Some of the techniques involve 2D or 3D digitization of the inscriptions and various post-processing methods that help scholars recognize the inscribed characters or symbols, analyze their structure, and study writing techniques. This interdisciplinary panel that consists of computer scientists, computational linguists, heterogeneous writings experts (archaic Latin, cursive Latin, Egyptian writings), and epigraphists will address the following issues: the use of traditional and digital methodologies for deciphering and analyzing inscriptions, the accuracy and efficacy of a computer algorithm that tries to solve the same problem, text representation problems when iconicity is involved, optimal ways to train digital tools, and to what extent 2D, 3D representations, and text encodings follow, imitate, and enhance traditional methodologies},
URL = {https://iris.cnr.it/handle/20.500.14243/281930},
DOI = {10.13133/978-88-98533-42-8},
ISBN = {978-88-98533-42-8},
}
@INPROCEEDINGS{LUCENTINI_2014_INPROCEEDINGS_LCCMNC_276435,
AUTHOR = {Lucentini, R. and Chiarella, D. and Cutugno, P. and Marconi, L. and Noberini, S. and Castelletti, S.},
TITLE = {A digital archive for cultural heritage: the case of the Luzzati Museum},
YEAR = {2014},
URL = {https://iris.cnr.it/handle/20.500.14243/276435},
CONFERENCE_NAME = {RENEWAL, INNOVATION AND CHANGE: HERITAGE AND EUROPEAN SOCIETY (RICHES) First International Conference},
}
@INPROCEEDINGS{SAGRI_2014_INPROCEEDINGS_STMV_289336,
AUTHOR = {Sagri, M. T. and Tiscornia, D. and Montemagni, S. and Venturi, G.},
TITLE = {Investigating the relationship between neuroscience and law: a case study on a corpus of Italian case law texts},
YEAR = {2014},
KEYWORDS = {Neuroscience, linguistic and lexico-semantic analysis},
URL = {https://iris.cnr.it/handle/20.500.14243/289336},
CONFERENCE_NAME = {Language and Law in Social Practice 3rd International Conference},
}
@INPROCEEDINGS{SASSOLINI_2014_INPROCEEDINGS_SSCCS_248752,
AUTHOR = {Sassolini, E. and Sassi, M. and Cucurullo, S. and Cinini, A. and Sbrulli, S.},
TITLE = {Industrial Philology: Problems and techniques of data and archives preservation for future generations},
YEAR = {2014},
ABSTRACT = {The main objective of digital archiving of texts is their re-use and preservation. The concept that guides these initiatives is linked to structural and organizational needs which heavily influence the definition of the format specifications that describe the organisation of the archives at various levels and consists of a more or less complex document. A format specification provides the details needed to build a file from a text, establishes the admitted encodings and software applications that can decode the file and make its content accessible. These structural specifications can have an extremely variable size and they depend on the complexity of the format. Although some format specifications are, for the most part, independent of the specific software (for example, ASCII and Unicode codes), many of them are related to the historical period in which the texts were acquired and also by dated software technologies. The file format specification should evolve hand in hand with the related software, and the fate of one is in fact often linked to that of the other. It is therefore appropriate to face the issue of obsolescence of software together with the obsolescence of file formats and of storage medium},
KEYWORDS = {text management, text analysis},
PAGES = {168-172},
URL = {https://iris.cnr.it/handle/20.500.14243/248752},
ISSN = {1386-2316},
ISBN = {978-90-77484-22-7},
CONFERENCE_NAME = {GL15: Fifteenth International Conference on Grey Literature},
}
@TECHREPORT{ALBANESI_2014_TECHREPORT_ABBG_350478,
AUTHOR = {Albanesi, D. and Bellandi, A. and Bellusci, A. and Giovannetti, E.},
TITLE = {Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-Rapporto tecnico 3},
YEAR = {2014},
ABSTRACT = {Il presente documento descrive lo stato di avanzamento del lavoro condotto dall'Istituto di Linguistica Computazionale "A. Zampolli" del CNR (ILC-CNR) nel contesto del progetto "Traduzione del Talmud Babilonese" in italiano. Quanto qui descritto costituisce un "Rapporto sullo Stato di Avanzamento dei Lavori (SAL) dell'applicazione Web" unicamente da parte dell'ILC-CNR e si configura come il terzo dei fascicoli previsti a cadenza quadrimestrale},
URL = {https://iris.cnr.it/handle/20.500.14243/350478},
}
@TECHREPORT{ALBANESI_2014_TECHREPORT_ABBG_350479,
AUTHOR = {Albanesi, D. and Bellandi, A. and Benotto, G. and Giovannetti, E.},
TITLE = {Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-Rapporto tecnico 4},
YEAR = {2014},
ABSTRACT = {Il presente documento descrive lo stato di avanzamento del lavoro condotto dall'Istituto di Linguistica Computazionale "A. Zampolli" del CNR (ILC-CNR) nel contesto del progetto "Traduzione del Talmud Babilonese" in italiano. Quanto qui descritto costituisce un "Rapporto sullo Stato di Avanzamento dei Lavori (SAL) dell'applicazione Web" unicamente da parte dell'ILC-CNR e si configura come il quarto dei fascicoli previsti a cadenza quadrimestrale},
URL = {https://iris.cnr.it/handle/20.500.14243/350479},
}
@TECHREPORT{ALBANESI_2014_TECHREPORT_ABBCG_350477,
AUTHOR = {Albanesi, D. and Bellandi, A. and Bulleri, F. and Carniani, E. and Giovannetti, E.},
TITLE = {Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-Rapporto tecnico 2},
YEAR = {2014},
ABSTRACT = {Il presente documento descrive lo stato di avanzamento del lavoro condotto dall'Istituto di Linguistica Computazionale "A. Zampolli" del CNR (ILC-CNR) nel contesto del progetto "Traduzione del Talmud Babilonese" in italiano. Quanto qui descritto costituisce un "Rapporto sullo stato di avanzamento dei lavori dell'applicazione Web" unicamente da parte dell'ILC-CNR e si configura come il secondo dei fascicoli previsti a cadenza quadrimestrale. Il rilascio del presente rapporto, previsto per febbraio, è stato ritardato di un mese per consentire di incorporarvi anche la documentazione relativa allo sviluppo di componenti che sono stati richiesti all'ILC-CNR per rispondere ad esigenze editoriali e di composizione del layout di stampa (cfr. sez. 2. 4). In seguito, le parole, le frasi o una intera sezione che riteniamo degne di nota saranno sottolineate},
URL = {https://iris.cnr.it/handle/20.500.14243/350477},
}
@TECHREPORT{BENOTTO_2014_TECHREPORT_B_221643,
AUTHOR = {Benotto, G.},
TITLE = {Tecnologie linguistiche per la costruzione automatica o semi-automatica di ontologie di dominio},
YEAR = {2014},
ABSTRACT = {La necessità di accedere a grandi quantità di conoscenza disponibile in forma non strutturata, presente come testo libero in basi documentali vaste e variegate per stile e argomento, ha dato impulso allo sviluppo di tecnologie per l'acquisizione, la classificazione, la strutturazione e la gestione automatica dell'informazione testuale. Tali applicazioni hanno guadagnato, con gli anni, un'importante diffusione in molteplici contesti applicativi. Questo lavoro si propone di fornire una breve rassegna relativa alle principali tecnologie linguistiche per la costruzione automatica o semi-automatica di ontologie di dominio. Si descriveranno quindi le diverse fasi del processo di acquisizione e strutturazione dei dati, focalizzandosi in particolare sulla fase di estrazione terminologica relativa a lessici di dominio, con particolare attenzione al problema della difficoltà riscontrata nel riconoscimento del lessico relativo a particolari linguaggi specialistici e sulla fase di estrazione delle relazioni semantiche},
KEYWORDS = {Computational linguistics},
URL = {https://iris.cnr.it/handle/20.500.14243/221643},
}
@TECHREPORT{BENOTTO_2014_TECHREPORT_B_221551,
AUTHOR = {Benotto, G.},
TITLE = {Modelli distribuzionali delle relazioni semantiche: il caso dell'iponimia e dell'antonimia},
YEAR = {2014},
ABSTRACT = {Questo lavoro si propone di esplorare le potenzialita? e i limiti dell'approccio distribuzionale come modello del lessico semantico. Ci si propone quindi di effettuare uno studio riguardo le misure distribuzionali attualmente proposte per il riconoscimento delle relazioni semantiche paradigmatiche, in modo da valutarne il grado di successo. Si vuole infatti capire se i metodi distribuzionali possono rivelarsi efficaci nello svolgimento di compiti di riconoscimento di relazioni semantiche paradigmatiche. Si vuole inoltre stabilire se esiste un margine di miglioramento nelle tecniche attualmente in uso per il riconoscimento di questo tipo di relazioni},
KEYWORDS = {Computational linguistics, distributional semantics},
URL = {https://iris.cnr.it/handle/20.500.14243/221551},
}
@TECHREPORT{CHIARELLA_2014_TECHREPORT_CCM_267802,
AUTHOR = {Chiarella, D. and Cutugno, P. and Marconi, L.},
TITLE = {D3. 1 Initial list of gestures and syntax},
YEAR = {2014},
PAGES = {1-17},
URL = {https://iris.cnr.it/handle/20.500.14243/267802},
}
@TECHREPORT{CIGNONI_2014_TECHREPORT_C_228525,
AUTHOR = {Cignoni, L.},
TITLE = {Il mondo delle "Nursery rhymes" inglesi},
YEAR = {2014},
PAGES = {1-11},
URL = {https://iris.cnr.it/handle/20.500.14243/228525},
}
@TECHREPORT{DEMATTEI_2014_TECHREPORT_DMDMBF_276258,
AUTHOR = {De Mattei, M. and Medone, D. and D'Angelo, P. and Monachini, M. and Bartolini, R. and Frontini, F.},
TITLE = {MAPS: Architettura del Sistema},
YEAR = {2014},
ABSTRACT = {PROGRAMMA OPERATIVO REGIONALE POR-FESR (2007-2013) Asse 1 Innovazione e Competitività Bando DLTM Azione 1. 2. 2 "Ricerca industriale e sviluppo sperimentale a favore delle imprese del Distretto Ligure per le Tecnologie Marine (DLTM) anno 2012. Il presente documento è il deliverable "D3. 1-Architettura del Sistema" del progetto MAPS (Marine Planning and Service Platform). Il progetto MAPS è un'evoluzione del progetto precedente Marine. Tale evoluzione si articola su tre aspetti diversi:-Un meccanismo di federazione dei dati, che consenta di rendere disponibili ai propri utenti non soltanto i dati prodotti internamente da sistema Marine ma anche quelli resi disponibili da altri sistemi similari, soddisfacendo così un più ampio ambito di esigenze informative. Il deliverable D2. 2, Modello della Soluzione specifica in dettaglio queste nuove funzionalità.-Un Catalogo dei Documenti che, conservando la documentazione tecnica e scientifica dei prodotti offerti, possa documentare in modo accurato le modalità di misurazione, elaborazione e controllo dei prodotti forniti e quindi i relativi ambiti di applicabilità.-Un sistema di ricerca capace di selezionare i dati necessari ad uno scopo determinato non soltanto sulla base della loro tipologia, della loro dislocazione territoriale o di altre informazioni simili contenute nei metadati associati come avviene oggi nella maggior parte dei sistemi esistenti, ma anche sulla base delle informazioni contenute nella documentazione tecnica e scientifica. Tali funzionalità sono specificate nel deliverable D1. 3-Modello della Soluzione},
KEYWORDS = {Marine Science, Search Engine, Source Data, Oceanography},
PAGES = {1-35},
URL = {https://iris.cnr.it/handle/20.500.14243/276258},
}
@TECHREPORT{DEMATTEI_2014_TECHREPORT_DMMFBM_276262,
AUTHOR = {De Mattei, M. and Medone, D. and Maltese, M. and Frontini, F. and Bartolini, R. and Monachini, M.},
TITLE = {META: Report di progettazione degli algoritmi individuati},
YEAR = {2014},
ABSTRACT = {PROGRAMMA OPERATIVO REGIONALE POR-FESR (2007-2013) Asse 1 Innovazione e Competitività Bando DLTM Azione 1. 2. 2 "Ricerca industriale e sviluppo sperimentale a favore delle imprese del Distretto Ligure per le Tecnologie Marine (DLTM) anno 2012. Il deliverable definisce l'architettura del Sistema di Estrazione Eventi Meteo realizzato dagli autori nell'ambito del progetto META. Il sistema estrae da contenuti online informazione su eventi meteo critici verificatesi in Liguria e nel nord della Toscana},
KEYWORDS = {Ontology, Information Extraction, Taxonomy},
PAGES = {1-19},
URL = {https://iris.cnr.it/handle/20.500.14243/276262},
}
@TECHREPORT{DELGROSSO_2014_TECHREPORT_D_315843,
AUTHOR = {Del Grosso, A. M.},
TITLE = {Processo di analisi e indicizzazione dei testi digitalizzati di Cristoforo Clavio},
YEAR = {2014},
ABSTRACT = {Il contributo descrive il rilascio del componente di analisi linguistica sviluppato dall'Istituto di Linguistica Computazionale in seno al progetto Clavius on the Web (CoW). Contestualmente vengono presentate le risorse utilizzate nonché i dati e i vincoli di input e quelli di output},
KEYWORDS = {Clavius on the Web, Lemmatizzazione, Latino},
URL = {http://www.claviusontheweb.it},
}
@TECHREPORT{FRONTINI_2014_TECHREPORT_FBM_276261,
AUTHOR = {Frontini, F. and Bartolini, R. and Monachini, M.},
TITLE = {META:-Report sui modelli e tecniche linguistiche},
YEAR = {2014},
ABSTRACT = {PROGRAMMA OPERATIVO REGIONALE POR-FESR (2007-2013) Asse 1 Innovazione e Competitività Bando DLTM Azione 1. 2. 2 "Ricerca industriale e sviluppo sperimentale a favore delle imprese del Distretto Ligure per le Tecnologie Marine (DLTM) anno 2012. Il deliverable riassume lo stato dell'arte delle tecnologie semantiche che possono essere impiegate nella realizzazione del progetto META. Il progetto META è una progetto di ricerca e sviluppo tecnologico finanziato dalla Regione Liguria con i fondi POR-FESR 2007-2013 della Comunità Europea che mira alla realizzazione di un sistema per l'allerta di eventi meteo critici in Liguria e nel nord della Toscana. Nell'ambito del progetto META le tecnologie semantiche sono utilizzate per estrarre eventi meteo di interesse da articoli pubblicati in rete o sui social network},
KEYWORDS = {Ontology, Information Extraction, Semantic Web, Search Engine},
PAGES = {1-20},
URL = {https://iris.cnr.it/handle/20.500.14243/276261},
}
@TECHREPORT{FRONTINI_2014_TECHREPORT_FBM_276259,
AUTHOR = {Frontini, F. and Bartolini, R. and Monachini, M.},
TITLE = {MAPS: Stato dell'Arte},
YEAR = {2014},
ABSTRACT = {PROGRAMMA OPERATIVO REGIONALE POR-FESR (2007-2013) Asse 1 Innovazione e Competitività Bando DLTM Azione 1. 2. 2 "Ricerca industriale e sviluppo sperimentale a favore delle imprese del Distretto Ligure per le Tecnologie Marine (DLTM) anno 2012 Il documento descrive lo stato dell'arte delle tecnologie linguistiche applicate ai sistemi di ricerca semantica},
KEYWORDS = {Marine Science, Search Engine, Source Data, Oceanography},
PAGES = {1-21},
URL = {https://iris.cnr.it/handle/20.500.14243/276259},
}
@TECHREPORT{FRONTINI_2014_TECHREPORT_FBMPG_222835,
AUTHOR = {Frontini, F. and Bartolini, R. and Monachini, M. and Pardelli, G. and Goggi, S.},
TITLE = {Stato dell'arte dei motori semantici. Progetto MAPS, programma operativo regionale POR-FESR (2007-2013)},
YEAR = {2014},
ABSTRACT = {Il presente documento è il deliverable "D1. 1-Stato dell'Arte dei motori semantici del progetto MAPS (Marine Planning and Service Platform). Il progetto MAPS è una evoluzione del progetto precedente Marine. Tramite il progetto Marine (Bando Ricerca Industriale e Sviluppo Sperimentale Regione Liguria 2007-2013-pos n. 1) è stata realizzata una piattaforma informatica di supporto all'Oceanografia Operativa capace di raccogliere dati marini per renderli poi disponibili ai ricercatori e alle organizzazioni interessate tramite protocolli standard. Lo scopo del progetto MAPS è quello di realizzare una Catalogo di Documenti contenente informazioni per la piattaforma Marine. Caratteristica di MAPS è di fornire accesso ai dati oceanografici sia attraverso la ricerca per metadati, sia attraverso la ricerca semantica contenuta nella manualistica tecnico scientifica di riferimento},
PAGES = {1-22},
URL = {https://iris.cnr.it/handle/20.500.14243/222835},
}
@TECHREPORT{MARZI_2014_TECHREPORT_M_225698,
AUTHOR = {Marzi, C.},
TITLE = {Lexical acquisition in bilingual contexts: aspects of (extra)linguistic and psycholinguistic modeling},
YEAR = {2014},
ABSTRACT = {The overall research goals of this bilateral action have been to focus on cognitive and extra-linguistic factors involved in bilingual word recognition, with a view to exploring implications, requirements and constraints on computational models of bilingual acquisition. In particular, the cross visits intended to investigate linguistic, extra-linguistic and psycholinguistic issues which are generally assumed to have a bearing on aspects of bilingual lexicon acquisition and word processing, with a view to better understanding their role and dynamic relationship with aspects more closely related to the language-specific input},
KEYWORDS = {Cognitive factors, monolingual and bilingual word},
URL = {http://www.esf.org/coordinating-research/research-networking-programmes/humanities-hu},
}
@TECHREPORT{MARZI_2014_TECHREPORT_MPV_225700,
AUTHOR = {Marzi, C. and Plag, I. and Vulchanova, M.},
TITLE = {Words: structure, meaning, acquisition, processing},
YEAR = {2014},
ABSTRACT = {By bringing together experts of various scientific domains and different theoretical inclinations, the second NetWordS Summer school contributed to advance the current awareness of theoretical, typological, psycholinguistic, computational and neurophysiological evidence on the structure and processing of words, with a view to fostering novel methods of research and assessment for grammar architecture and language physiology},
KEYWORDS = {Mental lexicon, Lexical processing and acquisition, Interdisciplinary approach},
URL = {http://www.networds-esf.eu/uploads/NetWordS/2nd_SummerSchool_Trondheim_scientificr},
}
@MISC{BARONI_2014_MISC_B_312489,
AUTHOR = {Baroni, P.},
TITLE = {Sito Web dell'Istituto di Linguistica Computazionale «A. Zampolli»},
YEAR = {2014},
ABSTRACT = {New Web site of the Institute for Computational Linguistics of the Italian National Research Council (ILC-CNR), powered by Drupal, developed in Italian and English},
KEYWORDS = {Sito web},
URL = {http://www.ilc.cnr.it},
}
@MISC{BELEFFI_2014_MISC_BS_286648,
AUTHOR = {Beleffi, E. and Sassi, M.},
TITLE = {La sicurezza del paziente sui quotidiani in Italia: indagine preliminare sui termini e l'andamento degli eventi},
YEAR = {2014},
URL = {https://iris.cnr.it/handle/20.500.14243/286648},
CONFERENCE_NAME = {FORUM RISK MANAGEMENT IN SANITÀ 2014},
}
@MISC{BELLANDI_2014_MISC_BM_370095,
AUTHOR = {Bellandi, A. and Marchi, S.},
TITLE = {Computational Lexicon Interface: Greek into Arabic},
YEAR = {2014},
ABSTRACT = {Interfaccia di interrogazione analitica e grafica, al lessico di Plotino, integrata nella piattaforma web Greek into Arabic},
URL = {https://iris.cnr.it/handle/20.500.14243/370095},
}
@MISC{BELLANDI_2014_MISC_BSBT_228485,
AUTHOR = {Bellandi, T. and Sassi, M. and Beleffi, E. and Tartaglia, R.},
TITLE = {Patient safety on the press in Italy, a preliminary investigation of the terms and trend},
YEAR = {2014},
ABSTRACT = {Introduction: Patient safety is a public concern. In Italy, the wide majority of the citizens (97%) reported that medical errors are an important problem (Eurobarometer 241, 2006), but the proportion of those who reported to have suffered an adverse event (15%) is much below the EU average of 26% (Eurobarometer 327, 2010). Then we decided to systematically analyse the terms used on the press to report patient safety incidents and to look at eventual correlations between the trend of terms, catastrophic events occurred, regulations and practices to reduce risks. Methods: We used a dedicated software developed for collecting, storing and analyzing all health news. Quantitative and qualitative analysis were conducted on the DB of articles published from 1999 to 2012 in the three main Italian newspapers, applying a set of 6 terms of common and technical language to refer to patient safety incidents. Also, we reviewed the national regulations and the database of adverse events collected since 2006. Results: On a total of 38. 265 articles on health topics, 0, 5% refer to patient safety incidents. The most frequent word used is "malpractice" (59, 4%), followed by "adverse reaction" (17, 5%) and "adverse event" (10, 5%). Peaks are in 2007 (17, 1%), 2010 (14, 6%) and 2008 (12, 2%), whit no clear trend neither for the aggragated data nor for the individual terms used. Peaks seem to be attributable to the media coverage of individual catastrophic event, such as the transplantation of three organs from an HIV-positive donor and the death of a woman following an unecessary surgery due to a mis-identification of the CT-scan (2007), the death of three babies during delivery within three weeks at the same hospital (2008). In 2010 the peak correspond to the publication of the national enquiry on malpractice at the Parliament. Discussion: Patient safety incidents are not very popular on health news. Despite the effort made to develop regulations and practices for patient safety and for public disclosure of incidents, the peaks seem to be related to individual catastrophic events and malpractice issues. Further investigation is needed to understand the influence of the press on clinical risk perception and improve the information on patient safety},
URL = {https://iris.cnr.it/handle/20.500.14243/228485},
}
@MISC{BIAGIONI_2014_MISC_BDGP_263921,
AUTHOR = {Biagioni, S. and De Luca, R. and Giannini, S. and Pardelli, G.},
TITLE = {I sistemi informativi della Biblioteca dell'Area della Ricerca di Pisa},
YEAR = {2014},
ABSTRACT = {Description of the CNR Library, (Pisa, Italy) and its services},
KEYWORDS = {Sistemi informativi per biblioteche, Servizi bibliotecari},
URL = {https://iris.cnr.it/handle/20.500.14243/263921},
CONFERENCE_NAME = {Seminario rivolto agli alunni dell'Istituto Tecnico Economico "F. Carrara" di Lucca, organizzato dall'Istituto di Linguistica Computazionale "A. Zampolli" del CNR di Pisa},
}
@MISC{BOSCHETTI_2014_MISC_B_228554,
AUTHOR = {Boschetti, F.},
TITLE = {OCR: instruments linguistiques pour améliorer la précision de la reconnaissance optique des caractères dans le cas du grec ancien et de l'arabe},
YEAR = {2014},
URL = {https://iris.cnr.it/handle/20.500.14243/228554},
CONFERENCE_NAME = {Workshop International en Traitement Automatique de la Langue Arabe},
}
@MISC{BOSCHETTI_2014_MISC_B_228561,
AUTHOR = {Boschetti, F.},
TITLE = {Extracting Information Related To Writings From Traditional Paper Corpora},
YEAR = {2014},
URL = {http://bit.ly/11ps2tD},
CONFERENCE_NAME = {EAGLE 2014 International Conference},
}
@MISC{BOSCHETTI_2014_MISC_B_228559,
AUTHOR = {Boschetti, F.},
TITLE = {L'edizione scientifica digitale del testo letterario e del testo epigrafico: convergenze e divergenze-Parte I},
YEAR = {2014},
URL = {https://iris.cnr.it/handle/20.500.14243/228559},
CONFERENCE_NAME = {Risorse digitali e strumenti collaborativi per le Scienze dell'Antichità},
}
@MISC{BOSCHETTI_2014_MISC_B_228536,
AUTHOR = {Boschetti, F.},
TITLE = {Corpus Linguistics and Greek},
YEAR = {2014},
PAGES = {391-394},
URL = {https://iris.cnr.it/handle/20.500.14243/228536},
ISBN = {9789004225978},
EDITOR = {Giannakis, G. K.},
}
@MISC{BOSCHETTI_2014_MISC_BCD_228551,
AUTHOR = {Boschetti, F. and Caruso, L. and Del Grosso, A. M.},
TITLE = {Euporia: Un'esperienza di Filologia Collaborativa a scuola, per promuovere il circolo virtuoso fra ricerca e didattica},
YEAR = {2014},
URL = {https://iris.cnr.it/handle/20.500.14243/228551},
CONFERENCE_NAME = {Internet Festival},
}
@MISC{BOSCHETTI_2014_MISC_BD_228552,
AUTHOR = {Boschetti, F. and Del Grosso, A. M.},
TITLE = {Progetto Euporia: Gli studenti incontrano la Filologia Collaborativa},
YEAR = {2014},
URL = {https://iris.cnr.it/handle/20.500.14243/228552},
CONFERENCE_NAME = {Annotazione Linguistica e Retorica di Testi Greci con Traduzione a Fronte},
}
@MISC{BOSCHETTI_2014_MISC_BD_228549,
AUTHOR = {Boschetti, F. and Del Grosso, A. M.},
TITLE = {La filologia computazionale e collaborativa al liceo},
YEAR = {2014},
URL = {https://iris.cnr.it/handle/20.500.14243/228549},
}
@MISC{BOSCHETTI_2014_MISC_BF_228556,
AUTHOR = {Boschetti, F. and Fortunato, L.},
TITLE = {Correcting Multiple Editions of Aeschylus},
YEAR = {2014},
URL = {https://iris.cnr.it/handle/20.500.14243/228556},
CONFERENCE_NAME = {Open Philology Meeting},
}
@MISC{BOSCHETTI_2014_MISC_BL_293554,
AUTHOR = {Boschetti, F. and Lamé, M.},
TITLE = {L'edizione scientifica digitale del testo letterario e del testo epigrafico: convergenze e divergenze},
YEAR = {2014},
URL = {https://iris.cnr.it/handle/20.500.14243/293554},
}
@MISC{BOZZI_2014_MISC_BM_247999,
AUTHOR = {Bozzi, A. and Marchi, S.},
TITLE = {"Greek into Arabic Web App" as a Research Infrastructure for the History of Philosophy and Science},
YEAR = {2014},
URL = {https://iris.cnr.it/handle/20.500.14243/247999},
CONFERENCE_NAME = {Plotinus, East and West-The Enneads in Arabic and Latin},
}
@MISC{BURGASSI_2014_MISC_B_269646,
AUTHOR = {Burgassi, C.},
TITLE = {The History of Italian Vocabulary},
YEAR = {2014},
URL = {https://iris.cnr.it/handle/20.500.14243/269646},
CONFERENCE_NAME = {Heritage Lexicography as Supporting Tool for International Council on Monuments and Sites},
}
@MISC{BURGASSI_2014_MISC_BDGLBNVZ_256341,
AUTHOR = {Burgassi, C. and Dotto, D. and Guadagnini, E. and Lorenzi, C. and Biondi, C. L. and Nieri, V. and Vaccaro, G. and Zago, A.},
TITLE = {DiVo-Bibliografia filologica (2014)},
YEAR = {2014},
ABSTRACT = {DiVo DB è la bibliografia filologica dei volgarizzamenti medievali dei testi classici e tardo-antichi. Sono compilate delle schede brevi per le opere latine, con informazioni sull'autore, sulla compilazione e sul genere dell'opera, nonché l'identificazione dell'edizione di riferimento (quella inclusa nel corpus DiVo). Le schede dei testi volgari contengono cenni biografici sull'autore del volgarizzamento, la datazione dell'opera, l'identificazione della coloritura linguistica del testo, l'indicazione della tipologia testuale e del genere dell'opera, la catalogazione della tradizione diretta mediante l'elencazione dei testimoni manoscritti e delle stampe antiche, una trattazione filologica della storia della tradizione, l'identificazione dell'edizione di riferimento, un panorama bibliografico sull'opera articolato per punti. A ciascun manoscritto è dedicata una scheda in cui si indicano gli incipit e gli explicit di ciascun manoscritto, le carte in cui l'opera è contenuta, eventuali note e l'informazione sulla visione diretta del manufatto. Si indicano i casi in cui lo studio della tradizione ha mostrato la necessità di controlli più approfonditi della lezione dei manoscritti: gli esiti di tali controlli costituiscono il sistema di note filologiche associato al corpus DiVo},
URL = {https://iris.cnr.it/handle/20.500.14243/256341},
}
@MISC{BURGASSI_2014_MISC_BDGV_256339,
AUTHOR = {Burgassi, C. and Dotto, D. and Guadagnini, E. and Vaccaro, G.},
TITLE = {Corpus del Dizionario dei Volgarizzamenti (Corpus DiVo) (2014)},
YEAR = {2014},
ABSTRACT = {Il Corpus DiVo è parte del progetto di ricerca DiVo-Dizionario dei Volgarizzamenti diretto da Elisa Guadagnini e Giulio Vaccaro, ospitato dall'Istituto Opera del Vocabolario Italiano (CNR) e dalla Scuola Normale Superiore di Pisa, finanziato dal MIUR all'interno del programma FIRB-Futuro in Ricerca 2010. Il Corpus DiVo, interrogabile con GattoWeb, è curato da Cosimo Burgassi, Diego Dotto, Elisa Guadagnini e Giulio Vaccaro. Comprende attualmente 165 testi volgari, per complessive 6. 374. 624 occorrenze di 177. 340 forme grafiche distinte. Sono presenti 86 testi latini associati. Sono presenti nel corpus due distinti specimina di lemmatizzazione e iperlemmatizzazione, entrambi a cura di Diego Dotto: il primo, fondato su un sottocorpus, segue i criteri descritti in D. Dotto, Note per la lemmatizzazione del corpus DiVo, in «Bollettino dell'Opera del Vocabolario Italiano», XVII (2012), pp. 336-364; il secondo, fondato sull'intero corpus, seleziona alcuni lemmi significativi con riferimento agli iperlemmi «Cariche e uffici» e «Vestiario» (per questi lemmi un sistema di etichettatura isola le dittologie sinonimiche, marcate «] Ditt. », e gli esempi con valore di glossa, marcati «] Gl»). Per la consultazione, occorre accedere alla «Ricerca di contesti per iperlemmi», in cui si potranno interrogare i 13 iperlemmi individuati che mettono in relazione i lemmi per area semantica, o alla «Ricerca di contesti per disambiguatori», dove ricercando le stringhe «] Ditt. » e «] Gl» si potranno recuperare tutti i contesti che presentano la suddetta marcatura. Sono presenti 2. 427 lemmi, per un totale di 51. 274 occorrenze lemmatizzate},
KEYWORDS = {Volgarizzamenti, Corpus testuale, Dizionario dei Volgarizzamenti, Italiano antico},
URL = {http://divoweb.ovi.cnr.it},
}
@MISC{BURGASSI_2014_MISC_BDGVZ_256340,
AUTHOR = {Burgassi, C. and Dotto, D. and Guadagnini, E. and Vaccaro, G. and Zago, A.},
TITLE = {Corpus dei classici latini volgarizzati (Corpus CLaVo) (2014)},
YEAR = {2014},
ABSTRACT = {Il Corpus CLaVo è parte del progetto di ricerca DiVo-Dizionario dei Volgarizzamenti., diretto da Elisa Guadagnini e Giulio Vaccaro, ospitato dall'Istituto Opera del Vocabolario Italiano (CNR) e dalla Scuola Normale Superiore di Pisa, finanziato dal MIUR all'interno del programma FIRB-Futuro in Ricerca 2010. Il Corpus CLaVo, interrogabile con GattoWeb, è curato da Cosimo Burgassi, Diego Dotto, Elisa Guadagnini e Giulio Vaccaro. Esso raccoglie le opere latine tradotte dai volgarizzamenti compresi nel corpus DiVo: per alcune sommarie informazioni su queste opere e sulla loro tradizione si rinvia alle relative schede, compilate per la maggior parte da Anna Zago, comprese nella bibliografia filologica del DiVo. Il Corpus CLaVo comprende attualmente 87 testi corrispondenti a 42 opere latine, associate a 86 volgarizzamenti, per complessive 2. 205. 143 occorrenze di 122. 364 forme grafiche distinte. Al Corpus CLaVo è associato un dizionario macchina, curato da Anna Zago, che contiene 3263 lemmi e 45. 086 coppie forma-lemma},
KEYWORDS = {Classici latini, Corpus testuale, Dizionario dei Volgarizzamenti, Lingua latina},
URL = {http://clavoweb.ovi.cnr.it/},
}
@MISC{CIGNONI_2014_MISC_C_228531,
AUTHOR = {Cignoni, L.},
TITLE = {English Grammar Slides},
YEAR = {2014},
URL = {http://www.paleopatologia.it},
}
@MISC{CIGNONI_2014_MISC_CF_228524,
AUTHOR = {Cignoni, L. and Fornaciari, G.},
TITLE = {Basics of English Grammar},
YEAR = {2014},
ABSTRACT = {This ongoing basic reference grammar was created to support the Italian students of the funerary archaeology courses held at the University of Pisa in the years 2011-2014 in the study of the English language. The courses conducted by a University Professor specialized in the discipline and by an expert English language teacher were delivered according to the CLIL (content and language integrated learning) methodology, which combines the teaching of a particular subject with the study of a vehicular language of instruction. In this online grammar resource the different parts of speech (nouns, pronouns, adjectives, etc.) and elements of the sentence or clause are explained in a simple and concise manner, so as to help the students develop their grammar skills. On the model of the same English grammar (2010), written in Italian and accompanied by short reading passages extracted from Henry Duday's The Archaeology of the Dead, this grammar written in English will be constantly enriched with contextualized examples illustrating the different grammar items. The subject teacher and the native language teacher will select the most appropriate examples extracted by the students from a number of acknowledged funerary archaeology texts used during the courses and dealing with the subjects of funerary archaeology and of other related research areas, in particular with the funerary customs and practices of specific historical periods (Anglo-Saxon, Roman, Medieval). The examples illustrating a particular grammar rule will not only show the use of the word in context, but will at the same time be rich in content, providing some useful notions about the discipline, so that the grammar can be studied not in isolation but in meaningful contexts and real-life situations. The CLIL classes fall within the framework of a wider project carried out at the Division of Palaeopathology-Department of Oncology, Transplants and Modern Technologies in Medicine of the University of Pisa, which is aimed to develop specific training for those (master and specialist level graduate students, post-doctoral scholars, etc.) specializing in funerary archaeology},
URL = {http://www.paleopatologia.it},
}
@MISC{DELGRATTA_2014_MISC_DZNDB_344113,
AUTHOR = {Del Gratta, R. and Zarghili, A. and Nahli, O. and Del Grosso, A. and Boschetti, F.},
TITLE = {From text to cloud},
YEAR = {2014},
ABSTRACT = {We describe a model to integrate tools for searching and editing texts with lexical-semantic resources. We also suggest that this integration is necessary for students and researchers. Finally, we indicate (L)LOD as a formalism and strategy both for data organization and distribution},
KEYWORDS = {computationla linguistics, linguistic linked open data, computational philology},
URL = {http://www.dh.uni-leipzig.de/wo/workshop-december-2014/greek-and-latin-in-an-age-of-open-data-schedule/riccardo-del-gratta-et-al-from-text-to-cloud},
CONFERENCE_NAME = {Greek and Latin in an Age of Open Data},
}
@MISC{DELGROSSO_2014_MISC_DB_370143,
AUTHOR = {Del Grosso, A. M. and Boschetti, F.},
TITLE = {Progetto pilota EUPORIA. Annotazione linguistica e retorica di testi greci con traduzione a fronte dell'Elena di Euripide},
YEAR = {2014},
ABSTRACT = {Il contributo illustra i risultati del progetto Euporia},
KEYWORDS = {digital philology, computational philology, digital humanities},
URL = {https://iris.cnr.it/handle/20.500.14243/370143},
}
@MISC{DIDONATO_2014_MISC_D_407994,
AUTHOR = {Di Donato, F.},
TITLE = {Archivi e linked data},
YEAR = {2014},
ABSTRACT = {open science e linked data: un'introduzione},
URL = {https://iris.cnr.it/handle/20.500.14243/407994},
}
@MISC{DIDONATO_2014_MISC_D_407993,
AUTHOR = {Di Donato, F.},
TITLE = {Semantic annotation with Pundit: Enriching the Web of Science},
YEAR = {2014},
ABSTRACT = {presentazione di Pundit all'Agorà Final Conference: Digitizing Philosophy. Towards new paradigms and methods in editing, publishing and querying philosophical texts},
URL = {https://iris.cnr.it/handle/20.500.14243/407993},
}
@MISC{FRONTINI_2014_MISC_F_286128,
AUTHOR = {Frontini, F.},
TITLE = {La mappa delle opinioni e dei sentimenti estratte dai social media},
YEAR = {2014},
URL = {https://iris.cnr.it/handle/20.500.14243/286128},
CONFERENCE_NAME = {Seminario rivolto agli alunni dell'Istituto Tecnico Economico "F. Carrara" di Lucca, organizzato dall'Istituto di Linguistica Computazionale "A. Zampolli" del CNR di Pisa},
}
@MISC{GUADAGNINI_2014_MISC_G_256343,
AUTHOR = {Guadagnini, E.},
TITLE = {recensione: Rosa Piro, L'Almansore. Volgarizzamento fiorentino del XIV secolo. Edizione critica, Firenze, SISMEL-Edizioni del Galluzzo (Micrologus' Library) 2011},
YEAR = {2014},
PAGES = {212-220},
URL = {https://iris.cnr.it/handle/20.500.14243/256343},
VOLUME = {78 (309)},
ISSN = {0035-1458},
}
@MISC{KHAN_2014_MISC_KFM_262584,
AUTHOR = {Khan, F. and Frontini, F. and Monachini, M.},
TITLE = {A Model for Representing Diachronic Semantic Information in Lexico-Semantic Resources on the Semantic Web},
YEAR = {2014},
ABSTRACT = {The Semantic Web offers a way of publishing structured data online that facilitates the interlinking of different datasets stored at different online locations? indeed one of the main aims of the Semantic Web movement is to actively encourage this enrichment of online datasets with information from other resources, in order to avoid the problem of so called 'data islands'. In contrast to conventional hyperlinks however the links between different resources on the Semantic Web can be given semantic types and classified hierarchically. Data published on the Semantic Web is referred to as Linked Data? if, in addition, this data is available with an open license then it can be referred to as Linked Open Data (Heath 2011)},
KEYWORDS = {Cultural resources, Heritage resources},
PAGES = {1-3},
URL = {http://www.dh.uni-leipzig.de/wo/wp-content/uploads/2014/11/Fahad-Khan-Francesca-Frontini-and-Monica-Monachini-A-Model-for-Representing.pdf},
CONFERENCE_NAME = {Greek and Latin in an age of Open Data. Open Philology Project},
}
@MISC{LAM_2014_MISC_LBDRPSBB_300674,
AUTHOR = {Lamé, M. and Boschetti, F. and Dellepiane, M. and Rosmorduc, S. and Polis, S. and Sarullo, G. and Barmpoutis, A. and Bozia, E.},
TITLE = {First Standpoints of the Panel 'Technology & Tradition: a Synergic Approach to Deciphering, Analyzing and Annotating Epigraphic Writings'},
YEAR = {2014},
ABSTRACT = {This panel intends to discuss the advantages of computer-assisted study of writings as well as the exigency for collaboration between digital and traditional epigraphists. The advances in computing in the past few decades have resulted in the development of several digital tools meant to assist scholars decipher and analyze inscribed symbols. Some of the techniques involve 2D or 3D digitization of the inscriptions and various post-processing methods that help scholars recognize the inscribed characters or symbols, analyze their structure, and study writing techniques. This interdisciplinary panel that consists of computer scientists, computational linguists, heterogeneous writings experts (archaic Latin, cursive Latin, Egyptian writings), and epigraphists will address the following issues: the use of traditional and digital methodologies for deciphering and analyzing inscriptions, the accuracy and efficacy of a computer algorithm that tries to solve the same problem, text representation problems when iconicity is involved, optimal ways to train digital tools, and to what extent 2D, 3D representations, and text encodings follow, imitate, and enhance traditional methodologies},
URL = {https://iris.cnr.it/handle/20.500.14243/300674},
}
@MISC{LAME_2014_MISC_L_297484,
AUTHOR = {Lamé, M.},
TITLE = {Writings In Contexts: some Echoes of Epigraphic Dispositive},
YEAR = {2014},
ABSTRACT = {repeat details that are similar to, and make you think of, something else},
KEYWORDS = {Epigraphic transmission (echoes), Epigraphic dispositive, Digital Epigraphy, Writings in contexts, Deciphering, Digital Autoptic Process, Archaic and iconographic writings, Encoding epigraphic writings, 3D reconstruction and analysis},
URL = {http://eer.hypotheses.org/technology-tradition-a-synergic-approach-to-deciphering-analyzing-and-annotating-epigraphic-writings/unit-1-computer-graphics-digital-epigraphy-and-computational-linguistics-from-cnr-pisa/marion-lame-writings-in-contexts},
}
@MISC{MARINELLI_2014_MISC_M_254625,
AUTHOR = {Marinelli, R.},
TITLE = {Database semantico-lessicali come strumento per l'apprendimento della lingua Inglese (crocieristica e turismo)},
YEAR = {2014},
ABSTRACT = {Partiamo dalla descrizione di Mariterm, database semantico lessicale di dominio marittimo. Mariterm dopo le fasi inziali della sua costruzione è stato ampliato e arricchito con immagini che permettono di visualizzare il termine preso in considerazione e successivamente con l'inserimento di espressioni idiomatiche e modi di dire che appartengono al dominio marittimo con l'inserimento di termini che riguardano più specificatamente il settore della crocieristica e dell'attività turistica ad essa legata. Vogliamo qui parlare dell'uso di db semantico lessicali per l'insegnamento della lingua Inglese, per lo scopo specifico dell'Inglese Marittimo e, in particolare della terminologia di pertinenza del settore della crocieristica e dell'attività turistica ad essa lagata},
KEYWORDS = {database semanti lessicali, terminologia, turismo, crocieristica.},
URL = {https://iris.cnr.it/handle/20.500.14243/254625},
CONFERENCE_NAME = {Meeting annuale del Gruppo Web Semantico},
}
@MISC{MARZI_2014_MISC_M_261269,
AUTHOR = {Marzi, C.},
TITLE = {Models and dynamics of the morphological lexicon in mono-and bilingual acquisition},
YEAR = {2014},
ABSTRACT = {Aim of this work is to define an explanatory model of the morphological lexicon as a dynamic system of word acquisition and storage in both mono-and multi-lingual contexts. The main focus is on exploring some aspects of the paradigmatic organisation of the mental lexicon in language acquisition, based on a dynamic analysis of mono-and bilingual contexts. An interdisciplinary approach to the lexical acquisition combines theoretical-motivated accounts, psycho-cognitive evidence and methodologies, and machine learning technologies. In particular, the thesis deals with those basic psychological and cognitive mechanisms considered as crucial in language acquisition: (i) the ability to perceive recurrent morphological structures (invariances) in varying temporal contexts, (ii) the capability to access/activate time series of symbols in the short term memory and to selectively integrate them with long term memory expectations, (iii) the attitude towards building novel forms through analogical extension of intra-and inter-paradigmatic relations (generalisation). This investigation is pursued through a computational model based on Self-Organising Maps with Hebbian connections defined over a temporal layer (Temporal Self-Organising Maps-TSOMs), providing a principled algorithmic account of effects of lexical acquisition, processing and access. Computational simulation of biologically inspired neural architecture of the mental lexicon offers the possibility to reproduce a wide range of conditions of mono-and multi-lingual input exposure, and to illustrate the dynamic of word acquisition and the emergence of morphological organisation. The proposed model provides an adaptive multifactorial account of morphology acquisition affected by input factors, such as word frequency distributions, paradigm regularity and wordlikeness, whereby lexical perception and organisation are grounded on memory-based processing strategies},
KEYWORDS = {word acquisition, morphological lexicon, bio-computational model},
URL = {https://iris.cnr.it/handle/20.500.14243/261269},
}
@MISC{PICCINI_2014_MISC_PRB_370149,
AUTHOR = {Piccini, S. and Ruimy, N. and Bellandi, A.},
TITLE = {Plotino's Ontology},
YEAR = {2014},
ABSTRACT = {Plotino's Ontology},
URL = {https://iris.cnr.it/handle/20.500.14243/370149},
}
@MISC{PIRRELLI_2014_MISC_P_228535,
AUTHOR = {Pirrelli, V.},
TITLE = {Modèles psycho-computationnels du lexique mentale},
YEAR = {2014},
ABSTRACT = {Over the last decades, a growing body of evidence on the mechanisms governing lexical storage, access, acquisition and processing has raised a considerable challenge to traditional models of language architecture and word usage. By pulling together cognitive, neurofunctional and psycho-computational implications of these mechanisms, a new view of the lexicon-grammar architecture emerges, based on the dynamic interaction between storage and processing. We call this an "integrative" view of the mental lexicon},
KEYWORDS = {Mental Lexicon, Language Acquisition, Memory},
URL = {https://iris.cnr.it/handle/20.500.14243/228535},
CONFERENCE_NAME = {Workshop International en Traitement Automatique de la Langue Arabe},
}
@MISC{PIRRELLI_2014_MISC_P_228534,
AUTHOR = {Pirrelli, V.},
TITLE = {Review of "Computational Paralinguistics: Emotion, Affect and Personality in Speech and Language Processing" (by Schuller & Batliner, Wiley Publishing 2013)},
YEAR = {2014},
KEYWORDS = {Paralinguistics, Pragmatics, Language usage},
URL = {http://www.computingreviews.com/review/review_review.cfm?review_id=142608},
}
@MISC{PIRRELLI_2014_MISC_P_228504,
AUTHOR = {Pirrelli, V.},
TITLE = {Psycho-computational modelling of lexical access and organisation: what can we learn from Arabic?},
YEAR = {2014},
ABSTRACT = {Arabic morphology raises a formidable challenge to Markovian computational models of word processing, based on fixed-order memory chaining. Computational models of human short-term and long-term memory can help us considerably to shed light on the issues involved at the level of peripheral word processing (access lexical representations). According to this view, word processing (short-term activation) and lexical representations (entrenchment of habitual activation chains) are two sides of the same coin, as they involve the same levels of brain circuitry on a different time scale. Such an "integrative" view of the lexicon as a dynamic system will be possible only we are able to foster an increasing synergy of perspectives and scientific domains of inquiry: neurosciences, (psycho)linguistics and computing. Conventions of Arabic script are no accident (maliciously intended to trip up computer algorithms)! They rather reflect some fundamental dynamics of the way human brain processes language},
URL = {https://iris.cnr.it/handle/20.500.14243/228504},
CONFERENCE_NAME = {IEEE CIST'14-Innovative Systems and Technologies for the Future},
}
@MISC{PROIETTI_2014_MISC_PC_411318,
AUTHOR = {Proietti, C. and Ciuni, R.},
TITLE = {Arthur Prior},
YEAR = {2014},
ABSTRACT = {Arthur Prior (1914-1969) si è occupato di temi che spaziano dalla logica formale all'etica, ed ha fornito contributi di grandissima importanza soprattutto nell'ambito della logica modale, della metafisica, e della filosofia del tempo. E' considerato il padre della logica temporale e il precursore della contemporanea logica ibrida, è stato un precursore della semantica a mondi possibili di Saul Kripke, e il sostenitore di una forma raffinata e davvero audace di attualismo, a sua volta fondata su una precisa concezione dei rapporti fra esistenza, fatti e verità. Il suo approccio alla filosofia è stato molto attento alle grandi questioni tradizionali di metafisica e ontologia, ma allo stesso tempo ha gettato le basi di nuovi ambiti d'investigazione in logica modale. Il presente profilo si propone di presentare e discutere alcuni fra i suoi contributi più importanti e la loro rilevanza filosofica. In particolare, presenta e discute le semantiche per il branching time e la loro relazione con il problema del determinismo, le logiche ibride e la riduzione degli istanti a proposizioni, la logica Q e il problema della predicazione su individui contingentemente non esistenti},
KEYWORDS = {Arthur Prior, Logic},
PAGES = {499-515},
URL = {http://www.aphex.it/public/file/Content20141031_APhEx10,2014ProfiliPriorCiuniProietti.pdf},
VOLUME = {10 (10)},
ISSN = {2036-9972},
}
@MISC{RANDACCIO_2014_MISC_RSZ_257898,
AUTHOR = {Randaccio, S. and Soria, C. and Zoli, C.},
TITLE = {Standardized orthography: a shoe for barefoot},
YEAR = {2014},
URL = {https://iris.cnr.it/handle/20.500.14243/257898},
CONFERENCE_NAME = {Language Endangerment: Orthography Development for Language Maintenance and Revitalisation},
}
@MISC{SORIA_2014_MISC_S_257894,
AUTHOR = {Soria, C.},
TITLE = {Towards a notion of "Digital Language Diversity": the role of technologies for preserving multilingualism},
YEAR = {2014},
KEYWORDS = {digital language diversity, NLP, less-resourced languages, regional languages, minority languages, digital rights},
URL = {https://iris.cnr.it/handle/20.500.14243/257894},
CONFERENCE_NAME = {Seminario tenuto presso Department of English and Linguistics, University of Mainz},
}
@MISC{SORIA_2014_MISC_S_257897,
AUTHOR = {Soria, C.},
TITLE = {Towards a notion of Digital Language Diversity},
YEAR = {2014},
KEYWORDS = {digital language diversity, NLP, less-resourced languages, regional languages, minority languages, digital rights},
URL = {https://iris.cnr.it/handle/20.500.14243/257897},
CONFERENCE_NAME = {International Conference Linguistic Diversity in Cyberspace},
}
@MISC{SORIA_2014_MISC_S_257893,
AUTHOR = {Soria, C.},
TITLE = {Regional and Minority Languages of Italy, and the importance of terminology},
YEAR = {2014},
URL = {https://iris.cnr.it/handle/20.500.14243/257893},
CONFERENCE_NAME = {ELEN General Assembly},
}
@ARTICLE{BOSCHETTI_2013_ARTICLE_B_262429,
AUTHOR = {Boschetti, F.},
TITLE = {Annotations in collaborative environments},
YEAR = {2013},
ABSTRACT = {This article discusses methodological aspects of the Greek into Arabic Web Application related to the annotation system. Collaborative environments for the philological studies manage multiple versions both of the reference edition with digital variants and of linguistic and exegetical annotations. The system must verify and maintain the consistency of interrelated information, which can change asynchronously. Strategies to align different versions of texts and annotations, in order to update the internal references and notify the users to verify the content consistency, are illustrated. Structural aspects that involve the granularity and overlapping of annotations are discussed, taking into account also that linguistic annotations automatically generated by morphological parsers can be the basis for extended comments in natural language. Finally, the article illustrates which features related to the annotation system are yet implemented in the G2A Web Application},
KEYWORDS = {collaborative philology},
PAGES = {185-194},
URL = {http://www.greekintoarabic.eu/index.php?id=20},
VOLUME = {3},
ISSN = {2239-012X},
JOURNAL = {STUDIA GRAECO-ARABICA},
}
@ARTICLE{BOZZI_2013_ARTICLE_B_228612,
AUTHOR = {Bozzi, A.},
TITLE = {G2A: a Web application to study, annotate and scholarly edit ancient texts and their aligned translations. Part I. General model of the computational philology application},
YEAR = {2013},
ABSTRACT = {This paper presents the general model of a Web application for computational philology and describes the modules implemented by ILC-CNR in Pisa for the ERC project Ideas "Greek into Arabic. Philosophical Concepts and Linguistic Bridges" ADG 249431 (acronym: Greek into Arabic). The main principles on which the model is based are modularity, !exibility and development of the software according to open source criteria. These elements make it possible to include additional components in the modular structure, as well as components essential to the Greek into Arabic project (modularity), thus allowing the application to extend its functions to many other philological "elds, from classical and medieval philology to genetic criticism and philology of ancient printed texts (!exibility). Dissemination of this application, especially in the research and academic "elds, is guaranteed by the fact that its development is performed using internationally acknowledged systems of standard mark-up language and tools with no copyright restrictions (open source). In Part II a preliminary version of the user manual of G2A Web application is provided},
KEYWORDS = {History of Philosophy, Computational philology},
PAGES = {159-171},
URL = {http://www.greekintoarabic.eu/index.php?id=101},
VOLUME = {3},
ISSN = {2239-012X},
JOURNAL = {STUDIA GRAECO-ARABICA},
}
@ARTICLE{BURGASSI_2013_ARTICLE_B_265640,
AUTHOR = {Burgassi, C.},
TITLE = {Per Baldus XXII, 168},
YEAR = {2013},
ABSTRACT = {Si propongono alcune ipotesi di restauro testuale per un passo del "Baldus" di Folengo, di particolare rilievo nell'economia di tutta l'opera. A questo proposito sono messe in luce le implicazioni culturali e dottrinarie sottese al passo e che presiedono all'opera intera di Folengo},
KEYWORDS = {Filologia Italiana, Folengo},
PAGES = {74-94},
URL = {https://iris.cnr.it/handle/20.500.14243/265640},
VOLUME = {8},
ISSN = {1722-5434},
JOURNAL = {QUADERNI FOLENGHIANI},
}
@ARTICLE{BURGASSI_2013_ARTICLE_B_258927,
AUTHOR = {Burgassi, C.},
TITLE = {LIVIO IN ACCADEMIA. NOTE SULLA RICEZIONE, SULLA LINGUA E LA TRADIZIONE DEL VOLGARIZZAMENTO DI TITO LIVIO},
YEAR = {2013},
ABSTRACT = {Il contributo prende in esame alcuni aspetti relativi al lessico e alla ricezione del volgarizzamento della terza e della quarta Deca di Tito Livio. Tradizionalmente attribuite a Giovanni Boccaccio, le traduzioni liviane sono qui analizzate attraverso il filtro della speculazione teorica e della pratica lessicografica con il quale gli Accademici della Crusca, e segnatamente Lionardo Salviati, lessero, interpretarono e setacciarono queste fonti preziose del loro primo Vocabolario (1612). La parte iniziale del contributo, pertanto, illustra il sistema di valutazione linguistica dei testi antichi elaborato dal Salviati, con speciale riferimento ai volgarizzamenti in generale e a quelli di Livio in particolare. Nella seconda parte, poi, sono selezionate alcune voci estratte dalla Deca terza volgare, che, dapprima annotate nel cosiddetto «quaderno riccardiano» di Salviati e successivamente confluite nel Vocabolario, risultano notevoli per rarità lessicale o semantica, per singolare affinità con gli istituti linguistici di Boccaccio, e infine perché esemplificano in maniera paradigmatica le modalità di traduzione del modello classico (secondo la dialettica che vede alternarsi i prestiti diretti dal latino alle riformulazioni prettamente volgari)},
KEYWORDS = {Lessicologia, Volgarizzamenti},
PAGES = {5-25},
URL = {https://iris.cnr.it/handle/20.500.14243/258927},
VOLUME = {30},
ISSN = {0392-5218},
JOURNAL = {STUDI DI LESSICOGRAFIA ITALIANA},
}
@ARTICLE{BURGASSI_2013_ARTICLE_B_269670,
AUTHOR = {Burgassi, C.},
TITLE = {Scelta di voci del Tesoro della Lingua Italiana delle Origini (diciassettesima serie)},
YEAR = {2013},
ABSTRACT = {Voci INDOLE s. f., QUERELA s. f, QUERELANTE s. m., SEDARE v., SEDATIVO s. m., SEDAZIONE s. f. del Tesoro della Lingua Italiana delle Origini (pp. 56, 113-15, 125-26)},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana},
PAGES = {17-158},
URL = {https://iris.cnr.it/handle/20.500.14243/269670},
VOLUME = {18},
ISSN = {1591-8254},
JOURNAL = {BOLLETTINO-OPERA DEL VOCABOLARIO ITALIANO},
}
@ARTICLE{CALZOLARI_2013_ARTICLE_C_222944,
AUTHOR = {Calzolari, N.},
TITLE = {Il Trattamento Automatico della Lingua per la sopravvivenza dell'Italiano nel mondo digitale},
YEAR = {2013},
ABSTRACT = {Il TAL nelle sue dimensioni rilevanti},
URL = {https://iris.cnr.it/handle/20.500.14243/222944},
}
@ARTICLE{CIUNI_2013_ARTICLE_CP_405499,
AUTHOR = {Ciuni, R. and Proietti, C.},
TITLE = {THE ABUNDANCE OF THE FUTURE A Paraconsistent Approach to Future Contingents},
YEAR = {2013},
ABSTRACT = {Supervaluationism holds that the future is undetermined, and as a consequence of this, statements about the future may be neither true nor false. In the present paper, we explore the novel and quite different view that the future is abundant: statements about the future do not lack truth-value, but may instead be glutty, that is both true and false. We will show that (1) the logic resulting from this "abundance of the future" is a non-adjunctive paraconsistent formalism based on subvaluations, which has the virtue that all classical laws are valid in it, while no formula like phi boolean AND phi is satisfiable (though both phi and phi may be true in a model); (2) The peculiar behaviour of abundant logical consequence has an illuminating analogy in probability logic; (3) abundance preserves some important features of classical logic (not preserved in supervaluationism) when it comes to express those important retrogradations of truth which are presupposed by the argument de praesenti ad praeteritum},
KEYWORDS = {Future contingents, supervaluationism, gluts, subvaluations, retrogradation of truth},
PAGES = {21-43},
URL = {https://iris.cnr.it/handle/20.500.14243/405499},
VOLUME = {22 (1)},
DOI = {10.12775/LLP.2013.002},
ISSN = {1425-3305},
JOURNAL = {LOGIC AND LOGICAL PHILOSOPHY},
}
@ARTICLE{DEFELICE_2013_ARTICLE_D_257262,
AUTHOR = {De Felice, I.},
TITLE = {Affordances: una chiave per il word sense disambiguation},
YEAR = {2013},
PAGES = {105-110},
VOLUME = {1 (2)},
JOURNAL = {NEA SCIENCE},
}
@ARTICLE{DELGROSSO_2013_ARTICLE_D_228540,
AUTHOR = {Del Grosso, A. M.},
TITLE = {Indexing techniques and variant readings management},
YEAR = {2013},
ABSTRACT = {This paper illustrates indexing routines developed for the G2A Web Application, a philological system totally open source designed by the Team of the ILC-CNR of Pisa within the context of the ERC project Greek into Arabic. Philosophical Concepts and Linguistic Bridges (Ideas AdG 249431). Section 1 introduces the concept of 'index' in this peculiar field. The indexing process implemented by the ILC-CNR Team for the G2A Web Application is illustrated in Section 2. Section 3 discusses the component of textual criticism},
KEYWORDS = {Computational and collaborative philology},
PAGES = {211-230},
URL = {http://www.greekintoarabic.eu/index.php?id=101\&reset=1},
VOLUME = {3},
ISSN = {2239-012X},
JOURNAL = {STUDIA GRAECO-ARABICA},
}
@ARTICLE{DELLORLETTA_2013_ARTICLE_DVM_280032,
AUTHOR = {Dell'Orletta, F. and Venturi, G. and Montemagni, S.},
TITLE = {Linguistically-driven selection of correct arcs for dependency parsing},
YEAR = {2013},
ABSTRACT = {LISCA is an unsupervised algorithm aimed at assigning a quality score to each arc generated by a dependency parser in order to produce a decreasing ranking of arcs from correct to incorrect ones. LISCA exploits statistics about a set of linguistically-motivated and dependency-based features extracted from a large corpus of automatically parsed sentences and uses them to assign a quality score to each arc of a parsed sentence belonging to the same domain of the automatically parsed corpus. LISCA has been successfully tested on two datasets belonging to two different domains and in all experiments it turned out to outperform different baselines, thus showing to be able to reliably detect correct arcs also representing domain-specific peculiarities},
KEYWORDS = {Correct arcs, Dependency parsing},
PAGES = {125-136},
URL = {http://cys.cic.ipn.mx/ojs/index.php/CyS/article/view/1517},
VOLUME = {17 (2)},
ISSN = {1405-5546},
JOURNAL = {COMPUTACIÓN Y SISTEMAS},
}
@ARTICLE{DIDONATO_2013_ARTICLE_DM_382005,
AUTHOR = {Di Donato, F. and Müller, S.},
TITLE = {Biblioteche digitali semantiche. Il progetto Burckhardtsource. org},
YEAR = {2013},
ABSTRACT = {This article describes Burckhardtsource. org. The platform is developed within the project ERC-Advanced Grant 'The European Correspondence to Jacob Burckhardt', as the result of an interdisciplinary work that involves art historians, philologists, and science communication and computer scientists. The first part focuses on the platform and describes its content and the methodology followed in the editing of the correspondence to Burckhardt. The second part is devoted to a brief explanation of the software (Muruca) through which the platform is built. The last part, finally, considers a tool for the semantic annotation of web pages (Pundit) integrated into the platform, which allows the enrichment of texts through the use of Linked Data technologies},
URL = {https://iris.cnr.it/handle/20.500.14243/382005},
ISSN = {1128-3564},
JOURNAL = {BIBLIOTIME},
}
@ARTICLE{FANTONI_2013_ARTICLE_FADM_226945,
AUTHOR = {Fantoni, G. and Apreda, R. and Dell'Orletta, F. and Monge, M.},
TITLE = {Automatic extraction of function-behaviour-state information from patents},
YEAR = {2013},
ABSTRACT = {Patents contain a large quantity of technical information not available elsewhere and therefore very interesting for both academia and industry. The purpose of the research is to try to detect and extract information about the functions, the physical behaviours and the states of the system directly from the text of a patent in an automatic way. The above three categories constitute a well-known set of relevant entities in the theory of engineering design, and their study allows powerful analysis of individual artefacts as well as that of groups of products or technologies. The focus is in providing a handy tool that could speed up and facilitate human analysis and allow tackling also large corpora of documents. A second goal is to develop a protocol based on free software and database resources, so that it could be replicable with limited effort by everyone without having to rely on commercial databases. Extracting technical and design information from a document whose aim is more legal than technical, and that is written using a specific jargon, is not a trivial task. The approach chosen to overcome the various issues is to support state-of-the-art Computational Linguistic tools with a large Knowledge Base. The latter has been constructed both manually and automatically and comprises not only keywords but also concepts, relationships and regular expressions. A case study about a very recent patent describing a mechanical device has been included to show the functioning and output of the entire system. © 2013 Elsevier Ltd. All rights reserved},
KEYWORDS = {Function-Behaviour-Structure, Pa, Product development, Semantic elaboration},
PAGES = {317-334},
URL = {http://www.sciencedirect.com/science/article/pii/S1474034613000487},
VOLUME = {27 (3)},
DOI = {10.1016/j.aei.2013.04.004},
ISSN = {1474-0346},
JOURNAL = {ADVANCED ENGINEERING INFORMATICS},
}
@ARTICLE{GUADAGNINI_2013_ARTICLE_G_272429,
AUTHOR = {Guadagnini, E.},
TITLE = {Voce MANTELLO s. m. del Tesoro della Lingua Italiana delle Origini},
YEAR = {2013},
ABSTRACT = {1 Indumento maschile e femminile costituito da un ampio pezzo di tessuto o di pellame stretto al collo, di lunghezza e ampiezza variabile, da portare appoggiato sulle spalle sopra i vestiti. 1. 1 Coperta (del cavallo). 1. 2 Ciò che costituisce la superficie esterna di qsa: corpo (dell'uomo), pelliccia (di un animale), livrea (di una pianta), ecc. 1. 3 Fig. Apparenza esteriore di qno o qsa (spesso contrapposta alla realtà o alla verità, con valore neg.)},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana},
URL = {http://tlio.ovi.cnr.it/voci/030457.htm},
VOLUME = {17},
ISSN = {2240-5216},
JOURNAL = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI},
}
@ARTICLE{GUADAGNINI_2013_ARTICLE_G_272435,
AUTHOR = {Guadagnini, E.},
TITLE = {Voce MATTEZZA s. f. del Tesoro della Lingua Italiana delle Origini},
YEAR = {2013},
ABSTRACT = {Completa la famiglia di "matto", uscita parzialmente a stampa sul Boll.-Opera vocab. ital. 17},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana},
URL = {http://tlio.ovi.cnr.it/voci/029993.htm},
VOLUME = {17},
ISSN = {2240-5216},
JOURNAL = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI},
}
@ARTICLE{GUADAGNINI_2013_ARTICLE_G_265584,
AUTHOR = {Guadagnini, E.},
TITLE = {Scelta di voci del Tesoro della Lingua Italiana delle Origini (diciassettesima serie)},
YEAR = {2013},
ABSTRACT = {Voci architenente agg., architettura s. f., rugidore s. m. del Tesoro della Lingua Italiana delle Origini (pp. 17-18, 118)},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana},
PAGES = {17-158},
URL = {https://iris.cnr.it/handle/20.500.14243/265584},
VOLUME = {18},
ISSN = {1591-8254},
JOURNAL = {BOLLETTINO-OPERA DEL VOCABOLARIO ITALIANO},
}
@ARTICLE{GUADAGNINI_2013_ARTICLE_G_272439,
AUTHOR = {Guadagnini, E.},
TITLE = {Voce TORPORE s. m. del Tesoro della Lingua Italiana delle Origini},
YEAR = {2013},
ABSTRACT = {Latinismo. 1 Rallentamento dei movimenti o stato di immobilità o di paralisi che colpisce in modo transitorio un corpo, una sua parte, det. arti. 1. 1 Fig. [Rif. all'animo o alle sue facoltà: ] allontanamento o astensione dall'attività critico-intellettuale che deve giudicare e informare di sé il corretto comportamento umano},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana, Progetto DiVo},
URL = {http://tlio.ovi.cnr.it/voci/030790.htm},
VOLUME = {17},
ISSN = {2240-5216},
JOURNAL = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI},
}
@ARTICLE{MARCHI_2013_ARTICLE_M_229212,
AUTHOR = {Marchi, S.},
TITLE = {G2A: a Web application to study, annotate and scholarly edit ancient texts and their aligned translations. Part II. Towards a user manual},
YEAR = {2013},
ABSTRACT = {The present contribution describes the current operating procedures of the G2A application. The system is still under development at the Institute of Computational Linguistics (ILC/CNR, Area della ricerca di Pisa); therefore, all the functions described in this provisional user manual should be considered as an exemplification of the general model described by Andrea Bozzi in Part I},
KEYWORDS = {Literary computing, XML, Web Application, Java, exist-db},
PAGES = {173-183},
URL = {https://learningroads.cfs.unipi.it/wp-content/uploads/2015/10/MARCHISGA3-2013.pdf},
VOLUME = {3},
ISSN = {2239-012X},
JOURNAL = {STUDIA GRAECO-ARABICA},
}
@ARTICLE{MARZI_2013_ARTICLE_M_225694,
AUTHOR = {Marzi, C.},
TITLE = {Innovation, language, and grey literature},
YEAR = {2013},
ABSTRACT = {Language and innovation are inseparable. Language conveys ideas which are essential in innovation, establishes the most immediate connections with our conceptualisation of the outside world, and provides the building blocks for communication. Every linguistic choice is necessarily meaningful, and it involves the parallel construction of form and meaning. From this perspective, language is a dynamic knowledge construction process. In this article, emphasis will be laid on investigating how words are used to describe innovation, and how innovation topics can influence word usage and collocational behaviour. Especially in grey materials, and in a context-based approach, the lexical representation of innovative knowledge is closely related to the representation of knowledge itself, and gives the opportunity to reduce the gap between knowledge representation and knowledge understanding. This will bring into focus the dynamic interplay between lexical creativity and innovative pragmatic contexts, and the necessity for a dynamic semantic shift from context-driven vagueness to domain-driven specialisation},
KEYWORDS = {Lexical productivity, Language technologies, Grey Literature, Web corpora},
PAGES = {145-151},
URL = {http://www.scopus.com/inward/record.url?eid=2-s2.0-84884695370\&partnerID=q2rCbXpz},
VOLUME = {9 (3)},
ISSN = {1574-1796},
JOURNAL = {THE GREY JOURNAL},
}
@ARTICLE{MARZI_2013_ARTICLE_MF_256850,
AUTHOR = {Marzi, C. and Ferro, M.},
TITLE = {Adaptive strategies in lexical acquisition},
YEAR = {2013},
ABSTRACT = {The emergence of morphological patterns from lexical storage in language acquisition is conditioned by language-specific factors as well as extra-linguistic cognitive capacities. With particular reference to the acquisition of plural markers in German, in a memory-based perspective highlighting interesting theoretical implications for usage-based models, the paper analyses acquisitional strategies by focussing on emergent relations between stored word forms and on dynamic expectation/competition of incoming input. In particular, we outline an adaptive multifactorial account of morphological processing that includes both frequency and formal factors. Our investigation is supported by a computational model of morphology acquisition/processing based on self-organisation memories, where word representations are dynamically recoded as time-series},
KEYWORDS = {German plurals, Morphological generalisation, Self-organising memory, Word processing},
PAGES = {307-328},
URL = {http://www.scopus.com/inward/record.url?eid=2-s2.0-84892521599\&partnerID=q2rCbXpz},
VOLUME = {XII (2)},
DOI = {10.1418/75045},
ISSN = {1720-9331},
JOURNAL = {LINGUE E LINGUAGGIO},
}
@ARTICLE{MONTEMAGNI_2013_ARTICLE_M_294413,
AUTHOR = {Montemagni, S.},
TITLE = {Tecnologie linguistico-computazionali e monitoraggio della lingua italiana},
YEAR = {2013},
ABSTRACT = {In una riflessione su dove stia andando l'italiano del terzo millennio, è legittimo chiedersi se e in che misura le tecnologie linguistico-computazionali possano essere di aiuto nel monitoraggio della lingua italiana nelle sue varietà diamesiche, diafasiche e diastratiche, nonché sull'asse diacronico. L'obiettivo del presente contributo consiste nel fornire una risposta, sebbene preliminare, a questo interrogativo, primariamente sul versante metodologico. In particolare, si vuole mostrare che mediante il ricorso a tecnologie linguistico-computazionali è oggi possibile monitorare un ampio spettro di tratti, che spaziano tra i diversi livelli di descrizione linguistica (primariamente, lessico, morfo-sintassi e sintassi), in relazione a corpora di sempre più vaste dimensioni. Questo rappresenta un cambio fondamentale nello studio della variazione linguistica, in particolare della lingua italiana, fino a oggi basato su corpora di dimensioni relativamente ridotte e tipicamente condotto mediante un'analisi (semi-)manuale del testo. Come vedremo, l'uso di vasti corpora testuali combinato con il ricorso a tecnologie linguistico-computazionali per l'analisi e il monitoraggio linguistico rendono oggi possibili analisi sempre più accurate e affidabili, che coprono aspetti della struttura linguistica rimasti fino a ora inesplorati in quanto difficilmente attingibili mediante un'analisi manuale del testo},
KEYWORDS = {Monitoraggio Linguistico, Trattamento Automatico del Linguaggio, Varietà d'Uso della Lingua},
PAGES = {145-172},
URL = {http://www.italianlp.it/wp-content/uploads/2014/04/montemagni_silta_submission_rif.pdf},
VOLUME = {XLII (1)},
ISSN = {0390-6809},
JOURNAL = {STUDI ITALIANI DI LINGUISTICA TEORICA E APPLICATA},
}
@ARTICLE{MONTEMAGNI_2013_ARTICLE_MWDN_228553,
AUTHOR = {Montemagni, S. and Wieling, M. and De Jonge, B. and Nerbonne, J.},
TITLE = {Synchronic patterns of Tuscan phonetic variation and diachronic change: Evidence from a dialectometric study},
YEAR = {2013},
ABSTRACT = {A careful investigation of synchronic patterns of linguistic variation with underlying linguistic features can lead to important insights into the comprehension of diachronic phonetic processes. In this article, we showed that the method of spectral partitioning of bipartite graphs applied to synchronic dialectal data can effectively and reliably be used to investigate diachronic processes, thus contributing to a deeper understanding of the relationship between synchronic variation and diachronic change. This was illustrated through a case study carried out on Tuscan dialects, focusing on so-called Tuscan 'gorgia', a lenition process consisting of the spirantization of stop consonants. In particular, from a quantitative analysis of the sound correspondences involving voiceless and voiced stops, we tracked the evolution of the spirantization phenomenon in several respects. First, we tracked spirantization geographically, across Tuscany from the influential center of Florence to the peripheral areas. Second, we tracked it phonologically, from voiceless to voiced stops, and within each voicing class from velars to dentals and then to bilabials. Finally, we tracked it demographically, with young speakers using the most innovative sound correspondences more than old speakers. The fact that these results are in line with the literature on the topic of Tuscan 'gorgia' demonstrates the potential of the method of spectral partitioning of bipartite graphs with respect to the reconstruction of diachronic processes starting from diatopically distributed synchronic dialectal data},
KEYWORDS = {Tuscan dialactelogy, dialectometry, diachronic variation},
PAGES = {157-172},
URL = {https://iris.cnr.it/handle/20.500.14243/228553},
VOLUME = {28 (1)},
DOI = {10.1093/llc/fqs057},
ISSN = {0268-1145},
JOURNAL = {LITERARY \& LINGUISTIC COMPUTING},
}
@ARTICLE{NAHLI_2013_ARTICLE_NG_264611,
AUTHOR = {Nahli, O. and Giovannetti, E.},
TITLE = {Computational contributions for Arabic language processing-Part II. Lisan al-'arab as a source of lexical and morphological knowledge},
YEAR = {2013},
ABSTRACT = {The following sections illustrate a part of the study on the morphology of the Arabic language which is carried on within the framework of the ERC project Greek into Arabic. Philosophical Concepts and Linguistic Bridges ADG 249431. We used the Arabic lexicographic encyclopaedia Lisan al-'arab and, thanks to the regularity of its structure, we developed a system for the extraction of morphologically labelled word sequences, to be exploited for morphological analysis purposes},
KEYWORDS = {Arabic morphology, Arabic morphological analysis, Arabic lexicography, Natural Language Processing},
PAGES = {207-210},
URL = {https://iris.cnr.it/handle/20.500.14243/264611},
VOLUME = {3},
ISSN = {2239-012X},
JOURNAL = {STUDIA GRAECO-ARABICA},
}
@ARTICLE{NAHLI_2013_ARTICLE_NO_222323,
AUTHOR = {Nahli and Ouafae},
TITLE = {Computational contributions for Arabic language processing Part I. The automatic morphologic analysis of Arabic texts},
YEAR = {2013},
ABSTRACT = {problems of ambiguity inherent to the Arabic language. Difficulties arose in the various stages of automatic processing of the Arabic version of Plotinus, the text which lies at the core of our project. Part I highlights the needs that led us to update the morphological engine AraMorph in order to optimize its morpho-syntactic analysis. Even if the engine has been optimized, a digital lexical source for better use of the system is still lacking. Part II presents a methodology exploiting the internal structure of the Arabic lexicographic encyclopaedia Lisan al-"arab, which allows automatic extraction of the roots and derived lemmas. The outcome of this work is a useful resource for morphological analysis of Arabic, either in its own right, or to enrich already existing resources},
KEYWORDS = {Morphological engine AraMorph, Morpho-syntactic analysis, Arabic language},
PAGES = {195-206},
URL = {http://www.greekintoarabic.eu/uploads/media/NAHLI_SGA_3-2013.pdf},
VOLUME = {3},
ISSN = {2239-012X},
JOURNAL = {STUDIA GRAECO-ARABICA},
}
@ARTICLE{PARDELLI_2013_ARTICLE_PB_16331,
AUTHOR = {Pardelli, G. and Biagioni, S.},
TITLE = {Quando la linguistica incontra l'informatica: una riflessione terminologica},
YEAR = {2013},
ABSTRACT = {This paper presents a case study to the use of words in the field of Natural Language Processing. This electronic processing of linguistic data leads to the diffusion of clear and concise words for describing a complex concept that would need a circumlocution to be described instead. The aim of this article is to provide thinking over of these new lexical forms over the time. We present a tabular representation summarizing terms extracted from the titles of papers presented at international conferences COLING, International Conference on Computational Linguistics in the period (1965-2010). The system used for the data processing is available at the Istituto di Linguistica Computazionale "A. Zampoilli"-CNR, Pisa, Italy},
KEYWORDS = {Computational Linguistics, Computer Science, Terminology, Information extraction, Content Analysis and Indexing},
PAGES = {67-78},
URL = {http://caspur-ciberpublishing.it},
VOLUME = {3 (1)},
DOI = {10.2423/i22394303v3n1p67},
ISSN = {2239-4303},
JOURNAL = {SCIRES-IT},
}
@INCOLLECTION{BASILI_2013_INCOLLECTION_BLDMV_287820,
AUTHOR = {Basili, R. and Lenci, A. and De Cao, D. and Moschitti, A. and Venturi, G.},
TITLE = {Evalita 2011: the Frame Labeling over Italian Texts Task},
YEAR = {2013},
ABSTRACT = {The Frame Labeling over Italian Texts (FLaIT) task held within the EvalIta 2011 challenge is here described. It focuses on the automatic annotation of free texts according to frame semantics. Systems were asked to label all semantic frames and their arguments, as evoked by predicate words occurring in plain text sentences. Proposed systems are based on a variety of learning techniques and achieve very good results, over 80% of accuracy, in most subtasks},
KEYWORDS = {NLP System Evaluation, Shallow Semantic Parsing, Frame Semantics},
PAGES = {195-204},
URL = {https://iris.cnr.it/handle/20.500.14243/287820},
PUBLISHER = {Springer (Berlin Heidelberg, DEU)},
ISBN = {978-3-642-35827-2},
CONFERENCE_PLACE = {Berlin Heidelberg},
BOOKTITLE = {Evaluation of Natural Language and Speech Tools for Italian},
EDITOR = {Magnini, B. and Cutugno, F. and Falcone, M. and Pianta, E.},
}
@INCOLLECTION{BURGASSI_2013_INCOLLECTION_B_258922,
AUTHOR = {Burgassi, C.},
TITLE = {Notizie dal DiVo. Teoria e pratica dell'associazione latino-volgare},
YEAR = {2013},
ABSTRACT = {Il contributo illustra i metodi con i quali il testo volgare è stato associato al testo latino tradotto nelle banche dati allestite dal progetto DiVo ("Dizionario dei Volgarizzamenti")},
PAGES = {85-96},
URL = {https://iris.cnr.it/handle/20.500.14243/258922},
PUBLISHER = {Edizioni dell'Orso (Alessandria, ITA)},
ISBN = {978-88-6274-480-5},
CONFERENCE_PLACE = {Alessandria},
BOOKTITLE = {«Diverse voci fanno dolci note». L'Opera del Vocabolario Italiano per Pietro G. Beltrami},
EDITOR = {Larson, P. and Squillacioti, P. and Vaccaro, G.},
}
@INCOLLECTION{CALZOLARI_2013_INCOLLECTION_C_222331,
AUTHOR = {Calzolari, N.},
TITLE = {Language Resources: From Infancy to Maturity. Lessons and Next Steps for the UNL Community},
YEAR = {2013},
ABSTRACT = {In the second chapter, Professor Nicoletta Calzolari Zamorani, Research Associate and former Director of CNR-ILC, Pisa, Italy, approaches the questions by giving insight on the general framework surrounding Language Resources (LRs) today. Rather than answering the specific UNL questions directly, she emphasizes the fact that in order to define a language structure such as UNL it is pree-eminent to gather results of analyses from different communities and to define a coherent strategy},
URL = {https://iris.cnr.it/handle/20.500.14243/222331},
ISBN = {978-1-4438-5144-2},
}
@INCOLLECTION{CALZOLARI_2013_INCOLLECTION_CBLM_128519,
AUTHOR = {Calzolari, N. and Bertagna, F. and Lenci, A. and Monachini, M.},
TITLE = {Boosting Lexical Resources for the Semantic Web: Generative Lexicon and Lexicon Interoperability},
YEAR = {2013},
ABSTRACT = {To make the vision of a European Information Infrastructure and of the Semantic Web a reality, two key issues are tackled: (i) content, which must be dealt with in a multilingual environment; (ii) standards, which are critical to achieve interoperability and integration. In the Semantic Web scenario, ontologies are the key components to manage knowledge, whereas, in Human Language Technology, semantic description is committed to computational lexicons, which have to squarely address the complexity of natural language. Answers to the above issues are found within two frameworks: first, in the framework of Generative Lexicon (GL) theory and GL-based lexicons that account for the complex, multidimensional and multifaceted nature of meaning in lexicon and ontology design; second, in the context of the ISLE enterprise which, with the MILE, represents an essential interface between advanced research in the field of multilingual lexical semantics and the practical task of developing resources for HLT},
KEYWORDS = {Generative Lexicon, Computational Lexicons, Standards, Semantic Web, Human Language Technology},
PAGES = {415-431},
URL = {http://download-v2.springer.com/static/pdf/679/chp%253A10.1007%252F978-94-007-5189-7_18.pdf?token2=exp=1430751723~acl=%2Fstatic%2Fpdf%2F679%2Fchp%25253A10.1007%25252F978-94-007-5189-7_18.pdf*~hmac=2ebe0f4a7ba5903ef47dbc16674a886bcbb26b9d6e4e9c9f209e35787522e5f1},
DOI = {10.1007/978-94-007-5189-7_18},
PUBLISHER = {Springer (Dordrecht, NLD)},
ISBN = {9789400751880},
CONFERENCE_PLACE = {Dordrecht},
BOOKTITLE = {Text, Speech and Language Technology},
EDITOR = {Pustejovsky, J. and Bouillon, P. and Isahara, H. and Kanzaki, K. and Lee, C.},
}
@INCOLLECTION{CALZOLARI_2013_INCOLLECTION_CMS_255564,
AUTHOR = {Calzolari, N. and Monachini, M. and Soria, C.},
TITLE = {LMF-Historical Context and Perspectives},
YEAR = {2013},
ABSTRACT = {The importance of designing standards for language resources (LR) is firmly established, starting with the Expert Advisory Group for Language Engineering (EAGLES) and International Standards for Language Engineering (ISLE) initiatives. Both EAGLES and ISLE stress the importance of reaching a consensus on (linguistic and nonlinguistic) "content", in addition to agreement on formats and encoding issues, and also address the needs of content processing and Semantic Web technologies. The recommendations for standards and best practices issued within the projects became, through the INTERA and mainly the LIRICS project, the International Organization for Standardization (ISO) within the ISO TC37/SC4 committee, where Lexical Markup Framework (LMF) was developed. Standards are fundamental to exchange, preserve, maintain and integrate data and LRs, to achieve interoperability in general, and they are an essential basis of any LR infrastructure},
KEYWORDS = {EAGLES, international standards for language engineering, interoperability, lexical markup framework (LMF)},
PAGES = {1-18},
URL = {http://dx.doi.org/10.1002/9781118712696.ch1},
DOI = {10.1002/9781118712696.ch1},
PUBLISHER = {John Wiley \& Sons, Inc (Hoboken, USA)},
ISBN = {978-1-118-71259-7},
CONFERENCE_PLACE = {Hoboken},
BOOKTITLE = {LMF Lexical Markup Framework},
EDITOR = {Gil, F. and Patrick, P.},
}
@INCOLLECTION{CUCURULLO_2013_INCOLLECTION_CS_316212,
AUTHOR = {Cucurullo, S. and Sassi, M.},
TITLE = {ASPETTI TECNICO-METODOLOGICI DEL PROGETTO LinCi},
YEAR = {2013},
KEYWORDS = {Sociolinguistica, banca-dati DBT},
PAGES = {47-50},
URL = {https://iris.cnr.it/handle/20.500.14243/316212},
PUBLISHER = {Franco Cesati Editore (Firenze, ITA)},
ISBN = {9788876674563},
CONFERENCE_PLACE = {Firenze},
BOOKTITLE = {La lingua delle città Raccolta di studi},
EDITOR = {Nesi, A.},
}
@INCOLLECTION{CUCURULLO_2013_INCOLLECTION_CS_316207,
AUTHOR = {Cucurullo, S. and Sassi, M.},
TITLE = {Il Contributo Tecnologico dell'ILC al Progetto LinCi},
YEAR = {2013},
ABSTRACT = {The project " la Lingua delle Città (LinCi)" aims to highlight some relevant phenomena-both from the lexical point of view that grammar-common Italian and informal, in the opinion of respondents using speakers. For this purpose the group of linguists who devised the project has developed a questionnaire of 200 questions related to various semantic fields. The structure of the questionnaire also allows the collector to derive grammatical information (eg on the use of certain pronominal or verbal), as well as judgments of metalinguistic character on the "dialectic tendencies" or otherwise of certain forms, the differences between formal and informal register on frequency of use. 81},
KEYWORDS = {lingua italiana, banche dati},
PAGES = {81-99},
URL = {https://iris.cnr.it/handle/20.500.14243/316207},
PUBLISHER = {Accademia della Crusca (Firenze, ITA)},
ISBN = {978-88-89369-51-7},
CONFERENCE_PLACE = {Firenze},
BOOKTITLE = {La lingua delle città LinCi. La banca dati},
EDITOR = {Nesi, A. and Salani, T. P.},
}
@INCOLLECTION{DELGROSSO_2013_INCOLLECTION_DM_228542,
AUTHOR = {Del Grosso, A. M. and Marchi, S.},
TITLE = {Una Applicazione Web per la Filologia Computazionale. Un esperimento su alcuni scritti autografi di Ferdinand de Saussure},
YEAR = {2013},
ABSTRACT = {Nel progetto PRIN "Per un'edizione digitale dei manoscritti di Ferdinand de Saussure", il cui scopo era approntare una serie di strumenti utili all'edizione di-gitale degli autografi saussuriani, il gruppo di ricerca e sviluppo di filologia com-putazionale guidato da Andrea Bozzi e presente presso l'Istituto di Linguistica Computazionale "Antonio Zampolli" (ILC-CNR, Pisa) ha individuato i requisiti ed implementato le funzionalita? rispondenti alle esigenze dichiarate degli studiosi di questi materiali},
KEYWORDS = {filologia computazionale, piattaforma web},
PAGES = {131-157},
URL = {https://iris.cnr.it/handle/20.500.14243/228542},
PUBLISHER = {Edizioni dell'Orso (Alessandria, ITA)},
ISBN = {978-88-6274-478-2},
CONFERENCE_PLACE = {Alessandria},
BOOKTITLE = {Guida per un'edizione digitale dei manoscritti di Ferdinand de Saussure},
EDITOR = {Gambarara, D. and Marchese, M. P.},
}
@INCOLLECTION{DELLORLETTA_2013_INCOLLECTION_DMMVAF_220446,
AUTHOR = {Dell'Orletta, F. and Marchi, S. and Montemagni, S. and Venturi, G. and Agnoloni, T. and Francesconi, E.},
TITLE = {Domain Adaptation for Dependency Parsing at EVALITA 2011},
YEAR = {2013},
ABSTRACT = {The domain adaptation task was aimed at investigating techniques for adapting state-of-the-art dependency parsing systems to new domains. Both the language dealt with, i. e. Italian, and the target do-main, namely the legal domain, represent two main novelties of the task organised at Evalita 2011 with respect to previous domain adaptation ini-tiatives. In this paper, we define the task and describe how the datasets were created from different resources. In addition, we characterize the different approaches of the participating systems, report the test results, and provide a first analysis of these results},
KEYWORDS = {Dependency Parsing, Domain Adaptation, Self-training, Active Learning, Legal-NLP},
PAGES = {58-69},
URL = {https://iris.cnr.it/handle/20.500.14243/220446},
PUBLISHER = {Springer (Berlin Heidelberg, DEU)},
ISBN = {978-3-642-35827-2},
CONFERENCE_PLACE = {Berlin Heidelberg},
BOOKTITLE = {Evaluation of NLP and Speech Tools for Italian},
EDITOR = {Magnini, B. and Cutugno, F. and Falcone, M. and Pianta, E.},
}
@INCOLLECTION{GUADAGNINI_2013_INCOLLECTION_G_265234,
AUTHOR = {Guadagnini, E.},
TITLE = {Notizie dal DiVo. Parole tradotte e lessicografia dell'italiano},
YEAR = {2013},
ABSTRACT = {Studio dell'utilizzo dei volgarizzamenti medievali come fonti lessicografiche nelle cinque impressioni del Vocabolario della Crusca, nel Tommaseo-Bellini e nel Battaglia},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana, Volgarizzamenti, Progetto DiVo},
PAGES = {59-70},
URL = {https://iris.cnr.it/handle/20.500.14243/265234},
PUBLISHER = {Edizioni dell'Orso (Alessandria, ITA)},
ISBN = {9788862744805},
CONFERENCE_PLACE = {Alessandria},
BOOKTITLE = {«Diverse voci fanno dolci note». L'Opera del Vocabolario Italiano per Pietro G. Beltrami},
EDITOR = {Vaccaro, P. L. P. S. G.},
}
@INCOLLECTION{HAYASHI_2013_INCOLLECTION_HMSSC_257932,
AUTHOR = {Hayashi, Y. and Monachini, M. and Savas, B. and Soria, C. and Calzolari, N.},
TITLE = {LMF as a Foundation for Servicized Lexical Resources},
YEAR = {2013},
ABSTRACT = {This chapter argues that the lexical markup framework (LMF) can play a significant role in realizing servicized lexical resources on the Web. To accomplish this goal, it begins with a brief introduction of the notion of servicized resources, and then presents a technical architecture of, what is called, LMF-aware lexicon access services. It presents two implementation showcases to demonstrate the applicability of the LMF and to discuss its possible extensions. The first example deals with WordNet-type computational semantic lexicons, while the other takes up a machine-readable bilingual dictionary primarily compiled for human usage. To conclude the chapter, the final sections summarize the results while reviewing related work},
KEYWORDS = {lexical markup framework (LMF), LMF-aware lexicon access services, servicized lexical resources},
PAGES = {201-213},
URL = {http://onlinelibrary.wiley.com/doi/10.1002/9781118712696.ch14/references},
DOI = {10.1002/9781118712696.ch14},
PUBLISHER = {Wiley-ISTE (Hoboken, USA)},
ISBN = {9781118712696},
CONFERENCE_PLACE = {Hoboken},
BOOKTITLE = {LMF-Lexical Markup Framework},
EDITOR = {Francopoulo, G.},
}
@INCOLLECTION{MONTANI_2013_INCOLLECTION_MARBCMSTSBP_251955,
AUTHOR = {Montani, C. and Andronico, P. and Raviolo, C. and Bozzi, A. and Codenotti, B. and Meghini, C. and Sommani, M. and Tarabella, L. and Scopigno, R. and Baraglia, R. and Perego, R.},
TITLE = {Il CNR dopo la CEP},
YEAR = {2013},
ABSTRACT = {Una breve [e parziale] storia di alcune tematiche ICT di successo che si sono sviluppate negli Istituti CNR di Pisa a partire dagli anni '60 e che, a giudizio degli autori, rappresentano a buon diritto rami importanti di quell'albero rigoglioso che ha avuto le sue radici nella CEP},
KEYWORDS = {divulgazione scientifica, storia dell'informatica},
URL = {https://iris.cnr.it/handle/20.500.14243/251955},
PUBLISHER = {Pisa University Press (Pisa, ITA)},
CONFERENCE_PLACE = {Pisa},
BOOKTITLE = {La CEP prima della CEP: storia dell'informatica. Divulgazione scientifica e didattica sperimentale. Atti del Convegno, Pisa 11-12 novembre 2011},
}
@INCOLLECTION{MONTEMAGNI_2013_INCOLLECTION_M_294410,
AUTHOR = {Montemagni, S.},
TITLE = {Estrazione Terminologica Automatica e Indicizzazione: Scenari Applicativi, Problemi e Possibili Soluzioni},
YEAR = {2013},
ABSTRACT = {Il ricorso a metodi e tecniche di estrazione automatica di terminologia settoriale da corpora di dominio, ovvero da insiemi di documenti relativi a uno specifico settore della conoscenza, rappresenta una sempre più diffusa pratica di supporto al processo di indicizzazione di collezioni documentali, inteso come l'operazione volta all'individuazione delle voci indice che ne costituiscono il contenuto concettuale. L'obiettivo di questo contributo è una rivisitazione critica di esperienze condotte all'interno di diversi scenari applicativi in cui i risultati del processo di estrazione automatica di terminologia sono utilizzati per la costruzione di vocabolari controllati o di thesauri sulla base dei quali è condotto il processo di indicizzazione},
KEYWORDS = {Trattamento Automatico del Linguaggio, Estrazione Terminologica, Indicizzazione},
PAGES = {241-284},
URL = {https://iris.cnr.it/handle/20.500.14243/294410},
PUBLISHER = {Iter (Milano) (Milano, ITA)},
ISBN = {978-88-903419-3-9},
CONFERENCE_PLACE = {Milano},
BOOKTITLE = {Documenti Digitali},
EDITOR = {Guarasci, R. and Folino, A.},
}
@INCOLLECTION{RUIMY_2013_INCOLLECTION_RPGB_265110,
AUTHOR = {Ruimy, N. and Piccini, S. and Giovannetti, E. and Bellandi, A.},
TITLE = {Lessicografia Computazionale e Terminologia Saussuriana},
YEAR = {2013},
PAGES = {161-179},
URL = {https://iris.cnr.it/handle/20.500.14243/265110},
PUBLISHER = {Edizioni dell'Orso (Alessandria, ITA)},
ISBN = {978-88-6274-478-2},
CONFERENCE_PLACE = {Alessandria},
BOOKTITLE = {Guida per un'edizione digitale dei manoscritti di Ferdinand de Saussure},
}
@INCOLLECTION{SASSI_2013_INCOLLECTION_SG_286088,
AUTHOR = {Sassi, M. and Grava, M.},
TITLE = {Una metamorfosi chiamata GIS: dai Database ai Geo-database},
YEAR = {2013},
ABSTRACT = {In this paper we describe the development of the Project named Population and Agriculture in the Tuscan territory during the nineteenth century. This study, started by Giuliana Biagioli using traditional methods, thanks to the particular intuition of this scientist, found in the University Pisa the breeding ground for the computer adventure. Here we recall that the first Faculty of Computer Science was founded in Pisa a few years before (it was in 1969) and in years immediately after was possible to count on the first specialists of this sector. The initial part of this paper will describe the introductory stages of the work carried out with the aid of the computer, which at that time was called Mainframe, filled huge spaces and was "fed" with mechanographic cards and magnetic tapes. In the second part instead we face the issue of GIS and WebGIS},
KEYWORDS = {Storia, Banca-dati, Catasto leopoldino, Storia dell'Informatica},
PAGES = {439-458},
URL = {https://iris.cnr.it/handle/20.500.14243/286088},
PUBLISHER = {Edizioni ETS (Pisa, ITA)},
ISBN = {9788846736765},
CONFERENCE_PLACE = {Pisa},
BOOKTITLE = {Il mondo a metà-Studi storici sul territorio e l'ambiente-In onore di Giuliana Biagioli},
EDITOR = {Pazzagli, R.},
}
@INCOLLECTION{VENTURI_2013_INCOLLECTION_V_260903,
AUTHOR = {Venturi, G.},
TITLE = {Semantic annotation of Italian legal texts: a FrameNet-based approach},
YEAR = {2013},
ABSTRACT = {The FrameNet approach to text semantic annotation can be a reliable model to make explicit the linguistic information and the semantic content of legal texts. This hypothesis is discussed and empirically demonstrated through an experiment of annotation of a corpus of Italian legal texts. This study is aimed at showing how FrameNet is particularly appropriate in order to provide new perspectives for legal language studies and for legal knowledge representation tasks. Moreover, by relying on the output of an automatic dependency parser, the FrameNet-based annotation methodology presented here is meant to be succesfully used in automatic semantic processing tasks of legal texts},
KEYWORDS = {Legal Language, Semantic Annotation, Legal Ontologies, Natural Language Processing},
PAGES = {51-84},
URL = {https://iris.cnr.it/handle/20.500.14243/260903},
DOI = {10.1075/bct.58},
PUBLISHER = {John Benjamins Publishing Company (Amsterdam/Philadelphia, USA)},
ISBN = {9789027202772},
CONFERENCE_PLACE = {Amsterdam/Philadelphia},
BOOKTITLE = {Advances in Frame Semantics},
EDITOR = {Fried, M. and Nikiforidou, K.},
}
@INCOLLECTION{VOSSEN_2013_INCOLLECTION_VSM_257910,
AUTHOR = {Vossen, P. and Soria, C. and Monachini, M.},
TITLE = {Wordnet-LMF: A Standard Representation for Multilingual Wordnets},
YEAR = {2013},
ABSTRACT = {Wordnet-lexical markup framework (LMF) is an instantiation of LMF for representing Wordnet-like semantic dictionaries. Wordnet is a widely accepted resource and thus provides a good case for testing the viability of a representation in LMF and the acceptance by a wide range of users. Wordnet-LMF was developed in the framework of the EU project KYOTO for the specific purpose of endowing a set of wordnets with a standardized interoperability format allowing the interchange of semantic information. This chapter explains the choices that were made to model the wordnet information in LMF. It provides a preliminary assessment of LMF, by large-scale application to real lexical resources, endowing wordnet with a format representation that allows easier integration among resources sharing the same structure and, more importantly, across resources with different theoretical and implementation approaches},
KEYWORDS = {KYOTO project, multilingual wordnets, Wordnet-lexical markup framework},
PAGES = {51-66},
URL = {http://dx.doi.org/10.1002/9781118712696.ch4},
DOI = {10.1002/9781118712696.ch4},
PUBLISHER = {Wiley-ISTE (Hoboken, USA)},
ISBN = {9781118712696},
CONFERENCE_PLACE = {Hoboken},
BOOKTITLE = {LMF-Lexical Markup Framework},
EDITOR = {Francopoulo, G.},
}
@EDITORIAL{BELTRAMI_2013_EDITORIAL_BLSABBDDGIGMMRVV_214457,
AUTHOR = {Beltrami, P. D. and Larson, P. C. and Squillacioti, P. C. and Artale, E. and Boccellari, A. and Burgassi, C. and De Dominicis, G. and Dotto, D. and Guadagnini, E. and Iorio Fili, D. and Giuliani, M. and Morlino, L. and Mosti, R. and Ravani, S. and Vaccaro, G. and Verlato, Z.},
TITLE = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI-Edizione online: www. vocabolario. org (ISSN 2240-5216)-Versione giugno 2013},
YEAR = {2013},
ABSTRACT = {A pdf copy of the Tesoro della Lingua Italiana delle Origini (TLIO), a dictionary of early Italian in progress, published online, as it was at the end of June 2013. TLIO is the first section of the Italian Historical Dictionary which is the mission of the OVI Institute},
KEYWORDS = {Lingua italiana, Lessico, Lessicografia},
URL = {http://tlio.ovi.cnr.it/TLIO},
ISSN = {2240-5216},
}
@EDITORIAL{SAUR_2013_EDITORIAL_SCRLMP_228630,
AUTHOR = {Saurí, R. and Calzolari, N. and Ren Huang, C. and Lenci, A. and Monachini, M. and Pustejovsky, J.},
TITLE = {Proceedings of the 6th International Conference on Generative Approaches to the Lexicon Generative Lexicon and Distributional Semantics},
YEAR = {2013},
ABSTRACT = {The papers in this volume represent some of the most recent and exciting work being carried out both within the framework of Generative Lexicon and related approaches to the lexicon and lexical resources. With the recent emphasis in natural language processing on the development of machine learning algorithms, it has become even more important for computational linguists to work on the development of linguistically informed lexical resources, for use in the annotation of corpora and creation of gold standard data for training, as well as the collation of larger theoretical datasets for investigating linguistic phenomena in greater detail and sophistication. These works contribute to this trend as well as to the further development of the mechanisms within GL for describing and explaining semantic and lexical phenomena in language},
KEYWORDS = {Generative Lexicon, Language Resources},
PAGES = {I-126},
URL = {https://aclweb.org/anthology/W/W13/W13-5400.pdf},
PUBLISHER = {Association for Computational Linguistics (Stroudsburg, USA)},
ISBN = {978-1-937284-98-5},
CONFERENCE_PLACE = {Stroudsburg},
}
@INPROCEEDINGS{BENOTTO_2013_INPROCEEDINGS_B_338145,
AUTHOR = {Benotto, G.},
TITLE = {modelli distribuzionali delle relazioni semantiche: il caso dell'iperonimia},
YEAR = {2013},
ABSTRACT = {I modelli di semantica distribuzionale misurano la similarità semantica tra le parole, basandosi sul principio per il quale termini che appaiono in contesti simili sono semanticamente simili. Questa linea di ricerca è stata molto utilizzata negli ultimi decenni, in cui sono state proposte molte misure per il calcolo della similarità lessicale su base distribuzionale. Parole semanticamente simili possono differire per il tipo di relazione semantica che intercorre tra loro. La similarità distribuzionale è modellata principalmente da misure simmetriche, come il coseno, che ben si prestano al riconoscimento di relazioni semantiche simmetriche, come la sinonimia. Questo rende difficoltoso applicare tali modelli al riconoscimento di relazioni semantiche non simmetriche, quali iperonimia/iponimia (animale, cane) o meronimia/olonimia (finestra, palazzo). Questo lavoro si propone di valutare la possibilità di identificare e classificare la relazione di iperonimia utilizzando misure di similarità direzionali. A tale scopo è stata condotta una valutazione delle misure di similarità direzionali esistenti, nel riconoscere e classificare parole legate da iperonimia. Sono state inoltre individuate alcune caratteristiche peculiari di tale relazione, modellate in due nuove misure di similarità semantica direzionale, con risultati migliori rispetto allo stato dell'arte},
KEYWORDS = {Computational linguistics, distributional semantics},
PAGES = {85-98},
URL = {https://iris.cnr.it/handle/20.500.14243/338145},
ISBN = {978-88-98138-06-7},
CONFERENCE_NAME = {Atti del convegno 2012 del CODISCO},
BOOKTITLE = {Animali, Umani, Macchine Atti del convegno 2012 del CODISCO},
EDITOR = {Adornetti, I. and Cominetti, F.},
}
@INPROCEEDINGS{BOSCO_2013_INPROCEEDINGS_BMS_294412,
AUTHOR = {Bosco, C. and Montemagni, S. and Simi, M.},
TITLE = {Converting Italian Treebanks: Towards an Italian Stanford Dependency Treebank},
YEAR = {2013},
ABSTRACT = {The paper addresses the challenge of converting MIDT, an existing dependency-based Italian treebank resulting from the harmonization and merging of smaller resources, into the Stanford Dependencies annotation formalism, with the final aim of constructing a standard-compliant resource for the Italian language. Achieved results include a methodology for converting treebank annotations belonging to the same dependency-based family, the Italian Stanford Dependency Treebank (ISDT), and an Italian localization of the Stanford Dependency scheme},
KEYWORDS = {Italian Treebank, Harmonization and Merging of Resources, Stanford Dependencie s},
PAGES = {61-69},
URL = {http://aclweb.org/anthology/W13-2308},
ISBN = {978-1-937284-58-9},
CONFERENCE_NAME = {7th Linguistic Annotation Workshop and Interoperability with Discourse},
BOOKTITLE = {Proceedings of the 7th Linguistic Annotation Workshop and Interoperability with Discourse},
}
@INPROCEEDINGS{CARDILLO_2013_INPROCEEDINGS_CAF_338718,
AUTHOR = {Cardillo, F. A. and Amato, G. and Falchi, F.},
TITLE = {Experimenting a visual attention model in the context of CBIR systems},
YEAR = {2013},
ABSTRACT = {Many novel applications in the field of object recognition and pose estimation have been built relying on local invariant features extracted from selected key points of the images. Such keypoints usually lie on high-contrast regions of the image, such as object edges. However, the visual saliency of the those regions is not considered by state-of-the art detection algorithms that assume the user is interested in the whole image. Moreover, the most common approaches discard all the color in-formation by limiting their analysis to monochromatic versions of the input images. In this paper we present the experimental results of the application of a biologically-inspired visual attention model to the problem of local feature selection in landmark and object recognition tasks. The model uses color-information and restricts the matching between the images to the areas showing a strong saliency. The results show that the approach improves the accuracy of the classifier in the object recognition task and preserves a good accuracy in the landmark recognition task when a high percentage of visual features is filtered out. In both cases the reduction of the average numbers of local features result in high efficiency gains during the search phase that typically requires costly searches of candidate images for matches and geometric consistency checks},
KEYWORDS = {Behavioral research, Color matching, Image matching, Information retrieval},
PAGES = {45-56},
URL = {http://ceur-ws.org/Vol-964/paper8.pdf},
CONFERENCE_NAME = {IIR 2013-4th Italian Information Retrieval Workshop},
BOOKTITLE = {4th Italian Information Retrieval Workshop, IIR 2013},
}
@INPROCEEDINGS{CHIARELLA_2013_INPROCEEDINGS_CCCMMS_245105,
AUTHOR = {Chiarella, D. and Cutugno, P. and Cinini, A. and Marconi, L. and Morgavi, G. and Sbrulli, S.},
TITLE = {Análisis de documentos en red sobre la renuncia del Papa Ratzinger y la elección del Papa Francisco},
YEAR = {2013},
URL = {https://iris.cnr.it/handle/20.500.14243/245105},
ISBN = {9789597152194},
CONFERENCE_NAME = {VIII Conferencia Científica Internacional Lingüística},
}
@INPROCEEDINGS{CHIARELLA_2013_INPROCEEDINGS_CCMM_217023,
AUTHOR = {Chiarella, D. and Cutugno, P. and Marconi, L. and Morgavi, G.},
TITLE = {Mnemosynet: "una red para seguir los caminos de la memoria colectiva"},
YEAR = {2013},
PAGES = {390-394},
URL = {https://iris.cnr.it/handle/20.500.14243/217023},
VOLUME = {I},
PUBLISHER = {Centro de Lingüística Aplicada, Ministero de Ciencia, Tecnología y Medio Ambiente (Santiago de Cuba, CUB)},
ISBN = {9789597174226},
CONFERENCE_NAME = {XII Simposio Internacional de Comunicación Social: Actualizaciones en Comunicación Social},
CONFERENCE_PLACE = {Santiago de Cuba},
BOOKTITLE = {Actualizaciones en Comunicación Social-Vol. I},
EDITOR = {Miyares, L. R. and Silva, M. R. A. and Alvarado, A. M.},
}
@INPROCEEDINGS{CIMINO_2013_INPROCEEDINGS_CDVM_227043,
AUTHOR = {Cimino, A. and Dell'Orletta, F. and Venturi, G. and Montemagni, S.},
TITLE = {Linguistic Profiling based on General-purpose Features and Native Language Identification},
YEAR = {2013},
ABSTRACT = {In this paper, we describe our approach to native language identification and discuss the results we submitted as participants to the First NLI Shared Task. By resorting to a wide set of general-purpose features qualifying the lexical and grammatical structure of a text, rather than to ad hoc features specifically selected for the NLI task, we achieved encouraging results, which show that the proposed approach is general-purpose and portable across different tasks, domains and languages},
KEYWORDS = {Native Language Identification, Linguistic Profiling},
PAGES = {207-215},
URL = {http://www.aclweb.org/anthology/W13-1727},
ISBN = {978-1-937284-47-3},
CONFERENCE_NAME = {8th workshop on "Innovative Use of NLP for Building Educational Applications"},
}
@INPROCEEDINGS{CIUNI_2013_INPROCEEDINGS_CP_405918,
AUTHOR = {Ciuni, R. and Proietti, C.},
TITLE = {Probabilistic Semantics for a Discussive Temporal Logic},
YEAR = {2013},
ABSTRACT = {The paper introduces a probabilistic semantics for the paraconsistent temporal logic Ab presented by the authors in a previous work on future contingents. Probabilistic concepts help frame two possible interpretations of the logic in question-a 'subjective' and an 'objective' one-and explaining the rationale behind both of them. We also sketch a proof-method for Ab and address some considerations regarding the conceptual appeal of our proposal and its possible future developments},
KEYWORDS = {probability, discussive logic, future contingents},
PAGES = {1-13},
URL = {https://iris.cnr.it/handle/20.500.14243/405918},
ISBN = {978-1-84890-110-0},
CONFERENCE_NAME = {Logica 2012},
}
@INPROCEEDINGS{CONNOR_2013_INPROCEEDINGS_CCMR_339508,
AUTHOR = {Connor, R. and Cardillo, F. and Moss, R. and Rabitti, F.},
TITLE = {Evaluation of Jensen-Shannon distance over sparse data},
YEAR = {2013},
ABSTRACT = {Jensen-Shannon divergence is a symmetrised, smoothed version of Küllback-Leibler. It has been shown to be the square of a proper distance metric, and has other properties which make it an excellent choice for many high-dimensional spaces in R*. The metric as defined is however expensive to evaluate. In sparse spaces over many dimensions the Intrinsic Dimensionality of the metric space is typically very high, making similarity-based indexing ineffectual. Exhaustive searching over large data collections may be infeasible. Using a property that allows the distance to be evaluated from only those dimensions which are non-zero in both arguments, and through the identification of a threshold function, we show that the cost of the function can be dramatically reduced. © 2013 Springer-Verlag},
URL = {https://iris.cnr.it/handle/20.500.14243/339508},
DOI = {10.1007/978-3-642-41062-8_16},
ISBN = {978-3-642-41061-1},
}
@INPROCEEDINGS{DELGROSSO_2013_INPROCEEDINGS_DB_262445,
AUTHOR = {Del Grosso, A. M. and Boschetti, F.},
TITLE = {Collaborative multimedia platform for computational philology},
YEAR = {2013},
ABSTRACT = {This paper aims at illustrating a collaborative and modular web platform in the domain of digital and computational philology. The proposed work deals with parallel multilingual and multimedia resources. Two case studies are discussed in order to show the flexibility of the designed platform. The reusability of the components in different projects is achieved by abstract modeling and through the application of effective design patterns. The platform deals with textual resources and associated multimedia content, which can be retrieved by the metadata and shown in parallel (e. g., the page image of a manuscripts and the related transcription). The library of components will distribute under GPL 3. 0 license and available at https: //github. com/CoPhi},
KEYWORDS = {Computational philology, Digital philology, Enterprise systems, Multilingualism, Parallel multimedia},
PAGES = {46-51},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-84905815787\&origin=inward},
ISBN = {9781627484770},
CONFERENCE_NAME = {MMEDIA 2013},
BOOKTITLE = {Proceedings of a meeting held at NexComm 2013, The Fifth International Conferences on Advances in Multimedia (MMEDIA 2013)},
EDITOR = {Davis, P.},
}
@INPROCEEDINGS{DELLORLETTA_2013_INPROCEEDINGS_DVM_227044,
AUTHOR = {Dell'Orletta, F. and Venturi, G. and Montemagni, S.},
TITLE = {Unsupervised Linguistically-Driven Reliable Dependency Parses Detection and Self-Training for Adaptation to the Biomedical Domain},
YEAR = {2013},
ABSTRACT = {In this paper, a new self-training method for domain adaptation is illustrated, where the selection of reliable parses is carried out by an unsupervised linguistically-driven algorithm, ULISSE. The method has been tested on biomedical texts with results showing a significant improvement with respect to considered baselines, which demonstrates its ability to capture both reliability of parses and domain-specificity of linguistic constructions},
KEYWORDS = {Self-training, Domain Adaptation, Biomedical Texts},
PAGES = {45-53},
URL = {http://www.aclweb.org/anthology/W13-1906},
ISBN = {978-1-937284-55-8},
CONFERENCE_NAME = {12th workshop on "Biomedical Natural Language Processing" (BioNLP)},
}
@INPROCEEDINGS{DIDONATO_2013_INPROCEEDINGS_DMFPGN_382009,
AUTHOR = {Di Donato, F. and Morbidoni, C. and Fonda, S. and Piccioli, A. and Grassi, M. and Nucci, M.},
TITLE = {Semantic annotation with Pundit: A case study and a practical demonstration},
YEAR = {2013},
ABSTRACT = {This paper discusses the application of Pundit, a novel semantic annotation tool, in the case study of Burckhardt's correspondence. In this context the occurrences of persons and places names as well as references to works of art in the letters are being semantically annotated and linked to the Web of Data. Such an experiment has a two fold goal. The first one is validating and iteratively improving Pundit as a tool for creating and making explicit the information "hidden" in the letters. The second is to investigate how such knowledge can be presented and visualized to be actually useful for scholars themselves. Leveraging on Semantic Web technologies and on the Open Annotation data model, scholars' collaboratively created annotations are coherently merged with the metadata already present in the DL and exposed via REST APIs to build a number of alternative ways of visualizing the knowledge graph. We claim this approach fosters a "virtuous circle" where the new knowledge produced by scholars can, in turn, become the starting point for new researches. This paper discusses the preliminary results of this ongoing project, presenting requirements and a first visualization prototype. © 2013 ACM},
URL = {https://iris.cnr.it/handle/20.500.14243/382009},
DOI = {10.1145/2517978.2517995},
}
@INPROCEEDINGS{FERRARI_2013_INPROCEEDINGS_FSD_253217,
AUTHOR = {Ferrari, A. and Spagnolo, G. and Dell'Orletta, F.},
TITLE = {Mining commonalities and variabilities from natural language documents},
YEAR = {2013},
ABSTRACT = {A company who wishes to enter an established marked with a new, competitive product is required to analyse the product solutions of the competitors. Identifying and comparing the features provided by the other vendors might greatly help during the market analysis. However, mining common and variant features of from the publicly available documents of the competitors is a time consuming and error-prone task. In this paper, we suggest to employ a natural language processing approach based on textit(contrastive analysis) to identify commonalities and variabilities from the brochures of a group of vendors. We present a first step towards a practical application of the approach, in the the context of the market of Communications-Based Train Control (CBTC) systems},
KEYWORDS = {Software Product Lines, Variability Mining, CBTC, D.2 SOFTWARE ENGINEERING, 68N30},
PAGES = {116-120},
URL = {http://dl.acm.org/citation.cfm?id=2491634},
ISBN = {978-1-4503-1968-3},
CONFERENCE_NAME = {SPLC 2013-17th International Software Product Line Conference},
EDITOR = {Kishi, T.},
}
@INPROCEEDINGS{FRONTINI_2013_INPROCEEDINGS_FDM_226376,
AUTHOR = {Frontini, F. and Del Gratta, R. and Monachini, M.},
TITLE = {Linking the Geonames ontology to WordNet},
YEAR = {2013},
ABSTRACT = {This paper illustrates the transformation of the GeoNames ontology concepts, with their English labels and glosses, into a GeoDomain WordNet-like resource in English, its translation into Italian, and its linking to the existing generic WordNets of both languages},
KEYWORDS = {GeoNames, WordNet, lemon},
PAGES = {263-267},
URL = {http://hnk.ffzg.hr/bibl/ltc2013/book/papers/OWN-2.pdf},
PUBLISHER = {Fundacja Uniwersytetu im A. Mickiewicza (Poznan, POL)},
ISBN = {978-2-9517408-8-4},
CONFERENCE_NAME = {6th Language \& Technology Conference: Human Language Technologies as a Challenge for Computer Science and Linguistics},
CONFERENCE_PLACE = {Poznan},
BOOKTITLE = {Human Language Technologies as a Challenge for Computer Science and Linguistics. Proceedings, 6th Language \& Technology Conference, December 7-9, 2013, Poznañ, Poland},
EDITOR = {Vetulani, Z. and Uszkoreit, H.},
}
@INPROCEEDINGS{GRASSI_2013_INPROCEEDINGS_GMNFD_382003,
AUTHOR = {Grassi, M. and Morbidoni, C. and Nucci, M. and Fonda, S. and Di Donato, F.},
TITLE = {Pundit: Creating, exploring and consuming semantic annotations},
YEAR = {2013},
ABSTRACT = {This paper presents Pundit, a novel semantic web annotation tool, and demonstrates its use in producing structured data out of users annotations. Pundit allows communities of scholars to produce machinereadable annotations that can be made public and thus consumable as web data via SPARQL and ad-hoc REST APIs. Pundit is highly con-figurable and can deployed in custom instances to include well-defined and agreed annotation vocabularies. Such instances can be distributed as bookmaklets to community users so they can create uniformly structured data in a certain application scenario. Basing on the provided APIs, some demonstrative applications have been developed, exploring different use scenarios, ranging from philosophy to journalism and cultural heritage. The main aim of this paper is to demonstrate how such uniformly structured annotations can be quickly re-used on the web to make information discoverable or to visualize it in interesting ways},
URL = {https://iris.cnr.it/handle/20.500.14243/382003},
}
@INPROCEEDINGS{GUADAGNINI_2013_INPROCEEDINGS_G_265236,
AUTHOR = {Guadagnini, E.},
TITLE = {Cicéron et Boèce en Orient: quelques réflexions sur la "Rectorique" de Jean d'Antioche},
YEAR = {2013},
ABSTRACT = {Il lavoro analizza le fonti (dirette e indirette) della "divisio scientiae" e del capitolo sul "metodo" del traduttore presenti nella "Rectorique" di Jean d'Antioche},
KEYWORDS = {Filologia romanza, Jean d'Antioche, Lessico tecnico, Volgarizzamenti},
PAGES = {37-46},
URL = {https://iris.cnr.it/handle/20.500.14243/265236},
VOLUME = {15},
PUBLISHER = {Brepols (Turnhout, BEL)},
ISBN = {9782503549095},
CONFERENCE_NAME = {The Medieval Translator 2010 In Principio Fuit Interpres. The Cardiff Conference on the Theory and Practice of Translation in the Middle Ages},
CONFERENCE_PLACE = {Turnhout},
BOOKTITLE = {The Medieval Translator. Traduire au Moyen Age, vol. 15, In Principio Fuit Interpres},
EDITOR = {Petrina, A.},
}
@INPROCEEDINGS{GUADAGNINI_2013_INPROCEEDINGS_G_265238,
AUTHOR = {Guadagnini, E.},
TITLE = {Per una nuova edizione della Rettorica di Brunetto Latini},
YEAR = {2013},
ABSTRACT = {Studio preparatorio per una nuova edizione della "Rettorica": descrizione dello stemma codicum e discussione di due passi (in cui occorrono rispettivamente il lessema "giuridiziale", assente nell'ed. Maggini ma a mio avviso da restituire a testo, e il lessema "managio", sic nell'ed. Maggini ma a mio avviso lezione erronea)},
KEYWORDS = {Filologia italiana, Brunetto Latini, Lessicografia},
PAGES = {211-221},
URL = {https://iris.cnr.it/handle/20.500.14243/265238},
PUBLISHER = {Walter De Gruyter \& Co (Berlin, DEU)},
ISBN = {9783110300017},
CONFERENCE_NAME = {XXVI Congreso Internacional de Lingüística y Filología Románica},
CONFERENCE_PLACE = {Berlin},
BOOKTITLE = {Actas del XXVI Congreso Internacional de Lingüística y Filología Románica},
EDITOR = {Rigual, E. C. H. C. C.},
}
@INPROCEEDINGS{KHAN_2013_INPROCEEDINGS_KFDMQ_259365,
AUTHOR = {Khan, F. and Frontini, F. and Del Gratta, R. and Monachini, M. and Quochi, V.},
TITLE = {Generative Lexicon Theory and Linguistic Linked Open Data},
YEAR = {2013},
ABSTRACT = {In this paper we look at how Generative Lexicon theory can assist in providing a more thorough definition of word senses as links between items in a RDF-based lexicon and concepts in an ontology. We focus on the definition of lexical sense in lemon and show its limitations before defining a new model based on lemon and which we term lemonGL. This new model is an initial attempt at providing a way of structuring lexico-ontological resources as linked data in such a way as to allow a rich representation of word meaning (following the GL theory) while at the same time (attempting to) re-main faithful to the separation between the lexicon and the ontology as recommended by the lemon model},
URL = {https://iris.cnr.it/handle/20.500.14243/259365},
ISBN = {978-1-937284-98-5},
}
@INPROCEEDINGS{MARCHETTI_2013_INPROCEEDINGS_MTALDFM_226423,
AUTHOR = {Marchetti, A. and Tesconi, M. and Abbate, S. and Lo Duca, A. and D'Errico, A. and Frontini, F. and Monachini, M.},
TITLE = {Tour-pedia: a web application for the analysis and visualization of opinions for tourism domain},
YEAR = {2013},
ABSTRACT = {We present Tour-pedia an interactive web application that extracts opinions from reviews of accommodations from different sources available on-line. Polarity markers display on a map the different opinions. This tool is intended to help business operators to manage reputation on-line},
KEYWORDS = {Visualization tools, opinion mining, NLP on social media, tourism reviews},
PAGES = {594-595},
URL = {http://www.iit.cnr.it/sites/default/files/ltc2013_opener_demo.pdf},
PUBLISHER = {Fundacja Uniwersytetu im A. Mickiewicza (Poznan, POL)},
ISBN = {978-83-932640-4-9},
CONFERENCE_NAME = {6th Language \& Technology Conference: Human Language Technologies as a Challenge for Computer Science and Linguistics},
CONFERENCE_PLACE = {Poznan},
EDITOR = {Vetulani, Z. and Uszkoreit, H.},
}
@INPROCEEDINGS{MARCONI_2013_INPROCEEDINGS_MCCMS_245106,
AUTHOR = {Marconi, L. and Cutugno, P. and Chiarella, D. and Morgavi, G. and Sassi, M.},
TITLE = {Análisis de Blogs y Temas en "Narrarsi in rete: linguaggi a confronto"},
YEAR = {2013},
URL = {https://iris.cnr.it/handle/20.500.14243/245106},
ISBN = {9789597152194},
CONFERENCE_NAME = {VIII Conferencia Científica Internacional Lingüística},
}
@INPROCEEDINGS{MARINELLI_2013_INPROCEEDINGS_MC_254622,
AUTHOR = {Marinelli, R. and Cignoni, L.},
TITLE = {A Latin-Italian Database linked to the English language},
YEAR = {2013},
ABSTRACT = {This paper describes an ongoing research conducted at the Institute for Computational Linguistics (ILC) of the National Research Council (CNR) in Pisa, concerning the creation of a lexical semantic database for the Latin language, with its Italian and English translation. As we all know, many words of the Italian language derive from Latin, in the same way as many Latin words and expressions are used in everyday Italian language. The aim of this work is to exploit a well-known and tested conceptual model to construct a resource that can be easily consulted by the students of high school and university who wish to achieve proficiency in Latin language learning and deeper awareness of the use of Italian. The database is of a relational type, following the EuroWordNet (EWN)/ItalWordNet (IWN) model, according to the WordNet (WN) philosophy perspective. The items included in the database are clustered into approximately 250 synsets, which are sets of one or more synonyms, for example carina, navis (ship). Each Latin synset is linked to other words (or synsets) by means of semantic 'internal relations' of the hierarchical-vertical type (or 'is-a' relations) and of the horizontal type (role, means, purpose, sub-event, instance, etc. relations), on the basis of the model. One of the most important characteristics of the database is the possibility of connecting the Latin words to the equivalent English synonyms (or near synonyms), included in the Princeton database WordNet, by means of 'equivalence relations'. 'Plug-in relations connect each word of the Latin lexicon to the equivalent synset (synonym) of the Italian WordNet (IWN), as a kind of hookup point from which it is possible to see the Italian synonym with all its semantic relations. The study of all these kinds of relations can support the students in the learning of the Latin language, linked to Italian as well as to English. The database currently contains 200 nouns and 50 verbs, drawn from the most recent version of the Campanini-Carboni's Latin and Italian Dictionary (2011), and from William's Vocabulary for Speaking Latin (1829). A set of adjectives and adverbs will be codified in the near future, in order to represent all the grammatical categories and a small group of proper names will also be included to enrich the resource. Particular attention is paid to the Latin words that are used in everyday spoken and written Italian, for instance virus, medium, video, etc. The management tool of the database allows to visualize each Latin word inserted in the database, the Italian translation with its definition, the link with the English language, and slots showing additional information on request about its etymology, history, derivates, declension or conjugation. The Latin concept is represented as a node in the net of connections in its semantic field},
URL = {https://iris.cnr.it/handle/20.500.14243/254622},
ISBN = {978-84-616-3822-2},
}
@INPROCEEDINGS{MARINELLI_2013_INPROCEEDINGS_MC_254616,
AUTHOR = {Marinelli, R. and Cignoni, L.},
TITLE = {How to Integrate CLIL Maritime Courses in English with Idioms Derived from Specialized Lexical Semantic Databases},
YEAR = {2013},
ABSTRACT = {This paper is a proposal for better learning of idiomatic seafaring expressions to be exploited in Content and Language Learning (CLIL) maritime English courses. These courses are specifically designed for individuals with little or no prior knowledge of maritime language, wishing to undertake professional training in Naval Academies or to embark on a career as officers, engineers or crew members, or to work in import-export companies, tour operators and shipping agencies. The starting point of our research was a set of idiomatic expressions included and structured in a lexical database of maritime terminology (Mariterm), organized in semantic relations and containing around 3500 Italian lemmas, clustered into approximately 2, 500 synsets (sets of one or more synonyms), e. g.: affondare, andare a fondo (to sink). Each term is linked to other terms of the specialized lexicon by means of lexical semantic relations, and the definition of each word in both languages and the translation into English is provided. A number of phraseological expressions and sayings, for instance seguire la corrente (to go with the tide) in Italian, "to hold course" in English, as well as information of a historical type, have been included in the database. As the terminology contained in Mariterm is constantly connected to the English language, we thought it was worth highlighting the English idiomatic expression with its translation into Italian, despite the fact that the Italian expressions sometimes belong to other semantic fields. The single or multiword expressions can be equivalent and idiomatic in both languages (essere sulla stessa barca/"to be in the same boat"); or can be idiomatic in one of the two languages but not in the other (essere un porto di mare/"to be like Piccadilly Circus"); or, viceversa, "sail close to the wind"/camminare sul filo del rasoio, thus highlighting similarities and differences related to concept representation in the two languages. In some cases, the terminological database managing tool allows for visualization of etymological or historical information related to the idiomatic expression sought for. Idioms are widely used in everyday language, and their complex constructions make them extremely difficult to understand, let alone to use, for non-native speakers. Some phrases referable to the seafaring field are clear, eg.: "to go with the flow" (continue in the same way as others), while others require background knowledge of their historical origin in order to be understood and better memorized, e. g.: "feeling blue" (to describe a feeling of sadness). Starting from the terminological database and using different and appropriate exercises, each phraseological item is provided with a definition, the Italian equivalent when it exists, and information about its origins. We present each idiom highlighting some variations, and giving when possible example sentences in context from well known and validated sources of various types (web sites, specialized maritime journals, handbooks, grey literature, newsletters and other publications), which can help the learner understand when and how a particular idiom is used and to illustrate important grammar points of the English language, making the learning process more interesting and appealing},
KEYWORDS = {CLIL, phraseology, maritime terminology, lexical semantic databases, grammar.},
PAGES = {6666-6673},
URL = {https://iris.cnr.it/handle/20.500.14243/254616},
PUBLISHER = {International Association of Technology, Education and Development (IATED) (Valencia, ESP)},
ISBN = {978-84-616-2661-8},
CONFERENCE_NAME = {INTED2013. 7th International Technology, Education and Development Conference},
CONFERENCE_PLACE = {Valencia},
BOOKTITLE = {INTED2013. 7th International Technology, Education and Development Conference. Valencia (Spain), 4th-6th of March, 2013. Proceedings},
EDITOR = {Chova, L. G. and Martínez, A. L. and Torres, I. C.},
}
@INPROCEEDINGS{MARZI_2013_INPROCEEDINGS_M_225696,
AUTHOR = {Marzi, C.},
TITLE = {Innovation, language, and the web},
YEAR = {2013},
ABSTRACT = {Language and innovation are inseparable. Language conveys ideas which are essential in innovation, establishes the most immediate connections with our conceptualisation of the outside world, and provides the building blocks for communication. Every linguistic choice is necessarily meaningful, and it involves the parallel construction of form and meaning. From this perspective, language is a dynamic knowledge construction process. In this article, emphasis will be laid on investigating how words are used to describe innovation, and how innovation topics can influence word usage and collocational behaviour. The lexical representation of innovative knowledge in a context-based approach is closely related to the representation of knowledge itself, and gives the opportunity to reduce the gap between knowledge representation and knowledge understanding. This will bring into focus the dynamic interplay between lexical creativity and innovative pragmatic contexts, and the necessity for a dynamic semantic shift from context-driven vagueness to domain-driven specialisation},
KEYWORDS = {Grey literature, Language technologies, Lexical productivity, Web corpora},
PAGES = {153-159},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-84924135180\&origin=inward},
VOLUME = {GL CONFERENCE SERIES, N. 14-ISSN 1386-2316},
PUBLISHER = {TextRelease (Amsterdam, NLD)},
ISSN = {1386-2316},
ISBN = {9789077484203},
CONFERENCE_NAME = {Fourteenth International Conference on Grey Literature},
CONFERENCE_PLACE = {Amsterdam},
BOOKTITLE = {THE GL-CONFERENCE SERIES. CONFERENCE PROCEEDINGS},
EDITOR = {Farace, D. J. and Frantzen, J. and Greynet},
}
@INPROCEEDINGS{MONEGLIA_2013_INPROCEEDINGS_MPGMRDKF_226438,
AUTHOR = {Moneglia, M. and Panunzi, A. and Gagliardi, G. and Monachini, M. and Russo, I. and De Felice, I. and Khan, F. and Frontini, F.},
TITLE = {IMAGACT E-learning Platform for Basic Action Types. In: Pixel (ed.), Proceedings of the 6th International Conference ICT for Language Learning},
YEAR = {2013},
ABSTRACT = {Action verbs express important information in a sentence and they are the most frequent elements in speech, but they are also one of the most difficult part of the lexicon to learn for L2 language learners, because languages segment these concepts in very different ways. The two sentences "Mary folds her shirt" and "Mary folds her arms" refer to two completely different types of action, as becomes evident when they are translated into another language (e. g., in Italian they would be translated as "Maria piega la camicia" and "Maria incrocia le braccia" respectively). IMAGACT e-learning platform aims to make these differences evident by creating a cross-linguistic ontology of action types, whose nodes consist of 3D scenes, each of which relates to one action type. In order to identify these types, contexts of use have been extracted from English and Italian spontaneous speech corpora for around 600 high frequency action verbs (for each language). All instances that refer to similar events (e. g., fold the shirt/ the blanket) are grouped under one single action type: each one of these types is then represented by a linguistic best example and a short video that represents simple actions (e. g. a man taking a glass from a table). The action types extracted for Italian and English are compared and merged into one cross-linguistic ontology of action. IMAGACT has provided an internet based annotation infrastructure to derive this information from corpora. The project is now completed for the Italian and English lexicon, data extraction for Chinese and Spanish is ongoing. Reference to prototypical imagery is crucial in order to bootstrap the learning process. By selecting the set of 3D scenes referred to by a verb in one language and viewing the type of activity represented therein learners can directly understand the range of applicability of each verb. Thanks to an easy interface, a user can access the English/Italian/Chinese lexicon by lemma or directly by 3D scenes. For example, searching for the verb "to turn", s/he will be presented with a number of scenes, showing the various action types associated to that verb. Clicking on a scene s/he or she will know how this type of action is referred to in other the languages},
KEYWORDS = {Ontology},
PAGES = {85-89},
URL = {https://iris.cnr.it/handle/20.500.14243/226438},
PUBLISHER = {libreriauniversitaria. it (Limena, ITA)},
ISBN = {978-88-6292-423-8},
CONFERENCE_NAME = {International Conference "ICT for Language Learning", 6th edition},
CONFERENCE_PLACE = {Limena},
BOOKTITLE = {Conference Proceedings. ICT for Language Learning},
EDITOR = {Pixel},
}
@INPROCEEDINGS{MONTANI_2013_INPROCEEDINGS_MARBCMSTSBP_245515,
AUTHOR = {Montani, C. and Andronico, P. and Raviolo, C. and Bozzi, A. and Codenotti, B. and Meghini, C. and Sommani, M. and Tarabella, L. and Scopigno, R. and Baraglia, R. and Perego, R.},
TITLE = {Il CNR dopo la CEP},
YEAR = {2013},
ABSTRACT = {A short history of some of the ICT issues developed in the Institutes of CNR in Pisa since the 60s and that, in the opinion of the authors, had its roots in the CEP (Pisa Electronic Computer)},
KEYWORDS = {Storia dell'Informatica, K.2 HISTORY OF COMPUTING},
PAGES = {41-66},
URL = {https://iris.cnr.it/handle/20.500.14243/245515},
ISBN = {978-88-6741-303-4},
CONFERENCE_NAME = {La CEP prima della CEP: storia dell'informatica. Atti},
EDITOR = {Cignoni, G. A. and Gadducci, F.},
}
@INPROCEEDINGS{MORGAVI_2013_INPROCEEDINGS_MMMC_181756,
AUTHOR = {Morgavi, G. and Morando, M. and Marconi, L. and Cutugno, P.},
TITLE = {Turn Taking: A Tool for Dialog Processes},
YEAR = {2013},
ABSTRACT = {Turn-taking is the process by which participants in a conversation alternate speech and silence, it is an essential component of spoken interaction. I order to lead productive conversations, people need not only know what to say but also when to say it. Usually, we evaluate the whole communication process focusing our attention on semantic meanings of exchanged words, but actually this analysis cannot be automatically performed. In this paper we propose a method to extract information on the dynamics of the dialog processes through simple turn-taking quantitative measurements. Over 1000 research interviews made from students during their psychology university course have been analyzed. Each whole interview process has been considered as a complex system evolving in the time. Our approach founds on analogies between interviews and mathematical chaotic processes. The proposed procedure allows the extraction of information on the dialog evolution: phase portraits with anomalous paths indicate situations where the communication has been troubled from external references},
URL = {https://iris.cnr.it/handle/20.500.14243/181756},
ISBN = {978-1-61804-155-5},
}
@INPROCEEDINGS{MLLER_2013_INPROCEEDINGS_MD_382011,
AUTHOR = {Müller, S. and Di Donato, F.},
TITLE = {Burckhardtsource. org. A semantic digital edition of the correspondence to Jacob Burckhardt},
YEAR = {2013},
ABSTRACT = {A description of the Digital Library Burckhardtsource. org},
URL = {https://iris.cnr.it/handle/20.500.14243/382011},
}
@INPROCEEDINGS{PARDELLI_2013_INPROCEEDINGS_PGS_184947,
AUTHOR = {Pardelli, G. and Goggi, S. and Sassi, M.},
TITLE = {Open Grey for Language Technology: a ride on the network},
YEAR = {2013},
ABSTRACT = {Sommario in IngleseThe aim of this paper is to introduce the Open Access movement for Natural Language Processing (NLP) by means of a wide range of open access Grey Literature documentation available on the web. In 2008 Robert Dale, in the last issue of volume 35 of Computational Linguistics said: "There are a number of definitions of the term 'open access' in circulation, but almost all share the key principle that scientific literature should be freely available for all to read, download, copy, distribute, and use (with appropriate attribution) without restriction". At first glance it might seem that the Open Access movement has gradually become more influential in the field of language technology by building repositories accessible through the network. Today's digital archives are niches of intellectual production spread by means of a wide range of documents (such as journal articles and proceedings) which, paradoxically, the search engines do not always reach. The use of inappropriate terms in the formulation of queries and the fragmentation of repositories in this area of investigation does not allow to retrieve information on a large scale. The full paper, after a first introductory section, will be organized in two sections: 1) the first dedicated to the methodology for searching and tracing open access resources and to the criteria for analyzing and selecting the online documentation; 2) the second devoted to a description of the state-of-the-art of Open Access Grey Literature material in a statistical and thematic scenario. As things stand, standardization of computational systems interconnected by links and tools of various nature allowing Internet users to easily retrieve the information that the web naturally makes available would then be essential. Topics: Sustainability, Public Accessible Resources, Product and Service enhancements, Open Access, Curation and Preservation},
KEYWORDS = {Open Access Movement. Natural Lanuage Processing},
PAGES = {161-165},
URL = {https://iris.cnr.it/handle/20.500.14243/184947},
PUBLISHER = {TEXTRELEASE, GL PROGRAM \& CONFERENCE BUREAU (Amsterdam, NLD)},
ISSN = {1386-2316},
ISBN = {978-90-77484-20-3},
CONFERENCE_NAME = {GL14 Fourteenth International Conference on Grey Literature. Tracking Innovation Through Grey Literature},
CONFERENCE_PLACE = {Amsterdam},
BOOKTITLE = {THE GL-CONFERENCE SERIES. CONFERENCE PROCEEDINGS},
EDITOR = {Farace, D. J. and Frantzen, J. and Greynet},
}
@INPROCEEDINGS{RUSSO_2013_INPROCEEDINGS_RC_228499,
AUTHOR = {Russo, I. and Caselli, T.},
TITLE = {Changeable Polarity of Verbs through Emotions' Attribution in Crowdsourcing Experiments},
YEAR = {2013},
ABSTRACT = {Sentiment analysis and emotion detection are tasks with common features but rarely related because they tend to categorize the objects of their studies according to different categories, i. e. positive, negative and neutral values in SA, and emotion labels such as "joy", "anger" etc. in emotion detection. In this paper we try to bridge this gap, reporting on three crowdsourcing experiments to collect speakers' intuitions on emotion(s) associated with events denoted by verbs and propose to set contextual polarity values on the basis of the selected emotions. In this way we suggest a methodology to handle connotational meanings of verbs that can help to refine automatic sentiment analysis on social media, where shared contents are often short reports on pleasant or unpleasant events and activities},
KEYWORDS = {emotion attribution, connotations of verbs, empathy},
PAGES = {131-139},
URL = {http://ceur-ws.org/Vol-1096/paper9.pdf},
CONFERENCE_NAME = {First International Workshop on Emotion and Sentiment in Social and Expressive Media: approaches and perspectives from AI (ESSEM 2013) A workshop of the XIII International Conference of the Italian Association for Artificial Intelligence (AI*IA 2013)},
BOOKTITLE = {Proceedings of the First International Workshop on Emotion and Sentiment in Social and Expressive Media: approaches and perspectives from AI (ESSEM 2013) A workshop of the XIII International Conference of the Italian Association for Artificial Intelligence (AI*IA 2013)},
EDITOR = {Battaglino, C. and Bosco, C. and Cambria, E. and Damiano, R. and Patti, V. and Rosso, P.},
}
@INPROCEEDINGS{RUSSO_2013_INPROCEEDINGS_RDFKM_257360,
AUTHOR = {Russo, I. and De Felice, I. and Frontini, F. and Khan, F. and Monachini, M.},
TITLE = {(Fore)seeing actions in objects. Acquiring distinctive affordances from language},
YEAR = {2013},
ABSTRACT = {In this paper we investigate if conceptual information concerning objects' affordances as possibilities for actions anchored to an object can be at least partially acquired through language. Considering verb-noun pairs as the linguistic realizations of relations between actions performed by an agent and objects we collect this information from the ImagAct dataset, a linguistic resource obtained from manual annotation of basic action verbs, and from a web corpus(itTenTen). The notion of affordance verb as the most distinctive verb in ImagAct enables a comparison with distributional data that reveal how lemmas ranking based on a semantic association measure that mirror that of affordances as the most distinctive actions an object can be involved in},
PAGES = {151-161},
URL = {https://docs.google.com/viewer?a=v\&pid=sites\&srcid=ZGVmYXVsdGRvbWFpbnxubHBjczIwMTN8Z3g6MTI0ZGMzYWYwYmMxNjY1Mg},
CONFERENCE_NAME = {NLPCS 2013-10th International Workshop on Natural Language Processing and Cognitive Science},
BOOKTITLE = {Proceedings of NLPCS 2013-10th International Workshop on Natural Language Processing and Cognitive Science},
EDITOR = {Sharp, B. and Zock, M.},
}
@INPROCEEDINGS{RUSSO_2013_INPROCEEDINGS_RFDKM_227078,
AUTHOR = {Russo, I. and Frontini, F. and De Felice, I. and Khan, F. and Monachini, M.},
TITLE = {Disambiguation of Basic Action Types through Nouns' Telic Qualia},
YEAR = {2013},
ABSTRACT = {Knowledge about semantic associations between words is effective to disambiguate word senses. The aim of this paper is to investigate the role and the relevance of telic information from SIMPLE in the disambiguation of basic action types of Italian HOLD verbs (prendere, 'to take', raccogliere, 'to pick up', pigliare 'to grab' etc.). We propose an experiment to compare the results obtained with telic information from SIMPLE with basic co-occurrence information extracted from corpora (most salient verbs modifying nouns) classified in terms of general semantic classes to avoid data sparseness},
PAGES = {70-75},
URL = {http://www.aclweb.org/anthology/W13-5410},
PUBLISHER = {Association for Computational Linguistics (Stroudsburg, USA)},
ISBN = {978-1-937284-98-5},
CONFERENCE_NAME = {6th International Conference on Generative Approaches to the Lexicon Generative Lexicon and Distributional Semantics},
CONFERENCE_PLACE = {Stroudsburg},
BOOKTITLE = {Proceedings of the 6th International Conference on Generative Approaches to the Lexicon. Generative Lexicon and Distributional Semantics},
EDITOR = {Saurí, R. and Calzolari, N. and Huang, C. R. and Lenci, A. and Monachini, M. and Pustejovsky, J.},
}
@INPROCEEDINGS{SASSI_2013_INPROCEEDINGS_SBP_183628,
AUTHOR = {Sassi, M. and Biagioni, S. and Pardelli, G.},
TITLE = {A linguistic and gender approach to 1841 Tuscany population Census},
YEAR = {2013},
ABSTRACT = {The Census of 1841 in Tuscany was first official data registry which tried to describe Tuscan population as a whole on granducal basis. With the use of special ad hoc created forms all demographic and socioeconomic characteristics of families and single persons in "Granducato di Toscana" were described. These data of Census, now kept by the State Archive of Florence, supply a precious source for studies of all different aspects of the population and include following information: name, surname, age, gender, marital status, employment, religion, schoolarity, "social status". In the registrers for each community and parish a full account is given of homes, resident families, and composition of families including family servants. Each of those entities had a proper incremental code number. [Registers were generated and updated by priests, who at that time were only surely scholarised officers widespread on territory, that is why they are divided by parish, which is an administrative unit typical of canonic right, instead of quarters or "rioni" or "contrade" which instead had been long practiced in civil right. ] During early 80: s the research group of prof. Biagioli of Department of Modern History of Pisa University, charged the computational linguistic Institute of CNR with digitalization and the electronic processing of these data as well as of data from "Catasto" [public registry of buildings and land ownership] to enable statistical, demographical, historical, sociological and economic analysis. In this work the authors have used the only partially usable subset of data left of that work, concerning four communities in the province of Pisa i. e actual Bièntina, Càscina, Pontedera and San Giuliano Terme (at that time named "Baths of San Giuliano") and is more concerned with terminological and lexical issues a gender related analysis of work and craftmanships. Each of the four communities has its own peculiar profile. Work is developed in 5 points: a) Informatics retrieval of linguistic information from Tuscany of 1800 focused by the arts and craftmanships more in use in families of that time, b) gender division of works and craftmanships, c) observation of lexical disparity in the four communities and terminological curiosities of that historical period, d) actually no longer existing craftmanships, e) diacronic analysis of communities, where possible. In this scenery the authors will introduce the methodology they employed for data analysis. Tables and graphs will be used to better focus different moments and results of work. The authors give the English translation of the terms extracted from the Corpus (see Appendix Glossary)},
KEYWORDS = {1841 Tuscany Population Census, Terminology},
PAGES = {200-205},
URL = {https://iris.cnr.it/handle/20.500.14243/183628},
PUBLISHER = {Centro de Lingüística Aplicada, Ministero de Ciencia, Tecnología y Medio Ambiente (Santiago de Cuba, CUB)},
ISBN = {978-959-7174-22-6},
CONFERENCE_NAME = {XIII Simposio Internacional de Comunicación Social-Actulaizaciones en Comunicacion Social},
CONFERENCE_PLACE = {Santiago de Cuba},
EDITOR = {Miyares, L. R. and Alvarado, M. R. A. S. Y. A. M.},
}
@INPROCEEDINGS{SASSOLINI_2013_INPROCEEDINGS_SCP_227909,
AUTHOR = {Sassolini, E. and Cucurullo, S. and Picchi, E.},
TITLE = {Semantic networks for improved access to biomedical databases},
YEAR = {2013},
URL = {https://iris.cnr.it/handle/20.500.14243/227909},
ISBN = {978-90-77484-20-3},
}
@INPROCEEDINGS{SASSOLINI_2013_INPROCEEDINGS_SSCCSS_227915,
AUTHOR = {Sassolini, E. and Sassi, M. and Cucurullo, S. and Cinini, A. and Sbrulli and Stefano},
TITLE = {I testi antichi: un patrimonio culturale da conservare e riutilizzare DIDAMATICA 2013, tecnologie e metodi per la didattica del futuro},
YEAR = {2013},
URL = {https://iris.cnr.it/handle/20.500.14243/227915},
ISBN = {978-88-98091-10-2},
}
@INPROCEEDINGS{SASSOLINI_2013_INPROCEEDINGS_SECSP_227907,
AUTHOR = {Sassolini and Eva and Cinini, A. and Sbrulli, S. and Picchi, E.},
TITLE = {Tools and Resources Supporting the Cultural Tourism},
YEAR = {2013},
ABSTRACT = {The diffusion of internet and the information technologies are creating continuous information flows. There is a widespread awareness of the added value and of the role that the Web has in dissemination, exploitation and promotion of the cultural tourism, especially in a country like Italy, where the cultural heritage is very important. Moreover, an open philosophy causes problems of authoritativeness in the production of contents because it is characterized by a strong interaction among users thus creating a distance between knowledge and communication. The spread of internet has brought the significant changes of communication paradigm. Nowadays the competition decreases among contents, even among from sources published in potential competition with them. In network logic, all nodes are interdependent and represent a single large hypertext. The proliferation of paths boosts a free circulation of ideas and can bring out most interesting contents},
URL = {https://iris.cnr.it/handle/20.500.14243/227907},
ISSN = {1386-2316},
ISBN = {978-90-77484-20-3},
BOOKTITLE = {THE GL-CONFERENCE SERIES. CONFERENCE PROCEEDINGS},
}
@INPROCEEDINGS{SORIA_2013_INPROCEEDINGS_SM_119264,
AUTHOR = {Soria, C. and Mariani, J.},
TITLE = {Searching LTs for minority languages},
YEAR = {2013},
ABSTRACT = {Les Technologies de la Langue (TL) sont un instrument nécessaire pour toutes les langues, en particulier celles qui aspirent à conquérir un espace dans les dispositifs numériques. Les langues qui ne sont pas équipées de technologies sont sérieusement menacées d'extinction numérique dans le long terme. Le projet META-NET a évalué l'état actuel des TL pour 30 langues européennes. Mais qu'en est-il des langues régionales et minoritaires ? Très peu d'informations sont disponibles pour elles. Dans cet article, nous présentons d'abord les données disponibles dans la LRE Map. Nous plaidons ensuite en faveur d'une campagne donnant une image complète des TL existant pour les langues minoritaires et régionales d'Europe. Cela aidera les décideurs, les chercheurs et les développeurs à planifier une feuille de route pour doter toutes les langues des instruments nécessaires pour fonctionner comme des langues correctement équipées dans l'ère numérique. Un recensement des TL disponibles et nécessaires est ainsi proposé},
KEYWORDS = {Lingue regionali e minoritarie, risorse linguistiche, tecnologie linguistiche},
PAGES = {235-247},
URL = {http://www.taln2013.org/actes/www/TALARE-2013/actes/talare-2013-long-005.pdf},
CONFERENCE_NAME = {TALARE 2013: Traitement Automatique des Langues Régionales de France et d'Europe},
BOOKTITLE = {Actes de TALARE 2013: Traitement Automatique des Langues Régionales de France et d'Europe},
EDITOR = {Morin, E. and Estève, Y.},
}
@INPROCEEDINGS{SORIA_2013_INPROCEEDINGS_SMZ_257950,
AUTHOR = {Soria, C. and Mariani, J. and Zoli, C.},
TITLE = {Dwarfs sitting on the giants' shoulders-how LTs for regional and minority languages can benefit from piggybacking major languages},
YEAR = {2013},
ABSTRACT = {LTs are a necessary instrument for all languages, especially for those aiming at conquering a space over digital devices. Languages that are not equipped with LT seriously face digital extinction in the long run. Many challenges are to be faced to equip minority languages with LTs (from basic to advanced): the almost complete lack of knowledge about available resources and technologies, the substantial delay in development of basic technologies, the lack of cooperation among minority languages communities, the chronic shortage of funding (in particular for minority languages not officially recognized, yet often the most vital ones over the Internet) and the limited economic value placed over LTs for minority languages by the digital market rules. In this paper we suggest how these challenges can be overcome, and how coordinated and standardized cooperation among all interested stakeholders can lead to better knowledge and awareness of the breadth and depth of available technologies},
PAGES = {73-79},
URL = {https://iris.cnr.it/handle/20.500.14243/257950},
ISBN = {978-0-9560210-5-2},
CONFERENCE_NAME = {XVII FEL Conference},
BOOKTITLE = {Proceedings of the XVII FEL Conference},
EDITOR = {Norris, M. J. and Anonby, E. and Junker, M. O. and Ostler, N. and Patrick, D.},
}
@INPROCEEDINGS{VENTURI_2013_INPROCEEDINGS_V_304637,
AUTHOR = {Venturi, G.},
TITLE = {Investigating legal language peculiarities across different types of Italian legal texts: an NLP-based approach},
YEAR = {2013},
ABSTRACT = {In this paper, the author carried out the linguistic profiling of a corpus of different types of Italian legal texts exemplifying different sub-varieties of Italian legal language by relying on a wide range of different linguistic features (lexical, morpho-syntactic and syntactic) automatically extracted from the output of a multi-level automatic linguistic analysis of texts. The devised comparative approach allowed investigating the linguistic variation i) between the considered corpus of legal texts and a corpus of newspaper articles representative of Italian ordinary language and ii) among the considered types of legal texts (legislative acts, administrative acts, the Italian Constitution and legal cases). Achieved results can provide the starting point to identify areas of lexical, morpho-syntactic and/or syntactic complexity within a legal text in order to assess its readability as well to perform a number of different computational forensic linguistics tasks},
KEYWORDS = {Legal language analysis, linguistic profiling, legal genres},
PAGES = {1-19},
URL = {http://ler.letras.up.pt/uploads/ficheiros/13624.pdf},
ISBN = {978-989-8648-14-3},
CONFERENCE_NAME = {3rd European Conference of the International Association of Forensic Linguists},
}
@INPROCEEDINGS{ZOLI_2013_INPROCEEDINGS_ZSR_257946,
AUTHOR = {Zoli, C. and Soria, C. and Randaccio, S.},
TITLE = {The status, corpus planning and speakers' attitudes on Romagnol (ISO 639-3: rgn)},
YEAR = {2013},
ABSTRACT = {Even if recognized by Ethnologue with a clear ISO code, Romagnol is still underestimated and often considered an Italian dialect. One of the variants of Gallo-Italic languages, it has a strong linguistic identity and is well determined as Abstandsprache with regards to Veneto and Marchigiano; less clear the boundaries towards west, where there is a dialectal continuum with Emilian (egl). With respect to Emilian, Romagnol is developing as Ausbausprache, being strong and clear the perception the community has of a Romagnol history, territory, ethnicity, separated from that of Emilia. However, it lacks of a relevant factor for its status: a written standard. Institute "Friedrich Schürr" is one of the most active associations in the field of language support, but it has to do a crucial step: from a amateurish and folkloric activism to a real effort for a shared recognition of the language. The creation of a standard spelling is the path to follow for public presence, but there is still big tension between the old and the new vision. The fragmentation of oral varieties of Romagnol has never been a communication barrier, but nowadays it is perceived as a problem in terms of a written standardization. The Italian equation that "the language is written as it is spoken" causes the misleading belief that every difference in pronunciation must be registered in writing. It is actually the opposite: after six years of age we do not read letter by letter but we register the entire word "photo-graphing" it. Therefore, it is not obviously necessary that the phonetics matches the spelling. But minority speakers often get confused between speaking and writing, and fear that the standardization of the language may harm their local dialect. A standardized spelling only makes sense for a written language. If there were, for example, a talk show in Romagna, the titles and explanatory signs would be in standard Romagnol, but the presenter and the guests would talk in their own dialects (as it happens in German Switzerland or in Norway). At the same time, the speakers who fear standardization, also reject the use of tools such as electronic instruments for spellchecking (according to the belief that everyone writes in his or her own way) and do not accept the creation of neologisms because they are alien to the traditional language these speakers learned as children. These attitudes contribute to relegate minority languages such as Romagnol to the status of dialects and prevent them to evolve and flourish. In our presentation we will briefly sketch the dialectal situation of Romagnol, the main standardization problems and the issues arisen in the last years among activists. We will try to demonstrate that standardization is not only necessary but also fundamental if we want to give minority languages such as Romagnol the same status and dignity of national languages},
KEYWORDS = {orthography, standardization, minority language, regional language},
PAGES = {124-125},
URL = {http://icml14.uni-graz.at/etc/upload/ICML_XIV_programme.pdf},
CONFERENCE_NAME = {14th International Conference on Minority Languages (ICML XIV)},
BOOKTITLE = {International Conference on Minority Languages XIV (ICML XIV)},
}
@INPROCEEDINGS{BOSCHETTI_2013_INPROCEEDINGS_BBD_262449,
AUTHOR = {Boschetti, F. and Bozzi, A. and Del Grosso, A. M.},
TITLE = {Library of components for the Computational Philological Domain dealing with TEI markup guidelines: CoPhiLib},
YEAR = {2013},
KEYWORDS = {collaborative philology},
PAGES = {160-162},
URL = {http://digilab2.let.uniroma1.it/teiconf2013/program/posters/abstracts-posters#C162},
CONFERENCE_NAME = {The Linked TEI: Text Encoding in the Web},
BOOKTITLE = {The Linked TEI: Text Encoding in the Web Book of Abstracts, Abstracts of the TEI Conference and Members Meeting 2013},
EDITOR = {Ciotti, F. and Ciula, A.},
}
@INPROCEEDINGS{BOSCHETTI_2013_INPROCEEDINGS_BBD_262451,
AUTHOR = {Boschetti, F. and Bozzi, A. and Del Grosso, A. M.},
TITLE = {Library of components for the Computational Philological Domain dealing with TEI markup guidelines: CoPhiLib},
YEAR = {2013},
URL = {https://iris.cnr.it/handle/20.500.14243/262451},
}
@INPROCEEDINGS{GOGGI_2013_INPROCEEDINGS_GPGB_249724,
AUTHOR = {Goggi, S. and Pardelli, G. and Giannini, S. and Biagioni, S.},
TITLE = {Grey literature in European Commission projects},
YEAR = {2013},
ABSTRACT = {The latest recommendations issued by the European Commission go towards the revision of their policy on dissemination and preservation of scientific information in order to promote the access to the results of the community funded research by especially implementing the open access policy within 'Horizon 2020', the EU Framework Programme for Research and Innovation (2014-2020). The aim of the survey is to identify, measure and evaluate the usability and availability of grey literature provided by the European Commission projects web sites in order to verify whether this type of literature is compliant with EU recommendations},
KEYWORDS = {Grey literature, EU Projects, A.1 INTRODUCTORY AND SURVEY},
PAGES = {154-159},
URL = {https://iris.cnr.it/handle/20.500.14243/249724},
ISBN = {978-90-77484-21-0},
CONFERENCE_NAME = {Fifteenth International Conference on Grey Literature. The Grey Audit: a field assessment in grey literature},
BOOKTITLE = {GL Program Books},
}
@INPROCEEDINGS{MARZI_2013_INPROCEEDINGS_MFP_227175,
AUTHOR = {Marzi, C. and Ferro, M. and Pirrelli, V.},
TITLE = {Lexical parsability and morphological structure},
YEAR = {2013},
ABSTRACT = {A classical tenet in the psycholinguistic literature on the mental lexicon is that a parsed affix presents high activation levels (and thus contributes to activation spreading to other words with the same affix), and that such levels are tightly correlated with the affix productivity. In a number of influential papers, it has been suggested that parsability criteria interact with frequency to define morphological productivity in the lexicon. For example, the frequency of a derivative (e. g. government) relative to its base (govern) is shown to be a good predictor for parsability/productivity. The higher the frequency ratio, the more likely the morphological structure to be perceived, and the associated affix to be used productively. The present contribution intends to offer a computational explanatory basis for this correlational evidence, and assess its applicability to the acquisition of complex inflectional paradigms. In those languages, like Italian and German, whose inflection is stem-based rather than word-based, there is often no single paradigmatic form which can act as a base by being properly contained in all other inflected variants. Yet, it seems intuitive to suggest that verbs that are inflected for one paradigm cell only (e. g. neighbouring), are learned earlier and more easily but exhibit lower levels of perceived inflectional structure than verbs with richer paradigms. This appears to be in good accord with experimental evidence of time latencies in lexical decision, which are shown to correlate negatively with token frequency, paradigm size and paradigm entropy. Our simulations, based on Temporal Self-Organizing Maps (TSOMs) allow us to establish an interesting connection between inflectional parsability, frequency-based paradigm structure, and acquisitional constraints on the interaction between the human processor and working memory. Self-organising topological models of the mental lexicon can mimic the spatial and temporal organization of memory structures supporting the processing of symbolic sequences [8-10], and can provide an interesting framework for testing integrative accounts of lexical processing/acquisition as the complex result of general-purpose operations on word stimuli (e. g. working memory, long-term storage, sensory-motor mapping, rehearsal, unit integration, unit analysis, executive control, time-series processing), in line with recent acquisitions on the neuro-functional architecture of the perisylvian language network in the left hemisphere of human brain. Simulations of the incremental acquisition of "mini-paradigms" (small islands of morphological contrast encompassing up to three different forms for the same verb support the hypothesis that perception of structure (parsability) and morphological productivity strongly correlate in the inflectional lexica of German and Italian. In particular, by monitoring longitudinal progress in storage and generalisation of differently distributed inflectional paradigms in the two languages, we show that: i) high-frequency forms are stored and accessed significantly earlier than low-frequency forms; ii) deeply entrenched but paradigmatically isolated forms tend to block usage of other forms in the same paradigm; iii) low-frequency evenly distributed (highly entropic) intra-paradigmatic forms are acquired later but are easily extended. Our investigation credits the proposed computational framework with psycholinguistic plausibility, and grounds parsability-based models of morphological productivity on a specific, explicit proposal of lexical architecture. This provides an explanatory basis for both psycholinguistic and linguistic accounts of morphological structure, and offers an intermediate framework for scientific inquiry bridging the gap between linguistic units and functional units in neurosciences. Finally, it makes the interesting suggestion that principles of morpheme-based organisation of the mental lexicon are compatible with a learning strategy requiring memorisation of full forms},
KEYWORDS = {morphological structure, word paradigms, frequency, human processor},
PAGES = {33-34},
URL = {http://mmm9.ffzg.unizg.hr/wp-content/uploads/2012/10/MMM_PROGRAM4.pdf},
CONFERENCE_NAME = {9th Mediterannean Morphology Meeting on "Morphology and Semantics" (9th MMM)},
BOOKTITLE = {Morphology and Semantics-Books of Abstracts},
}
@INPROCEEDINGS{RUTA_2013_INPROCEEDINGS_RSTBCCBTFNMP_260126,
AUTHOR = {Ruta, L. and Siracusano, R. and Tortorella, G. and Boncoddo, M. and Colombi, C. and Crifaci, G. and Billeci, L. and Tartarisco, G. and Ferro, M. and Narzisi, A. and Muratori, F. and Pioggia, G.},
TITLE = {The PRIMA-PIETRA Project: A Web-Based Platform for Early Autism Risk Assessment},
YEAR = {2013},
ABSTRACT = {It is well recognized that the best outcomes in autism spectrum disorders (ASD) are achieved through early diagnosis and early intervention. ASD symptoms may occur as early as 12-18 months and different instruments have been developed for early autism risk assessment under the age of 2 years. The Modified Checklist for Autism in Children (M-CHAT) is a developmental surveillance-screening instrument administered during 18-to 36-month well-child visits that was demonstrated to improve early identification of autism. Novel technologies can substantially contribute to improve early diagnosis in ASD, providing early screening risk assessment platforms, unobtrusive measurements of behaviors and physiological responses, as well as brain structure and connectivity, or other measurable stimulus-event experimental paradigms. The Prima Pietra Project based at the Pervasive Healthcare Center of the Institute of Clinical Physiology of the National Research Council of Italy (Consiglio Nazionale delle Ricerche, C. N. R.) and the AOU Polyclinic "G. Martino" in Messina developed and provided an early autism risk assessment web-based platform for pediatricians and physicians available on the internet},
KEYWORDS = {early autism risk assessment},
URL = {https://imfar.confex.com/imfar/2013/webprogram/Paper14488.html},
CONFERENCE_NAME = {International Meeting for Autism Research 2013},
BOOKTITLE = {International Meeting for Autism Research},
}
@TECHREPORT{ALBANESI_2013_TECHREPORT_ABBCG_350475,
AUTHOR = {Albanesi, D. and Bellandi, A. and Bulleri, F. and Carniani, E. and Giovannetti, E.},
TITLE = {Applicazione Web Linguistico-Computazionale per il Progetto di Traduzione del Talmud Babilonese-Rapporto tecnico 1},
YEAR = {2013},
ABSTRACT = {Il presente documento descrive lo stato di avanzamento del lavoro condotto dall'Istituto di Linguistica Computazionale "A. Zampolli" del CNR (ILC-CNR) nel contesto del progetto "Traduzione del Talmud Babilonese" in italiano. In particolare, vi sono illustrate le varie fasi che hanno portato allo sviluppo del sistema Talmud, nelle sue due attuali versioni, "alfa" e "beta", durante il primo anno di progetto. Quanto qui descritto costituisce un "Rapporto sullo stato di avanzamento dei lavori dell'applicazione Web" unicamente da parte dell'ILC-CNR e si configura come un primo fascicolo di una serie che avrà cadenza quadrimestrale. Gli altri fascicoli, pertanto, usciranno a febbraio, giugno e ottobre 2014. Quanto al numero di pagine, mentre questo documento ne occupa 10 perché si riferisce al lavoro di un intero anno svolto da parte di 6 persone (quelle indicate nel frontespizio), i successivi presumibilmente ne occuperanno un numero minore, a meno che non venga richiesto dal Comitato di Coordinamento del PTTB di descrivere particolari tecnici e metodologie informatico-ingegneristiche adottate da parte dell'équipe di sviluppatori. Infine, in tutti i fascicoli, le parole, le frasi o una intera sezione che riteniamo degne di nota saranno sottolineate},
URL = {https://iris.cnr.it/handle/20.500.14243/350475},
}
@TECHREPORT{BOSCHETTI_2013_TECHREPORT_B_262443,
AUTHOR = {Boschetti, F.},
TITLE = {Acquisition of texts and development of linguistic tools for Greek, Latin and Italian corpora},
YEAR = {2013},
ABSTRACT = {This report illustrates the activities of Federico Boschetti, researcher at the ILC-CNR of Pisa, Italy, during the visit at the Perseus Project (Dec. 2012 Jun. 2013), aimed at the development of methods and tools for the localization in Italian of digital resources for the study of classics. After a short introduction that contextualizes the visit, the lines of investigation and development are described: a) the collaborative multilingual proofreader, b) the Ancient Greek WordNet linked to the Italian WordNets and c) the alignment of original texts to the Italian translations. The conclusion discusses the relations among the products of these activities},
URL = {https://iris.cnr.it/handle/20.500.14243/262443},
}
@TECHREPORT{CININI_2013_TECHREPORT_CPSS_333476,
AUTHOR = {Cinini, A. and Picchi, P. and Sassi, M. and Sassolini, E.},
TITLE = {Digesto 3. 0: il nuovo sistema di navigazione delle traduzioni del Digesto},
YEAR = {2013},
ABSTRACT = {La sincronizzazione del testo latino e greco con la traduzione in italiano del Digesto si svolge nell'ambito del programma di ricerca PRIN 2008: Traduzione dei Digesta di Giustiniano: "Lessico giuridico storia e dogmatica", settore disciplinare IUS/18. Nell'ambito del progetto sono stati implementati negli anni alcuni software, sviluppati dal Dr. Eugenio Picchi e dal suo gruppo di ricerca, dell'Istituto di Linguistica Computazionale del CNR di Pisa, per l'allineamento dei testi paralleli bilingui, in latino e italiano. Il progetto ha una lunga storia, caratterizzata da 3 fasi di sviluppo diverse. Con il titolo Digesto 3. 0 abbiamo cercato di ricordare quest'ultima evoluzione del progetto, caratterizzata da un nuovo sistema di navigazione on-line},
URL = {https://iris.cnr.it/handle/20.500.14243/333476},
}
@TECHREPORT{DELGROSSO_2013_TECHREPORT_DGP_315841,
AUTHOR = {Del Grosso, A. M. and Giovannetti, E. and Piccini, S.},
TITLE = {Definizione del modello di filologia computazionale},
YEAR = {2013},
ABSTRACT = {Il documento illustra il lavoro di analisi condotto durante la prima fase del progetto Clavius on the Web. Nelle sezioni del documento si descrivono le modalità secondo le quali il modello generale della piattaforma di gestione dei testi verrà implementato partendo dalle esigenze degli studiosi dei manoscritti originali di Clavius digitalizzati e messi a raffronto con i file di trascrizione},
KEYWORDS = {Clavius, Clavius on the web, Literary Computing, Computational Philology, Lexica, Latin, Semantic Web},
URL = {http://claviusontheweb.it/},
}
@TECHREPORT{MARZI_2013_TECHREPORT_MG_227818,
AUTHOR = {Marzi, C. and Giraudo, H.},
TITLE = {Perspectives on Synergy},
YEAR = {2013},
ABSTRACT = {The 2nd NetWordS Workshop, held on the 3rd and 4th of December 2012 in the Toulouse Research Area (Maison de la Recherche) of the French National Research Council (CNRS), brought together 27 participants (scholars, Post-Docs, PhD students) from various European countries. Ten speakers, experts of various scientific domain and with different theoretical inclinations, discussed cross-disciplinary Perspectives on Synergy, reflecting the interdisciplinarity and synergy fostered by NetWordS, the European Research Networking Programme on Word Structure. With these objectives in mind, the workshop gathered PhD students and junior research fellows who carried out interdisciplinary research under the NetWordS granting scheme for 2012 and more senior scholars who are currently involved in European or national initiatives geared towards scientific goals of interest to the NetWordS programme. A Round Table followed to concretely discuss project proposals of common interest to be submitted in the years 2013-2014, and to encourage the sharing of interdisciplinary cooperation efforts among NetWordS partners and other research teams},
KEYWORDS = {Mental lexicon, Interdisciplinary approach},
URL = {http://www.networds-esf.eu/index.php?page=2nd-networds-workshop},
}
@TECHREPORT{MARZI_2013_TECHREPORT_MP_225093,
AUTHOR = {Marzi, C. and Pirrelli, V.},
TITLE = {NetWordS: the European Network on Word Structure (2011-2015) ESF RNP Mid-Term Report (2011-2013)},
YEAR = {2013},
ABSTRACT = {By networking experts of various research fields (including but not limited to Theoretical Linguistics, Cognition, Brain Sciences and Computing) and of different theoretical inclinations, NetWordS has set itself the fundamental goal of advancing the current awareness of theoretical, typological, psycholinguistic, computational and neurophysiological evidence on the structure and processing of words, with a view to promoting novel methods of research and assessment for grammar architecture and language physiology. The programme is pursued through knowledge sharing, dissemination and transfer, organised over a four year period, from May 2011 to April 2015. Thanks to its highly interdisciplinary profile, the programme promotes training of young scientists through short visits, exchange grants and Summer Schools. It encourages the novel integration of existing methodologies, sets common research priorities, and fosters virtual cross-disciplinary laboratories, partnerships and research infrastructures},
KEYWORDS = {Mental lexicon, Interdisciplinary approach, word representation, word processing},
URL = {https://iris.cnr.it/handle/20.500.14243/225093},
}
@TECHREPORT{MARZI_2013_TECHREPORT_MR_225088,
AUTHOR = {Marzi, C. and Raffaelli, I.},
TITLE = {Variation and Adaptation in Lexical Processing and Acquisition},
YEAR = {2013},
ABSTRACT = {Recent emphasis on language knowledge as an emergent dynamic system has drawn considerable attention to the role of time in the way speakers acquire and use their own language. There are at least three levels on which time matters. At the processing level, the interaction between processing and memory constraints, and in particular between short-term and long-term memory issues, is understood to shape the way we recode and organise time-bound sequences of linguistic signals. On an ontogenetic scale, the age of acquisition of language input data, and the duration of exposure (in the case of multilingual contexts) are known to interact with issues of cognitive maturation and brain plasticity, yielding different outcomes as a function of different time intervals. In this connection, also the distribution of input data in a particular linguistic environment (both in terms of word type and token frequency) is bound to have an impact on rate and speed of acquisition and on overall knowledge organisation. Finally, all previously mentioned time-effects conspire to make the language system change through usage and acquisition in passing from one generation to the ensuing one},
KEYWORDS = {Mental lexicon, Lexical processing and acquisition, Interdisciplinary approach},
URL = {http://www.networds-esf.eu/index.php?page=3rd-networds-workshop},
}
@TECHREPORT{PARDELLI_2013_TECHREPORT_P_17321,
AUTHOR = {Pardelli, G.},
TITLE = {Un modello bibliografico saussuriano},
YEAR = {2013},
ABSTRACT = {Il modello bibliografico saussuriano, presentato il 21 settembre 2012 al Seminario Internazionale organizzato dall'Università di Firenze presso la Facoltà di Lettere a conclusione del progetto, ha le caratteristiche di un repertorio in quanto volto a una fonte primaria di conoscenza legata a uno specifico autore e a una sola tipologia documentaria. Ciascuna scheda è strutturata per contenere i formati digitali e per divenire strumento di estrazione informativa dai vari ambienti indicizzati. Nella sostanza trattasi di un database bibliografico al passo con l'era delle risorse documentarie cartacee che migrano progressivamente nei formati richiesti dalla rete telematica: una trasposizione verso il digitale resa possibile anche dai numerosi progetti di ricerca nazionali e comunitari di cui un esempio prezioso è il Progetto PRIN coordinato dal Professor Daniele Gambarara. Il Web si configura così come strumento di reference per recuperi veloci di materiale bibliografico. La descrizione dell'involucro tecnologico di questo particolare segmento della bibliografia saussuriana è il tema argomentale del presente scritto, mirato a una raccolta di informazioni da convogliare e frammentare in un centinaio di record aventi tutti eguale struttura e organizzati puntualmente in campi e sotto campi, al fine di soddisfare bisogni conoscitivi attraverso una maschera di interrogazione disponibile in Internet grazie ad un vocabolario controllato di termini in linguaggio naturale},
KEYWORDS = {Saussure Ferdinand, Bibliografia},
PAGES = {1-9},
URL = {https://iris.cnr.it/handle/20.500.14243/17321},
}
@MISC{BOSCHETTI_2013_MISC_B_262447,
AUTHOR = {Boschetti, F.},
TITLE = {Acquisition and Creation of Multilingual Resources for Classical Philology in Collaborative Environments: Three Use Cases},
YEAR = {2013},
URL = {https://iris.cnr.it/handle/20.500.14243/262447},
}
@MISC{BOSCHETTI_2013_MISC_B_262440,
AUTHOR = {Boschetti, F.},
TITLE = {An Integrated System for Generating and Correcting Polytonic Greek OCR: The Proof-reading Process},
YEAR = {2013},
URL = {http://www.digitalclassicist.org/wip/wip2013.html},
CONFERENCE_NAME = {Digital Classicist Seminars},
}
@MISC{BOSCHETTI_2013_MISC_B_262452,
AUTHOR = {Boschetti, F.},
TITLE = {The Proof-reading Process},
YEAR = {2013},
URL = {https://iris.cnr.it/handle/20.500.14243/262452},
CONFERENCE_NAME = {Open Philology Seminar},
}
@MISC{BOSCHETTI_2013_MISC_B_262450,
AUTHOR = {Boschetti, F.},
TITLE = {Acquisizione e Creazione di Risorse Plurilingui per la Filologia Classica in Ambienti Collaborativi-Tre Casi d'Uso},
YEAR = {2013},
URL = {https://iris.cnr.it/handle/20.500.14243/262450},
CONFERENCE_NAME = {II Convegno AIUCD 2013},
}
@MISC{BURGASSI_2013_MISC_B_269631,
AUTHOR = {Burgassi, C.},
TITLE = {Presentazione del progetto DiVo-Dizionario dei volgarizzamenti. Il lessico di traduzione dal latino nell'italiano delle origini: bibliografia filologica, corpus bilingue lemmatizzato, dizionario storico settoriale},
YEAR = {2013},
URL = {https://iris.cnr.it/handle/20.500.14243/269631},
}
@MISC{BURGASSI_2013_MISC_B_269641,
AUTHOR = {Burgassi, C.},
TITLE = {Le projet DiVo et ses corpus: une base de données italo-latine de traductions médiévales},
YEAR = {2013},
URL = {https://iris.cnr.it/handle/20.500.14243/269641},
}
@MISC{BURGASSI_2013_MISC_BDGV_259610,
AUTHOR = {Burgassi, C. and Dotto, D. and Guadagnini, E. and Vaccaro, G.},
TITLE = {Corpus del Dizionario dei Volgarizzamenti (Corpus DiVo) (2013)},
YEAR = {2013},
ABSTRACT = {Il Corpus DiVo è parte del progetto di ricerca DiVo-Dizionario dei Volgarizzamenti, diretto da Elisa Guadagnini e Giulio Vaccaro, ospitato dall'Istituto Opera del Vocabolario Italiano (CNR) e dalla Scuola Normale Superiore di Pisa, finanziato dal MIUR all'interno del programma FIRB-Futuro in Ricerca 2010. Il Corpus DiVo, interrogabile con GattoWeb, è curato da Cosimo Burgassi, Diego Dotto, Elisa Guadagnini e Giulio Vaccaro. Comprende 150 testi volgari, per complessive 5. 941. 061 occorrenze di 169. 845 forme grafiche distinte; sono presenti 76 testi latini associati. È presente uno specimen di lemmatizzazione, curato da Diego Dotto, che conta 2. 226 lemmi e 13 iperlemmi, per un totale di 30. 367 occorrenze lemmatizzate},
KEYWORDS = {Volgarizzamenti, Corpus testuale, Dizionario dei Volgarizzamenti, Italiano antico},
URL = {https://iris.cnr.it/handle/20.500.14243/259610},
}
@MISC{BURGASSI_2013_MISC_BDGVZ_259609,
AUTHOR = {Burgassi, C. and Dotto, D. and Guadagnini, E. and Vaccaro, G. and Zago, A.},
TITLE = {Corpus dei Classici Latini volgarizzati (Corpus CLaVo) (2013)},
YEAR = {2013},
ABSTRACT = {Il Corpus CLaVo è parte del progetto di ricerca DiVo-Dizionario dei Volgarizzamenti, diretto da Elisa Guadagnini e Giulio Vaccaro, ospitato dall'Istituto Opera del Vocabolario Italiano (CNR) e dalla Scuola Normale Superiore di Pisa, finanziato dal MIUR all'interno del programma FIRB-Futuro in Ricerca 2010. Il Corpus CLaVo, interrogabile con GattoWeb, è curato da Cosimo Burgassi, Diego Dotto, Elisa Guadagnini e Giulio Vaccaro. Esso raccoglie le opere latine tradotte dai volgarizzamenti compresi nel Corpus DiVo: per alcune sommarie informazioni su queste opere e sulla loro tradizione si rinvia alle relative schede, compilate per la maggior parte da Anna Zago, comprese nella bibliografia filologica del DiVo. Il Corpus CLaVo comprende 26 opere latine, associate a 45 volgarizzamenti, per complessive 913. 656 occorrenze di 78. 587 forme grafiche distinte. Al Corpus CLaVo è associato un dizionario macchina, curato da Anna Zago, che contiene 3263 lemmi e 45. 086 coppie forma-lemma},
KEYWORDS = {Classici latini, Corpus testuale, Dizionario dei Volgarizzamenti, Lingua latina},
URL = {http://clavoweb.ovi.cnr.it},
}
@MISC{DELGROSSO_2013_MISC_DM_348346,
AUTHOR = {Del Grosso, A. M. and Marchi, S.},
TITLE = {Saussure Philological Web Application},
YEAR = {2013},
ABSTRACT = {Web Application for Computational Philology. An Experiment on Ferdinand de Saussure original sources: images and texts},
KEYWORDS = {computational philology, digital humanities, software engineering, web application},
URL = {http://licodemo.ilc.cnr.it:8080/Saussure_Wapp/controlPanel.xhtml},
}
@MISC{DELGROSSO_2013_MISC_DMPM_228560,
AUTHOR = {Del Grosso, A. M. and Murano, F. and Pesini, L. and Marchi, S.},
TITLE = {A Web tool for philological research. An experiment on some Saussurean writings},
YEAR = {2013},
ABSTRACT = {The work describes a philological-computational tool developed by the Istituto di Linguistica Computazionale, CNR, Pisa to create a digital edition of Ferdinand de Saussure's unpublished manuscripts. Since the use of a digital edition and of the most modern computer technology allow a more in-depth research, the ILC is developing a set of digital tools to facilitate the research and to take advantage of both the documents and the related information by the scientific community},
KEYWORDS = {digital philology, digital humaniteis, software enginnering},
URL = {https://iris.cnr.it/handle/20.500.14243/228560},
CONFERENCE_NAME = {AIUCD2013},
}
@MISC{DIDONATO_2013_MISC_D_407980,
AUTHOR = {Di Donato, F.},
TITLE = {Working on Scholarly Contents: A Semantic Vision},
YEAR = {2013},
ABSTRACT = {Presentation held at the Conference: Open Platforms for Digital Humanities, Cortona, Palazzone della Scuola Normale Superiore},
URL = {https://iris.cnr.it/handle/20.500.14243/407980},
}
@MISC{DIDONATO_2013_MISC_D_407982,
AUTHOR = {Di Donato, F.},
TITLE = {L'Open Access in pratica},
YEAR = {2013},
ABSTRACT = {presentazione sull'Open Access al Forum degli allievi della Scuola Normale Superiore di Pisa},
URL = {https://iris.cnr.it/handle/20.500.14243/407982},
}
@MISC{DIDONATO_2013_MISC_D_407987,
AUTHOR = {Di Donato, F.},
TITLE = {Building a Network of Open Correspondence Projects. A model for Open Science},
YEAR = {2013},
ABSTRACT = {presentazione di un progetto inteso a creare una rete aperta di corrispondenze},
URL = {https://iris.cnr.it/handle/20.500.14243/407987},
}
@MISC{DIDONATO_2013_MISC_D_407984,
AUTHOR = {Di Donato, F.},
TITLE = {Fare ricerca sul Web. Dalle biblioteche digitali all'annotazione semantica},
YEAR = {2013},
ABSTRACT = {Un'introduzione all'open science attraverso l'esempio del progetto ERC-AdG EUROCORR},
URL = {https://iris.cnr.it/handle/20.500.14243/407984},
}
@MISC{DIDONATO_2013_MISC_D_407990,
AUTHOR = {Di Donato, F.},
TITLE = {DH@Net7},
YEAR = {2013},
ABSTRACT = {presentazione dei progetti DH di Net7},
URL = {https://iris.cnr.it/handle/20.500.14243/407990},
}
@MISC{DIDONATO_2013_MISC_D_382013,
AUTHOR = {Di Donato, F.},
TITLE = {Guida alla pubblicazione dei dati delle pubbliche amministrazioni},
YEAR = {2013},
ABSTRACT = {Siamo nella società dell'informazione. La nostra è un'economia dell'informazione. Il digitale sta cambiando tutto. Questi mantra vengono ripetuti sino alla noia, ma prendiamoli sul serio e chiediamoci cosa ciò comporti nell'Agenda (Digitale) di un amministratore o dirigente pubblico. Cosa si potrebbe fare per adeguare i meccanismi di funzionamento della macchina pubblica a questo nuovo ambiente, cosa per massimizzare le opportunità di benessere sociale per tutti? Tra le molte possibili risposte, questo libro ne esplora una, suggerita anche dall'Agenda Digitale della Commissione Europea: "mettere a disposizione le informazioni relative al settore pubblico in modo trasparente, efficace e non discriminatorio, come fonte importante di crescita potenziale di servizi online innovativi"},
URL = {https://iris.cnr.it/handle/20.500.14243/382013},
}
@MISC{DIDONATO_2013_MISC_D_407983,
AUTHOR = {Di Donato, F.},
TITLE = {Il ruolo dei toponimi in Territori. Strumenti per la georeferenziazione automatica e prospettive in ambito web semantico},
YEAR = {2013},
ABSTRACT = {Presentazione del portale Territori all'Archivio centrale dello Stato},
URL = {https://iris.cnr.it/handle/20.500.14243/407983},
}
@MISC{DIDONATO_2013_MISC_D_407989,
AUTHOR = {Di Donato, F.},
TITLE = {Linked Open Data, Beni Culturali e integrazione. Uno sguardo sul futuro},
YEAR = {2013},
ABSTRACT = {presentazione del progetto ERC-AdG EUROCORR},
URL = {https://iris.cnr.it/handle/20.500.14243/407989},
}
@MISC{DIDONATO_2013_MISC_D_407981,
AUTHOR = {Di Donato, F.},
TITLE = {Guida alla pubblicazione dei dati delle pubbliche amministrazioni. Un'introduzione},
YEAR = {2013},
ABSTRACT = {presentazione della Guida alla pubblicazione dei dati delle pubbliche amministrazioni},
URL = {https://iris.cnr.it/handle/20.500.14243/407981},
}
@MISC{DIDONATO_2013_MISC_D_407986,
AUTHOR = {Di Donato, F.},
TITLE = {Semantic annotation of digital libraries. A model for science communication},
YEAR = {2013},
ABSTRACT = {presentazione del progetto EUROCORR (ERC-AdG) alla conferenza Knowledge Triangle},
URL = {https://iris.cnr.it/handle/20.500.14243/407986},
}
@MISC{GUADAGNINI_2013_MISC_G_265242,
AUTHOR = {Guadagnini, E.},
TITLE = {Il corpus DiVo (Dizionario dei Volgarizzamenti)},
YEAR = {2013},
URL = {https://iris.cnr.it/handle/20.500.14243/265242},
CONFERENCE_NAME = {Repertori filologici, archivi testuali e risorse lessicografiche: nuovi strumenti per l'italianistica},
}
@MISC{LAM_2013_MISC_LD_344097,
AUTHOR = {Lamé, M. and Del Grosso, A. M.},
TITLE = {WE ARE ALL DISABLED!},
YEAR = {2013},
ABSTRACT = {This is not a technical proposition. This is a very humble web user's testimony from socalled enabled and disabled people: any human being is disabled when it comes to accessing digital information, as it requires a device that is a computer to be reasonably understandable, perceivable, operable and robust, unless one wants to print the binary code of a movie, such as La Jetée by Chris Marker as the artist David Guez recently did for his art exhibition at Centre Pompidou},
KEYWORDS = {Digital Publishing, w3c, web},
URL = {https://www.w3.org/2012/12/global-publisher/statements-of-interest/21-WeAreAllDisabled.pdf},
CONFERENCE_NAME = {A W3C Workshop on Digital Publishing},
}
@MISC{LAM_2013_MISC_LSBB_284808,
AUTHOR = {Lamé, M. and Soler, V. L. E. F. and Boschetti, F. and Benedetti, L.},
TITLE = {De la transcription graphique à la reconstitution diplomatique},
YEAR = {2013},
URL = {https://iris.cnr.it/handle/20.500.14243/284808},
}
@MISC{MARINELLI_2013_MISC_M_254614,
AUTHOR = {Marinelli, R.},
TITLE = {Espressioni idiomatiche in un database di terminologia: codifica, relazioni, traduzione},
YEAR = {2013},
ABSTRACT = {In questa presentazione si parla di un database di terminologia marittima che dopo le fasi inziali della sua costruzione è stato ampliato e arricchito con immagini che permettono di visualizzare il termine preso in considerazione e successivamente con l'inserimento di espressioni idiomatiche e modi di dire che appartengono al dominio marittimo. Viene inoltre illustrata anche la problematica della traduzione in inglese, sia dei termini, sia delle espressioni idiomatiche stesse},
KEYWORDS = {Database semantico lessicali, terminologia, espressioni idiomatiche.},
URL = {https://iris.cnr.it/handle/20.500.14243/254614},
CONFERENCE_NAME = {Meeting annuale del Gruppo Web Semantico},
}
@MISC{MARZI_2013_MISC_MD_230727,
AUTHOR = {Marzi, C. and Daelemans, W.},
TITLE = {On memory and computation: a reappraisal of German noun plural inflection},
YEAR = {2013},
ABSTRACT = {The talk "On memory and computation: a reappraisal of German noun plural inflection" presented one of the main objectives on which the bilateral Italian-Belgian action is focussing, namely linguistic and extra-linguistic factors involved in mono-and bi-lingual word recognition. She suggests a multi-factorial view of morphology adaptive processing, in presenting a usage-based perspective, by investigating a few properties of the German noun plural system and focusing on the dynamic relation between regularity, productivity and competition of inflection patterns through computer simulations (Temporal Self-Organising Maps-TSOMs) of type/token-frequency effects. In detail, she highlighted a few formal properties of the-s plural class, and concluded that although relatively infrequent,-s plurals seem to pattern in fairly regular sub-classes which suffer from no competition by members of other inflectional classes},
KEYWORDS = {German, plural inflection},
URL = {http://www.networds-esf.eu/index.php?page=3rd-networds-workshop},
CONFERENCE_NAME = {Third NetWordS Workshop on "Variation and Adaptation in Lexical Processing and Acquisition"},
}
@MISC{SAGRI_2013_MISC_SV_289319,
AUTHOR = {Sagri, M. T. and Venturi, G.},
TITLE = {Exploring the use of neuroscience in the Italian courtrooms: the linguistic and lexico-semantic analysis of a corpus of Italian case law texts},
YEAR = {2013},
URL = {https://iris.cnr.it/handle/20.500.14243/289319},
}
@MISC{SORIA_2013_MISC_S_284021,
AUTHOR = {Soria, C.},
TITLE = {Salviamo l'italiano dall'estinzione digitale},
YEAR = {2013},
URL = {https://iris.cnr.it/handle/20.500.14243/284021},
CONFERENCE_NAME = {Salone del Libro di Torino, Convegno "D'Annunzio innovatore"},
}
@MISC{SORIA_2013_MISC_S_257906,
AUTHOR = {Soria, C.},
TITLE = {Preserving Digital Language Diversity},
YEAR = {2013},
URL = {https://iris.cnr.it/handle/20.500.14243/257906},
CONFERENCE_NAME = {All-Russia methodological seminar on protection of minority languages of peoples of Siberia and the Russian Far East},
}
@MISC{SORIA_2013_MISC_S_257939,
AUTHOR = {Soria, C.},
TITLE = {You can speak it now: assessing the effect of official recognition on vitality of minority languages},
YEAR = {2013},
ABSTRACT = {In 1999, an Italian controversial law granted official recognition to twelve regional and minority languages, but denied it to others such as Piedmontese, Venetan, Sicilian, Emilian, Romagnol, that nevertheless are rated as endangered by UNESCO and Ethnologue. This particular situation offers an ideal laboratory to assess the impact of language policies on protected languages and at the same time the effect of lack of official protection and recognition on languages denied of institutional support. In this research we have coupled official census data with the results of an extensive survey carried out among speakers of all endangered languages of Italy, recognised or not, to re-assess their vitality in terms of speakers' number, domains of use, intergenerational transmission and speakers' attitudes. After illustrating the methodology adopted for the survey, we will show how the law was largely ineffective in producing quantitatively significant changes, while had a sharp effect on speakers' attitudes. We will argue that official recognition generally improved self-esteem and generated a pride in the language that is severely lacking among speakers of other languages, while lack of top-down recognition can be a powerful element in reinforcing negative feelings and overestimation of the diffculties of language revitalization},
KEYWORDS = {minority language, regional language, endangered language, institutional support, speakers' attitudes},
URL = {https://iris.cnr.it/handle/20.500.14243/257939},
CONFERENCE_NAME = {Conference Language Endangerment: Language Policy and Planning},
}
@MISC{SORIA_2013_MISC_SZR_257948,
AUTHOR = {Soria, C. and Zoli, C. and Randaccio, S.},
TITLE = {Why the Internet should speak minority languages-and how. The role of Language Technologies for minority and contested languages},
YEAR = {2013},
ABSTRACT = {Many minority languages that are thriving to get a place in the digital space and are profiting of the new opportunities offered by the Internet and digital devices will seriously face digital extinction if they will not be supported by Language Technologies (Calzolari et al. 2012). LTs (spelling and grammar checkers, electronic dictionaries, localized interfaces, as well as search engines, language translators or information extraction tools) are a necessary instrument to secure usability of minority languages over the web (Soria et al. 2012, Krauwer 2003), thus ensuring those languages equal digital opportunities and raising their profile in the eyes of the younger, digitally-oriented generation. However, there are many challenges to be faced to equip minority languages with LTs (from basic to advanced): a substantial delay in development of basic technologies, a lack of cooperation among minority languages communities, a chronic shortage of funding (in particular for minority languages not officially recognized, yet often the most vital ones over the Internet) and the limited economic value placed over LTs for minority languages by the digital market rules. In this talk, on the basis of concrete examples and a survey about the digital use of minority languages of Italy, we will show how these challenges can be overcome and suggest a roadmap towards sustainable development of LTs for minority languages},
URL = {https://iris.cnr.it/handle/20.500.14243/257948},
CONFERENCE_NAME = {Conference Contested Languages in the Old World},
}
@MISC{VACCARO_2013_MISC_VGBDLBZ_259608,
AUTHOR = {Vaccaro, G. and Guadagnini, E. and Burgassi, C. and Dotto, D. and Lorenzi, C. and Biondi, C. L. and Zago, A.},
TITLE = {DiVo-Bibliografia filologica (2013)},
YEAR = {2013},
ABSTRACT = {DiVo DB è la bibliografia filologica dei volgarizzamenti medievali dei testi classici e tardo-antichi. Sono compilate delle schede brevi per le opere latine, con informazioni sull'autore, sulla compilazione e sul genere dell'opera, nonché l'identificazione dell'edizione di riferimento (quella inclusa nel corpus DiVo). Le schede dei testi volgari contengono cenni biografici sull'autore del volgarizzamento, la datazione dell'opera, l'identificazione della coloritura linguistica del testo, l'indicazione della tipologia testuale e del genere dell'opera, la catalogazione della tradizione diretta mediante l'elencazione dei testimoni manoscritti e delle stampe antiche, una trattazione filologica della storia della tradizione, l'identificazione dell'edizione di riferimento, un panorama bibliografico sull'opera articolato per punti. A ciascun manoscritto è dedicata una scheda in cui si indicano gli incipit e gli explicit di ciascun manoscritto, le carte in cui l'opera è contenuta, eventuali note e l'informazione sulla visione diretta del manufatto. Si indicano i casi in cui lo studio della tradizione ha mostrato la necessità di controlli più approfonditi della lezione dei manoscritti: gli esiti di tali controlli costituiscono il sistema di note filologiche associato al corpus DiVo},
URL = {https://iris.cnr.it/handle/20.500.14243/259608},
}
@ARTICLE{BARCA_2012_ARTICLE_BP_6234,
AUTHOR = {Barca, L. and Pezzulo, G.},
TITLE = {Unfolding visual lexical decision in time},
YEAR = {2012},
ABSTRACT = {Visual lexical decision is a classical paradigm in psycholinguistics, and numerous studies have assessed the so-called "lexicality effect" (i. e., better performance with lexical than non-lexical stimuli). Far less is known about the dynamics of choice, because many studies measured overall reaction times, which are not informative about underlying processes. To unfold visual lexical decision in (over) time, we measured participants' hand movements toward one of two item alternatives by recording the streaming x, y coordinates of the computer mouse. Participants categorized four kinds of stimuli as "lexical" or "non-lexical: " high and low frequency words, pseudowords, and letter strings. Spatial attraction toward the opposite category was present for low frequency words and pseudowords. Increasing the ambiguity of the stimuli led to greater movement complexity and trajectory attraction to competitors, whereas no such effect was present for high frequency words and letter strings. Results fit well with dynamic models of perceptual decision-making, which describe the process as a competition between alternatives guided by the continuous accumulation of evidence. More broadly, our results point to a key role of statistical decision theory in studying linguistic processing in terms of dynamic and non-modular mechanisms},
KEYWORDS = {Psycholinguistics, Time Measurement},
URL = {http://www.plosone.org/article/info:doi/10.1371/journal.pone.0035932},
VOLUME = {7 (4)},
DOI = {10.1371/journal.pone.0035932},
ISSN = {1932-6203},
JOURNAL = {PLOS ONE},
}
@ARTICLE{BARCA_2012_ARTICLE_BP_2911,
AUTHOR = {Barca, L. and Pezzulo, G.},
TITLE = {Written language processing in Hearing and Deaf},
YEAR = {2012},
ABSTRACT = {Visual lexical decision is a classical paradigm in psycholinguistics, and numerous studies have assessed the so-called ''lexicality effect'' (i. e., better performance with lexical than non-lexical stimuli). Far less is known about the dynamics of choice, because many studies measured overall reaction times, which are not informative about underlying processes. To unfold visual lexical decision in (over) time, we measured participants' hand movements toward one of two item alternatives by recording the streaming x, y coordinates of the computer mouse. Participants categorized four kinds of stimuli as 'lexical' or 'non-lexical': high and low frequency words, pseudowords, and letter strings. Spatial attraction toward the opposite category was present for low frequency words and pseudowords. Increasing the ambiguity of the stimuli led to greater movement complexity and trajectory attraction to competitors, whereas no such effect was present for high frequency words and letter strings. Results fit well with dynamic models of perceptual decision-making, which describe the process as a competition between alternatives guided by the continuous accumulation of evidence. More broadly, our results point to a key role of statistical decision theory in studying linguistic processing in terms of dynamic and non-modular mechanisms},
KEYWORDS = {Visual lexical decision, Interactive Activation account, dynamic models of decision-making, kinematics},
PAGES = {e35932},
URL = {http://www.plosone.org/article/info%3Adoi%2F10.1371%2Fjournal.pone.0035932},
VOLUME = {7 (4)},
ISSN = {1932-6203},
JOURNAL = {PLOS ONE},
}
@ARTICLE{BELLANDI_2012_ARTICLE_BBCNPR_19539,
AUTHOR = {Bellandi, A. and Bellini, P. and Cappuccio, A. and Nesi, P. and Pantaleo, G. and Rauch, N.},
TITLE = {Assisted Knowledge Base Generation, Management and Competence Retrieval},
YEAR = {2012},
ABSTRACT = {Despite the presence of many systems for developing and managing structured taxonomies and/or SKOS models for a given domain for which small documents set are accessible, the production and maintenance of these domain knowledge bases is still a very expensive and time consuming process. This paper proposes a solution for assisting expert users in the development and management of knowledge base, including SKOS and ontologies modeling structures and relationships. The proposed solution accelerates the knowledge production by crawling and exploiting different kinds of sources (in multiple languages and with several inconsistencies among them). The proposed tool supports the experts in defining relationships among the most recurrent concepts, reducing the time to SKOS production and allowing assisted production. The validity of the produced knowledge base has been assessed by using SPARQL query interface and a precision and recall model. The solution has been developed for Open Space Innovative Mind project, with the aim of creating a portal to allow industries at posing semantic queries to discover potential competences in a large institution such as the University of Florence, in which several distinct domains are associated with its own departments},
URL = {https://iris.cnr.it/handle/20.500.14243/19539},
ISSN = {0218-1940},
JOURNAL = {INTERNATIONAL JOURNAL OF SOFTWARE ENGINEERING AND KNOWLEDGE ENGINEERING},
}
@ARTICLE{BELLANDI_2012_ARTICLE_BT_6121,
AUTHOR = {Bellandi, A. and Turini, F.},
TITLE = {Mining Bayesian networks out of ontologies},
YEAR = {2012},
ABSTRACT = {Probabilistic reasoning is an essential feature when dealing with many application domains. Starting with the idea that ontologies are the right way to formalize domain knowledge and that Bayesian networks are the right tool for probabilistic reasoning, we propose an approach for extracting a Bayesian network from a populated ontology and for reasoning over it. The paper presents the theory behind the approach, its design and examples of its use},
KEYWORDS = {Probabilistic reasoning, Ontology queries},
PAGES = {507-532},
URL = {http://link.springer.com/article/10.1007%2Fs10844-011-0165-4},
VOLUME = {38 (2)},
DOI = {10.1007/s10844-011-0165-4},
ISSN = {0925-9902},
JOURNAL = {JOURNAL OF INTELLIGENT INFORMATION SYSTEMS},
}
@ARTICLE{BURGASSI_2012_ARTICLE_B_19840,
AUTHOR = {Burgassi, C.},
TITLE = {Prove di commento ai «Due dialoghi» di Ruzante},
YEAR = {2012},
KEYWORDS = {Filologia italiana, Ruzante},
PAGES = {375-407},
URL = {https://iris.cnr.it/handle/20.500.14243/19840},
VOLUME = {59},
ISSN = {0392-5110},
JOURNAL = {STUDI DI FILOLOGIA ITALIANA},
}
@ARTICLE{BURGASSI_2012_ARTICLE_B_269593,
AUTHOR = {Burgassi, C.},
TITLE = {Gesualdo lettore di Petrarca e la «prova degli artisti» (RVF 77)},
YEAR = {2012},
ABSTRACT = {Tra i commenti sistematici al Canzoniere di Petrarca d'età umanistico-rinascimentale, la Sposizione di Giovanni Andrea Gesualdo si distingue sia per mole sia per profondità concettuale. L'elaborazione dell'opera è infatti giustificata dalla necessità di inquadrare correttamente il fondamento filosofico che sorreggerebbe la poesia petrarchesca, troppo spesso interpretata, secondo il Gesualdo, come esperienza artistica esemplare soltanto sul piano delle pure forme, e non anche dei contenuti teoretici. Nel commento ai sonetti sul ritratto di Laura dipinto da Simone Martini (RVF 77-78), in particolare, alla robusta indagine filosofica fa seguito l'inchiesta, altrettanto dettagliata, sulle fonti che avrebbero ispirato il poeta. Così, la "prova degli artisti" con cui si apre il sonetto 77, è persuasivamente messa in relazione con fatti analoghi che videro protagonisti i più celebrati maestri scultori dell'antichità, secondo quanto racconta Plinio il Vecchio},
KEYWORDS = {Commenti petrarcheschi, Fonti classiche in Petrarca},
PAGES = {169-181},
URL = {https://iris.cnr.it/handle/20.500.14243/269593},
VOLUME = {70},
ISSN = {0392-5110},
JOURNAL = {STUDI DI FILOLOGIA ITALIANA},
}
@ARTICLE{BURGASSI_2012_ARTICLE_B_281686,
AUTHOR = {Burgassi, C.},
TITLE = {Scelta di voci del Tesoro della Lingua Italiana delle Origini (sedicesima serie)},
YEAR = {2012},
ABSTRACT = {Voci STIFICANZA s. f., STIFICARE v., TESTIFICANZA s. f., TESTIFICARE v., TESTIFICAZIONE s. f. del Tesoro della Lingua Italiana delle Origini (pp. 152-58)},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana},
PAGES = {17-160},
URL = {https://iris.cnr.it/handle/20.500.14243/281686},
VOLUME = {17},
ISSN = {1591-8254},
JOURNAL = {BOLLETTINO-OPERA DEL VOCABOLARIO ITALIANO},
}
@ARTICLE{BURGASSI_2012_ARTICLE_B_19847,
AUTHOR = {Burgassi, C.},
TITLE = {Monaco di Montaudon, BdT 305. 1, 2 e 9a},
YEAR = {2012},
KEYWORDS = {Filologia romanza, Provenzalistica, Monaco di Montaudon},
PAGES = {29-104},
URL = {https://iris.cnr.it/handle/20.500.14243/19847},
VOLUME = {10-12},
ISSN = {1593-7259},
JOURNAL = {RIVISTA DI STUDI TESTUALI},
}
@ARTICLE{CHERSI_2012_ARTICLE_CP_6255,
AUTHOR = {Chersi, F. and Pezzulo, G.},
TITLE = {Using hippocampal-striatal loops for spatial navigation and goal-directed decision-making},
YEAR = {2012},
ABSTRACT = {The hippocampus plays a central role in spatial representation, declarative and episodic memory. In this area, so-called place cells possess high spatial selectivity, firing preferentially when the individual is within a small area of the environment. Interestingly, it has been found in rats that these cells can be active also when the animal is outside the location or context of their corresponding place field producing so-called ''forward sweeps''. These typically occur at decision points during task execution and seem to be utilized, among other things, for the evaluation of potential alternative paths. Anticipatory firing is also found in the ventral striatum, a brain area that is strongly interconnected with the hippocampus and is known to encode value and reward. In this paper, we describe a biologically based computational model of the hippocampalventral striatum circuit that implements a goal-directed mechanism of choice, with the hippocampus primarily involved in the mental simulation of possible navigation paths and the ventral striatum involved in the evaluation of the associated reward expectancies. The model is validated in a navigation task in which a rat is placed in a complex maze with multiple rewarding sites. We show that the rat mentally activates place cells to simulate paths, estimate their value, and make decisions, implementing two essential processes of model-based reinforcement learning algorithms of choice: look-ahead prediction and the evaluation of predicted states},
KEYWORDS = {Spatial navigation Mental simulation Hippocampal-striatal circuit Neural network Computational model},
PAGES = {125-129},
URL = {http://link.springer.com/content/pdf/10.1007%2Fs10339-012-0475-7},
VOLUME = {13 (1)},
DOI = {10.1007/s10339-012-0475-7},
ISSN = {1612-4782},
JOURNAL = {COGNITIVE PROCESSING},
}
@ARTICLE{DIDONATO_2012_ARTICLE_D_382024,
AUTHOR = {Di Donato, F.},
TITLE = {Open Government e Open Data},
YEAR = {2012},
ABSTRACT = {Che cosa si intende con Open Government e Open Data? Quali sono le caratteristiche dei Linked Open Data? L'articolo si propone di rispondere a queste domande ricostruendo in primo luogo il passaggio dal cosiddetto e-Government all'Open Government, nato assai di recente in ambito anglosassone, per concentrarsi in secondo luogo sulla definizione giuridica e tecnica di Open (Government) Data, per concludere, infine, con un'analisi delle conseguenze che l'adozione di un paradigma basato sui Linked Open Data (LOD) può avere, in termini di trasparenza amministrativa e di sostegno ai modelli di cittadinanza attiva},
URL = {https://iris.cnr.it/handle/20.500.14243/382024},
JOURNAL = {SCIENZA E PACE},
}
@ARTICLE{GAGGIOLI_2012_ARTICLE_GPTBFCSPGMR_315984,
AUTHOR = {Gaggioli, A. and Pioggia, G. and Tartarisco, G. and Baldus, G. and Ferro, M. and Cipresso, P. and Serino, S. and Popleteev, A. and Gabrielli, S. and Maimone, R. and Riva, G.},
TITLE = {A system for automatic detection of momentary stress in naturalistic settings},
YEAR = {2012},
ABSTRACT = {Prolonged exposure to stressful environments can lead to serious health problems. Therefore, measuring stress in daily life situations through non-invasive procedures has become a significant research challenge. In this paper, we describe a system for the automatic detection of momentary stress from behavioral and physiological measures collected through wearable sensors. The system's architecture consists of two key components: a) a mobile acquisition module; b) an analysis and decision module. The mobile acquisition module is a smartphone application coupled with a newly developed sensor platform (Personal Biomonitoring System, PBS). The PBS acquires behavioral (motion activity, posture) and physiological (hearth rate) variables, performs low-level, real-time signal preprocessing, and wirelessly communicates with the smartphone application, which in turn connects to a remote server for further signal processing and storage. The decision module is realized on a knowledge basis, using neural network and fuzzy logic algorithms able to combine as input the physiological and behavioral features extracted by the PBS and to classify the level of stress, after previous knowledge acquired during a training phase. The training is based on labeling of physiological and behavioral data through self-reports of stress collected via the smartphone application. After training, the smartphone application can be configured to poll the stress analysis report at fixed time steps or at the request of the user. Preliminary testing of the system is ongoing. © 2012 Interactive Media Institute and IOS Press},
KEYWORDS = {decision, knowledge models, physiological monitoring, psychological stress, wearable sensors},
PAGES = {182-186},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-84872015110\&origin=inward},
VOLUME = {181},
DOI = {10.3233/978-1-61499-121-2-182},
ISSN = {1554-8716},
JOURNAL = {ANNUAL REVIEW OF CYBERTHERAPY AND TELEMEDICINE},
}
@ARTICLE{GUADAGNINI_2012_ARTICLE_G_269629,
AUTHOR = {Guadagnini, E.},
TITLE = {Voce NAPPA s. f. del Tesoro della Lingua Italiana delle Origini},
YEAR = {2012},
ABSTRACT = {Proposta di un'interpretazione originale di un passo di Paolo dell'Aquila (punto 1. 1 della voce): 1 Telo di tessuto (usato spec. in tavola): tovaglia o tovagliolo. 1. 1 Fras. Servire di nappa: imbandire, apparecchiare (la tavola). Fig. Preparare un'occasione propizia},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana, Paolo dell'Aquila},
URL = {http://tlio.ovi.cnr.it/voci/029020.htm},
VOLUME = {16},
ISSN = {2240-5216},
JOURNAL = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI},
}
@ARTICLE{GUADAGNINI_2012_ARTICLE_G_269620,
AUTHOR = {Guadagnini, E.},
TITLE = {Voce MELLÉ agg. /s. m. del Tesoro della Lingua Italiana delle Origini},
YEAR = {2012},
ABSTRACT = {Francesismo. L'entrata della voce costituisce un'intepretazione critica dei dati offerti dalla documentazione: gli editori trascurano di segnare l'accento grafico, che invece è necessario dato il chiaro calco sul fr. ant. "mellé", "meslé" (per cui cfr. le voci TLIO "mellare" e "mellato")},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana, Francesismi},
URL = {http://tlio.ovi.cnr.it/voci/028258.htm},
VOLUME = {16},
ISSN = {2240-5216},
JOURNAL = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI},
}
@ARTICLE{GUADAGNINI_2012_ARTICLE_G_265585,
AUTHOR = {Guadagnini, E.},
TITLE = {Scelta di voci del Tesoro della Lingua Italiana delle Origini (sedicesima serie)},
YEAR = {2012},
ABSTRACT = {Voci matta (1) s. f., matta (2) s. f., mattamente avv., mattare (1) v., mattare (2) v., mattato agg., matteggiare v., mattire v., matto (1) agg. /s. m., matto (2) agg., matto (3) agg. del Tesoro della Lingua Italiana delle Origini (pp. 83-92)},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana},
PAGES = {17-160},
URL = {https://iris.cnr.it/handle/20.500.14243/265585},
VOLUME = {17},
ISSN = {1591-8254},
JOURNAL = {BOLLETTINO-OPERA DEL VOCABOLARIO ITALIANO},
}
@ARTICLE{GUADAGNINI_2012_ARTICLE_G_269611,
AUTHOR = {Guadagnini, E.},
TITLE = {Voce MAGAGNA s. f. del Tesoro della Lingua Italiana delle Origini},
YEAR = {2012},
ABSTRACT = {1 Imperfezione o guasto, spec. non manifesto, che altera la struttura o diminuisce il pregio (specif. di un manufatto). 1. 1 [Detto di un animale: ] malformazione o difetto permanente, menomazione; difetto di andatura, azzoppamento (del cavallo). 1. 2 [Rif. a una persona: ] difetto fisico, malformazione o menomazione. Fig. Pecca morale (spec. non manifesta). 1. 3 Infermità dovuta a una patologia o una ferita. 2 Nocumento agli interessi di qno, danno. 2. 1 Situazione, insieme di circostanze o accadimento difficoltoso, sfavorevole, sfortunato},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana},
URL = {http://tlio.ovi.cnr.it/voci/028226.htm},
VOLUME = {16},
ISSN = {2240-5216},
JOURNAL = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI},
}
@ARTICLE{HAYASHI_2012_ARTICLE_HSMSC_4446,
AUTHOR = {Hayashi, Y. and Savas, B. and Monachini, M. and Soria, C. and Calzolari, N.},
TITLE = {LMF-aware Web services for accessing semantic lexicons},
YEAR = {2012},
ABSTRACT = {This paper demonstrates that Wordnet-LMF, a version of ISO LMF, allows us to effectively design and implement Web services for accessing WordNettype semantic lexicons that conform to the REST Web service architecture. The implemented prototype service currently provides access to native wordnets as well as to a bilingual concept dictionary. This paper thus describes slight revisions that were made to the Wordnet-LMF specifications to model and accommodate a nonwordnet-native bilingual concept dictionary},
KEYWORDS = {Lexical markup framework, Semantic lexicon, Wordnet, Language service, RESTful Web service design},
PAGES = {253-264},
URL = {http://link.springer.com/content/pdf/10.1007%2Fs10579-012-9181-4.pdf},
VOLUME = {46 (2)},
DOI = {10.1007/s10579-012-9181-4},
ISSN = {1574-020X},
JOURNAL = {LANGUAGE RESOURCES AND EVALUATION},
}
@ARTICLE{LAM_2012_ARTICLE_LVB_6202,
AUTHOR = {Lamé, M. and Valchera, V. and Boschetti, F.},
TITLE = {Epigrafia digitale. Paradigmi di rappresentazione per il trattamento digitale delle epigrafi},
YEAR = {2012},
ABSTRACT = {The article is divided into two parts: the first presents some theoretical and methodological aspects of traditional epigraphy, which can be the theoretical basis for digitization of entries. In particular, the attention is focused on the autopsy of the epigraph. The second part concerns the description of a systematic model for the digital representation of an epigraphic text, based on nine levels of independent analyses, according to the principles of the stand-off mark-up},
KEYWORDS = {Digital Epigraphy, Digital Philology},
PAGES = {331-338},
URL = {https://iris.cnr.it/handle/20.500.14243/6202},
VOLUME = {74 (1-2)},
ISSN = {0013-9572},
JOURNAL = {EPIGRAPHICA},
}
@ARTICLE{MARINELLI_2012_ARTICLE_MBMCCS_6195,
AUTHOR = {Marinelli, R. and Bindi, R. and Marchi, S. and Castellani, E. and Carli, G. and Santarcangelo, E. L.},
TITLE = {Hypnotizability-related differences in written language},
YEAR = {2012},
ABSTRACT = {Hypnotizierbarkeitbedingte Unterschiede in der Geschriebenen Sprache Rita Marinelli, Remo Bindi, SimoneMarchi, Eleonora Castellani, Giancarlo Carli und Enrica L. Santarcangelo Abstrakt: Die Studie analysierte Schreibproben von Probanten mit hoher und geringer Hypnotisierbarkeit. Die Versuchsteilnehmer wurden unter Normalbedingungen angeleitet kurze Texte in Reaktion zu hochimaginären Szenarien zu schreiben. Die Texte wurden mit computerbasierten und manuellen Methoden erarbeitet. Die Ergebnisse zeigten daß die Texte der Hochhypnotisierbaren stilistisch verfeinert waren mit mehr abstrakten Hauptwörtern; intensiver und vollstellungsreicher mit mehr Vergleichen, bildlichen Ausdrücken, und Tonmalereien; und weniger detailliert mit höheren Hauptwort-zu-Adjektiv-Quotienten. Diskutiert werden die Unterschiede im Gebrauch abstrakter Worte und hochvorgestellter Ausdrücke in ihrer Verbindung zu der überragenden linkshemispherischen Aktivität von Hochhypnotisierbaren im Wachzustand und einer möglicherweise andersartigen Rolle des Prekuneus, der in hypnotischen Phänomen beteiligt ist},
KEYWORDS = {Written language, text analysis, hypnosis, hypnotizability},
PAGES = {54-66},
URL = {https://iris.cnr.it/handle/20.500.14243/6195},
VOLUME = {1 (60)},
DOI = {10.1080/00207144.2011.622196},
ISSN = {0020-7144},
JOURNAL = {INTERNATIONAL JOURNAL OF CLINICAL AND EXPERIMENTAL HYPNOSIS},
}
@ARTICLE{MARZI_2012_ARTICLE_M_6179,
AUTHOR = {Marzi, C.},
TITLE = {Knowledge communities in grey},
YEAR = {2012},
ABSTRACT = {The dynamic nature of modern human social interactions, and the increasing capability of wireless and mobile devices for creating and sharing contents, open up the opportunity for a wide dissemination of information through complex knowledge sharing systems. As the shared knowledge components build cognitive ties, there is no real sharing of knowledge without a common understanding of it. In this article, particular emphasis is laid on technologies in Natural Language understanding and knowledge management for providing structured, intelligent access to the continuously evolving content, generated on-line in a pervasive collaborative environment. In detail, robust automated techniques for term extraction and knowledge acquisition are used to tap the information density and the global coherence of text excerpts sampled from both general-purpose and subject-specific social networks. We show empirically that the two sources may exhibit considerable differences in terms of content accessibility and informativeness},
KEYWORDS = {Grey Literature, Web Communities, Knowledge sharing, Concept Maps},
PAGES = {27-33},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-84883276602\&origin=inward},
VOLUME = {8 (1)},
ISSN = {1574-1796},
JOURNAL = {THE GREY JOURNAL},
}
@ARTICLE{MARZI_2012_ARTICLE_M_6168,
AUTHOR = {Marzi, C.},
TITLE = {First 'NetWordS'Workshop on Understanding the Architecture of the Mental Lexicon: Integration of Existing Approaches},
YEAR = {2012},
ABSTRACT = {The ambitious goal of the workshop, organised within the framework of "NetWordS", the European Science Foundation Research Networking Programme on the Structure of Words in the languages of Europe, was to lay the foundations for an interdisciplinary European research agenda on the Mental Lexicon for the coming 10 years, with particular emphasis on three main challenges:. Lexicon and Rules in the grammar. Word knowledge and word use. Words and meanings},
KEYWORDS = {Mental lexicon},
PAGES = {52-52},
URL = {http://ercim-news.ercim.eu/en89/events/first-networds-workshop},
VOLUME = {89},
ISSN = {0926-4981},
JOURNAL = {ERCIM NEWS},
}
@ARTICLE{MARZI_2012_ARTICLE_MFP_6224,
AUTHOR = {Marzi, C. and Ferro, M. and Pirrelli, V.},
TITLE = {Word alignment and paradigm induction},
YEAR = {2012},
ABSTRACT = {The variety of morphological processes attested in inflectional system of average complexity calls for adaptive strategies of word alignment. Prefixation, suffixation, stem alternation and combinations thereof pose severe problems to unsupervised algorithms of morphology induction. The paper analyses morphological generalisation as a by-product of flexible memory self-organisation strategies for word recoding. Our model endorses the hypothesis that lexical forms are memorised as full units. At the same time, lexical units are paradigmatically organised. We show that the overall amount of redundant morphological structure emerging from paradigm-based self-organisation has a clear impact on generalisation. This supports the view that issues of word representation and issues of word processing are mutually implied in lexical acquisition},
KEYWORDS = {Morphological Generalisation, Morphological Paradigm, Self-Organising Memory, Word coding and Processing},
PAGES = {251-274},
URL = {http://www.rivisteweb.it/doi/10.1418/38789},
VOLUME = {XI (2)},
DOI = {10.1418/38789},
ISSN = {1720-9331},
JOURNAL = {LINGUE E LINGUAGGIO},
}
@ARTICLE{MARZI_2012_ARTICLE_MP_6217,
AUTHOR = {Marzi, C. and Pirrelli, V.},
TITLE = {Understanding the Architecture of the Mental Lexicon},
YEAR = {2012},
ABSTRACT = {The present collection stems from the 1st NetWordS Workshop "Understanding the architecture of the mental lexicon: Integration of existing approaches", held in the Pisa Research Area of the Italian National Research Council, in November 2011. "NetWordS: the European network on Word Structure in the languages of Europe" is the Research Networking Programme of the European Science Foundation launched in May 2011 with the ambitious goal of paving the way to the European interdisciplinary research agenda on the Mental Lexicon, with particular emphasis on the following three main challenges:-lexicon and rules in the grammar,-word knowledge and word use,-words and meanings},
KEYWORDS = {Mental Lexicon, interdisciplinary approach},
PAGES = {101-105},
URL = {https://iris.cnr.it/handle/20.500.14243/6217},
VOLUME = {XI (2)},
DOI = {10.1418/38780},
ISSN = {1720-9331},
JOURNAL = {LINGUE E LINGUAGGIO},
}
@ARTICLE{PEZZULO_2012_ARTICLE_P_4436,
AUTHOR = {Pezzulo, G.},
TITLE = {The interaction engine: a common pragmatic competence across linguistic and non-linguistic interactions},
YEAR = {2012},
ABSTRACT = {Recent research in cognitive psychology, neuro-science, and robotics has widely explored the tight relations between language and action systems in primates. However, the link between the pragmatics of linguistic and nonlinguistic inter-actions has received less attention up to now. In this paper, we argue that cognitive agents exploit the same cognitive processes and neural substrate-a general pragmatic competence-across linguistic and nonlinguistic interactive contexts. Elaborating on Levinson's idea of an "interaction engine" that permits to convey and recognize communicative intentions in both linguistic and nonlinguistic interactions, we offer a computationally guided analysis of pragmatic competence, suggesting that the core abilities required for successful linguistic interactions could derive from more primitive architectures for action control, nonlinguistic interactions, and joint actions. Furthermore, we make the case for a novel, embodied approach to human-robot interaction and communication, in which the ability to carry on face-to-face communication develops in coordination with the pragmatic competence required for joint action},
KEYWORDS = {Computational modeling, Context, Engines, Joints, Planning},
PAGES = {105-123},
URL = {http://ieeexplore.ieee.org/xpl/login.jsp?reload=true\&tp=\&arnumber=6006515\&url=http%3A},
VOLUME = {4 (2)},
DOI = {10.1109/TAMD.2011.2166261},
ISSN = {1943-0604},
JOURNAL = {IEEE TRANSACTIONS ON AUTONOMOUS MENTAL DEVELOPMENT},
}
@ARTICLE{PEZZULO_2012_ARTICLE_PBCFMS_4401,
AUTHOR = {Pezzulo, G. and Barsalou, L. W. and Cangelosi, A. and Fischer, M. H. and McRae, K. and Spivey, M.},
TITLE = {Computational Grounded Cognition: A New Alliance between Grounded Cognition and Computational Modeling},
YEAR = {2012},
ABSTRACT = {Grounded theories assume that there is no central module for cognition. According to this view, all cognitive phenomena, including those considered the province of amodal cognition such as reasoning, numeric and language processing, are ultimately grounded in (and emerge from) a variety of bodily, affective, perceptual and motor processes. The development and expression of cognition is constrained by the embodiment of cognitive agents and various contextual factors (physical and social) in which they are immersed. The grounded framework has received numerous empirical confirmations. Still, there are very few explicit computational models that implement grounding in sensory, motor and affective processes as intrinsic to cognition, and demonstrate that grounded theories can mechanistically implement higher cognitive abilities. We propose a new alliance between grounded cognition and computational modeling towards a novel multidisciplinary enterprise: Computational Grounded Cognition. We clarify the defining features of this novel approach and emphasize the importance of using the methodology of Cognitive Robotics, which permits simultaneous consideration of multiple aspects of grounding, embodiment, and situatedness, showing how they constrain the development and expression of cognition},
KEYWORDS = {Grounding, embodiment, situatedness, Cognitive Robotics, situated simulation},
PAGES = {612-613},
URL = {http://www.frontiersin.org/Psychology/10.3389/fpsyg.2012.00612/abstract},
VOLUME = {3},
DOI = {10.3389/fpsyg.2012.00612},
}
@ARTICLE{PEZZULO_2012_ARTICLE_PO_6207,
AUTHOR = {Pezzulo, G. and Ognibene, D.},
TITLE = {Proactive action preparation: Seeing action preparation as a continuous and proactive process},
YEAR = {2012},
ABSTRACT = {In this paper, we aim to elucidate the processes that occur during action preparation from both a conceptual and a computational point of view. We rst introduce the traditional, serial model of goaldirected action and discuss from a computational viewpoint its subprocesses occurring during the two phases of covert action preparation and overt motor control. Then, we discuss recent evidence indicating that these sub-processes are highly intertwined at representational and neural levels, which undermines the validity of the serial model and points instead to a parallel model of action speci cation and selection. Within the parallel view, we analyze the case of delayed choice, arguing that action preparation can be proactive, and preparatory processes can take place even before decisions are made. Speci cally, we discuss how prior knowledge and prospective abilities can be used to maximize utility even before deciding what to do. To support our view, we present a computational implementation of (an approximated version of) proactive action preparation, showing its advantages in a simulated tennis-like scenario},
KEYWORDS = {action preparation, action execution, proactivity, prediction, internal model},
PAGES = {386-424},
URL = {https://iris.cnr.it/handle/20.500.14243/6207},
VOLUME = {16 (3)},
ISSN = {1087-1640},
JOURNAL = {MOTOR CONTROL},
}
@ARTICLE{PROIETTI_2012_ARTICLE_P_405484,
AUTHOR = {Proietti, C.},
TITLE = {Intuitionistic Epistemic Logic, Kripke Models and Fitch's Paradox},
YEAR = {2012},
ABSTRACT = {The present work is motivated by two questions. (1) What should an intuitionistic epistemic logic look like? (2) How should one interpret the knowledge operator in a Kripke-model for it? In what follows we outline an answer to (2) and give a model-theoretic definition of the operator K. This will shed some light also on (1), since it turns out that K, defined as we do, fulfills the properties of a necessity operator for a normal modal logic. The interest of our construction also lies in a better insight into the intuitionistic solution to Fitch's paradox, which is discussed in the third section. In particular we examine, in the light of our definition, DeVidi and Solomon's proposal of formulating the verification thesis as. We show, as our main result, that this definition excapes the paradox, though it is validated only under restrictive conditions on the models},
KEYWORDS = {Intuitionistic logic, Epistemic logic, Fitch's paradox, Kripke models},
PAGES = {877-900},
URL = {https://iris.cnr.it/handle/20.500.14243/405484},
VOLUME = {41 (5)},
DOI = {10.1007/s10992-011-9207-1},
ISSN = {0022-3611},
JOURNAL = {JOURNAL OF PHILOSOPHICAL LOGIC},
}
@ARTICLE{RIGOLI_2012_ARTICLE_RPP_4415,
AUTHOR = {Rigoli, F. and Pavone Enea, F. and Pezzulo, G.},
TITLE = {Aversive pavlovian responses affect human instrumental motor performance},
YEAR = {2012},
ABSTRACT = {In neuroscience and psychology, an influential perspective distinguishes between two kinds of behavioral control: instrumental (habitual and goal-directed) and Pavlovian. Understanding the instrumental-Pavlovian interaction is fundamental for the comprehension of decision-making. Animal studies (as those using the negative auto-maintenance paradigm), have demonstrated that Pavlovian mechanisms can have maladaptive effects on instrumental performance. However, evidence for a similar effect in humans is scarce. In addition, the mechanisms modulating the impact of Pavlovian responses on instrumental performance are largely unknown, both in human and non-human animals. The present paper describes a behavioral experiment investigating the effects of Pavlovian conditioned responses on performance in humans, focusing on the aversive domain. Results showed that Pavlovian responses influenced human performance, and, similar to animal studies, could have maladaptive effects. In particular, Pavlovian responses either impaired or increased performance depending on modulator variables such as threat distance, task controllability, punishment history, amount of training, and explicit punishment expectancy. Overall, these findings help elucidating the computational mechanisms underlying the instrumental-Pavlovian interaction, which might be at the base of apparently irrational phenomena in economics, social behavior, and psychopathology},
KEYWORDS = {Controllability, goal-directed, habitual, Pavlovian, reinforcement learning},
PAGES = {134-14},
URL = {http://www.frontiersin.org/Decision_Neuroscience/10.3389/fnins.2012.00134/abstract},
VOLUME = {6 (134)},
DOI = {10.3389/fnins.2012.00134},
ISSN = {1662-453X},
JOURNAL = {FRONTIERS IN NEUROSCIENCE (ONLINE)},
}
@ARTICLE{RUSSO_2012_ARTICLE_RCR_4471,
AUTHOR = {Russo, I. and Caselli, T. and Rubino, F.},
TITLE = {Recognizing deverbal events in context},
YEAR = {2012},
ABSTRACT = {Event detection is a key task in order to access informa-tion through content. This paper focuses on events realized by deverbal nouns in Italian. Deverbal nouns obtained through transpositional suf-fixes (such as-zione;-mento,-tura and-aggio) are commonly known as nouns of action, i. e. nouns which denote the process/action described by the corresponding verbs. However, this class of nouns is also known for a specific polysemous alternation: they may denote the result of the process/action of the corresponding verb. This paper describes a sta-tistically based analysis that helps to develop a classifier for automatic identification of deverbal nouns denoting events in context by exploit-ing rules obtained from syntagmatic and collocational cues identified by linguists},
KEYWORDS = {Deverbal noun, Event detection},
PAGES = {91-103},
URL = {http://www.gelbukh.com/ijcla/2011-1-2/IJCLA-2011.pdf#page=91},
VOLUME = {2 (1-2)},
ISSN = {0976-0962},
JOURNAL = {INTERNATIONAL JOURNAL OF COMPUTATIONAL LINGUISTICS AND APPLICATIONS},
}
@ARTICLE{TARTARISCO_2012_ARTICLE_TBCRAFGP_226738,
AUTHOR = {Tartarisco, G. and Baldus, G. and Corda, D. and Raso, R. and Arnao, A. and Ferro, M. and Gaggioli, A. and Pioggia, G.},
TITLE = {Personal Health System architecture for stress monitoring and support to clinical decisions},
YEAR = {2012},
ABSTRACT = {Developments in computational techniques including clinical decision support systems, information processing, wireless communication and data mining hold new premises in Personal Health Systems. Pervasive Healthcare system architecture finds today an effective application and represents in perspective a real technological breakthrough promoting a paradigm shift from diagnosis and treatment of patients based on symptoms to diagnosis and treatment based on risk assessment. Such architectures must be able to collect and manage a large quantity of data supporting the physicians in their decision process through a continuous pervasive remote monitoring model aimed to enhance the understanding of the dynamic disease evolution and personal risk. In this work an automatic simple, compact, wireless, personalized and cost efficient pervasive architecture for the evaluation of the stress state of individual subjects suitable for prolonged stress monitoring during normal activity is described. A novel integrated processing approach based on an autoregressive model, artificial neural networks and fuzzy logic modeling allows stress conditions to be automatically identified with a mobile setting analysing features of the electrocardiographic signals and human motion. The performances of the reported architecture were assessed in terms of classification of stress conditions. © 2011 Elsevier B. V. All rights reserved},
KEYWORDS = {Autonomic sympathovagal balance, Autoregressive model, Clinical decision support system, Pervasive healthcare architecture, Stress detection},
PAGES = {1296-1305},
URL = {http://www.sciencedirect.com/science/article/pii/S0140366411003720},
VOLUME = {35 (11)},
DOI = {10.1016/j.comcom.2011.11.015},
ISSN = {0140-3664},
JOURNAL = {COMPUTER COMMUNICATIONS},
}
@ARTICLE{TERRANOVA_2012_ARTICLE_TFCRBSP_171910,
AUTHOR = {Terranova, G. and Ferro, M. and Carpeggiani, C. and Recchia, V. and Braga, L. and Semelka Richard, C. and Picano, E.},
TITLE = {Low Quality and Lack of Clarity of Current Informed Consent Forms in Cardiology: How to Improve Them},
YEAR = {2012},
ABSTRACT = {Guidelines on informed consent for clinical practice exhort physicians to use standard plain language to enhance patient comprehension and facilitate shared decision making. The aim of this study was to assess and improve quality and readability of current informed consent forms used in cardiology. We evaluated the currently used informed consent forms, previously written in Italian and English, of 7 common imaging examinations, according to the recommendations of scientific societies. For each text, we also developed a revised informed consent form according to reference standards, including Federal Plain Language guidelines. Regarding readability scores, we analyzed each text (standard and revised) with Flesch-Kincaid (F-K) grade level (higher numbers indicating harder-to-read text) and the Italian language-tailored Gulpease level (from 0 [difficult] to 100 [easy]). Overall quality and readability was poor for both the original English and Italian versions, and readability was improved with the revised form, with higher readability evidenced by changes in both F-K grade level (standard 10. 2 ± 2. 37% vs. revised 6. 5 ± 0. 41%; p < 0. 001) for English and Gulpease (standard 45. 7 ± 2% vs. revised 84. 09 ± 2. 98%; p < 0. 0001) for Italian. In conclusion, current informed consent forms are complex, incomplete, and unreadable for the average patient. Substantial quality improvement and higher readability scores can be achieved with revised forms that explicitly discuss risks and are prepared following standard recommendations of plain writing},
KEYWORDS = {bioethic, imaging risk communication, informed consent, patient rights},
PAGES = {649-655},
URL = {http://www.sciencedirect.com/science/article/pii/S1936878X1200321X},
VOLUME = {5 (6)},
DOI = {10.1016/j.jcmg.2012.03.007},
ISSN = {1936-878X},
JOURNAL = {JACC. CARDIOVASCULAR IMAGING},
}
@ARTICLE{TORAL_2012_ARTICLE_TFMM_4454,
AUTHOR = {Toral, A. and Ferrández, S. and Monachini, M. and Munoz, R.},
TITLE = {Web 2. 0, Language Resources and standards to automatically build a multilingual Named Entity Lexicon},
YEAR = {2012},
ABSTRACT = {This paper proposes to advance in the current state-of-the-art of automatic Language Resource (LR) building by taking into consideration three elements: (1) the knowledge available in existing LRs, (2) the vast amount of information available from the collaborative paradigm that has emerged from the Web 2. 0 and (3) the use of standards to improve interoperability. We present a case study in which a set of LRs for different languages (WordNet for English and Spanish and Parole-Simple-Clips for Italian) are extended with Named Entities (NE) by exploiting Wikipedia and the aforementioned LRs. The practical result is a multilingual NE lexicon connected to these LRs and to two ontologies: SUMO and SIMPLE. Furthermore, the paper addresses an important problem which affects the Computational Linguistics area in the present, interoperability, by making use of the ISO LMF standard to encode this lexicon. The different steps of the procedure (mapping, disambiguation, extraction, NE identification and postprocessing) are comprehensively explained and evaluated. The resulting resource contains 974, 567, 137, 583 and 125, 806 NEs for English, Spanish and Italian respectively. Finally, in order to check the usefulness of the constructed resource, we apply it into a stateof-the-art Question Answering system and evaluate its impact; the NE lexicon improves the system's accuracy by 28. 1%. Compared to previous approaches to build NE repositories, the current proposal represents a step forward in terms of automation, language independence, amount of NEs acquired and richness of the information represented},
KEYWORDS = {Language Resource, Named Entitie, Web 2.0, Standards},
PAGES = {383-419},
URL = {http://link.springer.com/content/pdf/10.1007%2Fs10579-011-9148-x.pdf},
VOLUME = {46 (3)},
DOI = {10.1007/s10579-011-9148-x},
ISSN = {1574-020X},
JOURNAL = {LANGUAGE RESOURCES AND EVALUATION},
}
@BOOK{CALZOLARI_2012_BOOK_CMSS_119251,
AUTHOR = {Calzolari, N. and Magnini, B. and Speranza, M. and Soria, C.},
TITLE = {The Italian language in the digital age-La lingua italiana nell'era digitale},
YEAR = {2012},
ABSTRACT = {This white paper is part of a series that promotes knowledge about language technology and its potential. It addresses educators, journalists, politicians, language communities and others. The availability and use of language technology in Europe varies between languages. Consequently, the actions that are required to further support research and development of language technologies also differ for each language. The required actions depend on many factors, such as the complexity of a given language and the size of its community. META-NET, a Network of Excellence funded by the European Commission, has conducted an analysis of current language resources and technologies. This analysis focused on the 23 official European languages as well as other important national and regional languages in Europe. The results of this analysis suggest that there are many significant research gaps for each language. A more detailed expert analysis and assessment of the current situation will help maximise the impact of additional research and minimize any risks. META-NET consists of 54 research centres from 33 countries that are working with stakeholders from commercial businesses, government agencies, industry, research organisations, software companies, technology providers and European universities. Together, they are creating a common technology vision while developing a strategic research agenda that shows how language technology applications can address any research gaps by 2020},
KEYWORDS = {digital extinction, tecnologie del linguaggio, lingua italiana},
PAGES = {69},
URL = {http://www.springer.com/computer/ai/book/978-3-642-30775-1},
DOI = {10.1007/978-3-642-30776-8},
PUBLISHER = {Springer (Berlin, DEU)},
ISBN = {978-3-642-30775-1},
CONFERENCE_PLACE = {Berlin},
EDITOR = {Rehm, G. and Uszkoreit, H.},
}
@INCOLLECTION{BURGASSI_2012_INCOLLECTION_B_19844,
AUTHOR = {Burgassi, C.},
TITLE = {Intorno al testo dei «Due dialoghi»},
YEAR = {2012},
KEYWORDS = {Filologia italiana, Ruzante},
PAGES = {63-79},
URL = {https://iris.cnr.it/handle/20.500.14243/19844},
PUBLISHER = {CLEUP (Padova, ITA)},
CONFERENCE_PLACE = {Padova},
BOOKTITLE = {Molte cose stanno bene nella penna che ne la scena starebben male. Teatro e lingua in Ruzante (Atti del Convegno, Padova-Pernumia 26-27 ottobre 2011)},
EDITOR = {Cecchinato, A.},
}
@INCOLLECTION{CAVIONI_2012_INCOLLECTION_CCMRZ_216300,
AUTHOR = {Cavioni, V. and Cutugno, P. and Marconi, L. and Renati, R. and Zanetti, M. A.},
TITLE = {Essere e apparire: le identità digitali costruite in rete},
YEAR = {2012},
ABSTRACT = {Identità, apprendimento e comunità sono parole chiavi attraverso cui è possibile capire la portata innovativa che i nuovi ambienti di comunicazione on line stanno apportando alla vita sociale, culturale e privata di coloro che entrano in rete. In quest'ottica, il volume analizza i processi di interazione on line, di identità digitali, di comunità virtuali, con particolare riferimento ad ambienti e strumenti tecnologici di diverso tipo: forum, blog, Facebook. L'accesso ad Internet permette agli individui l'ingresso in uno spazio, non solo digitale, ma anche psicologico. La possibilità di comunicare senza vincoli di tempo e di spazio attraverso molteplici modalità comunicative permette alle persone di sentirsi realmente parte di una comunità all'interno della quale ogni "mente" è collegata alle altre. L'identità online non è soltanto definita dalle caratteristiche auto-attribuite da un utente a sé stesso, ma essa risulta determinata dai feedback di risposta dagli altri utenti, i quali danno ulteriori significati ai contenuti online in risposta a comportamenti agiti nel cyberspazio. Nella rete, quindi, è possibile rinegoziare la propria struttura identitaria, attraverso continui processi di differenziazione/identificazione, riflessioni e narrazioni di Sé nella comunità virtuale. Il linguaggio, come sistema di simboli volontariamente prodotti e attraverso il quale si esprime e realizza la comunicazione all'interno di una determinata comunità o gruppo sociale, costituisce indubbiamente un elemento essenziale dei processi di costruzione dell'identità. E' interessante esplorare nello specifico le modalità di scrittura, in particolare i testi online prodotti dalle giovani generazioni al fine identificarne i tratti salienti integrando gli aspetti di analisi linguistica con quelli maggiormente di tipo psicologico. L'obiettivo è stato quello di esplorare le modalità di scrittura dei giovani, identificandone similarità e specificità con i modi tradizionali di comunicare. Nello specifico è stata condotta un'analisi relativa agli aspetti linguistici e psicologici propri della scrittura in rete prodotta nei blog},
KEYWORDS = {conoscenza, linguistica, media education, didattica, formazione},
PAGES = {105-123},
URL = {https://iris.cnr.it/handle/20.500.14243/216300},
PUBLISHER = {Franco Angeli Edizioni (Roma-Milano, ITA)},
ISBN = {9788856845891},
CONFERENCE_PLACE = {Roma-Milano},
BOOKTITLE = {Identità, apprendimento e comunità virtuali. Strumenti e attività on line},
EDITOR = {Albanese, O. and Ligorio, M. B. and Zanetti, M. A.},
}
@INCOLLECTION{DINDO_2012_INCOLLECTION_DLNPCT_4557,
AUTHOR = {Dindo, H. and La Tona, G. and Nivel, H. and Pezzulo, G. and Chella, A. and Thorisson, K. R.},
TITLE = {Simulation and anticipation as tools for coordinating with the future},
YEAR = {2012},
ABSTRACT = {A key goal in designing an artificial intelligence capable of performing complex tasks is a mechanism that allows it to efficiently choose appropriate and relevant actions in a variety of situations and contexts. Nowhere is this more obvious than in the case of building a general intelligence, where the contextual choice and application of actions must be done in the presence of large numbers of alternatives, both subtly and obviously distinct from each other. We present a framework for action selection based on the concurrent activity of multiple forward and inverse models. A key characteristic of the proposed system is the use of simulation to choose an action: the system continuously simulates the external states of the world (proximal and distal) by internally emulating the activity of its sensors, adopting the same decision process as if it were actually operating in the world, and basing subsequent choice of action on the outcome of such simulations. The work is part of our larger effort to create new observation-based machine learning techniques. We describe our approach, an early implementation, and an evaluation in a classical AI problem-solving domain: the Sokoban puzzle},
KEYWORDS = {Machine learning techniques},
PAGES = {117-125},
URL = {http://link.springer.com/content/pdf/10.1007%2F978-3-642-34274-5_24},
PUBLISHER = {Springer-Verlag (Berlin Heidelberg, DEU)},
CONFERENCE_PLACE = {Berlin Heidelberg},
BOOKTITLE = {Biologically Inspired Cognitive Architectures},
EDITOR = {Chella, A.},
}
@INCOLLECTION{IOANNDIS_2012_INCOLLECTION_ITDFVTP_4538,
AUTHOR = {Ioanndis, D. and Tzovaras, D. and Dalle Mura, G. and Ferro, M. and Valenza, G. and Tognetti, A. and Pioggia, G.},
TITLE = {Gait and Anthropometric Profile Biometrics: A Step Forward},
YEAR = {2012},
ABSTRACT = {While a sharp debate is emerging about whether conventional biometric technology offers society any significant advantages over other forms of identification, and whether it constitutes a threat to privacy, technology is rapidly progressing. Politicians and the public are still discussing fingerprinting and iris scan, while scientists and engineers are already testing futuristic solutions. Second generation biometrics-which include multimodal biometrics, behavioural biometrics, dynamic face recognition, EEG and ECG biometrics, remote iris recognition, and other, still more astonishing, applications-is a reality which promises to overturn any current ethical standard about human identification. Robots which recognise their masters, CCTV which detects intentions, voice responders which analyse emotions: these are only a few applications in progress to be developed},
KEYWORDS = {biometric, sensing seat},
PAGES = {105-127},
URL = {http://www.springer.com/social+sciences/applied+ethics/book/978-94-007-3891-1},
DOI = {10.1007/978-94-007-3892-8_5},
PUBLISHER = {Springer Verlag (Norwell MA, USA)},
ISBN = {978-94-007-3891-1},
CONFERENCE_PLACE = {Norwell MA},
BOOKTITLE = {Second Generation Biometrics: The Ethical, Legal and Social Context},
EDITOR = {Mordini, E. and Tzovaras, D.},
}
@INCOLLECTION{MORGAVI_2012_INCOLLECTION_MMMC_230427,
AUTHOR = {Morgavi, G. and Marconi, L. and Morando, M. and Cutugno, P.},
TITLE = {From human creative cognitive processes to adaptable artificial system design},
YEAR = {2012},
ABSTRACT = {In epigenetic robotics, a new research field, interdisciplinary theory and empirical evidences are used to inform adaptive robotic models, and, vice-versa, these models can be used as tools to make experimental predictions in developmental psychology. A truly autonomous robot should be capable of evolving and `growing up' through experience. Following different psychological points of view, growing up implies a knowledge creative process called: change of functional meaning; increased complexity; enlargement of the internal knowledge map; abstraction and insight. To understand this creative process, we organized an experiment with pre-school children diving with the abstraction process. The cognitive development of children of this age do not include the ability of abstraction, but they are able to explain the process they are thinking. Forty-two metaphoric sentences have been proposed to eight working-groups, of nine to ten children each, asking for their abstracted meanings. After a preliminary "brainstorming" phase, where the free creative associations were prevalent, we addressed children's attention towards the individuation of the metaphoric meaning. The process has been recorded and then we analyzed and classified the answers. Collective speech have been analyzed to compensate the individual differences. The children disclosure was mostly driven by their value system, their motivations and their emotions. They tried many different strategies to reach the abstract meaning, starting from their concrete knowledge and experiences. Each children followed a set of thinking paths that resulted in some very interesting suggestions for the architecture of an adaptive and evolving robot: i. e. the importance of multi-sensor perception, motivation and emotional drives are underlined and, the growing up insights shows similarities to emergent self-organized behaviours},
KEYWORDS = {epigenetis robotics, growing up, abstraction},
PAGES = {133-145},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-84892171708\&origin=inward},
DOI = {10.4324/9780203325988},
PUBLISHER = {Psychology Press (London, GBR)},
ISBN = {9780203325988},
CONFERENCE_PLACE = {London},
BOOKTITLE = {Attention, Representation, and Human Performance: Integration of Cognition, Emotion, and Motivation},
EDITOR = {Slim, M. M. and Dai David, Y. and Abdelmajid, N.},
}
@INCOLLECTION{PEZZULO_2012_INCOLLECTION_P_4589,
AUTHOR = {Pezzulo, G.},
TITLE = {Re-founding cognitivism based on the cybernetic idea of goal-directed action},
YEAR = {2012},
KEYWORDS = {goals, prediction, cognition},
PAGES = {13-23},
URL = {https://iris.cnr.it/handle/20.500.14243/4589},
PUBLISHER = {College Publications Ltd (London, GBR)},
CONFERENCE_PLACE = {London},
BOOKTITLE = {The Goals of Cognition. Essays in honour of Cristiano Castelfranchi},
EDITOR = {Paglieri, F. and Tummolini, L. and Falcone, R.},
}
@INCOLLECTION{PIRRELLI_2012_INCOLLECTION_PFC_134821,
AUTHOR = {Pirrelli, V. and Ferro, M. and Calderone, B.},
TITLE = {Learning Paradigms in Time and Space: Computational Evidence from Romance Languages},
YEAR = {2012},
ABSTRACT = {In the linguistic literature, paradigms have enjoyed a hybrid status, half-way between entrenched patterns of lexical organization and processing structures enforcing global constraints on the output of traditional inflection rules. We describe here an original computational model of the mental lexicon where paradigmatic structures emerge through learning as the by-product of the endogenous dynamics of lexical memorization as competitive self-organization, based on the complementary principles of formal contrast (in space) and association biuniqueness (in time)},
KEYWORDS = {Computational model, Lexical memorization, Mental lexicon, Processing structures, Self-organizing maps},
PAGES = {135-157},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-84921732430\&origin=inward},
DOI = {10.1093/acprof:oso/9780199589982.003.0008},
PUBLISHER = {Oxford University Press (Oxford, GBR)},
ISBN = {978-0-19-958998-2},
CONFERENCE_PLACE = {Oxford},
BOOKTITLE = {Morphological Autonomy: Perspectives for Romance Inflectional Morphology},
EDITOR = {Maiden, M. and Smith, J. C. and Goldbach, M.},
}
@EDITORIAL{DIRETTODASEGRE_2012_EDITORIAL_DAMS_130174,
AUTHOR = {Diretto Da Segre, C. and A Cura Di Martignoni, C. and Morini, L. and Sassi, M.},
TITLE = {Rimario diacronico dell'Orlando Furioso},
YEAR = {2012},
ABSTRACT = {Il rimario dell'Orlando Furioso qui edito è diacronico perchè rappresenta sistematicamente i numerosi cambi di rimante fra le tre redazioni dell'Orlando Furioso, tutte e tre curate personalmente dall'autore (A, 1516, B, 1521; c, 1532). Se perciò un verso ha subito cambi di rimante esso è presente sotto i rimanti successivamente impiegati nelle tre redazioni. Il confronto è immediato in questo rimario diacronico, sia che si parta da un verso di A per arrivare alla forma assunta in B e poi in C, sia che si parta da C e si risalga a B e ad A. Gli sviluppi del contesto analizzato si possono riportare anche all'insieme del macrocontesto grazie all'acclusa Tavola comparativa delle tre edizioni originali},
KEYWORDS = {Orlando Furioso. Rimario Diacronico},
PAGES = {1-1702},
URL = {https://iris.cnr.it/handle/20.500.14243/130174},
PUBLISHER = {Iuss Press (Pavia, ITA)},
ISBN = {9788861980686},
CONFERENCE_PLACE = {Pavia},
}
@EDITORIAL{FRANCESCONI_2012_EDITORIAL_FMPW_297503,
AUTHOR = {Francesconi, E. and Montemagni, S. and Peters, W. and Wyner, A.},
TITLE = {Proceedings of the Fourth Workshop on Semantic Processing of Legal Texts (SPLeT 2012)},
YEAR = {2012},
KEYWORDS = {Trattamento Automatico del Linguaggio, Linguaggio Giuridico, Estrazione di Conoscenza},
PAGES = {71},
URL = {http://www.lrec-conf.org/proceedings/lrec2012/workshops/27.LREC%202012%20Workshop%20Proceedings%20SPLeT.pdf},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {978-2-9517408-7-7},
CONFERENCE_PLACE = {Paris},
}
@EDITORIAL{MARZI_2012_EDITORIAL_MP_226484,
AUTHOR = {Marzi, C. and Pirrelli, V.},
TITLE = {Understanding the Architecture of the Mental Lexicon},
YEAR = {2012},
ABSTRACT = {The present collection stems from the 1st NetWordS Workshop "Understanding the architecture of the mental lexicon: Integration of existing approaches", held in the Pisa Research Area of the Italian National Research Council, in November 2011. "NetWordS: the European network on Word Structure in the languages of Europe" is the Research Networking Programme of the European Science Foundation launched in May 2011 with the ambitious goal of paving the way to the European interdisciplinary research agenda on the Mental Lexicon, with particular emphasis on the following three main challenges:-lexicon and rules in the grammar,-word knowledge and word use,-words and meanings},
KEYWORDS = {Mental Lexicon, interdisciplinary approach},
PAGES = {101-274},
URL = {https://iris.cnr.it/handle/20.500.14243/226484},
PUBLISHER = {Il Mulino (Bologna, ITA)},
ISSN = {1720-9331},
ISBN = {978-88-15-23601-2},
CONFERENCE_PLACE = {Bologna},
}
@INPROCEEDINGS{BIANCHI_2012_INPROCEEDINGS_BTG_264623,
AUTHOR = {Bianchi, E. and Tavosanis, M. and Giovannetti, E.},
TITLE = {Creation of a bottom-up corpus-based ontology for Italian Linguistics},
YEAR = {2012},
ABSTRACT = {This paper describes the steps of construction of a shallow lexical ontology of Italian Linguistics in Italian, set to be used by a meta-search engine for query refinement. The ontology was constructed with the software Protege 4. 0. 2 and encoded in OWL format; its construction has been carried out following the steps described in the well-known Ontology Learning From Text (OLFT) layer cake. The starting point was the automatic term extraction from a corpus of web documents concerning the domain of interest (304, 000 words); as regards corpus construction, we describe the main criteria of the web documents selection and its critical points, concerning the definition of user profile and of degrees of specialisation. We then describe the process of term validation and construction of a glossary of terms of Italian Linguistics; afterwards, we outline the identification of synonymic chains and the main criteria of ontology design: top classes of ontology are Concept (containing taxonomy of concepts) and Term (containing terms of the glossary as instances), while concepts are linked through part-whole and involved-role relation, both borrowed from Wordnet. Finally, we show some examples of the application of the ontology for query refinement},
KEYWORDS = {Ontologies, Italian Linguistics, Query refinement},
PAGES = {2641-2647},
URL = {https://iris.cnr.it/handle/20.500.14243/264623},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
CONFERENCE_NAME = {LREC 2012-Eight International Conference on Language Resources and Evaluation},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Language Resources and Evaluation},
}
@INPROCEEDINGS{BONIN_2012_INPROCEEDINGS_BDMV_289376,
AUTHOR = {Bonin, F. and Dell'Orletta, F. and Montemagni, S. and Venturi, G.},
TITLE = {Lessico settoriale e lessico comune dell'estrazione di terminologia specialistica da corpora di dominio},
YEAR = {2012},
PAGES = {207-220},
URL = {https://iris.cnr.it/handle/20.500.14243/289376},
PUBLISHER = {Bulzoni Editore (Roma, ITA)},
ISBN = {978-88-7870-655-2},
CONFERENCE_NAME = {XLIV congresso internazionale di studi della società di linguistica italiana},
CONFERENCE_PLACE = {Roma},
BOOKTITLE = {Lessico e Lessicologia. Atti del XLIV congresso internazionale di studi della società di linguistica italiana},
}
@INPROCEEDINGS{BOSCO_2012_INPROCEEDINGS_BMS_297499,
AUTHOR = {Bosco, C. and Montemagni, S. and Simi, M.},
TITLE = {Harmonization and Merging of two Italian Dependency Treebanks},
YEAR = {2012},
ABSTRACT = {The paper describes the methodology which is currently being defined for the construction of a "Merged Italian Dependency Treebank" (MIDT) starting from already existing resources. In particular, it reports the results of a case study carried out on two available dependency treebanks, i. e. TUT and ISST-TANL. The issues raised during the comparison of the annotation schemes underlying the two treebanks are discussed and investigated with a particular emphasis on the definition of a set of linguistic categories to be used as a "bridge" between the specific schemes. As an encoding format, the CoNLL de facto standard is used},
KEYWORDS = {Syntactic Annotation, Merging of Resources, Dependency Parsing},
PAGES = {23-30},
URL = {http://www.lrec-conf.org/proceedings/lrec2012/workshops/06.LREC%202012%20Merging%20Proceedings.pdf},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {978-2-9517408-7-7},
CONFERENCE_NAME = {LREC 2012 Workshop on Language Resource Merging},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the LREC 2012 Workshop on Language Resource Merging},
EDITOR = {Bel, N.},
}
@INPROCEEDINGS{BOZZI_2012_INPROCEEDINGS_B_129363,
AUTHOR = {Bozzi, A.},
TITLE = {La filologia del testo assistita dal calcolatore},
YEAR = {2012},
ABSTRACT = {Il termine filologia del testo abbraccia molte attività che uno studioso compie nel momento in cui decida di affrontare lo studio di un'opra antica, moderna o contemporanea. Tali incombenze possono riguardare sia lo sviluppo del testo e la ricerca di tutti gli elementi interni ed esterni che ne mettono in luce la storia, sia la valutazione e la collocazione di quanto il teto veicola in relazione con le conoscenze che si hanno sul suo autore, se noto, sull'ambiente in cui il testo nasce, sugli eventuali rapporti con altre fonti precedenti o contemporanee},
KEYWORDS = {Filologia computazionale},
PAGES = {219-229},
URL = {https://iris.cnr.it/handle/20.500.14243/129363},
CONFERENCE_NAME = {Il diritto romano e le scienze antichistiche nell'era digitale},
}
@INPROCEEDINGS{CALDERONE_2012_INPROCEEDINGS_CP_228503,
AUTHOR = {Calderone, B. and Pirrelli, V.},
TITLE = {Apprendimento morfologico, relazioni base-derivato e topologie paradigmatiche. Evidenze psico-computazionali a confronto},
YEAR = {2012},
ABSTRACT = {Il presente lavoro è volto a esplorare alcune dinamiche acquisizionali relative ai processi di maturazione della competenza morfologica in apprendenti bambini. In quest"ottica, sono riportate due differenti simulazioni computazionali dei processi di apprendimento della morfologia flessiva in Italiano e in Inglese. La prima simulazione, propria di un quadro connessionista classico, dà conto in modo inadeguato delle differenti scale temporali nell"apprendimento di alcune forme flesse verbali in inglese e italiano. La letteratura sull"argomento (Pizzuto \& Caselli 1992, Noccetti 2003) documenta in modo convergente una maggiore rapidità nell"apprendimento delle forme del presente indicativo da parte dei bambini italiani rispetto al ritmo di acquisizione delle forme verbali corrispondenti (la forma di base e la terza persona singolare in-s) da parte di bambini di madre lingua inglese. La seconda simulazione, basata su un modello di memorie associative, a cascata" addestrate tramite protocollo non-supervisionato, rende conto in maniera non banale del paradosso acquisizionale, confermato su base inter-linguistica da un recente studio di Dressler e colleghi (Bittner et al., 2003), secondo cui sistemi flessivi più complessi e completi sono appresi con maggiore facilità di sistemi flessivi più semplici ed estesamente sincretici},
KEYWORDS = {Lessico Mentale, apprendimento morfologico, paradigmi flessionali},
PAGES = {17},
URL = {https://iris.cnr.it/handle/20.500.14243/228503},
PUBLISHER = {Bulzoni Editore (Roma, ITA)},
CONFERENCE_NAME = {XLII Convegno della Società di Linguistica Italiana},
CONFERENCE_PLACE = {Roma},
BOOKTITLE = {Linguaggio e cervello / Semantica, Atti del XLII Convegno della Società di Linguistica Italiana (Pisa, Scuola Normale Superiore, 25-27 settembre 2008)},
EDITOR = {Bambini, V. and Ricci, I. and Bertinetto, P. M.},
}
@INPROCEEDINGS{CALZOLARI_2012_INPROCEEDINGS_CDFMRRS_119646,
AUTHOR = {Calzolari, N. and Del Gratta, R. and Francopoulo, G. and Mariani, J. and Rubino, F. and Russo, I. and Soria, C.},
TITLE = {The LRE Map. Harmonising Community Descriptions of Resources},
YEAR = {2012},
ABSTRACT = {Accurate and reliable documentation of Language Resources is an undisputable need: documentation is the gateway to discovery of Language Resources, a necessary step towards promoting the data economy. Language resources that are not documented virtually do not exist: for this reason every initiative able to collect and harmonise metadata about resources represents a valuable opportunity for the NLP community. In this paper we describe the LRE Map, reporting statistics on resources associated with LREC2012 papers and providing comparisons with LREC2010 data. The LRE Map, jointly launched by FLaReNet and ELRA in conjunction with the LREC 2010 conference, is an instrument for enhancing availability of information about resources, either new or already existing ones, reinforcing and facilitating the use of standards in the community. The LRE Map web interface provides the possibility of searching according to a fixed set of metadata and to view the details of extracted resources. The LRE Map is continuing to collect bottom-up input about resources from authors of other conferences through standard submission process. This will help broadening the notion of "language resources" and attract to the field neighboring disciplines that so far have been only marginally involved by the standard notion of language resources},
KEYWORDS = {Language resources, metadata, documentation},
PAGES = {1084-1089},
URL = {http://www.lrec-conf.org/proceedings/lrec2012/index.html},
ISBN = {978-2-9517408-7-7},
CONFERENCE_NAME = {The Eight International Conference on Language Resources and Evaluation (LREC'12)},
BOOKTITLE = {Proceedings of LREC'12-The Eight International Conference on Language Resources and Evaluation},
EDITOR = {Calzolari, E. N. and Choukri, K. and Declerck, T. and Doğan, M. U. and Maegaard, B. and Mariani, J. and Idijk, J. and Piperidis, S.},
}
@INPROCEEDINGS{CASELLI_2012_INPROCEEDINGS_CFQRR_222834,
AUTHOR = {Caselli, T. and Frontini, F. and Quochi, V. and Rubino, F. and Russo, I.},
TITLE = {Flexible Acquisition of Subcategorization Frames in Italian},
YEAR = {2012},
ABSTRACT = {Lexica of predicate-argument structures constitute a useful tool for several tasks in NLP. This paper describes a web-service system for automatic acquisition of verb subcategorization frames (SCFs) from parsed data in Italian. The system acquires SCFs in an unsupervised manner. We created two gold standards for the evaluation of the system, the first by mixing together information from two lexica (one manually created and the second automatically acquired) and manual exploration of corpus data and the other annotating data extracted from a specialized corpus (environmental domain). Data filtering is accomplished by means of the maximum likelihood estimate (MLE). The evaluation phase has allowed us to identify the best empirical MLE threshold for the creation of a lexicon (P=0. 653, R=0. 557, F1=0. 601). In addition to this, we assigned to the extracted entries of the lexicon a confidence score based on the relative frequency and evaluated the extractor on domain specific data. The confidence score will allow the final user to easily select the entries of the lexicon in terms of their reliability: one of the most interesting feature of this work is the possibility the final users have to customize the results of the SCF extractor, obtaining different SCF lexica in terms of size and accuracy},
KEYWORDS = {lexicon, automatic acquisition, subcategorisation frames},
PAGES = {2842-2848},
URL = {http://www.lrec-conf.org/proceedings/lrec2012/summaries/390.html},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {9782951740877},
CONFERENCE_NAME = {Eight International Conference on Language Resources and Evaluation (LREC'12)},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the Eight International Conference on Language Resources and Evaluation (LREC'12)},
EDITOR = {Calzolari, N. and Choukri, K. and Declerck, T. and Doğan, M. U. and Maegaard, B. and Mariani, J. and Odijk, J. and Piperidis, S.},
}
@INPROCEEDINGS{CASELLI_2012_INPROCEEDINGS_CRR_122937,
AUTHOR = {Caselli, T. and Russo, I. and Rubino, F.},
TITLE = {Assigning Connotation Values to Events},
YEAR = {2012},
ABSTRACT = {Sentiment Analysis (SA) and Opinion Mining (OM) have become a popular task in recent years in NLP with the development of language resources, corpora and annotation schemes. The possibility to discriminate between objective and subjective expressions contributes to the identification of a document's semantic orientation and to the detection of the opinions and sentiments expressed by the authors or attributed to other participants in the document. Subjectivity word sense disambiguation helps in this task, automatically determining which word senses in a corpus are being used subjectively and which are being used objectively. This paper reports on a methodology to assign in a semi-automatic way connotative values to eventive nouns usually labelled as neutral through syntagmatic patterns that express cause-effect relations between emotion cause events and emotion words. We have applied our method to nouns and we have been able reduce the number of OBJ polarity values associated to event noun},
KEYWORDS = {cause emotion events, event connotative values, sentiment polarity},
PAGES = {3082-3089},
URL = {http://www.jotform.com/uploads/fabioaffeilc/30222975566357/225367778092788016/1111_Pa},
CONFERENCE_NAME = {Eight International Conference on Language Resources and Evaluation Proceedings (LREC'12)},
}
@INPROCEEDINGS{CASELLI_2012_INPROCEEDINGS_CRR_351625,
AUTHOR = {Caselli, T. and Russo, I. and Rubino, F.},
TITLE = {Assigning Connotation Values to Events},
YEAR = {2012},
ABSTRACT = {Sentiment Analysis (SA) and Opinion Mining (OM) have become a popular task in recent years in NLP with the development of language resources, corpora and annotation schemes. The possibility to discriminate between objective and subjective expressions contributes to the identification of a document's semantic orientation and to the detection of the opinions and sentiments expressed by the authors or attributed to other participants in the document. Subjectivity word sense disambiguation helps in this task, automatically determining which word senses in a corpus are being used subjectively and which are being used objectively. This paper reports on a methodology to assign in a semi-automatic way connotative values to eventive nouns usually labelled as neutral through syntagmatic patterns that express cause-effect relations between emotion cause events and emotion words. We have applied our method to nouns and we have been able reduce the number of OBJ polarity values associated to event noun},
URL = {https://iris.cnr.it/handle/20.500.14243/351625},
}
@INPROCEEDINGS{CIGNONI_2012_INPROCEEDINGS_CM_5152,
AUTHOR = {Cignoni, L. and Marinelli, R.},
TITLE = {LEARNING THE ROPES: A SOFTWARE TOOL FOR CLIL COURSES IN MARITIME SCHOOLS AND INSTITUTIONS},
YEAR = {2012},
ABSTRACT = {This paper outlines a proposal for maritime English language teaching in public and private Nautical Schools and other maritime educational institutions and establishments in Italy, using a content and language integrated learning (CLIL) approach. The courses are addressed in particular to those students who would like to take up a marine career as officers, engineers or other crew members of the Merchant Navy, and thus require an adequate knowledge of seafaring terminology, but can also be interesting for those wishing to explore the origins and development of maritime language. In order to provide a more challenging environment and better opportunity for the learning of seafaring terms and expressions in English, students are supported by Mariterm, a lexical database, organized in semantic relations, available at the Institute for Computational Linguistics (ILC) of the National Research Council (CNR) in Pisa. A},
KEYWORDS = {maritime terminology},
PAGES = {5279-5288},
URL = {https://iris.cnr.it/handle/20.500.14243/5152},
CONFERENCE_NAME = {4th International Conference on Education and New Learning Technologies},
}
@INPROCEEDINGS{DELGRATTA_2012_INPROCEEDINGS_DFMQRAL_117790,
AUTHOR = {Del Gratta, R. and Frontini, F. and Monachini, M. and Quochi, V. and Rubino, F. and Abrate, M. and Lo Duca, A.},
TITLE = {L-LEME: an Automatic Lexical Merger based on the LMF Standard},
YEAR = {2012},
ABSTRACT = {The present paper describes LMF LExical MErger (L-LEME), an architecture to combine two lexicons in order to obtain new resource(s). L-LEME relies on standards, thus exploiting the benefits of the ISO Lexical Markup Framework (LMF) to ensure interoperability. L-LEME is meant to be dynamic and heavily adaptable: it allows the users to configure it to meet their specific needs. The L-LEME architecture is composed of two main modules: the Mapper, which takes in input two lexicons A and B and a set of user-defined rules and instructions to guide the mapping process (Directives D) and gives in output all matching entries. The algorithm also calculates a cosine similarity score. The Builder takes in input the previous results, a set of Directives D1 and produces a new LMF lexicon C. The Directives allow the user to define its own building rules and different merging scenarios. L-LEME is applied to a specific concrete task within the PANACEA project, namely the merging of two Italian SubCategorization Frame (SCF) lexicons. The experiment is interesting in that A and B have different philosophies behind, being A built by human introspection and B automatically extracted. Ultimately, L-LEME has interesting repercussions in many language technology applications},
KEYWORDS = {LMF, Lexicon mapping, similarity score},
PAGES = {31-40},
URL = {https://iris.cnr.it/handle/20.500.14243/117790},
ISBN = {978-2-9517408-7-7},
CONFERENCE_NAME = {The Eight International Conference on Language Resources and Evaluation (LREC) 2012},
BOOKTITLE = {Proceedings of the LREC 2012 Workshop on Language Resource Merging},
EDITOR = {Bel, N. and Gavrilidou, M. and Monachini, M. and Quochi, V. and Rimell, L.},
}
@INPROCEEDINGS{DELGRATTA_2012_INPROCEEDINGS_DFRRC_119634,
AUTHOR = {Del Gratta, R. and Frontini, F. and Rubino, F. and Russo, I. and Calzolari, N.},
TITLE = {The Language Library: supporting community effort for collective resource production},
YEAR = {2012},
ABSTRACT = {Relations among phenomena at different linguistic levels are at the essence of language properties but today we focus mostly on one specific linguistic layer at a time, without (having the possibility of) paying attention to the relations among the different layers. At the same time our efforts are too much scattered without much possibility of exploiting other people's achievements. To address the complexities hidden in multilayer interrelations even small amounts of processed data can be useful, improving the performance of complex systems. Exploiting the current trend towards sharing we want to initiate a collective movement that works towards creating synergies and harmonisation among different annotation efforts that are now dispersed. In this paper we present the general architecture of the Language Library, an initiative which is conceived as a facility for gathering and making available through simple functionalities the linguistic knowledge the field is able to produce, putting in place new ways of collaboration within the LRT community. In order to reach this goal, a first population round of the Language Library has started around a core of parallel/comparable texts that have been annotated by several contributors submitting a paper for LREC2012. The Language Library has also an ancillary aim related to language documentation and archiving and it is conceived as a theory-neutral space which allows for several language processing philosophies to coexist},
KEYWORDS = {annotation, metadata, scientific crowdsourcing},
PAGES = {43-49},
URL = {https://iris.cnr.it/handle/20.500.14243/119634},
CONFERENCE_NAME = {The Eight International Conference on Language Resources and Evaluation (LREC'12)},
BOOKTITLE = {The Eight International Conference on Language Resources and Evaluation (LREC'12)},
}
@INPROCEEDINGS{DELLORLETTA_2012_INPROCEEDINGS_DMMPV_5141,
AUTHOR = {Dell'Orletta, F. and Marchi, S. and Montemagni, S. and Plank, B. and Venturi, G.},
TITLE = {The SPLeT-2012 Shared Task on Dependency Parsing of Legal Texts},
YEAR = {2012},
ABSTRACT = {The 4th Workshop on "Semantic Processing of Legal Texts" (SPLeT-2012) presents the first multilingual shared task on Dependency Parsing of Legal Texts. In this paper, we define the general task and its internal organization into sub-tasks, describe the datasets and the domain-specific linguistic peculiarities characterizing them. We finally report the results achieved by the participating systems, describe the underlying approaches and provide a first analysis of the final test results},
KEYWORDS = {Dependency Parsing, Domain Adaptation, Legal Text Processing},
URL = {http://www.lrec-conf.org/proceedings/lrec2012/workshops/27.LREC%202012%20Workshop%20Proceedings%20SPLeT.pdf},
CONFERENCE_NAME = {Fourth Workshop on Semantic Processing of Legal Texts (SPLeT 2012)-First Shared Task on Dependency Parsing of Legal Texts (SPLeT 2012)},
}
@INPROCEEDINGS{DELLORLETTA_2012_INPROCEEDINGS_DMMVAF_5136,
AUTHOR = {Dell'Orletta, F. and Marchi, S. and Montemagni, S. and Venturi, G. and Agnoloni, T. and Francesconi, E.},
TITLE = {Domain Adaptation for Dependency Parsing at Evalita 2011},
YEAR = {2012},
ABSTRACT = {The domain adaptation task was aimed at investigating techniques for adapting state-of-the-art dependency parsing systems to new domains. Both the language dealt with, i. e. Italian, and the target domain, namely the legal domain, represent two main novelties of the task organised at Evalita 2011. In this paper, we define the task and describe how the datasets were created from different resources. In addition, we characterize the different approaches of the participating systems, report the test results, and provide a first analysis of these results},
KEYWORDS = {Dependency Parsing, Domain Adaptation, Legal Text Processing},
PAGES = {1-7},
URL = {http://www.evalita.it/sites/evalita.fbk.eu/files/working_notes2011/Domain_Adaptation/},
CONFERENCE_NAME = {Evaluation of NLP and Speech Tools for Italian (EVALITA 2011): Domain Adaptation track},
}
@INPROCEEDINGS{DELLORLETTA_2012_INPROCEEDINGS_DM_349404,
AUTHOR = {Dell'Orletta, F. and Montemagni, S.},
TITLE = {Tecnologie linguistico-computazionali per la valutazione delle competenze linguistiche in ambito scolastico},
YEAR = {2012},
ABSTRACT = {Se da una lato le tecnologie linguistico-computazionali svolgono un ruolo ormai indiscusso per l'accesso al contenuto testuale, sia esso rappresentato dalla conoscenza specifica di un dominio oppure dalla conoscenza linguistica sottostante (es. collocazioni, strutture argomentali, relazioni semantico-lessicali tra parole, ecc.), ciò non appare scontato quando si vada a considerare il loro ruolo nella valutazione della competenza linguistica di apprendenti. La presente comunicazione intende indagare questo interrogativo, in particolare se e in che misura le tecnologie linguistico-computazionali possano costituire un valido ausilio nella valutazione della competenza linguistica italiana di studenti in ambito scolastico},
KEYWORDS = {tecnologie linguistico-computazionali, competenze linguistiche in ambito scolastico},
PAGES = {343-359},
URL = {https://iris.cnr.it/handle/20.500.14243/349404},
PUBLISHER = {Bulzoni Editore (Roma, ITA)},
CONFERENCE_NAME = {XLIV congresso internazionale di studi della società di linguistica italiana},
CONFERENCE_PLACE = {Roma},
BOOKTITLE = {Linguistica Educativa. Atti del XLIV congresso internazionale di studi della società di linguistica italiana},
}
@INPROCEEDINGS{DELLORLETTA_2012_INPROCEEDINGS_DMV_266008,
AUTHOR = {Dell'Orletta, F. and Montemagni, S. and Venturi, G.},
TITLE = {Genre-oriented Readability Assessment: a Case Study},
YEAR = {2012},
URL = {https://iris.cnr.it/handle/20.500.14243/266008},
ISBN = {978-1-62748-389-6},
}
@INPROCEEDINGS{FRONTINI_2012_INPROCEEDINGS_FABBMPPS_251924,
AUTHOR = {Frontini, F. and Aliprandi, C. and Bacciu, C. and Bartolini, R. and Marchetti, A. and Parenti, E. and Piccinonno, F. and Soru, T.},
TITLE = {GLOSS, an infrastructure for the semantic annotation and mining of documents in the public security domain},
YEAR = {2012},
ABSTRACT = {Efficient access to information is crucial in the work of organizations that require decision taking in emergency situations. This paper gives an outline of GLOSS, an integrated system for the analysis and retrieval of data in the environmental and public security domain. We shall briefly present the GLOSS infrastructure and its use, and how semantic information of various kinds is integrated, annotated and made available to the final users},
KEYWORDS = {semantic annotation, text mining, geographic data},
PAGES = {21-25},
URL = {https://iris.cnr.it/handle/20.500.14243/251924},
PUBLISHER = {European language resources association (ELRA) (Paris, FRA)},
ISBN = {978-2-9517408-7-7},
CONFERENCE_NAME = {Eight International Conference on Language Resources and Evaluation. LREC'12. European Language Resources Association: France},
CONFERENCE_PLACE = {Paris},
}
@INPROCEEDINGS{FRONTINI_2012_INPROCEEDINGS_FQR_128272,
AUTHOR = {Frontini, F. and Quochi, V. and Rubino, F.},
TITLE = {Automatic Creation of Quality Multi-Word Lexica from Noisy Text Data},
YEAR = {2012},
ABSTRACT = {This paper describes the design of a tool for the automatic creation of multi-word lexica that is deployed as a web service and runs on automatically web-crawled data within the framework of the PANACEA platform. The main purpose of our task is to provide a (computationally "light") tool that creates a full high quality lexical resource of multi-word items. Within the platform, this tool is typically inserted in a work flow whose first step is automatic web-crawling. Therefore, the input data of our lexical extractor is intrinsically noisy. The paper evaluates the capacity of the tool to deal with noisy data, and in particular with texts containing a significant amount of duplicated paragraphs. The accuracy of the extraction of multi-word expressions from the original crawled corpus is compared to the accuracy of the extraction from a later "de-duplicated" version of the corpus. The paper shows how our method can extract with sufficiently good precision also from the original, noisy crawled data. The output of our tool is a multi-word lexicon formatted and encoded in XML according to the Lexical Mark-up Framework},
KEYWORDS = {Lexical induction, multi-word extraction, web-based distributed platform, noisy data},
URL = {http://www.kde.cs.tut.ac.jp/~aono/pdf/COLING2012/AND/pdf/AND04.pdf},
PUBLISHER = {ACM, Association for computing machinery (New York, USA)},
ISBN = {978-1-4503-1919-5},
CONFERENCE_NAME = {AND 2012},
CONFERENCE_PLACE = {New York},
BOOKTITLE = {Proceedings of the Sixth Workshop on Analytics for Noisy Unstructured Text Data},
}
@INPROCEEDINGS{GAVRILIDOU_2012_INPROCEEDINGS_GLDPPMFDFAM_5349,
AUTHOR = {Gavrilidou, M. and Labropoulou, P. and Desipri, E. and Piperidis, S. and Papageorgiou, H. and Monachini, M. and Frontini, F. and Declerck, T. and Francopoulo, G. and Arranz, V. and Mapelli, V.},
TITLE = {The META-SHARE Metadata Schema for the Description of Language Resources},
YEAR = {2012},
ABSTRACT = {This paper presents a metadata model for the description of language resources proposed in the framework of the META-SHARE infrastructure, aiming to cover both datasets and tools/technologies used for their processing. It places the model in the overall framework of metadata models, describes the basic principles and features of the model, elaborates on the distinction between minimal and maximal versions thereof, briefly presents the integrated environment supporting the LRs description and search and retrieval processes and concludes with work to be done in the future for the improvement of the model},
KEYWORDS = {metadata, META-SHARE, LRs description},
PAGES = {1090-1097},
URL = {http://www.lrec-conf.org/proceedings/lrec2012/index.html},
ISBN = {978-2-9517408-7-7},
CONFERENCE_NAME = {The Eight International Conference on Language Resources and Evaluation (LREC'12)},
}
@INPROCEEDINGS{GIRAUDO_2012_INPROCEEDINGS_GMP_65173,
AUTHOR = {Giraudo, H. and Montermini, F. and Pirrelli, V.},
TITLE = {Processi cognitivi nell'analisi delle classi verbali dell'italiano: un approccio sperimentale},
YEAR = {2012},
ABSTRACT = {L'analisi della flessione, soprattutto verbale, nelle lingue romanze ha ricevuto un notevole impulso negli ultimi anni, in particolare dall'apporto alla ricerca in linguistica teorica di discipline come la psicolinguistica o le scienze cognitive. In questo articolo intendiamo riesaminare la ripartizione dei verbi italiani in classi, e osservare come la teoria morfologica e l'analisi sperimentale possano dare risultati convergenti e contribuire a mettere in luce i processi mentali che costituiscono la base della competenza morfologica dei parlanti (cf. Pirrelli 2007a; 2007b e, per un'illustrazione Bonami et al. 2008)},
KEYWORDS = {Morphology, Word Processing, Word Learning, Mental Lexicon, L1},
URL = {https://iris.cnr.it/handle/20.500.14243/65173},
PUBLISHER = {Bulzoni Editore (Roma, ITA)},
ISBN = {978-88-7870-652-1},
CONFERENCE_NAME = {Linguaggio e cervello / Semantica, Atti del XLII Convegno della Società diLinguistica Italiana (Pisa, Scuola Normale Superiore, 25-27 settembre 2008)},
CONFERENCE_PLACE = {Roma},
BOOKTITLE = {Linguaggio e cervello / Semantica, Atti del XLII Convegno della Società di Linguistica Italiana (Pisa, Scuola Normale Superiore, 25-27 settembre 2008)},
EDITOR = {Bambini, V. and Ricci, I. and Bertinetto, P. M.},
}
@INPROCEEDINGS{GUADAGNINI_2012_INPROCEEDINGS_GV_21158,
AUTHOR = {Guadagnini, E. and Vaccaro, G.},
TITLE = {Il marziobarbulo e il laticlavio. Il lessico dei volgarizzamenti dei classici dal cantiere del DiVo (Dizionario dei volgarizzamenti)},
YEAR = {2012},
ABSTRACT = {Dopo aver presentato il Dizionario dei Volgarizzamenti vero e proprio, mette in luce gli aspetti metodologici della raccolta, della scelta e della presentazione dei materiali. L'esigenza prima è, infatti, "mappare" le zone semantiche distinguendo quelle che hanno subito un pacifico trapasso in volgare a fronte di quelle che si presentano a un qualche livello come "problematiche": rientrano nel primo tipo tutti i casi in cui c'è una diretta continuità con l'antico, per cui il termine latino ha una corrispondenza "immediata" e "spontanea" con quello volgare, ma anche i casi in cui si osserva una riproposizione del latino (compiuta mediante calco o prestito formale) già "archeologica", come parrebbe essere il caso per molte armi e tecniche militari. In altri casi si avverte una frizione o un'alterità inconciliabile fra il piano latino e quello volgare, e si tratta qui di valutare se c'è soltanto una difficoltà di resa o un fraintendimento del dettato originale, o una difficoltà di comprensione, se essa è cosciente, come è compiuto il tentativo di traduzione e per quali vie è operato l'adattamento (consapevole aggiornamento, anacronismo, calco pedissequo, trasposizione del sostantivo in verbi.)},
KEYWORDS = {Volgarizzamenti, Lessicografia italiana, Dizionario dei Volgarizzamenti},
PAGES = {435-447},
URL = {https://iris.cnr.it/handle/20.500.14243/21158},
PUBLISHER = {Bulzoni (Roma, ITA)},
ISBN = {9788878706552},
CONFERENCE_NAME = {XLIV congresso internazionale di studi della società di linguistica italiana},
CONFERENCE_PLACE = {Roma},
BOOKTITLE = {Lessico e lessicologia. Atti del XLIV congresso internazionale di studi della società di linguistica italiana},
EDITOR = {Ferreri, S.},
}
@INPROCEEDINGS{GUADAGNINI_2012_INPROCEEDINGS_GV_260378,
AUTHOR = {Guadagnini, E. and Vaccaro, G.},
TITLE = {La base de datos del DiVo: traducciones antiguas en red},
YEAR = {2012},
ABSTRACT = {El Corpus DiVo (Dizionario dei Volgarizzamenti 'Diccionario de las vulgarizaciones') forma parte de un proyecto de investigación del léxico iniciado en 2008 en el instituto de la Opera del Vocabolario Italiano por Elisa Guadagnini y Giulio Vaccaro. Él incluye todas las traducciones al italiano antiguo de los textos clásicos latinos, compuestas entre los años finales del siglo XIV en una variedad del sistema lingüístico ítalo románico. El corpus que está consultable al sitio http: //divoweb. ovi. cnr. it/ se compone de 113 textos de más de 6. 250. 000 ocurrencias total},
KEYWORDS = {Volgarizzamenti, Lessicografia italiana, Dizionario dei Volgarizzamenti},
PAGES = {181-187},
URL = {https://iris.cnr.it/handle/20.500.14243/260378},
PUBLISHER = {Universidad de Salamanca (Salamanca, ESP)},
ISBN = {978-84-9012-154-2},
CONFERENCE_NAME = {Empiricism and analytical tools for 21 century applied linguistics},
CONFERENCE_PLACE = {Salamanca},
BOOKTITLE = {Empiricism and analytical tools for 21 century applied linguistics. Selected papers from the XXIX international conference of the Spanish association of applied linguistics (AESLA)},
EDITOR = {Elorza, I. and Cortés, O. C. I. and Riaza, B. G. and Pérez Veneros, M.},
}
@INPROCEEDINGS{GUADAGNINI_2012_INPROCEEDINGS_GV_241054,
AUTHOR = {Guadagnini, E. and Vaccaro, G.},
TITLE = {«Selonc ce que Tulles dit en son livre». Il lessico retorico volgare nei volgarizzamenti ciceroniani},
YEAR = {2012},
ABSTRACT = {Il contributo analizza la resa nei volgarizzamenti, e in particolare in quelli ciceroniani o ritenuti nel Medioevo ciceroniani, del lessico retorico},
URL = {https://iris.cnr.it/handle/20.500.14243/241054},
PUBLISHER = {Aracne (Roma, ITA)},
ISBN = {9788854849310},
CONFERENCE_NAME = {VII Convegno triennale della Società Italiana di Filologia Romanza (S. I. F. R.)},
CONFERENCE_PLACE = {Roma},
BOOKTITLE = {Culture, livelli di cultura e ambienti nel Medioevo occidentale},
EDITOR = {Fassò, A. and Giannini, G. and Formisano, L. and Caraffi, P. and Brunetti, G. and Benozzo, F. and Mancini, M.},
}
@INPROCEEDINGS{LENCI_2012_INPROCEEDINGS_LB_513705,
AUTHOR = {Lenci, A. and Benotto, G.},
TITLE = {Identifying hypernyms in distributional semantic spaces},
YEAR = {2012},
ABSTRACT = {In this paper we apply existing directional similarity measures to identify hypernyms with a state-of-the-art distributional semantic model. We also propose a new directional measure that achieves the best performance in hypernym identification},
KEYWORDS = {distributional semantics, semantics, computational linguistics},
BOOKTITLE = {*SEM 2012: The First Joint Conference on Lexical and Computational Semantics – Volume 1: Proceedings of the main conference and the shared task, and Volume 2: Proceedings of the Sixth International Workshop on Semantic Evaluation (SemEval 2012)},
}
@INPROCEEDINGS{LENCI_2012_INPROCEEDINGS_LMVC_260805,
AUTHOR = {Lenci, A. and Montemagni, S. and Venturi, G. and Cutrulla Maria, R.},
TITLE = {Enriching the ISST-TANL Corpus with Semantic Frames},
YEAR = {2012},
ABSTRACT = {The paper describes the design and the results of a manual annotation methodology devoted to enrich the ISST-TANL Corpus with Semantic Frames information. The main issues encountered in applying the English FrameNet annotation criteria to a corpus of Italian language are discussed together with the choice of anchoring the semantic annotation layer to the underlying dependency syntactic structure. We also describe an experiment to measure inter-annotator agreement and a first case study to extend and specialise FrameNet annotation to a corpus of legislative texts},
KEYWORDS = {Semantic annotation, FrameNet, Multi-layer annotated corpus},
PAGES = {3719-3726},
URL = {http://www.lrec-conf.org/proceedings/lrec2012/pdf/986_Paper.pdf},
PUBLISHER = {European language resources association (ELRA) (Paris, FRA)},
ISBN = {978-2-9517408-7-7},
CONFERENCE_NAME = {Eight International Conference on Language Resources and Evaluation (LREC'12)},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the Eight International Conference on Language Resources and Evaluation (LREC'12)},
EDITOR = {Calzolari, N. and Choukri, K. and Declerck, T. and Doğan, M. U. and Maegaard, B. and Mariani, J. and Moreno, A. and Odijk, J. and Piperidis, S.},
}
@INPROCEEDINGS{MANCA_2012_INPROCEEDINGS_MSMTB_5261,
AUTHOR = {Manca, M. and Spinazzè, L. and Mastandrea, P. and Tessarolo, L. and Boschetti, F.},
TITLE = {Musisque Deoque: Text Retrieval on Critical Editions},
YEAR = {2012},
ABSTRACT = {This paper aims at illustrating the main features of the Musisque Deoque Project, which provides a fully freely searchable archive of Latin poetry equipped with critical apparatus. The first part explains how variants are mapped on the reference edition and the second part illustrates the web interface to retrieve sequences of words taking into account possible variants},
KEYWORDS = {Computational Philology},
PAGES = {127-138},
URL = {https://iris.cnr.it/handle/20.500.14243/5261},
VOLUME = {26},
ISSN = {0175-1336},
CONFERENCE_NAME = {Workshop on Annotation of Corpora for Research in the Humanities (ACRH)},
BOOKTITLE = {LDV-FORUM},
}
@INPROCEEDINGS{MARINELLI_2012_INPROCEEDINGS_MBMSCCC_134828,
AUTHOR = {Marinelli, R. and Bindi, R. and Marchi, S. and Santarcangelo, E. L. and Cavallaro, F. and Castellani, E. and Carli, G.},
TITLE = {Suscettibilità ipnotica e linguaggio},
YEAR = {2012},
KEYWORDS = {ipnosi, linguaggio, nlp},
PAGES = {1-10},
URL = {https://iris.cnr.it/handle/20.500.14243/134828},
VOLUME = {VOLUME 2},
PUBLISHER = {Bulzoni (Roma, ITA)},
ISBN = {978-88-7870-652-1},
CONFERENCE_NAME = {XLII congresso internazionale di Studi della Società di Linguistica Italianana (SLI)},
CONFERENCE_PLACE = {Roma},
BOOKTITLE = {Linguaggio e cervello-Semantica / Language and brain-Semantics},
}
@INPROCEEDINGS{MARINELLI_2012_INPROCEEDINGS_MC_122240,
AUTHOR = {Marinelli, R. and Cignoni, L.},
TITLE = {In the same boat and other idiomatic seafaring expressions},
YEAR = {2012},
ABSTRACT = {This paper reports on a research carried out at the Institute for Computational Linguistics (ILC) on a set of idiomatic nautical expressions in Italian and English. A total of 200 Italian expressions were first selected and examined, using both monolingual and bilingual dictionaries, as well as specific lexicographical works dealing with the subject of idiomaticity, especially of the maritime type, and a similar undertaking was then conducted for the English expressions. We discuss the possibility of including both the Italian and English idiomatic expressions in the semantic database Mariterm, which contains terms belonging to the maritime domain. We describe the terminological database and the way in which the idiomatic expressions can be organised within the system, so that, similarly to the other synsets, they are connected to other concepts represented in the database, but at the same time continue to belong to a group of particular linguistic expressions. Furthermore, we study similarities and differences in meaning and usage of some idiomatic expressions in the two languages},
KEYWORDS = {Terminology, Semantic databases, Idiomatic expressions},
PAGES = {627-631},
URL = {http://www.lrec-conf.org/proceedings/lrec2012/index.html},
CONFERENCE_NAME = {Eight International Conference on Language Resources and Evaluation (LREC 2012)},
}
@INPROCEEDINGS{MARINELLI_2012_INPROCEEDINGS_MC_450677,
AUTHOR = {Marinelli, R. and Cignoni, L.},
TITLE = {Enriching a Terminological Database with a Set of Idiomatic Expressions},
YEAR = {2012},
ABSTRACT = {The research described here is aimed at enriching the terminological database Mariterm with a set of idiomatic expressions related to the nautical field. The database is available at the Institute for Computational Linguistics (ILC) of the National Research Council (CNR) in Pisa (Italy), and contains semantic information for around 3500 Italian terms belonging to the maritime domain. Each Italian term is linked to other terms by means of semantic "internal relations" and is also connected to the equivalent synonyms in English. We relate on the methodology designed to expand the database, increase the lexical resource with explanations on the origins of the most common expressions, and study the similarities and differences in meaning and usage of some idiomatic expressions in the two languages. The possibility of using this linguistic resource also for didactic purposes in public and private schools is considered},
KEYWORDS = {Lexical semantic databases, terminology, idiomatic expressions},
PAGES = {690-696},
URL = {https://iris.cnr.it/handle/20.500.14243/450677},
CONFERENCE_NAME = {4th International Conference on Education and New Learning Technologies},
}
@INPROCEEDINGS{MARZI_2012_INPROCEEDINGS_M_4615,
AUTHOR = {Marzi, C.},
TITLE = {Knowledge communities in grey},
YEAR = {2012},
ABSTRACT = {In this article, particular emphasis is laid on technologies in Natural Language understanding and knowledge management for providing structured, intelligent access to the continuously evolving content, generated on-line in a pervasive collaborative environment. The dynamic nature of modern human social interactions, and the increasing capability of wireless and mobile devices for creating and sharing contents, open up the opportunity for a wide dissemination of information through complex knowledge sharing systems. As the shared knowledge components build cognitive ties, there is no real sharing of knowledge without a common understanding of it. In this article, particular emphasis is laid on technologies in Natural Language understanding and knowledge management for providing structured, intelligent access to the continuously evolving content, generated on-line in a pervasive collaborative environment. In detail, robust automated techniques for term extraction and knowledge acquisition are used to tap the information density and the global coherence of text excerpts sampled from both general-purpose and subject-specific social networks. We show empirically that the two sources may exhibit considerable differences in terms of content accessibility and informativeness. Topics: Subject based Communities; Social Networking},
KEYWORDS = {Concept maps, Grey literature, Knowledge sharing, Web communities},
PAGES = {34-40},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-84924107682\&origin=inward},
VOLUME = {13},
PUBLISHER = {TextRelease (Amsterdam, NLD)},
ISSN = {1386-2316},
ISBN = {9789077484173},
CONFERENCE_NAME = {Thirteenth International Conference on Grey Literature: The Grey Circuit-From Social Networking to Wealth Creation (GL13)},
CONFERENCE_PLACE = {Amsterdam},
BOOKTITLE = {THE GL-CONFERENCE SERIES. CONFERENCE PROCEEDINGS},
EDITOR = {Farace, D. J. and Fratzen, J.},
}
@INPROCEEDINGS{MARZI_2012_INPROCEEDINGS_MFCP_225692,
AUTHOR = {Marzi, C. and Ferro, M. and Caudai, C. and Pirrelli, V.},
TITLE = {Evaluating Hebbian self-organizing memories for lexical representation and access},
YEAR = {2012},
ABSTRACT = {The lexicon is the store of words in long-term memory. Any attempt at modelling lexical competence must take issues of string storage seriously. In the present contribution, we discuss a few desiderata that any biologically-inspired computational model of the mental lexicon has to meet, and detail a multi-task evaluation protocol for their assessment. The proposed protocol is applied to a novel computational architecture for lexical storage and acquisition, the "Topological Temporal Hebbian SOMs" (T2HSOMs), which are grids of topologically organised memory nodes with dedicated sensitivity to time-bound sequences of letters. These maps can provide a rigorous and testable conceptual framework within which to provide a comprehensive, multi-task protocol for testing the performance of Hebbian self-organising memories, and a comprehensive picture of the complex dynamics between lexical processing and the acquisition of morphological structure},
KEYWORDS = {Mental Lexicon, Morphology Acquisition, Self-Organizing Maps},
PAGES = {886-893},
URL = {http://www.lrec-conf.org/proceedings/lrec2012/index.html},
ISBN = {978-2-9517408-7-7},
CONFERENCE_NAME = {LREC'12-8th International Conference on Language Resources and Evaluation},
BOOKTITLE = {Language Resources and Evaluation},
EDITOR = {Calzolari, N. and Choukri, K. and Declerck, T. and An, M. U. D. and Maegaard, B. and Mariani, J. and Odijk, J. and Piperidis, S.},
}
@INPROCEEDINGS{MARZI_2012_INPROCEEDINGS_MFP_5201,
AUTHOR = {Marzi, C. and Ferro, M. and Pirrelli, V.},
TITLE = {Prediction and Generalisation in Word Processing and Storage},
YEAR = {2012},
ABSTRACT = {Word storage and processing have traditionally been modelled according to different computational paradigms, in line with the classical corner-stone of "dual-route" models of word structure assuming a sharp dissociation between memory and computation (Clahsen 1999, Di Sciullo \& Williams 1987, Pinker \& Prince 1988, Parasada \& Pinker 1993). Even the most radical alternative to dual-route thinking, connectionist one-route models, challenged the lexicon-grammar dualism only by providing a neurally-inspired mirror image of classical base-to-inflection rules, while largely neglecting issues of lexical storage (Rumelhart \& McClelland 1986, McClelland \& Patterson 2002, Seidenberg \& McClelland 1989). Recent psycho-and neuro-linguistic evidence, however, supports a less deterministic and modular view of the interaction between stored word knowledge and on-line processing [Baayen et al. 1997, Hay 2001, Maratsos 2000, Stemberger \& Middleton 2003, Tabak et al. 2005, Ford et al. 2003, Post et al. 2008). The view entails simultaneous activation of distributed patterns of cortical connectivity encoding redundant distributional regularities in language data. Furthermore, recent developments in morphological theorising question the primacy of grammar rules over lexical storage, arguing that word regularities emerge from independent principles of lexical organisation, whereby lexical units and constructions are redundantly stored and mutually related through entailment relations (Matthews 1991, Corbett \& Fraser 1993, Pirrelli 2000, Burzio 2004, Booij 2010). We endorse here such a non modular view on Morphology to investigate two basic behavioural aspects of human word processing: morphological prediction and generalisation. The investigation is based on a computer model of morphology acquisition supporting the hypothesis that they both derive from a common pool of principles of lexical organisation},
KEYWORDS = {Morphological generalisation, Word processing, Self-organising memory},
PAGES = {114-131},
URL = {http://mmm.lingue.unibo.it/},
CONFERENCE_NAME = {Eighth Mediterranean Morphology Meeting on "Morphology and the architecture of the grammar" (MMM8)},
BOOKTITLE = {Proceedings of the 8th Mediterranean Morphology Meeting on "Morphology and the architecture of the grammar"},
EDITOR = {Ralli, A. and Booij, G. and Scalise, S.},
}
@INPROCEEDINGS{MONACHINI_2012_INPROCEEDINGS_MFDRKGP_119663,
AUTHOR = {Monachini, M. and Frontini, F. and De Felice, I. and Russo, I. and Khan, F. and Gagliardi, G. and Panunzi, A.},
TITLE = {Verb interpretation for basic action types: annotation, ontology induction and creation of prototypical scenes},
YEAR = {2012},
ABSTRACT = {In the last 20 years dictionaries and lexicographic resources such as WordNet have started to be enriched with multimodal content. Short videos depicting basic actions support the user's need (especially in second language acquisition) to fully understand the range of applicability of verbs. The IMAGACT project has among its results a repository of action verbs ontologically organised around prototypical action scenes in the form of both video recordings and 3D animations. The creation of the IMAGACT ontology, which consists in deriving action types from corpus instances of action verbs, intra and cross linguistically validating them and producing the prototypical scenes thereof, is the preliminary step for the creation of a resouce that users can browse by verb, learning how to match different action prototypes with the correct verbs in the target language. The mapping of IMAGACT types onto WordNet synsets allows for a mutual enrichment of both resources},
KEYWORDS = {ontology of actions, lexical resource, 3D animations},
PAGES = {69-80},
URL = {https://iris.cnr.it/handle/20.500.14243/119663},
CONFERENCE_NAME = {COLING 2012-3rd Workshop on Cognitive Aspects of the Lexicon (CogALex-III)},
}
@INPROCEEDINGS{MONEGLIA_2012_INPROCEEDINGS_MGPFRM_122911,
AUTHOR = {Moneglia, M. and Gagliardi, G. and Panunzi, A. and Frontini, F. and Russo, I. and Monachini, M.},
TITLE = {IMAGACT: Deriving an Action Ontology from Spoken Corpora},
YEAR = {2012},
ABSTRACT = {This paper presents the IMAGACT annotation infrastructure which uses both corpus-based and competence-based methods for the simultaneous extraction of a language independent Action ontology from English and Italian spontaneous speech corpora. The infrastructure relies on an innovative methodology based on images of prototypical scenes and will identify high frequency action concepts in everyday life, suitable for the implementation of an open set of languages},
KEYWORDS = {Action verb, Ontology, imagery},
PAGES = {42-47},
URL = {https://iris.cnr.it/handle/20.500.14243/122911},
ISBN = {978-90-74029-00-1},
CONFERENCE_NAME = {Eighth Joint ISO-ACL SIGSEM Workshop on Interoperable Semantic Annotation (ISA-8)},
BOOKTITLE = {Proceedings of the Eight Joint ISO-ACL SIGSEM Workshop on Interoperable Semantic Annotation ISA-8},
EDITOR = {Bunt, H.},
}
@INPROCEEDINGS{MONEGLIA_2012_INPROCEEDINGS_MMCPFGR_5301,
AUTHOR = {Moneglia, M. and Monachini, M. and Calabrese, O. and Panunzi, A. and Frontini, F. and Gagliardi, G. and Russo, I.},
TITLE = {The IMAGACT Cross-linguistic Ontology of Action. A new infrastructure for natural language disambiguation},
YEAR = {2012},
ABSTRACT = {Action verbs, which are highly frequent in speech, cause disambiguation problems that are relevant to Language Technologies. This is a consequence of the peculiar way each natural language categorizes Action i. e. it is a consequence of semantic factors. Action verbs are frequently "general", since they extend productively to actions belonging to different ontological types. Moreover, each language categorizes action in its own way and therefore the cross-linguistic reference to everyday activities is puzzling. This paper briefly sketches the IMAGACT project, which aims at setting up a cross-linguistic Ontology of Action for grounding disambiguation tasks in this crucial area of the lexicon. The project derives information on the actual variation of action verbs in English and Italian from spontaneous speech corpora, where references to action are high in frequency. Crucially it makes use of the universal language of images to identify action types, avoiding the underdeterminacy of semantic definitions. Action concept entries are implemented as prototypic scenes; this will make it easier to extend the Ontology to other languages},
KEYWORDS = {Action verbs, Ontology, Imagery},
PAGES = {2606-2613},
URL = {http://www.lrec-conf.org/proceedings/lrec2012/pdf/428_Paper.pdf},
ISBN = {978-2-9517408-7-7},
CONFERENCE_NAME = {The Eight International Conference on Language Resources and Evaluation (LREC'12)},
}
@INPROCEEDINGS{MONEGLIA_2012_INPROCEEDINGS_MMPFGR_122919,
AUTHOR = {Moneglia, M. and Monachini, M. and Panunzi, A. and Frontini, F. and Gagliardi, G. and Russo, I.},
TITLE = {Mapping a corpusinduced ontology of action verbs on ItalWordNet},
YEAR = {2012},
ABSTRACT = {Action verbs are the least predictable linguistic type for bilingual dictionaries and they cause major problems for NLP technologies. This is not only because of language specific phraseology, but it is rather a consequence of the peculiar way each language categorizes events. In ordinary languages the most frequent action verbs are "general", since they extend productively to actions belonging to different ontological types. Moreover, each language categorizes actions in its own way and therefore the cross-linguistic reference to everyday activities is puzzling. A cross-linguistic stable ontology of actions is difficult to achieve because our knowledge on the actual variation of verbs across types of actions is largely unknown. This paper briefly presents the problems and the building strategies of the IMAGACT Ontology, which aims at filling this gap, and compares some early results on a set of Italian verbs with the information contained in ItalWordNet},
KEYWORDS = {action verb, ontology, image},
PAGES = {219-226},
URL = {https://iris.cnr.it/handle/20.500.14243/122919},
ISBN = {978-80-263-0244-5},
CONFERENCE_NAME = {Global Wordnet Conference (GWC2012)},
BOOKTITLE = {Proceedings of the 6th Global WordNet Conference (GWC2012)},
EDITOR = {Fellbaum, C. and Vossen, P.},
}
@INPROCEEDINGS{MONTEMAGNI_2012_INPROCEEDINGS_MWDN_297504,
AUTHOR = {Montemagni, S. and Wieling, M. and De Jonge, B. and Nerbonne, J.},
TITLE = {Patterns of Language Variation and Underlying Linguistic Features: A New Dialectometric Approach},
YEAR = {2012},
PAGES = {879-889},
URL = {https://iris.cnr.it/handle/20.500.14243/297504},
VOLUME = {II},
PUBLISHER = {Franco Cesati Editore (Firenze, ITA)},
ISBN = {978-88-7667-433-4},
CONFERENCE_NAME = {XI Congresso SILFI (Società Internazionale di Linguistica e Filologia Italiana)},
CONFERENCE_PLACE = {Firenze},
BOOKTITLE = {La variazione nell'italiano e nella sua storia. Varietà e varianti linguistiche e testuali. Atti dell'XI Congresso SILFI (Società Internazionale di Linguistica e Filologia Italiana)},
EDITOR = {Bianchi, P. and De Blasi, N. and De Caprio, C. and Montuori, F.},
}
@INPROCEEDINGS{PARDELLI_2012_INPROCEEDINGS_PGS_4605,
AUTHOR = {Pardelli, G. and Goggi, S. and Sassi, M.},
TITLE = {Grey Literature Between Tradition and Innovation: Is There a Continuum?},
YEAR = {2012},
ABSTRACT = {This study wants to explore ways of social media communication for Grey Literature. In particular it describes the role of social media in relation with traditional channels and how social media applications can be used for Grey},
KEYWORDS = {Grey Literature, Communication Networks, Knowledge Networking, Knowledge Exchange},
PAGES = {165-169},
URL = {https://iris.cnr.it/handle/20.500.14243/4605},
ISSN = {1386-2316},
CONFERENCE_NAME = {Thirteenth International Conference on Grey Literature: The Grey Circuit, From Social Networking to Wealth Creation (GL 13)},
BOOKTITLE = {THE GL-CONFERENCE SERIES. CONFERENCE PROCEEDINGS},
}
@INPROCEEDINGS{PARDELLI_2012_INPROCEEDINGS_PSGB_6009,
AUTHOR = {Pardelli, G. and Sassi, M. and Goggi, S. and Biagioni, S.},
TITLE = {From medical language processing to BioNLP domain},
YEAR = {2012},
ABSTRACT = {This paper presents the results of a terminological work on a reference corpus in the domain of Biomedicine. In particular, the research tends to analyse the use of certain terms in Biomedicine in order to verify their change over the time with the aim of retrieving from the net the very essence of documentation. The terminological sample contains words used in BioNLP and biomedicine and identifies which terms are passing from scientific publications to the daily press and which are rather reserved to scientific production. The final scope of this work is to determine how scientific dissemination to an ever larger part of the society enables a public of common citizens to approach communication on biomedical research and development; and its main source is a reference corpus made up of three main repositories from which information related to BioNLP and Biomedicine is extracted. The paper is divided in three sections: 1) an introduction dedicated to data extracted from scientific documentation; 2) the second section devoted to methodology and data description; 3) the third part containing a statistical representation of terms extracted from the archive: indexes and concordances allow to reflect on the use of certain terms in this field and give possible keys for having access to the extraction of knowledge in the digital era},
KEYWORDS = {Information Extraction, Information Retrieval, Text mining, Digital Libraries},
PAGES = {2049-2055},
URL = {http://www.lrec-conf.org/proceedings/lrec2012/pdf/687_Paper.pdf},
PUBLISHER = {European Language Resources Association (ELRA)-Evaluations and Language resources Distribution Agency (ELDA) (Paris, FRA)},
ISBN = {978-2-9517408-7-7},
CONFERENCE_NAME = {Eight International Conference on Language Resources and Evaluation. LREC'12},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the Eight International Conference on Language Resources and Evaluation (LREC'12)},
EDITOR = {Calzolari, N. and Choukri, K. and Declerck, T. and Doğan, M. U. and Maegaard, B. and Mariani, J. and Odijk, J. and Piperidis, S.},
}
@INPROCEEDINGS{PIRRELLI_2012_INPROCEEDINGS_PG_65152,
AUTHOR = {Pirrelli, V. and Guevara, E.},
TITLE = {Understanding NN Compounds},
YEAR = {2012},
ABSTRACT = {In this paper we intend to pursue two basic objectives: i) point out a substantial convergence between classification criteria for compounding that have developed independently from largely complementary perspectives and methodological stances, and ii) assess the important empirical consequences of this convergence and their potential impact on recent linguistic analyses of lexical compounds as either lexical (and specifically morphological) or syntactic phenomena. These two points are brought home by focusing on a particular class of Italian compounds, namely endocentric NN compounds such as ufficio reclami ('complaint office') or pesce palla ('ball fish') that prove to be increasingly productive in contemporary Italian (cf. Dardano 1978, Bisetto 2004)},
KEYWORDS = {Morphological composition, Word Processing, Word Learning, Mental Lexicon},
PAGES = {17},
URL = {https://iris.cnr.it/handle/20.500.14243/65152},
PUBLISHER = {Bulzoni Editore (Roma, ITA)},
ISBN = {978-88-7870-652-1},
CONFERENCE_NAME = {Linguaggio e cervello / Semantica, Atti del XLII Convegno della Società diLinguistica Italiana (Pisa, Scuola Normale Superiore, 25-27 settembre 2008)},
CONFERENCE_PLACE = {Roma},
BOOKTITLE = {Linguaggio e cervello /Semantica, Atti del XLII Convegno della Società di Linguistica Italiana (Pisa, Scuola Normale Superiore, 25-27 settembre 2008)},
EDITOR = {Bambini, V. and Ricci, I. and Bertinetto, P. M.},
}
@INPROCEEDINGS{POCH_2012_INPROCEEDINGS_PTHQB_259420,
AUTHOR = {Poch, M. and Toral, A. and Hamon, O. and Quochi, V. and Bel, N.},
TITLE = {Towards a User-Friendly Platform for Building Language Resources based on Web Services},
YEAR = {2012},
ABSTRACT = {This paper presents the platform developed in the PANACEA project, a distributed factory that automates the stages involved in the acquisition, production, updating and maintenance of Language Resources required by Machine Translation and other Language Technologies. We adopt a set of tools that have been successfully used in the Bioinformatics field, they are adapted to the needs of our field and used to deploy web services, which can be combined to build more complex processing chains (workflows). This paper describes the platform and its different components (web services, registry, workflows, social network and interoperability). We demonstrate the scalability of the platform by carrying out a set of massive data experiments. Finally, a validation of the platform across a set of required criteria proves its usability for different types of users (non-technical users and providers)},
KEYWORDS = {service platform, workflow, interoperability},
PAGES = {1156-1163},
URL = {http://www.lrec-conf.org/proceedings/lrec2012/pdf/543_Paper.pdf},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {978-2-9517408-7-7},
CONFERENCE_NAME = {Eighth International Conference on Language Resources and Evaluation},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the Eighth International Conference on Language Resources and Evaluation, LREC 2012},
EDITOR = {Calzolari, N. and Choukri, K. and Declerck, T. and Doğan, M. U. and Maegaard, B. and Mariani, J. and Moreno, A. and Odijk, J. and Piperidis, S.},
}
@INPROCEEDINGS{QUOCHI_2012_INPROCEEDINGS_QFR_128266,
AUTHOR = {Quochi, V. and Frontini, F. and Rubino, F.},
TITLE = {A MWE Acquisition and Lexicon Builder Web Service},
YEAR = {2012},
ABSTRACT = {This paper describes the development of a web-service tool for the automatic extraction of Multi-word expressions lexicons, which has been integrated in a distributed platform for the automatic creation of linguistic resources. The main purpose of the work described is thus to provide a (computationally "light") tool that produces a full lexical resource: multi-word terms/items with relevant and useful attached information that can be used for more complex processing tasks and applications (e. g. parsing, MT, IE, query expansion, etc.). The output of our tool is a MW lexicon formatted and encoded in XML according to the Lexical Mark-up Framework. The tool is already functional and available as a service. Evaluation experiments show that the tool precision is of about 80%},
KEYWORDS = {Multiword extraction, lexical resources, LMF, web services.},
PAGES = {2291-2306},
URL = {http://aclweb.org/anthology/C/C12/C12-1140.pdf},
PUBLISHER = {Curran Associates (Red Hook, NY 12571, USA)},
ISBN = {9781627483896},
CONFERENCE_NAME = {International Conference on Computational Linguistics (COLING)},
CONFERENCE_PLACE = {Red Hook, NY 12571},
BOOKTITLE = {Proceedings of COLING 2012: Technical Papers},
EDITOR = {Kay, M. and Boitet, C.},
}
@INPROCEEDINGS{RUBINO_2012_INPROCEEDINGS_RFQ_128261,
AUTHOR = {Rubino, F. and Frontini, F. and Quochi, V.},
TITLE = {Integrating NLP Tools in a Distributed Environment: A Case Study Chaining a Tagger with a Dependency Parser},
YEAR = {2012},
ABSTRACT = {The present paper tackles the issue of PoS tag conversion within the framework of a distributed web service platform for the automatic creation of language resources. PoS tagging is now considered a "solved problem"; yet, because of the differences in the tagsets, interchange of the various PoS taggers vailable is still hampered. In this paper we describe the implementation of a PoS-tagged-corpus converter, which is needed for chaining together in a workflow the FreeLing PoS tagger for Italian and the DESR dependency parser, given that these two tools have been developed independently. The conversion problems experienced during the implementation, related to the properties of the different tagsets and of tagset conversion in general, are discussed together with the solutions adopted. Finally, the converter is evaluated by assessing the impact of conversion on the performance of the dependency parser by comparing with the outcome of the native pipeline. From this we learn that in most cases parsing errors are due to actual tagging errors, and not to conversion itself. Besides, information on accuracy loss is an important feature in a distributed environment of (NLP) services, where users need to decide which services best suit their needs},
KEYWORDS = {PoS tag conversion, interoperability, NLP pipelines},
PAGES = {2125-2131},
URL = {http://www.lrec-conf.org/proceedings/lrec2012/summaries/726.html},
PUBLISHER = {European language resources association (ELRA) (Paris, FRA)},
ISBN = {9782951740877},
CONFERENCE_NAME = {Language Resources and Evaluation Conference 2012},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the Eight International Conference on Language Resources and Evaluation (LREC'12)},
EDITOR = {Calzolari, N. and Choukri, K. and Declerck, T. and Doğan, M. U. and Maegaard, B. and Mariani, J. and Odijk, J. and Piperidis, S.},
}
@INPROCEEDINGS{RUIMY_2012_INPROCEEDINGS_RPG_122943,
AUTHOR = {Ruimy, N. and Piccini, S. and Giovannetti, E.},
TITLE = {Defining and Structuring Saussure's Terminology},
YEAR = {2012},
ABSTRACT = {In the framework of the Italian project 'For a digital edition of Ferdinand de Saussure's manuscripts', an electronic thesaurus of Saussure's terminology is being built, which includes new terms extracted from recently found manuscripts. The lexical model on which it is grounded is a customized version of the SIMPLE model. In this paper, an overview of the customization process is provided, with a special focus on the steps taken for designing a domain-specific ontology as well as on the creation of additional semantic relations and features. Lexical entries are illustrated and the potential of a structured organization of semantic knowledge for gaining a wider understanding of the overall domain terminology is highlighted},
KEYWORDS = {Computational Lexicon},
PAGES = {828-833},
URL = {http://www.euralex.org/elx_proceedings/Euralex2012/pp828-833%20Ruimy,%20Piccini%20and},
CONFERENCE_NAME = {15th EURALEX International Congress (EURALEX2012)},
}
@INPROCEEDINGS{RUIMY_2012_INPROCEEDINGS_RPG_122956,
AUTHOR = {Ruimy, N. and Piccini, S. and Giovannetti, E.},
TITLE = {Les Outils Informatiques au Service de la Terminologie Saussurienne},
YEAR = {2012},
ABSTRACT = {Bien que l'oeuvre de Ferdinand de Saussure ait été diffusée à travers le monde, sa pensée a été en grande partie reconstruite et interprétée par ses étudiants et disciples. Ses écrits authentiques revêtent pourtant, de notre point de vue, une importance fondamentale: ils mettent en lumière l'attention que Saussure accorde à la terminologie linguistique. Lui-même utilise souvent un vocabulaire particulier. Il forge des néologismes ou confère un sens nouveau à des mots existants, il emploie quelques termes de façon éphémère, change la dénotation de certains concepts au fil du temps, créant ainsi une terminologie qui lui est propre. Dans cet article, nous présentons le premier thésaurus-lexique électronique de la terminologie linguistique saussurienne, en cours de création. La population de ce lexique est constituée par une nomenclature mise à jour, comprenant non seulement la terminologie répertoriée par Godel et Engler mais également de nouveaux termes extraits de manuscrits actuellement à l'étude. À travers ce lexique, nous nous proposons de fournir une représentation structurée de la terminologie saussurienne, de définir le contenu sémantique de chacun des termes ainsi que la nature des relations qui les unissent. À cet effet, nous avons choisi de customiser le modèle lexical SIMPLE qui, dans le panorama de la Lexicographie Computationnelle, s'est imposé comme standard de facto et offre une représentation sémantique hautement structurée des unités lexicales. Le processus de customisation du modèle de base s'est tout d'abord focalisé sur la conception d'une ontologie lexicale de domaine (ontologie SIMPLE_FdS), et sa traduction dans le langage de représentation d'ontologie Web OWL. Puis, les deux autres composants du modèle de base, i. e. un réseau de relations sémantiques et un ensemble de traits sémantiques, ont été également adaptés aux exigences du domaine traité. Les moyens expressifs jugés appropriés pour rendre compte de la terminologie saussurienne ont été retenus tandis que des traits et relations spécifiques ont été créés afin d'exprimer des propriétés et des liens qui caractérisent l'organisation conceptuelle de ce domaine de la connaissance. Le lexique est ici illustré par des exemples d'entrées lexicales et le potentiel de la base de connaissance par des requêtes sur les données mémorisées. L'organisation structurée de la connaissance lexicale et la richesse de la représentation sémantique font de ce lexique un outil de recherche sémantique particulièrement performant et qui devrait contribuer de manière significative à mieux maîtriser le vocabulaire saussurien et à éclairer certains aspects originaux de la pensée du maître genevois},
KEYWORDS = {Computational Lexicon},
PAGES = {1043-1056},
URL = {http://www.shs-conferences.org/articles/shsconf/abs/2012/01/shsconf_cmlf12_000294/shs},
DOI = {10.1051/shsconf/20120100294},
PUBLISHER = {EDP Sciences (Les Ulis Cedex, FRA)},
ISBN = {978-2-7598-0783-3},
CONFERENCE_NAME = {3e Congrès Mondial de Linguistique Française (CMLF 2012)},
CONFERENCE_PLACE = {Les Ulis Cedex},
BOOKTITLE = {3e Congrès Mondial de Linguistique Française},
}
@INPROCEEDINGS{RUSSO_2012_INPROCEEDINGS_R_228526,
AUTHOR = {Russo, I.},
TITLE = {Alternanze sintattiche, classi semantiche, funzioni comunicative. La posizione dell'aggettivo nel sintagma nominale},
YEAR = {2012},
PAGES = {2 B-9-2 B-10},
URL = {https://iris.cnr.it/handle/20.500.14243/228526},
ISBN = {978-88-7870-652-1},
CONFERENCE_NAME = {Linguaggio e cervello-Semantica / Language and the brain-Semantics},
BOOKTITLE = {Linguaggio e cervello-Semantica / Language and the brain-Semantics, Atti del XLII Convegno della Società di Linguistica Italiana (Pisa, Scuola Normale Superiore, 25-27 settembre 2008)},
EDITOR = {Bambini, V. and Ricci, I. and Bertinetto, P. M.},
}
@INPROCEEDINGS{SORIA_2012_INPROCEEDINGS_SBCMMOPQC_5324,
AUTHOR = {Soria, C. and Bel, N. and Choukri, K. and Mariani, J. and Monachini, M. and Odijk, J. and Piperidis, S. and Quochi, V. and Calzolari, N.},
TITLE = {The FLaReNet Strategic Language Resource Agenda},
YEAR = {2012},
ABSTRACT = {The FLaReNet Strategic Agenda highlights the most pressing needs for the sector of Language Resources and Technologies and presents a set of recommendations for its development and progress in Europe, as issued from a three-year consultation of the FLaReNet European project. The FLaReNet recommendations are organised around nine dimensions: a) documentation b) interoperability c) availability, sharing and distribution d) coverage, quality and adequacy e) sustainability f) recognition g) development h) infrastructure and i) international cooperation. As such, they cover a broad range of topics and activities, spanning over production and use of language resources, licensing, maintenance and preservation issues, infrastructures for language resources, resource identification and sharing, evaluation and validation, interoperability and policy issues. The intended recipients belong to a large set of players and stakeholders in Language Resources and Technology, ranging from individuals to research and education institutions, to policy-makers, funding agencies, SMEs and large companies, service and media providers. The main goal of these recommendations is to serve as an instrument to support stakeholders in planning for and addressing the urgencies of the Language Resources and Technologies of the future},
KEYWORDS = {strategic agenda, language resources planning, recommended priority actions},
PAGES = {1379-1386},
URL = {http://www.lrec-conf.org/proceedings/lrec2012/index.html},
ISBN = {978-2-9517408-7-7},
CONFERENCE_NAME = {The Eight International Conference on Language Resources and Evaluation (LREC'12)},
BOOKTITLE = {Proceedings of the 8th international conference on Language Resources and Evaluation (LREC2012)},
EDITOR = {Calzolari, N. and Choukri, K. and Declerck, T. and Dogan, M. U. and Maegaard, B. and Mariani, J. and Odijk, J. and Piperidis, S.},
}
@INPROCEEDINGS{SPADONI_2012_INPROCEEDINGS_STLRTSO_5167,
AUTHOR = {Spadoni, F. and Tartarelli, A. and Loparco, L. and Rossi, R. and Tariffi, F. and Sassolini, E. and Ongaro, P.},
TITLE = {SMARTCITY: Customized and Dynamic Multimedia Content Production for Tourism Applications},
YEAR = {2012},
ABSTRACT = {This paper presents the SMARTCITY project experience: customized and dynamic multimedia content production for professional tourism applications},
KEYWORDS = {Corpus Annotation, Cultural Heritage, Access To The Culture Information},
PAGES = {132-137},
URL = {http://digital.casalini.it/9788866551300},
CONFERENCE_NAME = {Electronic Imaging \& the Visual Arts EVA 2012 Florence (EVA 2012 Florence)},
}
@INPROCEEDINGS{BARCA_2012_INPROCEEDINGS_BP_124521,
AUTHOR = {Barca, L. and Pezzulo, G.},
TITLE = {Is visual lexical decision a dynamic and competitive process? No, if we look at reaction times. Yes, if we study how it unfolds in time},
YEAR = {2012},
ABSTRACT = {Visual lexical decision is a classical paradigm in Psycholinguistic, and numerous studies have assessed a so-called "lexicality effect" (i. e., better performance with lexical over non-lexical stimuli). Far less is know relative to the dynamics of choice, as many studies measure overal reaction times which are not informative of the underlying processes. To unfold visual lexical decision in time, we measured participants' hand movements toward one of two items alternatives by recording the streaming x, y coordinates of the computer mouse. Participants categorized as 'lexical' or 'non-lexical' four kinds of stimuli: high and low frequency words, pseudowords, and letter strings. Spatial attraction toward the opposite category was present for low frequency words and pseudowords. Increasing stimuli ambiguity lead to enhcanced movements' complexity and trajectories' attraction to competitors, as no such effect was present for high frequency words and letter strings},
KEYWORDS = {Visual lexical decision written language processes, kinematics, dynamic models of decision-making, written language processes},
PAGES = {1},
URL = {https://iris.cnr.it/handle/20.500.14243/124521},
DOI = {10.3389/conf.fnins.2012.86.00001},
CONFERENCE_NAME = {Neural Coding, Decision-Making \& Integration in Time, 2012},
}
@INPROCEEDINGS{DELGROSSO_2012_INPROCEEDINGS_D_350519,
AUTHOR = {Del Grosso, A. M.},
TITLE = {A Web-based Infrastructure for the philological domain},
YEAR = {2012},
ABSTRACT = {The preservation and transmission of ancient texts in the digital era require an infrastructure able to afford philological issues, such as the management of multiple editions of the same text, in a collaborative environment. The research activities necessary to develop the proposed infrastructure can be grouped into three blocks: Optical Character Recognition of printed editions and tools for collaborative editing of new editions, with particular attention to versioning. Term indexing, information retrieval, information extraction and knowledge representation using ontologies. Enterprise object oriented methodologies and design devoted to deal with resources in a distributed and collaborative Web-based environment (architectural modeling and formalization)},
KEYWORDS = {software engineering, digital humanities, computational philology},
URL = {https://iris.cnr.it/handle/20.500.14243/350519},
ISBN = {978-88-6741-042-2},
CONFERENCE_NAME = {Advances in Computer Systems and Networks},
}
@INPROCEEDINGS{FRONTINI_2012_INPROCEEDINGS_FMNMAB_314751,
AUTHOR = {Frontini, F. and Monachini, M. and N Lapolla, M. and Marchetti, A. and Abrate, M. and Bacciu, C.},
TITLE = {Web Language Identification Testing Tool},
YEAR = {2012},
ABSTRACT = {Nowadays a variety of tools for automatic language identification are available. Regardless of the approach used, at least two features can be identified as crucial to evaluate the performances of such tools: the precision of the presented results and the range of languages that can be detected. In this work we shall focus on a subtask of written language identification that is important to preserve and enhance multilinguality in the Web, i. e. detecting the language of a Web page given its URL. Most specifically, the final aim is to verify to which extent under-represented languages are recognized by available tools. The main specificity of Web Language Identification (WLI) lies in the fact that often an HTML page can provide interesting extralinguistic clues (URL domain name, metadata, encoding, etc) that can enhance accuracy. We shall first provide some data and statistics on the presence of languages on the web, secondly discuss existing practices and tools for language identification according to different metrics-for instance the approaches used and the number of supported languages-and finally make some proposals on how to improve current Web Language Identifiers. We shall also present a preliminary WLI service that builds on the Google Chromium Compact Language Detector; the WLI tool allows us to test the Google n-gram based algorithm against an ad-hoc gold standard of pages in various languages. The gold standard, based on a selection of Wikipedia projects, contains samples in languages for which no automatic recognition has been attempted; it can thus be used by specialists to develop and evaluate WLI systems},
KEYWORDS = {Language Identification Tools, Multilingual Web},
PAGES = {1-1},
URL = {https://iris.cnr.it/handle/20.500.14243/314751},
CONFERENCE_NAME = {W3C Workshop, Call for Participation: The Multilingual Web-The Way Ahead},
}
@INPROCEEDINGS{MARZI_2012_INPROCEEDINGS_M_128304,
AUTHOR = {Marzi, C.},
TITLE = {Innovation, Language, and the Web},
YEAR = {2012},
ABSTRACT = {Language and innovation are inseparable. Language conveys ideas which are essential in corporate innovation; innovation would be nearly impossible if we did not have language. Language establishes the most immediate connections with our conceptualisation of the outside world, and it provides the building blocks for communication. The structure of language itself reflects its functional and communicative use. Communication takes place when there is a real information exchange process. Every linguistic choice is necessarily meaningful, and absolute variables involve the parallel construction of form and meaning. From this perspective, language is not only structure, but a dynamic knowledge construction process as well. Knowledge transfer and innovation transfer are ubiquitous processes: knowledge extraction requires heterogeneous tasks related to the acquisition, from unstructured textual data in digital format, of structured and classified information relating to research topics. In the full version of this approach, emphasis will be laid on the mechanisms underlying language processing and communicative interaction, outlining knowledge retention and retrieval processes. The spread of Internet has enabled development of better bibliographic scientific databases with significantly improved capacity for storage and retrieval. In recent years, web searching has become the default mode of highly innovative information retrieval, though the main sources of digital information are unstructured or semi-structured documents. Information relating to developments in scientific research is collected in the form of abstracts or full publications, in large and growing bibliographic repositories. Considering the web as a corpus makes it possible to investigate how words are used to describe innovation, and how innovation topics can influence word usage and collocational behaviour. Investigation of corpora is concerned with the description of use and structure of language, by inquiring linguistic phenomena such as, co-occurence distributions, collocational variability, derivational productivity, neologism coinage. This will bring into focus the dynamic interplay between lexical creativity and innovative pragmatic contexts, thus blurring the traditional dichotomy between knowledge of language and its use. In particular, the work will focus on how words and language structures become vehicle for knowledge generation and innovation transfer, and how research data, research results and widely-distributed dissemination papers can support and enhance future research},
KEYWORDS = {Lexical productivity, Language Technologies, Web corpora, Grey Literature},
PAGES = {85-88},
URL = {https://iris.cnr.it/handle/20.500.14243/128304},
VOLUME = {14},
ISBN = {978-90-77484-19-7},
CONFERENCE_NAME = {Fourteenth international Conference on Grey Literature (GL14)},
BOOKTITLE = {Tracking Innovation thorugh Grey Literature},
EDITOR = {Farace, D. J. and Frantzen, J. and Greynet},
}
@INPROCEEDINGS{PARDELLI_2012_INPROCEEDINGS_PSG_128291,
AUTHOR = {Pardelli, G. and Sassi, M. and Goggi, S.},
TITLE = {Open Grey for Language Technology: a ride on the network},
YEAR = {2012},
ABSTRACT = {The aim of this paper is to introduce the Open Access movement for Natural Language Processing (NLP) by means of a wide range of open access Grey Literature documentation available on the web. In 2008 Robert Dale, in the last issue of volume 35 of Computational Linguistics said: "There are a number of definitions of the term 'open access' in circulation, but almost all share the key principle that scientific literature should be freely available for all to read, download, copy, distribute, and use (with appropriate attribution) without restriction". At first glance it might seem that the Open Access movement has gradually become more influential in the field of language technology by building repositories accessible through the network. Today's digital archives are niches of intellectual production spread by means of a wide range of documents (such as journal articles and proceedings) which, paradoxically, the search engines do not always reach. The use of inappropriate terms in the formulation of queries and the fragmentation of repositories in this area of investigation does not allow to retrieve information on a large scale. The full paper, after a first introductory section, will be organized in two sections: 1) the first dedicated to the methodology for searching and tracing open access resources and to the criteria for analyzing and selecting the online documentation; 2) the second devoted to a description of the state-of-the-art of Open Access Grey Literature material in a statistical and thematic scenario. As things stand, standardization of computational systems interconnected by links and tools of various nature allowing Internet users to easily retrieve the information that the web naturally makes available would then be essential. Topics: Sustainability, Public Accessible Resources, Product and Service enhancements, Open Access, Curation and Preservation},
KEYWORDS = {Open Access Movement, Natural Language Processing},
PAGES = {89-94},
URL = {https://iris.cnr.it/handle/20.500.14243/128291},
CONFERENCE_NAME = {GL14 Fourteenth International Conference on Grey Literature (GL14)},
}
@INPROCEEDINGS{PICCINI_2012_INPROCEEDINGS_PRG_264634,
AUTHOR = {Piccini, S. and Ruimy, N. and Giovannetti, E.},
TITLE = {Structuring a specific domain: an electronic thesaurus of Ferdinand de Saussure's terminology},
YEAR = {2012},
ABSTRACT = {Although Ferdinand de Saussure's work has been disseminated all over the world, his thought was mainlyreconstructed and interpreted by his students and disciples. His authentic writings are however of paramount importance as they highlight the complexity of the philosophical and semiological system Saussure developed and the attention he payed to linguistic terminology. The great Genevan linguist himself often used a peculiar vocabulary. He forged neologisms or conferred a new meaning to existing words, used a few terms ephemerally, changed the denotation of some concepts over the years, so to create his own idiosyncratic terminology, which is now at the base of modern linguistics. In this paper, we present the first electronic thesaurus-lexicon of the Saussurean linguistic terminology that is being developed in the framework of the ongoing Italian project 'For a digital edition of Ferdinand de Saussure's manuscripts'. The lexicon population consists of an updated nomenclature, encompassing not only the terminology gathered by two famous Saussurean scholars, Robert Godel and Rudolf Engler, but also new terms extracted from recently found manuscripts under study. In the lexicon, the overall structure of Saussure's terminology is made explicit and the semantic import of its component terms as well as the nature and relevance of their relationships are defined. The lexical model, on which the thesaurus is grounded, is a customized version of the SIMPLE model, a de facto standard in the domain of Computational Lexicography that enables a highly structured representation of lexical knowledge. The first stage of the customization process consisted in designing and translating into the Web Ontology Language OWL the central component of the SIMPLE_FdS model, i. e. a domain-specific lexical ontology that would structure Saussure's terminology. The two other building blocks of the root model, i. e. a network of semantic relations and a set of semantic features, were adapted in order to meet the requirements of the domain of interest. The expressive means deemed suitable for our domain were maintained whereas additional specific features and relations were created to account for term properties and relationships peculiar to the conceptual organization of this domain of knowledge. So far, 375 terms were endowed with a rich semantic description. In the extended paper, examples of lexical entries will be provided and many interesting possibilities of lexical investigation will be pointed out. Information retrieval queries may in fact be formulated using any single piece of information encoded, be it a semantic relation, a feature or a lexical unit. Such an electronic thesaurus-lexicon, based on a multidimensional structuring of concepts and a large network of semantic relations among terms, is therefore, in our opinion, a most valuable lexical research tool. It is our deep conviction that it will contribute to better master some of Saussure's reflections and to gain a wider understanding of the overall domain terminology. It might therefore help shading light on original aspectsof the author's thought},
KEYWORDS = {Saussure, terminologia, lessici computazionali},
PAGES = {1},
URL = {https://iris.cnr.it/handle/20.500.14243/264634},
CONFERENCE_NAME = {45th Annual Meeting of the Societas Linguistica Europaea (SLE)},
BOOKTITLE = {45th Annual Meeting of the Societas Linguistica Europae, Book of Abstracts},
EDITOR = {Cornillie, B. and Pascual, M. S. S.},
}
@INPROCEEDINGS{PIOGGIA_2012_INPROCEEDINGS_PBNFATFSGDTM_260119,
AUTHOR = {Pioggia, G. and Billeci, L. and Narzisi, A. and Farruggio, V. and Arnao, A. and Tartarisco, G. and Ferro, M. and Siracusano, R. and Germanò, E. and Deodato, M. and Tortorella, G. and Muratori, F.},
TITLE = {PRIMA PIETRA: Research, Integration, Enhancement, Assistance and Education Program for Autism Services and Rehabilitation Technologies},
YEAR = {2012},
ABSTRACT = {It is commonly recognized that autism spectrum disorder (ASD) symptoms are as early as 12 months of age and that the best outcomes are often achieved through early diagnosis and early intervention. However, there are many challenges to delivering health care to parents with a child with ASD. Difficulties to service delivery and utilization are more intensified for families living in suburban or remote areas, often resulting in limited access to preventative mental health services in general and parenting ASD interventions in particular. As Vismara an Rogers suggested (Vismara, 2010), the use of technology could support long-distance clinical health care. PRIMA PIETRA Italian project is focused on early diagnosis and intervention providing Early Start Denver Model (Dawson et al., 2009) using tele-rehabilitation. PRIMA PIETRA is a collaborative project supported by the Minister of Health of the Sicilian Region, in collaboration with Basilicata and Tuscany Regions},
KEYWORDS = {autism spectrum disorder, pervasive healthcare, early diagnosis},
PAGES = {4},
URL = {https://imfar.confex.com/imfar/2012/webprogram/Paper10070.html},
CONFERENCE_NAME = {International Meeting for Autism Research},
}
@INPROCEEDINGS{PIRRELLI_2012_INPROCEEDINGS_P_228577,
AUTHOR = {Pirrelli, V.},
TITLE = {Computational Complexity in Neurally-inspired Morphology processing},
YEAR = {2012},
ABSTRACT = {Pre-compilation of memory "chunks" in the mental lexicon is beneficial for on-line processing because it enhances the capacity to predict the completion of an upcoming input word and to maintain longer and more complex word sequences in the STM store: the more we memorize, the less material we need to integrate on-line. Morpheme-based representations are like memory chunks that come into the picture when memory of whole words fails, due to either novel, degenerate and noisy input, or to limitations in perception/memory spans. Due to the combinatorial nature of language and our memory limitations, less "chunking" and more on-line integration is expected at processing levels beyond morphology},
URL = {https://iris.cnr.it/handle/20.500.14243/228577},
}
@INPROCEEDINGS{QUOCHI_2012_INPROCEEDINGS_Q_128313,
AUTHOR = {Quochi, V.},
TITLE = {How predictive are grammatical constructions in Italian? The case of the caused-motion construction},
YEAR = {2012},
ABSTRACT = {Differently from English, Italian has a rich morpho logical system and a relative free word-order. For these reasons, the suitability of a "full-scope" constructional approach to Italian is not given. Although Goldberg's (1995, 2006) version of Construction grammar language is constructions all the way down (or up), one could still argue that in Italian, i. e. a language rich in morphology, abstract, grammatical constructions do not play a role, thus weakening the constructionist view. One of the strong points in favour of goldberg's approach is that argument structure constructions in English have been found to be highly predictive of sentence meaning (Goldberg et al. 2005), which provides a motivationfor their early acquisition by children. Many of such studies and evidences are still missing for Italian. This contribution will therefore attempt to start filling this gap by testing the predictive power of the Italian Caused Motion Construction. Data is taken from the CHILDES database (MacWhinney 2000) and annotated according to constructional properties and verb meaning. The annotation is then used to calculate the Cue and Category Validity (Murphy 2002) of both the Construction and the main verbs, which measures their predictive power (i. e respectively their reliability and availability) in relation to the overall sentence meaning. Results show that the Italian Caused Motion Construction is not only more reliable than verbs as a predictor of overall sentence meaning, but it is also more available},
KEYWORDS = {Construction Grammar, Psicolinguistica, Linguistica del corpus},
PAGES = {265-265},
URL = {http://www.sle2012.eu/downloads/Book_abstracts_SLE2012_23aug_final.pdf},
CONFERENCE_NAME = {45th Annual Meeting of the Societas Linguistica Europaea (SLE2012)},
}
@INPROCEEDINGS{SORIA_2012_INPROCEEDINGS_S_117863,
AUTHOR = {Soria, C.},
TITLE = {Voices of Italy: a project for the preservation of Italian language diversity},
YEAR = {2012},
ABSTRACT = {This submission will bring to discussion a project idea that addresses documentation and preservation of regional languages of Italy. Italy holds a unique position in Europe, with around 40 languages spoken and 31 of them in danger. Yet, little is being done for fostering their preservation, and little (if any) is the perception by the general public of the proportions of the phenomenon of language endangerment. The result of the project should be an audiovisual digital archive for storing samples of regional languages. User s will interact with the archive through a range of so called new technologies: not only a web portal for accessing, browsing and searching information, but also mobile devices Apps, a YouTube channel, social networking platforms, etc. for contributing language material. Since these new media are widespread among the Italian population, the youngest one in particular (36 million people in Italy have a connection to the Internet, and 9, 3 millions from a mobile device, with an increase of 74% in a year) it seems feasible to crowdsource the linguistic material to populate the archive, thereby offering an engaging experience that would boost involvement of speakers' communities into the documentation and preservation endeavour. It would be interesting to discuss the feasibility of this project under the current technological and cultural constraints},
PAGES = {17-17},
URL = {https://iris.cnr.it/handle/20.500.14243/117863},
CONFERENCE_NAME = {Language Endangerment: Methodologies and New Challenges},
BOOKTITLE = {Language Endangerment: Methodologies and New Challenges},
}
@TECHREPORT{ALIPRANDI_2012_TECHREPORT_ABBFLMPS_130245,
AUTHOR = {Aliprandi, C. and Bacciu, C. and Bartolini, R. and Frontini, F. and Lapolla, N. and Marchetti, A. and Piccinonno, F. and Soru, T.},
TITLE = {Specifiche architetturali e funzionali},
YEAR = {2012},
ABSTRACT = {Questo documento contiene le specifiche funzionali ed architetturali del sistema GLOSS elaborate come risultato dell'obiettivo operativo 1. Tali specifiche debbono essere di riferimento per tutte le fasi di sviluppo dei vari componenti del sistema stesso e della loro integrazione in un prototipo dimostrativo. Ad una breve introduzione che richiama gli obiettivi generali del progetto, seguono: 1. La descrizione delle funzionalità suddivisa nelle varie fasi che compongono il flusso operativo di GLOSS. 2. La descrizione dell'architettura del sistema da realizzare nella quale si fornisce lo schema dell'integrazione dei vari componenti, il protocollo di comunicazione e memorizzazione dei dati che viene trattato più nel dettaglio nel documento D1. 2 GAF-Gloss Annotation Format, e la descrizione di ciascun componente del sistema. Per sua natura, questo documento sarà soggetto a revisione durante tutto il periodo di sviluppo del sistema. Questa prima versione deve intendersi come guida per l'implementazione ed ha lo scopo di fornire a chi partecipa a questo progetto una visione generale delle funzionalità di GLOSS e come queste dovranno essere integrate nel prototipo dimostratore},
KEYWORDS = {GLOSS, specifiche funzionali},
URL = {https://iris.cnr.it/handle/20.500.14243/130245},
}
@TECHREPORT{BOZZI_2012_TECHREPORT_BGBNMPN_370139,
AUTHOR = {Bozzi, A. and Giovannetti, E. and Boschetti, F. and Nahli, O. and Marchi, S. and Piccini, S. and Nilda Ruimy, A. M. D. G.},
TITLE = {Greek into Arabic: contents, technologies and (humanistic and scientific) applications of a new software},
YEAR = {2012},
ABSTRACT = {This contribution aims to describe the methodological approach to Digital Philology by means of the G\&A Web Application. It also shows running examples for the: 1) Visualization and ordering of parallel texts subdivided in pericopes; 2) Linguistic annotations; 3) Scholarly comments; and 4)Search functions},
KEYWORDS = {digital philolog, computational philology, software engineering, Greek into Arabic, Computational linguistics},
URL = {https://iris.cnr.it/handle/20.500.14243/370139},
}
@TECHREPORT{DELGRATTA_2012_TECHREPORT_DMTALRBP_455959,
AUTHOR = {Del Gratta, R. and Monachini, M. and Tesconi, M. and Abrate, M. and Lo Duca, A. and Rimell, L. and Bel, N. and Padró, M.},
TITLE = {D6. 4 Lexical Merger},
YEAR = {2012},
ABSTRACT = {This document describes the experiments on the merging of lexical resources performed during the project and the development of two merging components for LMF lexicons},
KEYWORDS = {LFM, Lexical Merger},
PAGES = {1-39},
URL = {http://www.panacea-lr.eu/system/deliverables/PANACEA_D6.4.pdf},
}
@TECHREPORT{DELGROSSO_2012_TECHREPORT_DB_130182,
AUTHOR = {Del Grosso, A. M. and Boschetti, F.},
TITLE = {Parallel OCR for Ancient Greek Critical Editions},
YEAR = {2012},
ABSTRACT = {This project is focused on the parallelization of OCR processes applied to Ancient Greek critical editions. Two experiments have been performed. The first experiment is related to parameters differently tuned on the nodes of the grid, in order to identify the best combination that improves the accuracy of the recognition. The second experiment concerns the application of OCR with the best parameters on sample pages by a divide et impera strategy. Results related to the performances of the parallelization are discussed},
KEYWORDS = {OCR Ancient Greek Parallelization},
URL = {http://www.hpc-europa.eu/files/2012/Hum_1263_DEL%20GROSSO%20Angelo%20Mario.pdf},
}
@TECHREPORT{DELGROSSO_2012_TECHREPORT_DM_369067,
AUTHOR = {Del Grosso, A. M. and Marchi, S.},
TITLE = {Il trattamento digitale dei manoscritti di F. de Saussure},
YEAR = {2012},
ABSTRACT = {Il contributo presenta i risultati del progetto PRIN2008 Per un'edizione digitale dei manoscritti di Ferdinand de Saussure", finanziato dal Ministero dell'Istruzione, dell'Università e della Ricerca italiano per il biennio 2009-2011},
KEYWORDS = {prin, saussure, digital humanities, computational philology, digital philology},
URL = {https://iris.cnr.it/handle/20.500.14243/369067},
}
@TECHREPORT{FEDERMANN_2012_TECHREPORT_FGDMMPS_409053,
AUTHOR = {Federmann, C. and Georgantopoulos, B. and Del Gratta, R. and Magnini, B. and Mavroeidis, D. and Piperidis, S. and Speranza, M.},
TITLE = {META-SHARE Functional and Technical Specification (Deliverable D7. 1)META-SHARE Functional and Technical Specification (Deliverable D7. 1. 1)},
YEAR = {2012},
ABSTRACT = {META-SHARE Functional and Technical Specification. Deliverable finale},
URL = {https://iris.cnr.it/handle/20.500.14243/409053},
}
@TECHREPORT{MARZI_2012_TECHREPORT_M_130253,
AUTHOR = {Marzi, C.},
TITLE = {Neuroimaging: mania, revolution, or technological evolution?-A critical review},
YEAR = {2012},
ABSTRACT = {Imaging has become an increasingly important tool in both research and clinical care. A range of neuroimaging technologies provide unprecedented sensitivity to visualisation of brain structure (i. e. anatomy) and function (i. e. physiology) from the level of individual molecules to the whole brain. Many imaging methods are non-invasive and allow dynamic processes to be monitored over time. Imaging is enabling researchers to identify neural networks involved in cognitive processes; understand disease pathways; recognise and diagnose diseases early, when they are most effectively treated; and determine how therapies work. The cognitive neuroscience of higher order auditory processing has advanced enormously in a brief time, in large part benefiting from neuroimaging approaches. A significant amount of progress has been made, and much of it can be attributed to the possibilities for crossing boundaries afforded by neuroimaging tools. More sophisticated experiments combined with fMRI and EEG are helping to know what the brain is doing as people perform cognitive, emotional, and behavioural actions. MEG technology will allow linguists to explore how social interaction and sensorimotor experience affects the cortical processing of language in children; and the combination of behavioural and brain measures may enhance the certainty with which dyslexia can be predicted for a child and promote the possibility of preventive intervention},
KEYWORDS = {Neuroimaging technologies, Cognitive neuroscience, Language studies},
URL = {https://iris.cnr.it/handle/20.500.14243/130253},
}
@TECHREPORT{POCH_2012_TECHREPORT_PHQDTTPB_129399,
AUTHOR = {Poch, M. and Hamon, O. and Quochi, V. and Del Gratta, R. and Toral, A. and Thurmair, G. and Prokopidis, P. and Bel, N.},
TITLE = {D3. 4 Third version (v4) of the integrated platform and documentation},
YEAR = {2012},
ABSTRACT = {The deliverable describes the third and final version of the PANACEA platform},
KEYWORDS = {infrastrutture, Trattamento del linguaggio naturale},
URL = {https://iris.cnr.it/handle/20.500.14243/129399},
}
@TECHREPORT{PROKOPIDIS_2012_TECHREPORT_PPTPFRT_129408,
AUTHOR = {Prokopidis, P. and Papavassiliou, V. and Toral, A. and Poch Riera, M. and Frontini, F. and Rubino, F. and Thurmair, G.},
TITLE = {D4. 5 Final Report on the Corpus Acquisition & Annotation subsystem and its components},
YEAR = {2012},
ABSTRACT = {PANACEA WP4 targets the creation of a Corpus Acquisition and Annotation (CAA) subsystem for the acquisition and processing of monolingual and bilingual language resources (LRs). The CAA subsystem consists of tools that have been integrated as web services in the PANACEA platform of LR production. D4. 2 Initial functional prototype and documentation in T13 and D4. 4 Report on the revised Corpus Acquisition \& Annotation subsystem and its components in T23 provided initial and updated documentation on this subsystem, while this deliverable presents the final documentation of the subsystem as it evolved after the third development cycle of the project. The deliverable is structured as follows. The Corpus Acquisition Component (i. e. the Focused Monolingual and Bilingual Crawlers (FMC/FBC)) is described in section 2. The final list of tools for corpus normalization (cleaning and de-duplication) is detailed in section 3. Section 4 provides documentation on all NLP tools included in the subsystem. Due to its nature, this deliverable aggregates considerable parts of all previous WP4 deliverables. The main new additions include a) new functionalities for, among others, crawling strategy, de-duplication, and detection of parallel document pairs; and b) new NLP tools for syntactic analysis, named entity recognition, tweet processing and anonymization},
KEYWORDS = {Corpus Acquisition},
URL = {http://www.jotform.com/uploads/fabioaffeilc/30222975566357/225350067351490116/PANACEA},
}
@TECHREPORT{QUOCHI_2012_TECHREPORT_QFBHPPBTTK_130130,
AUTHOR = {Quochi, V. and Frontini, F. and Bartolini, R. and Hamon, O. and Poch Riera, M. and Padro, M. and Bel, N. and Thurmair, G. and Toral, A. and Kamran, A.},
TITLE = {D7. 4 Third evaluation report. Evaluation of PANACEA v3 and produced resources},
YEAR = {2012},
ABSTRACT = {D7. 4 reports on the evaluation of the different components integrated in the PANACEA third cycle of development as well as the final validation of the platform itself. All validation and evaluation experiments follow the evaluation criteria already described in D7. 1. The main goal of WP7 tasks was to test the (technical) functionalities and capabilities of the middleware that allows the integration of the various resource-creation components into an interoperable distributed environment (WP3) and to evaluate the quality of the components developed in WP5 and WP6. The content of this deliverable is thus complementary to D8. 2 and D8. 3 that tackle advantages and usability in industrial scenarios. It has to be noted that the PANACEA third cycle of development addressed many components that are still under research. The main goal for this evaluation cycle thus is to assess the methods experimented with and their potentials for becoming actual production tools to be exploited outside research labs. For most of the technologies, an attempt was made to re-interpret standard evaluation measures, usually in terms of accuracy, precision and recall, as measures related to a reduction of costs (time and human resources) in the current practices based on the manual production of resources. In order to do so, the different tools had to be tuned and adapted to maximize precision and for some tools the possibility to offer confidence measures that could allow a separation of the resources that still needed manual revision has been attempted. Furthermore, the extension to other languages in addition to English, also a PANACEA objective, has been evaluated. The main facts about the evaluation results are now summarized},
KEYWORDS = {PANACEA, evaluation, machine translation},
URL = {https://iris.cnr.it/handle/20.500.14243/130130},
}
@TECHREPORT{RIMELL_2012_TECHREPORT_RBPFMQ_130143,
AUTHOR = {Rimell, L. and Bel, N. and Padró, M. and Frontini, F. and Monachini, M. and Quochi, V.},
TITLE = {D6. 2 Integrated Final Version of the Components for Lexical Acquisition},
YEAR = {2012},
ABSTRACT = {The PANACEA project has addressed one of the most critical bottlenecks that threaten the development of technologies to support multilingualism in Europe, and to process the huge quantity of multilingual data produced annually. Any attempt at automated language processing, particularly Machine Translation (MT), depends on the availability of language-specific resources. Such Language Resources (LR) contain information about the language's lexicon, i. e. the words of the language and the characteristics of their use. In Natural Language Processing (NLP), LRs contribute information about the syntactic and semantic behaviour of words-i. e. their grammar and their meaning-which inform downstream applications such as MT. To date, many LRs have been generated by hand, requiring significant manual labour from linguistic experts. However, proceeding manually, it is impossible to supply LRs for every possible pair of European languages, textual domain, and genre, which are needed by MT developers. Moreover, an LR for a given language can never be considered complete nor final because of the characteristics of natural language, which continually undergoes changes, especially spurred on by the emergence of new knowledge domains and new technologies. PANACEA has addressed this challenge by building a factory of LRs that progressively automates the stages involved in the acquisition, production, updating and maintenance of LRs required by MT systems. The existence of such a factory will significantly cut down the cost, time and human effort required to build LRs. WP6 has addressed the lexical acquisition component of the LR factory, that is, the techniques for automated extraction of key lexical information from texts, and the automatic collation of lexical information into LRs in a standardized format. The goal of WP6 has been to take existing techniques capable of acquiring syntactic and semantic information from corpus data, improving upon them, adapting and applying them to multiple languages, and turning them into powerful and flexible techniques capable of supporting massive applications. One focus for improving the scalability and portability of lexical acquisition techniques has been to extend exiting techniques with more powerful, less "supervised" methods. In NLP, the amount of supervision refers to the amount of manual annotation which must be applied to a text corpus before machine learning or other techniques are applied to the data to compile a lexicon. More manual annotation means more accurate training data, and thus a more accurate LR. However, given that it is impractical from a cost and time perspective to manually annotate the vast amounts of data required for multilingual MT across domains, it is important to develop techniques which can learn from corpora with less supervision. Less supervised methods are capable of supporting both large-scale acquisition and efficient domain adaptation, even in the domains where data is scarce. Another focus of lexical acquisition in PANACEA has been the need of LR users to tune the accuracy level of LRs. Some applications may require increased precision, or accuracy, where the application requires a high degree of confidence in the lexical information used. At other times a greater level of coverage may be required, with information about more words at the expense of some degree of accuracy. Lexical acquisition in PANACEA has investigated confidence thresholds for lexical acquisition to ensure that the ultimate users of LRs can generate lexical data from the PANACEA factory at the desired level of accuracy},
KEYWORDS = {Lexical Acquisition},
URL = {http://www.panacea-lr.eu/system/deliverables/PANACEA_D6.2.pdf},
}
@TECHREPORT{RIMELL_2012_TECHREPORT_RBPFMQD_130161,
AUTHOR = {Rimell, L. and Bel, N. and Padró, M. and Frontini, F. and Monachini, M. and Quochi, V. and Del Gratta, R.},
TITLE = {D6. 5 Merged dictionaries},
YEAR = {2012},
ABSTRACT = {This document presents the merged dictionaries delivered in PANACEA. Those dictionaries result from merging already existing lexica, generally for general domain, with domain specific lexica acquired using PANACEA platform. The domain specific lexica are presented and delivered in D6. 3 and the merging repository that allowed the multilevel merging in D6. 4},
KEYWORDS = {merged dictionaries, computational lexicon},
URL = {http://www.panacea-lr.eu//en/deliverables/list},
}
@TECHREPORT{RIMELL_2012_TECHREPORT_RBPFMQD_130256,
AUTHOR = {Rimell, L. and Bel, N. and Padrò, M. and Frontini, F. and Monachini, M. and Quochi, V. and Del Gratta, R.},
TITLE = {D6. 3 Monolingual lexica for English, Spanish and Italian tuned for a particular domain (LAB and ENV)},
YEAR = {2012},
ABSTRACT = {This document presents the lexica acquired using PANACEA platform for Labour and Environment domains. The languages of the lexica are English, Spanish and Italian. The lexical information acquired depends on the language, according to the available tools in the platform},
KEYWORDS = {Lexicon Acqusition},
URL = {http://www.panacea-lr.eu/system/deliverables/PANACEA_D6.3.pdf},
}
@TECHREPORT{TARTARISCO_2012_TECHREPORT_TBCFP_130239,
AUTHOR = {Tartarisco, G. and Baldus, G. and Corda, D. and Ferro, M. and Pioggia, G.},
TITLE = {Decision Support Processing Architecture},
YEAR = {2012},
ABSTRACT = {This report presents the design and im-plementation of the INTERSTRESS Deci-sion Support System (DSS). The goal of the DSS is to assess the psychological state of each patient by analyzing the previously acquired knowledge, such as patient's physiological and behavioural profile, and current sensory data. Starting from such information, the DSS then infers physiological and behavioural markers of stress},
KEYWORDS = {decision support system, multimodal analysi, artificial neural network, Bayesian model, machine learning},
URL = {https://iris.cnr.it/handle/20.500.14243/130239},
}
@TECHREPORT{TARTARISCO_2012_TECHREPORT_TTBCFP_348232,
AUTHOR = {Tartarisco, G. and Tonacci, A. and Baldus, G. and Corda, D. and Ferro, M. and Pioggia, G.},
TITLE = {D5. 2 Decision Support Processing Architecture. INTERSTRESS Project},
YEAR = {2012},
ABSTRACT = {Deliverable describing the architecture of a clinical Decision Support System helping the clinician in the assessment of stress. The document was written within the INTERSTRESS Project},
KEYWORDS = {stress, decision support system, clinica, DSS},
URL = {https://iris.cnr.it/handle/20.500.14243/348232},
}
@TECHREPORT{VISINTAINER_2012_TECHREPORT_VMCKCPTF_130194,
AUTHOR = {Visintainer, F. and Muro, M. and Carlino, A. and Kalogirou, K. and Contreras, J. and Pioggia, G. and Tartarisco, G. and Ferro, M.},
TITLE = {Two vehicle demonstrators for elderly drivers support},
YEAR = {2012},
KEYWORDS = {elderly support, biometric, sensing seat},
URL = {https://iris.cnr.it/handle/20.500.14243/130194},
}
@MISC{ABRATE_2012_MISC_ABFLMM_128221,
AUTHOR = {Abrate, M. and Bacciu, C. and Frontini, F. and Lapolla Mariantonietta, N. and Marchetti, A. and Monachini, M.},
TITLE = {Web Language Identification Testing Tool},
YEAR = {2012},
ABSTRACT = {Nowadays a variety of tools for automatic language identification are available. Regardless of the approach used, at least two features can be identified as crucial to evaluate the performances of such tools: the precision of the presented results and the range of languages that can be detected. In this work we shall focus on a subtask of written language identification that is important to preserve and enhance multilinguality in the Web, i. e. detecting the language of a Web page given its URL. Most specifically, the final aim is to verify to which extent under-represented languages are recognized by available tools. The main specificity of Web Language Identification (WLI) lies in the fact that often an HTML page can provide interesting extralinguistic clues (URL domain name, metadata, encoding, etc) that can enhance accuracy. We shall first provide some data and statistics on the presence of languages on the web, secondly discuss existing practices and tools for language identification according to different metrics-for instance the approaches used and the number of supported languages-and finally make some proposals on how to improve current Web Language Identifiers. We shall also present a preliminary WLI service that builds on the Google Chromium Compact Language Detector; the WLI tool allows us to test the Google n-gram based algorithm against an adhoc gold standard of pages in various languages. The gold standard, based on a selection of Wikipedia projects, contains samples in languages for which no automatic recognition has been attempted; it can thus be used by specialists to develop and evaluate WLI systems},
KEYWORDS = {Multilingual Web},
URL = {https://iris.cnr.it/handle/20.500.14243/128221},
CONFERENCE_NAME = {The Multilingual Web-the Way Ahead},
}
@MISC{BARCA_2012_MISC_BP_140780,
AUTHOR = {Barca, L. and Pezzulo, G.},
TITLE = {Is visual lexical decision a dynamic and competitive process? no, if we look at reaction times. yes, if we study how it unfolds in time},
YEAR = {2012},
ABSTRACT = {Visual lexical decision is a classical paradigm in Psycholinguistic, and numerous studies have assessed a so-called "lexicality effect" (i. e., better performance with lexical over non-lexical stimuli). Far less is know relative to the dynamics of choice, as many studies measure overal reaction times which are not informative of the underlying processes. To unfold visual lexical decision in time, we measured participants' hand movements toward one of two items alternatives by recording the streaming x, y coordinates of the computer mouse. Participants categorized as 'lexical' or 'non-lexical' four kinds of stimuli: high and low frequency words, pseudowords, and letter strings. Spatial attraction toward the opposite category was present for low frequency words and pseudowords. Increasing stimuli ambiguity lead to enhcanced movements' complexity and trajectories' attraction to competitors, as no such effect was present for high frequency words and letter strings. Results fit well with dynamic models of perceptual decision-making describing the process as a competition between alternatives guided by the continuous accumulation of evidence, as well as with a recent neural model of visual word recognition that highlights the role of top-down influences and predictions on perceptual processes. More broadly, our results point to a key role of statistical decision theory to study linguistic processing in terms of dynamic and non-modular mechanisms. Finally, we discuss two aspects that make our set-up challenging for current dynamical models of decision-making: 1) not all information (e. g. ortographic, phonological and semantic) is available at the same time, therefore the accumulation process is nonstationary; 2) the choice is not completed at the action onset, but can be revised at any time during the movement},
KEYWORDS = {Computational neuroscience, psycholinguistic, statistical decision theory},
URL = {http://www.frontiersin.org/10.3389/conf.fnins.2012.86.00001/event_abstract},
DOI = {10.3389/conf.fnins.2012.86.00001},
ISSN = {1662-453X},
}
@MISC{BELTRAMI_2012_MISC_BLSABDFGIGMMRVV_241005,
AUTHOR = {Beltrami, P. D. and Larson, P. C. and Squillacioti, P. C. and Artale, E. and Boccellari, A. and Dotto, D. and Fortunato, M. and Guadagnini, E. and Iorio Fili, D. and Giuliani, M. and Morlino, L. and Mosti, R. and Ravani, S. and Vaccaro, G. and Verlato, Z.},
TITLE = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI-Edizione online: www. vocabolario. org (ISSN 2240-5216)-Versione 2012},
YEAR = {2012},
ABSTRACT = {A pdf copy of the Tesoro della Lingua Italiana delle Origini (TLIO), a dictionary of early Italian in progress, published online, as it was at the end of 2011. TLIO is the first section of the Italian Historical Dictionary which is the mission of the OVI Institute},
KEYWORDS = {Lessicografia italiana, italiano antico},
URL = {http://www.ovi.cnr.it},
}
@MISC{BOSCHETTI_2012_MISC_B_129381,
AUTHOR = {Boschetti, F.},
TITLE = {La localizzazione in lingua italiana dell'infrastruttura per lo studio dei classici greci e latini costituita dal Perseus Project},
YEAR = {2012},
ABSTRACT = {The parallelization of Greek and Latin texts with translations in Italian is discussed},
KEYWORDS = {localization cyberinfrastructure},
URL = {https://iris.cnr.it/handle/20.500.14243/129381},
CONFERENCE_NAME = {Convegno annuale dell'Associazione di Informatica Umanistica e Culture Digitali},
}
@MISC{BOSCHETTI_2012_MISC_B_128227,
AUTHOR = {Boschetti, F.},
TITLE = {A Language Independent Pedagogical Model for Greek, Latin and Arabic},
YEAR = {2012},
ABSTRACT = {Pedagogical tools in a collaborative environment for ancient languages learning is illustrated},
URL = {https://iris.cnr.it/handle/20.500.14243/128227},
CONFERENCE_NAME = {New Approaches to Historical Languages-Tufts University Workshop},
}
@MISC{BOSCHETTI_2012_MISC_BDL_129386,
AUTHOR = {Boschetti, F. and Del Grosso, A. M. and Lamé, M.},
TITLE = {Strumenti per l'analisi di testi bilingui al servizio dell'epigrafia digitale},
YEAR = {2012},
ABSTRACT = {Model for visualization and retrieval of bilingual epigraphic texts in parallel},
KEYWORDS = {allineamento bilinguismo},
URL = {https://iris.cnr.it/handle/20.500.14243/129386},
CONFERENCE_NAME = {Incontro di studi sulla versificazione epigrafica dall'antichità all'umanesimo},
}
@MISC{BOSCHETTI_2012_MISC_BF_128259,
AUTHOR = {Boschetti and Federico},
TITLE = {OCR Evaluation and Parallelization},
YEAR = {2012},
ABSTRACT = {The scalability of the OCR applied to a large amount of documents is discussed. In particulare, unsupervised methods to evaluate the accuracy of the OCR and parallelization of the processes, in order to reduce the time to perform the recognition, are illustrated},
KEYWORDS = {OCR parallelization evaluation},
URL = {https://iris.cnr.it/handle/20.500.14243/128259},
CONFERENCE_NAME = {Digital Humanities Seminars},
}
@MISC{BOSCHETTI_2012_MISC_BF_129394,
AUTHOR = {Boschetti and Federico},
TITLE = {Iperspazi del mondo mediterraneo},
YEAR = {2012},
ABSTRACT = {Investigation in parallel of multilingual semantic spaces},
KEYWORDS = {semantic spaces},
URL = {https://iris.cnr.it/handle/20.500.14243/129394},
}
@MISC{BOSCHETTI_2012_MISC_BF_128238,
AUTHOR = {Boschetti and Federico},
TITLE = {Data Sets and Software Components: Adjustment and Reuse},
YEAR = {2012},
ABSTRACT = {Building (or extending) a digital environment to study ancient authors requires the management of digital resources that must be adjusted asynchronously and the development of software components highly decoupled},
KEYWORDS = {reuse digital humanities infrastructure components},
URL = {https://iris.cnr.it/handle/20.500.14243/128238},
CONFERENCE_NAME = {The Papyrus and the Hypertext. Athenaeus in the Scholarly Kitchen},
}
@MISC{BURGASSI_2012_MISC_B_269621,
AUTHOR = {Burgassi, C.},
TITLE = {Vecchie questioni, nuovi strumenti: le traduzioni dei classici attribuite a Boccaccio alla luce del Dizionario dei Volgarizzamenti (DiVo)},
YEAR = {2012},
URL = {https://iris.cnr.it/handle/20.500.14243/269621},
CONFERENCE_NAME = {Seminario internazionale Boccaccio 2013},
}
@MISC{DELGROSSO_2012_MISC_D_344117,
AUTHOR = {Del Grosso, A. M.},
TITLE = {Overview, Activities and Groups at the Institute for Computational linguistics Antonio Zampolli (ILC-CNR)},
YEAR = {2012},
ABSTRACT = {This presentation aims at illustrating the ILC-CNR activities},
KEYWORDS = {computational linguistics, digital philology},
URL = {https://iris.cnr.it/handle/20.500.14243/344117},
}
@MISC{DELGROSSO_2012_MISC_D_344608,
AUTHOR = {Del Grosso, A. M.},
TITLE = {Evaluation and parallelization of large-scale polytonic Greek OCR},
YEAR = {2012},
ABSTRACT = {This work aims to face the rapid digitization of Greek texts not yet in digital libraries, illustrating 1) what is an OCR engine; 2) what makes Greek OCR hard; 3) the work provided by Robertson and Boschetti; 4) future challenges on parallel architectures and proof reading system},
KEYWORDS = {digital philology, computational philology, digital humanities, computer engineering},
URL = {https://iris.cnr.it/handle/20.500.14243/344608},
CONFERENCE_NAME = {Digitizing Greek Literature},
}
@MISC{DELGROSSO_2012_MISC_DMMP_344187,
AUTHOR = {Del Grosso, A. M. and Marchi, S. and Murano, F. and Pesini, L.},
TITLE = {Banca dati testuale Codifica Théorie des sonantes},
YEAR = {2012},
ABSTRACT = {Banca dati testuale XML della Théorie des sonantes edito dalla Marchese nel 2002},
KEYWORDS = {PRIN, Saussure, Digital philology, Computational philology, Digital Humanities},
URL = {http://licodemo.ilc.cnr.it:8080/Saussure_Wapp/controlPanelView.xhtml},
}
@MISC{DIDONATO_2012_MISC_D_407976,
AUTHOR = {Di Donato, F.},
TITLE = {Linked Open data. Verso una scienza aperta},
YEAR = {2012},
ABSTRACT = {presentazione al Convegno Opening the Past. Archaeological Open Data, Universita? di Pisa, 9 giugno 2012},
URL = {https://iris.cnr.it/handle/20.500.14243/407976},
}
@MISC{DIDONATO_2012_MISC_D_407979,
AUTHOR = {Di Donato, F.},
TITLE = {L'uso pubblico della ragione e la rete. Definizioni, problemi prospettive},
YEAR = {2012},
ABSTRACT = {presentazione all'evento Prospettive e opportunità della società digitale, nel rispetto della legalità, dell'etica e della tutela della persona, organizzato dal DIRPOLIS della Scuola Sant'Anna, Internet Festival, Pisa, 5 ottobre 2012},
URL = {https://iris.cnr.it/handle/20.500.14243/407979},
}
@MISC{GUADAGNINI_2012_MISC_GVBD_21182,
AUTHOR = {Guadagnini, E. and Vaccaro, G. and Burgassi, C. and Dotto, D.},
TITLE = {Corpus dei Classici Latini volgarizzati (Corpus CLaVo)},
YEAR = {2012},
ABSTRACT = {Il Corpus CLaVo è parte del progetto di ricerca DiVo-Dizionario dei Volgarizzamenti. Il lessico di traduzione dal latino nell'italiano delle origini: bibliografia filologica, corpus bilingue lemmatizzato, dizionario storico settoriale, di Elisa Guadagnini e Giulio Vaccaro, ospitato dall'Istituto Opera del Vocabolario Italiano (CNR) e dalla Scuola Normale Superiore di Pisa, finanziato dal MIUR all'interno del programma FIRB-Futuro in Ricerca 2010. Il Corpus CLaVo, interrogabile con GattoWeb, raccoglie le opere latine tradotte dai volgarizzamenti compresi nel corpus DiVo. Comprende 33 testi latini},
URL = {http://clavoweb.ovi.cnr.it},
}
@MISC{GUADAGNINI_2012_MISC_GVBD_21180,
AUTHOR = {Guadagnini, E. and Vaccaro, G. and Burgassi, C. and Dotto, D.},
TITLE = {Corpus del Dizionario dei Volgarizzamenti (Corpus DiVo)},
YEAR = {2012},
ABSTRACT = {Il Corpus DiVo è parte del progetto di ricerca DiVo-Dizionario dei Volgarizzamenti. Il lessico di traduzione dal latino nell'italiano delle origini: bibliografia filologica, corpus bilingue lemmatizzato, dizionario storico settoriale, di Elisa Guadagnini e Giulio Vaccaro, ospitato dall'Istituto Opera del Vocabolario Italiano (CNR) e dalla Scuola Normale Superiore di Pisa, finanziato dal MIUR all'interno del programma FIRB-Futuro in Ricerca 2010. Il Corpus DiVo, interrogabile con GattoWeb, è curato da Cosimo Burgassi, Diego Dotto, Elisa Guadagnini e Giulio Vaccaro. Comprende 103 testi volgari, per complessive 4. 361. 450 occorrenze di 143. 274 forme grafiche distinte. Sono presenti 40 testi latini associati. I testi sono stati preparati preparati per l'acquisizione in GATTO da Cosimo Burgassi, Diego Dotto, Elisa Guadagnini, Chiara Missana, Francesca Panontin e Giulio Vaccaro},
URL = {http://divoweb.ovi.cnr.it},
}
@MISC{IDE_2012_MISC_IC_227380,
AUTHOR = {Ide, N. and Calzolari, N.},
TITLE = {Editors' Note},
YEAR = {2012},
URL = {https://iris.cnr.it/handle/20.500.14243/227380},
DOI = {10.1007/s10579-012-9190-3},
ISSN = {1574-020X},
}
@MISC{LAM_2012_MISC_LBDB_284816,
AUTHOR = {Lamé, M. and Boschetti, F. and Del Grosso, A. M. and Benedetti, L.},
TITLE = {La matière épigraphique dans un espace numérique: l'importance du support archéologique},
YEAR = {2012},
URL = {https://iris.cnr.it/handle/20.500.14243/284816},
}
@MISC{LAM_2012_MISC_LVBML_290169,
AUTHOR = {Lamè, M. and Valchera, V. and Boschetti, F. and Masset, C. and Lemaire, P.},
TITLE = {Exploitation de la matière épigraphique dans un espace numérique},
YEAR = {2012},
URL = {https://iris.cnr.it/handle/20.500.14243/290169},
}
@MISC{LAM_2012_MISC_LVBML_284828,
AUTHOR = {Lamé, M. and Valchera, V. and Boschetti, F. and Masset, C. and Lemaire, P.},
TITLE = {Asking Text-Bearing Objects: Contribution of Epigraphical theories to Digital Representation of Texts},
YEAR = {2012},
ABSTRACT = {This methodological framework tries to combine the epigraphical theories and methods with the digital representation of text. The first section describes the methodological aspects of epigraphy, in particular the autopsy. The key concept concerns that epigraphy deals with text-bearing objects characterized by the genuineness and the uniqueness of the text. The second section discusses the nine levels of analysis proposed for the digital representation of inscriptions: 1. Metadata; 2. Matrix of the artefact; 3. Images of the artefact; 4. Decorations or figurative elements; 5. Transcription of the text: diplomatic edition; 6. Related epigraphs; 7. Text: critical edition with apparatus; 8. Bibliography; 9. Commentaries. At each level, the epigraphical evidence relates to the Res Gestae Divi Augusti (RGDA). The last section is dedicated to comparison between digital epigraphy and digital papyrology in order to consider their paths in the Digital Humanities. Now the papyrological world has a single platform, whereas epigraphers use databases more localized (based on geographic origin of inscriptions) and specialized, with, for only some of them, a basic common interface. Furthermore, these reflections would encourage interoperable tools and cooperation between communities},
URL = {https://iris.cnr.it/handle/20.500.14243/284828},
}
@MISC{MARZI_2012_MISC_M_129391,
AUTHOR = {Marzi, C.},
TITLE = {Seminario sulla rete europea della struttura della parola (NetWordS)-Dottorato in Linguistica, UniPV},
YEAR = {2012},
ABSTRACT = {Words are the basic building block of lòanguage productivity, establishing the most immediate connections between language and our conceptualisation of world, and they represent compelx interface units, which are not only part of larger constructions but are themselves made up of simpler sublecxical costituents. A better understanding of the human strategies involved in learning and processing word structures lies at the heart of our comprehension of the basic mechanism seving language and cognition},
KEYWORDS = {Word Structure},
URL = {http://studiumanistici.unipv.it/?pagina=p\&titolo=ling-Marzihomepage},
}
@MISC{PARDELLI_2012_MISC_P_129368,
AUTHOR = {Pardelli, G.},
TITLE = {Lineamenti di Linguistica Computazionale per il recupero informativo},
YEAR = {2012},
ABSTRACT = {Le ricerche linguistiche a partire dal secondo dopoguerra hanno avuto un ritmo di evoluzione e di espansione molto rapido grazie anche ai metodi di analisi introdotti, come l'uso dei metodi statistici o quantitativi nello studio delle lingue e delle opere letterarie. Nacquero nuovi settori di applicazione, la linguistica incontrò altre scienze e l' interdisciplinarità venne sempre più praticata fino a diventare indispensabile. L'introduzione di sistemi di automazione delle ricerche nelle analisi linguistiche vide la nascita della Linguistica Computazionale LC che mise in connessione lo studio della lingua e l'elaboratore elettronico. Dalla fine degli anni '40 all'inizio degli anni '60 gli utilizzi del calcolo elettronico per l'elaborazione di dati linguistici si articolarono in due filoni principali:-Gli spogli elettronici dei testi che diedero impulso alla lessicografia computazionale, avviata da Padre Roberto Busa nel 1951 con la compilazione delle concordanze dell'opera omnia di Tommaso d'Aquino;-I tentativi di traduzione automatica TA, in inglese machine translation MT, avviati da Weaver nel 1949 con la pubblicazione del memorandum "Translation". La TA divenne da subito nucleo e centro di spinta della LC utlilizzando il calcolatore per trasportare un testo da una lingua naturale all'altra. Il contenuto argomentale dei testi della Biblioteca dell'Istituto di Linguistica Computazionale si sviluppa per lo più sulle tematiche sopra descritte. L'articolo darà enfasi alla terminologia della LC, nella prima parte, quella introduttiva; nella seconda parte saranno fornite informazioni inerenti il patrimonio bibliografico, il software di gestione usato e indicazioni per il recupero informativo; la terza parte andrà a presentare il "Fondo Antonio Zampolli", preziosa collezione di testi, alcuni unici in Italia, nel settore del trattamento automatico della lingua, che va ad arricchire e completare la Biblioteca ILC. In appendice sarà fornita una tabella riassuntiva dei termini estratti dai titoli degli articoli presentati alle conferenze di Linguistica Computazionale COLING, dal 1965-anno della prima conferenza tenuta a New York-al 2010, conferenza tenuta a Pechino. Trattasi di 23 conferenze internazionali di Linguistica Computazionale, fondamentali nella storia della disciplina. L'estrazione terminologica del corpus COLING è stata operata con gli strumenti di analisi testuale del laboratorio DylanLab dell'Istituto di Linguistica Computazionale},
KEYWORDS = {Linguistica Computazionale, Terminologia, Repository},
URL = {https://iris.cnr.it/handle/20.500.14243/129368},
CONFERENCE_NAME = {Seminario di Studi-Benvenuti in Biblioteca! Umanesimo e società nelle collezioni librarie del CNR},
}
@MISC{PARDELLI_2012_MISC_PE_129374,
AUTHOR = {Pardelli, G. and Enea, A.},
TITLE = {Per un'edizione digitale dei manoscritti di Ferdinand de Saussure: Verso la Costruzione del prototipo bibliografico},
YEAR = {2012},
ABSTRACT = {Per un'edizione digitale dei manoscritti di Ferdinand de Saussure-PRIN 2008 Unità operativa CNR-ILC Responsabile dott. Nilda Ruimy Relazione attività svolta da Gabriella Pardelli Obiettivo: costruzione del prototipo bibliografico saussurriano compatibile con le applicazioni sviluppate per il progetto e volte alla rete telematica. In particolare il prototipo si integra con l' ontologia di dominio sviluppata per la creazione del lessico saussurriano (ILC) e con l'applicazione di Natural Language Processing nata per il recupero della terminologia multilingue da immagini digitali (ILC). Metodologia: 1) scelta del software; 2) recupero delle informazioni bibliografiche; 3) digitalizzazione 4) collegamento testo/immagine. 1) Il prototipo bibliografico degli scritti di Ferdinand de Saussure si avvale del software CDS/ISIS Computerised Documentation Service / Integrated Set of Information Systems. Il software è sviluppato, mantenuto e distribuito dall'UNESCO. L'applicazione permette l'associazione di file esterni (immagini e testi) oltre alla creazione di link tra record e archivi diversi. L'esportazione dei dati segue lo standard internazionale ISO2709. 2) La ricca bibliografia è stata elaborata dal coordinatore nazionale del progetto. Il recupero delle fonti saussurriane è stato svolto nella Biblioteca della Scuola Normale Superiore di Pisa e nella Biblioteca del Dipartimento di Linguistica di Pisa. 3) Le immagini sono state acquisite con la collaborazione di un fotografo professionista-fonti di prima generazione-. Invece per le fonti non recuperabili sul territorio italiano, l'acquisizione è frutto di portali europei dedicati a Saussure (Gallica)-fonti di seconda generazione-Con l'abbinamento della descrizione bibliografica alla rispettiva fonte digitalizzata il prototipo è stato ultimato. L'applicazione è stata presentata il 21 settembre 2012 al seminario internazionale organizzato dall'Università di Firenze, presso la Facoltà di Lettere, a conclusione del progetto. Consistenza: Il database contiene 150 record corredati dalla rispettiva immagine. Ogni record, diviso in campi e in ulteriori sotto campi, è stato pensato per organizzare e frammentare l'informazione e consentire indicizzazioni puntuali per recuperi informativi sui titoli, sulle lingue indagate da Saussure e oggetto di argomentazione linguistica (latino, greco, tedesco.), sulla tipologia della fonte documentaria, sulla data della comunicazione, sulla data della pubblicazione, sui commenti, sulle note, sulle riedizioni},
KEYWORDS = {Ferdinand de Saussure, Banca dati bibliografica},
URL = {https://iris.cnr.it/handle/20.500.14243/129374},
CONFERENCE_NAME = {Seminario internazionale Per un'edizione digitale dei manoscritti di Ferdinand de Saussure-Conclusione},
}
@MISC{PIRRELLI_2012_MISC_PV_228594,
AUTHOR = {Pirrelli and Vito},
TITLE = {Hebbian Self-Organizing Memories for Lexical Recoding and Processing},
YEAR = {2012},
ABSTRACT = {Hebbian self-organizing memories (Pirrelli et al. 2010, Ferro et al. 2011, Koutnik 2007) can provide a rigorous and testable conceptual framework within which to unify diverse functional hypotheses for lexical acquisition and processing, and to clarify how these hypotheses may be explained computationally. I discuss a few desiderata that any biologically-inspired computational model of the mental lexicon has to meet, and report on how well such desiderata are met by different types of Hebbian self-organizing memories, exhibiting empirically different maturational trends in lexical acquisition},
KEYWORDS = {Self-organising Maps, Memory, Word Processing},
URL = {https://iris.cnr.it/handle/20.500.14243/228594},
CONFERENCE_NAME = {Workshop on Exo-lexical variables in monolingual and bilingual morphological processing, IMM15},
}
@MISC{PIRRELLI_2012_MISC_PV_228538,
AUTHOR = {Pirrelli and Vito},
TITLE = {At the core of lexical processing: computational and neurocognitive issues},
YEAR = {2012},
ABSTRACT = {The lexicon lies at the root of our linguistic competence and represents a fundamental interface domain between language and our conceptualisation of the outside world. In traditional conceptions of the language architecture, the lexicon has been generally characterised as a declarative memory store of static building blocks, with rules providing the basic principles and constraints on their on-line procedural combination. The talk deals with some recent computational models of self-organising memories and neuroimaging evidence of the connectivity of the perisylvian network for language processing and working memory located in the left hemisphere of the human brain, to suggest a different conception of the mental lexicon and its role in the architecture of language},
KEYWORDS = {Memory, Mental Lexicon, Neurocognitive correlates},
URL = {http://hnk.ffzg.hr/fassbl2012/},
CONFERENCE_NAME = {8th International Conference Formal Approaches to South Slavic and Balkan Languages (FASSBL-8)},
}
@MISC{PROIETTI_2012_MISC_P_411319,
AUTHOR = {Proietti, C.},
TITLE = {Review of C. Gratton, Infinite regress arguments},
YEAR = {2012},
KEYWORDS = {Infinite regress arguments},
PAGES = {213-217},
URL = {https://iris.cnr.it/handle/20.500.14243/411319},
VOLUME = {4 (1)},
ISSN = {0718-8285},
}
@MISC{SORIA_2012_MISC_S_117855,
AUTHOR = {Soria, C.},
TITLE = {Voices of Italy: a project for the preservation of Italian language diversity},
YEAR = {2012},
URL = {https://iris.cnr.it/handle/20.500.14243/117855},
CONFERENCE_NAME = {Language Endangerment: Methodologies and New Challenges},
}
@MISC{SORIA_2012_MISC_SZ_284000,
AUTHOR = {Soria, C. and Zoli, C.},
TITLE = {New markets for Language Technology for minority languages},
YEAR = {2012},
ABSTRACT = {Language Technology offers significant opportunities for minority languages and can be a major force in addressing and alleviating some of the difficulties they face. For minority languages in particular, speech and language technology are a powerful means to bring together speakers' communities, to have a major impact on language learning support, to promote inclusion of elderly or impaired people and to foster widespread use of a language through digital means. In this talk, we will be presenting first the main outcomes of the research carried out by the META-NET project, resulting in the publication of the White Paper Series "Europe's Languages in the Digital Age". The series, that reports on the state of each European language with respect to Language Technology, offers an updated synthesis of the most urgent risks and chances faced, in particular, by less-serviced languages. The presentation will then provide concrete examples of LT solutions for minority languages, discussing their potential impact on those languages, in particular with regard to their role for language maintenance and preservation in the eyes of the younger, digitally-oriented generation},
KEYWORDS = {Language technology, NLP, minority languages},
URL = {https://iris.cnr.it/handle/20.500.14243/284000},
CONFERENCE_NAME = {3e Symposium sur le Multilinguisme dans le Cyberespace},
}
@MISC{SPADONI_2012_MISC_STLRTSO_122972,
AUTHOR = {Spadoni, F. and Tartarelli, A. and Loparco, L. and Rossi, R. and Tariffi, F. and Sassolini, E. and Ongaro, P.},
TITLE = {SMARTCITY: CUSTOMIZED AND DYNAMIC MULTIMEDIA CONTENT PRODUCTION FOR TOURISM APPLICATIONS},
YEAR = {2012},
ABSTRACT = {This paper presents the final results of the SMARTCITY project, co-funded by the Tuscany Region under the POR CREO 1. d program. The project proposes an innovative methodology as well as advanced technologies enabling professional services for cultural tourism applications in urban areas as well larger archaeological sites},
KEYWORDS = {Tourism application, Dynamic Multimedia Content Production, Semantic Annotation},
URL = {https://iris.cnr.it/handle/20.500.14243/122972},
}
@MISC{VACCARO_2012_MISC_VGBDLBZ_259607,
AUTHOR = {Vaccaro, G. and Guadagnini, E. and Burgassi, C. and Dotto, D. and Lorenzi, C. and Biondi, C. L. and Zago, A.},
TITLE = {DiVo-Bibliografia filologica (2012)},
YEAR = {2012},
ABSTRACT = {DiVo DB è la bibliografia filologica dei volgarizzamenti medievali dei testi classici e tardo-antichi. Sono compilate delle schede brevi per le opere latine, con informazioni sull'autore, sulla compilazione e sul genere dell'opera, nonché l'identificazione dell'edizione di riferimento (quella inclusa nel corpus DiVo). Le schede dei testi volgari contengono cenni biografici sull'autore del volgarizzamento, la datazione dell'opera, l'identificazione della coloritura linguistica del testo, l'indicazione della tipologia testuale e del genere dell'opera, la catalogazione della tradizione diretta mediante l'elencazione dei testimoni manoscritti e delle stampe antiche, una trattazione filologica della storia della tradizione, l'identificazione dell'edizione di riferimento, un panorama bibliografico sull'opera articolato per punti. A ciascun manoscritto è dedicata una scheda in cui si indicano gli incipit e gli explicit di ciascun manoscritto, le carte in cui l'opera è contenuta, eventuali note e l'informazione sulla visione diretta del manufatto. Si indicano i casi in cui lo studio della tradizione ha mostrato la necessità di controlli più approfonditi della lezione dei manoscritti: gli esiti di tali controlli costituiscono il sistema di note filologiche associato al corpus DiVo},
URL = {https://iris.cnr.it/handle/20.500.14243/259607},
}
@ARTICLE{BARCA_2011_ARTICLE_BFP_180100,
AUTHOR = {Barca, L. and Frascarelli, F. and Pezzulo, G.},
TITLE = {Working memory and Mental Imagery in Cerebral Palsy: A single case investigation},
YEAR = {2011},
ABSTRACT = {In this study we describe visuospatial working memory and visual mental imagery of a child with Cerebral Palsy. Beyond a moderate impairment of visuomotor integration skills, cognitive level and memory span, poor performance emerged in figures reconstruction, in memorizing matrix patterns and movements along a path. No such deficits were observed in recalling figures and their positions on a grid and learning groups of words using a visual imagery strategy. This case highlights that impaired action execution impairs performance in imagery tasks as well, but not when alternative strategies (e. g., verbal encoding) can be adopted. Results are discussed considering recent evidence on working memory and visual imagery links, and their role in motor rehabilitation training},
KEYWORDS = {Cerebral palsy, Visuospatial Working Memory, Visual Imagery, Motor rehabilitation training, Dorsal stream vulnerability},
PAGES = {1-7},
URL = {https://iris.cnr.it/handle/20.500.14243/180100},
VOLUME = {(i-Firts)},
DOI = {10.1080/13554794.2011.588183},
ISSN = {1355-4794},
JOURNAL = {NEUROCASE},
}
@ARTICLE{CARDUCCI_2011_ARTICLE_CASCC_436879,
AUTHOR = {Carducci, A. and Alfani, S. and Sassi, M. and Cinini, A. and Calamusa, A.},
TITLE = {Mass media health information: Quantitative and qualitative analysis of daily press coverage and its relation with public perceptions},
YEAR = {2011},
ABSTRACT = {Objective: This paper describes the methods followed by the Pisa University OCS for collecting, storing and analyzing all health-related articles and database contents. Moreover, an example population survey on the topic of food safety based on such analysis is shown. Methods: Articles published each day since 1999 in Italy's three most popular newspapers are collected and stored in a Data Base Text; on these articles quantitative and qualitative analyses were conducted. On the basis of these results as well as of epidemiological data, a questionnaire survey was carried out about sources of information, knowledge and risk perception of citizens regarding food safety. Results: On a total of 24, 434 articles on all health topics, 18% regarded food related hazards: their evolution over time showed peaks on BSE, avian flu and dioxin. A large proportion of the people surveyed declared having changed their food habits, at least temporarily, as a consequence of media information. Most get their information on food safety mainly from television. Most respondents remembered having previously heard news on BSE, avian flu and dioxin, but did not recall having heard of listeriosis, brucellosis or typhoid fever. Conclusions: Newspapers articles facing food related hazards tend to be alarming thus affecting the citizens risk perception. On the other hand people often ignore how to manage their own food safety in a practical way. Practice implications: Analysis of media messages can help to evaluate and correct the negative effects that may result in wrong information},
KEYWORDS = {Risk perception, Food safety, Mass media Communication, Population survey},
PAGES = {475-478},
URL = {http://www.sciencedirect.com/science/article/pii/S0738399111000061},
VOLUME = {VOLUME 82, ISSUE 3},
DOI = {10.1016/j.pec.2010.12.025},
ISSN = {0738-3991},
JOURNAL = {PATIENT EDUCATION AND COUNSELING},
}
@ARTICLE{CHERSI_2011_ARTICLE_CFPP_179864,
AUTHOR = {Chersi, F. and Ferro, M. and Pezzulo, G. and Pirrelli, V.},
TITLE = {Time, Language and Action-A Unified Long-Term Memory Model for Sensory-Motor Chains and Word Schemata},
YEAR = {2011},
ABSTRACT = {Action and language are known to be organized as closely-related brain subsystems. An Italian CNR project implemented a computational neural model where the ability to form chains of goal-directed actions and chains of linguistic units relies on a unified memory architecture obeying the same organizing principles},
PAGES = {27-28},
URL = {http://ercim-news.ercim.eu/images/stories/EN84/EN84-web.pdf},
VOLUME = {84},
ISSN = {0926-4981},
JOURNAL = {ERCIM NEWS},
}
@ARTICLE{DIDONATO_2011_ARTICLE_D_383741,
AUTHOR = {Di Donato, F.},
TITLE = {Les enjeux politiques de l'open access et le système de pouvoir scientifique},
YEAR = {2011},
ABSTRACT = {Le sfide politiche dell'open access al sistema tradizionale di comunicazione della ricerca},
URL = {https://iris.cnr.it/handle/20.500.14243/383741},
ISSN = {1591-4305},
JOURNAL = {BOLLETTINO TELEMATICO DI FILOSOFIA POLITICA},
}
@ARTICLE{DIDONATO_2011_ARTICLE_D_383742,
AUTHOR = {Di Donato, F.},
TITLE = {Comunicare la cultura: il dibattito sulla repubblica delle lettere nell'illuminismo tedesco},
YEAR = {2011},
ABSTRACT = {L'articolo ricostruisce le origini dell'espressione respublica literaria concentrandosi sul dibattito settecentesco sulla repubblica delle lettere in ambito germanico. In particolare, vengono prese in esame e messe a confronto le posizioni di Friedrich Gottlieb Klopstock e di alcune figure di spicco dell'illuminismo tedesco},
URL = {https://iris.cnr.it/handle/20.500.14243/383742},
ISSN = {1591-4305},
JOURNAL = {BOLLETTINO TELEMATICO DI FILOSOFIA POLITICA},
}
@ARTICLE{FERRO_2011_ARTICLE_FMP_179921,
AUTHOR = {Ferro, M. and Marzi, C. and Pirrelli, V.},
TITLE = {A Self-Organizing Model of Word Storage and Processing: Implications for Morphology Learning},
YEAR = {2011},
ABSTRACT = {In line with the classical cornerstone of "dual-route" models of word structure, assuming a sharp dissociation between memory and computation, word storage and processing have traditionally been modelled according to different computational paradigms. Even the most popular alternative to dual-route thinking-connectionist one-route models-challenged the lexicon-grammar dualism only by providing a neurally-inspired mirror image of classical base-to-inflection rules, while largely neglecting issues of lexical storage. Recent psycho-and neuro-linguistic evidence, however, supports a less deterministic and modular view of the interaction between stored word knowledge and on-line processing. We endorse here such a non modular view on morphology to offer a computer model supporting the hypothesis that they are both derivative of a common pool of principles for memory self-organization},
KEYWORDS = {Lexical Processing, Self Organizing Maps, Morphological Structure, Serial Memory},
PAGES = {209-226},
URL = {http://www.rivisteweb.it/doi/10.1418/35840},
VOLUME = {2},
DOI = {10.1418/35840},
ISSN = {1720-9331},
JOURNAL = {LINGUE E LINGUAGGIO},
}
@ARTICLE{GUADAGNINI_2011_ARTICLE_G_269014,
AUTHOR = {Guadagnini, E.},
TITLE = {Voce MACIGNO s. m. /agg. del Tesoro della Lingua Italiana delle Origini},
YEAR = {2011},
ABSTRACT = {Proposta di un'interpretazione originale di un passo di Bonvesin de la Riva (punto 1. 2. 1 della voce): 1 Tipo di pietra (gen. roccia arenaria) di particolare durezza e resistenza (impiegato come materiale da costruzione e, in partic., per fare macine). 1. 1 [Con rif. alla durezza]. 1. 2 Meton. Blocco di pietra, masso (grezzo o lavorato, impiegato come materiale da costruzione). 2 Agg. Pietra, coperta macigna: di pietra arenaria (dotata di particolare durezza e resistenza). 2. 1 Fig. Caratterizzato da estrema durezza},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana, Bonvesin da la Riva},
URL = {http://tlio.ovi.cnr.it/voci/026385.htm},
VOLUME = {15},
ISSN = {2240-5216},
JOURNAL = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI},
}
@ARTICLE{GUADAGNINI_2011_ARTICLE_G_272423,
AUTHOR = {Guadagnini, E.},
TITLE = {Voce FORTE (1) agg. /avv. /s. m. del Tesoro della Lingua Italiana delle Origini},
YEAR = {2011},
ABSTRACT = {Voce fondata su una vasta documentazione (oltre 11. 000 occorrenze nel corpus OVI) e di grande complessità semantica: 1 [Rif. alla prestanza o alla potenza fisica (di una persona, di un animale): ] dotato di un corpo vigoroso; che è in grado di sostenere prove fisiche impegnative, di fornire un notevole sforzo muscolare (puntuale o prolungato nel tempo); che ha doti fisiche superiori alla media. 1. 1 [Rif. esplicitamente alla costituzione fisica: ] di corpo forte; di forte natura; forte del corpo, di natura, della persona: di tempra robusta, di costituzione solida. 1. 2 Sost. Uomo dotato di grande prestanza o potenza fisica. 1. 3 [Rif. alla condizione fisica (potenzialmente mutevole o transitoria) di una persona o di un animale: ] che sta bene, che è in salute, che presenta condizioni fisiche ottimali, non debilitato. 1. 4 Avv. Impiegando (risolutamente) il proprio vigore o le proprie possibilità fisiche. 1. 5 Sost. [Per fraintendimento del lat. o guasto testuale: ] forza fisica, prestanza? 2 [Detto di un oggetto, di un materiale: ] capace di resistere ad uno sforzo, una pressione, una violenza; robusto, solido. 2. 1 [Detto di una costruzione o di un'opera in muratura: ] capace di resistere all'urto o all'attacco (spec. del nemico); fortificato. 2. 2 [Detto di un tessuto o di un oggetto in tessuto: ] resistente, non cedevole, di trama serrata. 2. 3 [Rif. ad oggetti sottoposti a pressioni o forti movimenti: ] che mantiene saldamente la sua posizione, che non è soggetto a cedimenti, cadute o rotture. Stare (bene e) forte, tenersi forte (anche con valore avv.). 3 [Rif. specif. alla capacità, alla possibilità o alla qualità di azione: ] che è in grado di influire o intervenire sensibilmente sul mondo esterno, sugli altri o sul corso degli eventi (modificandoli in virtù delle proprie facoltà, competenze, energie, o della propria posizione ed importanza); dotato di potere o di efficacia. 3. 1 [Come attributo di Dio, Cristo, Maria, di un santo (o rif. al loro potere)]. 3. 2 Avv. [Con valore pos., rif. specif. al giovare (fisicamente), al dare conforto (morale): ] efficacemente. 3. 3 Sost. Chi è in grado di imporsi sugli altri (per potere, posizione, caratteristiche fisiche o morali). 3. 4 Forte a qsa: che ha i requisiti, le qualità o le competenze necessarie per adempiere un det. compito, affrontare una det. situazione o reagire correttamente ad un det. stimolo; idoneo, atto o capace (fisicamente o moralmente) a qsa. 3. 5 [Detto di un farmaco: ] che agisce vigorosamente, influendo sensibilmente sul fisico (risultando efficace, ma anche gravoso da sopportare). 3. 6 [Detto di una tentazione: ] che ha il potere (quasi irresistibile) di indurre ad un det. comportamento. 3. 7 [Detto di un argomento: ] che è stabilito su basi solide e certe, che si sviluppa in modo convincente, che raggiunge o induce a conclusioni sicure; fondato, valido. 3. 8 [Con rif. ad una situazione di opposizione o di scontro (spec. militare), detto di un contendente o del suo intervento: ] dotato di vigore ed efficacia (spec. offensiva), atto e pronto a combattere validamente. 3. 9 [Detto di una legge, un processo o un provvedimento giudiziario: ] che esprime una posizione rigorosa e prevede una sanzione o una punizione severa. 3. 10 Sost. Abilità (di poeta), maestria. 4 [Detto specif. di un elemento o un fenomeno naturale: ] che ha caratteristiche o assume un'intensità tale da influire sensibilmente sulle condizioni ambientali (modificandole e spec. rendendole difficili per le persone; anche in contesti fig.). 4. 1 Avv. 5 [Detto di una persona, con rif. alla sua qualità morale: ] che agisce governando e forgiando la sua natura, il suo temperamento, la sua volontà e il suo comportamento in conformità alla norma morale; che non cede all'avversità, agli ostacoli, al dolore, alla tentazione, alla provocazione o al vizio e si mantiene saldo nei suoi principi e coerente nei suoi comportamenti; che ha e dimostra grandezza d'animo. 5. 1 [Rif. specif. all'animo]. 5. 2 Sost. Chi non cede alle avversità, agli ostacoli, alle tentazioni e mantiene il controllo di sé e un comportamento retto. 6 Che esige sforzo, impegno (fisico o morale) o abilità per essere affrontato, sopportato o superato; difficile, duro. 6. 1 Forte a, forte cosa a (una det. azione, espressa dall'inf. verbale): che richiede sforzo e impegno per un fine det. e esplicito. 6. 2 [Con valore neg.: ] avverso e ostile; crudele. 6. 3 [Detto di una prova fisica (spec. una pena, un martirio): ] che risulta debilitante e doloroso per il fisico. 6. 4 [Detto di un luogo fisico: ] che è difficilmente raggiungibile, accessibile o transitabile; impervio, malagevole. 6. 5 [Rif. ad un discorso, un modo di parlare, un concetto: ] che richiede un particolare impegno per essere compreso o interpretato. 6. 6 Sost. Difficoltà. 7 Che si distingue (e richiama l'attenzione) per l'eccezionalità delle sue caratteristiche; che non è usuale, ordinario, normale (per il suo aspetto, per le sue proprietà o la modalità con cui si manifestano). 7. 1 Parere forte (a qno): risultare esagerato o improprio (nella valutazione di qno), provocando sorpresa o sconcerto. 7. 2 Che si verifica raramente e con difficoltà; che ha scarse possibilità di attuazione o di successo. 8 [Con valore generic. intensivo, definisce la consistenza dell'oggetto a cui si riferisce: ] che costituisce o manifesta un grado pieno, intenso, abbondante, compiuto, notevole (in pos. o in neg.). 8. 1 Avv. In modo pieno, intenso, notevole; grandemente, tanto, molto. 8. 2 [Detto di una malattia o di un malore: ] che si manifesta in grado acuto, grave. 8. 3 [Detto di una ferita: ] profonda. 8. 4 [Detto del sonno, del dormire: ] pesante, profondo (tanto da non interrompersi facilmente). 8. 5 [Rif. specif. all'intensità di un suono: ] ad alto volume, rumoroso. 8. 6 [Detto dell'età: ] pienamente matura. 8. 7 [Detto di un odore: ] penetrante (spec. in senso neg.). 8. 8 [Detto del pensare o dell'immaginare: ] che si applica intensamente a qsa (senza occuparsi d'altro, senza distrarsi) producendone una rappresentazione vivida, profonda, che rimane ben presente alla mente o alla memoria. 9 [Rif. specif. ad unità di misura (spec. in relazione a metalli): ] pesante, di peso elevato (o maggiore di qsa altro). 9. 1 [Numism. ] [Detto di una moneta: ] pesante (e dunque di maggior valore). 10 [Detto di una spezia o di una pietanza: ] particolarmente saporito, piccante. 10. 1 [Detto del vino: ] ad alta gradazione alcolica. 10. 2 [Detto specif. dell'olio (in opp. a dolce): ] robusto. 11 [Rif. ad un movimento o alla capacità di movimento: ] che procede a velocità elevata (o ne ha la possibilità), rapido. 11. 1 [Detto del polso, del battito del cuore: ] accelerato, che batte velocemente (più del normale). 12 [Detto di un terreno: ] che si presenta compatto e resistente (specif. per la sua natura argillosa)},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana},
URL = {http://tlio.ovi.cnr.it/voci/025721.htm},
VOLUME = {15},
ISSN = {2240-5216},
JOURNAL = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI},
}
@ARTICLE{GUADAGNINI_2011_ARTICLE_G_275400,
AUTHOR = {Guadagnini, E.},
TITLE = {Scelta di voci del Tesoro della Lingua Italiana delle Origini (quindicesima serie)},
YEAR = {2011},
ABSTRACT = {Voci image s. f. /s. m., imago s. f., incantamento s. m., incantante s. m., incantare (1) v., incantare (2) v., incantato (1) agg. /s. m., incantato (2) agg., incantatore s. m. /agg., incantatrice s. f., incantatura s. f., incantazione (1) s. f., incantazione (2) s. f., incanteressa s. f., incantésimo s. m., incantévole agg., incanto (1) s. m., incanto (2) s. m., maceramento s. m., macerare v., macerato agg., macerazione s. f., maceria s. f., màcero (1) agg., màcero (2) s. m., macrocosmo s. m., megacosmo s. m., microcosmo s. m., romanzare v., romanziere s. m., romanzo s. m., sofisma s. m. /s. f., sofismàtico s. m., sofismosamente avv., sofista agg. /s. m., sofistica (1) s. f., sofisticamente avv., sofisticare v., sofisticatamente avv., sofisticato agg., sofisticazione s. f., sofìstico agg. /s. m. del Tesoro della Lingua Italiana delle Origini (pp. 175-193, 200-208, 235-237, 249-256)},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana},
PAGES = {15-265},
URL = {https://iris.cnr.it/handle/20.500.14243/275400},
VOLUME = {16},
ISSN = {1591-8254},
JOURNAL = {BOLLETTINO-OPERA DEL VOCABOLARIO ITALIANO},
}
@ARTICLE{GUADAGNINI_2011_ARTICLE_G_273021,
AUTHOR = {Guadagnini, E.},
TITLE = {«Magi» in italiano antico. Note lessicografiche e qualche considerazione su un'occorrenza petrarchesca (RVF 213, 14)},
YEAR = {2011},
ABSTRACT = {Il lavoro propone un censimento delle occorrenze del termine image 'immagine' nei testi italiani antichi. In particolare, si riconduce a tale lemma la forma aferetica del plurale "magi", mai identificata in precedenza ma attestata nel trattato metrico di Gidino da Sommacampagna, in un sonetto di Niccolò de' Rossi e probabilmente in un anonimo poemetto lombardo. Si discute inoltre la possibilità che un'attestazione petrarchesca della forma "magi" (RVF 213, 14) sia anch'essa da interpretarsi come occorrenza di "image"},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana, Petrarca},
PAGES = {109-121},
URL = {https://iris.cnr.it/handle/20.500.14243/273021},
VOLUME = {8},
ISSN = {1724-9090},
JOURNAL = {MEDIOEVO LETTERARIO D'ITALIA},
}
@ARTICLE{GUADAGNINI_2011_ARTICLE_G_272222,
AUTHOR = {Guadagnini, E.},
TITLE = {Voce RITMO s. m. del Tesoro della Lingua Italiana delle Origini},
YEAR = {2011},
ABSTRACT = {Tecnicismo metrico (con una nota linguistica in 0. 5). Assieme alle voci "arismo" e "orismo" fornisce un quadro delle diverse soluzioni filologiche proposte per un passo controverso di Guido Cavalcanti. 1 [Metr. ] Segmento testuale che si costituisce come unità (all'interno di un testo) e si fonda su una struttura che regola il numero delle sillabe, la posizione degli accenti (e specif. dell'ultimo accento tonico) ed eventualmente la sequenza fonica successiva all'ultimo accento tonico; lo stesso che verso. Unità composta da una det. sequenza di versi (gen. la terzina). 1. 1 [Come unità di composizione specif. volgare (in opp. al cursus o ai "versi" del lat.)]. 1. 2 [Metr. ] Meton. Testo in versi. 2 [Metr. ] Lo stesso che rima? 3 [Titolo di un'opera di Avicenna]},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana, Cavalcanti},
URL = {http://tlio.ovi.cnr.it/voci/026403.htm},
VOLUME = {15},
ISSN = {2240-5216},
JOURNAL = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI},
}
@ARTICLE{GUADAGNINI_2011_ARTICLE_G_272216,
AUTHOR = {Guadagnini, E.},
TITLE = {Voce ORISMO s. m. del Tesoro della Lingua Italiana delle Origini},
YEAR = {2011},
ABSTRACT = {Assieme alle voci "arismo" e "ritmo" fornisce un quadro delle diverse soluzioni filologiche proposte per un passo controverso di Guido Cavalcanti},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana, Cavalcanti},
URL = {http://tlio.ovi.cnr.it/voci/026393.htm},
VOLUME = {15},
ISSN = {2240-5216},
JOURNAL = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI},
}
@ARTICLE{GUADAGNINI_2011_ARTICLE_G_272238,
AUTHOR = {Guadagnini, E.},
TITLE = {Voce MAGO s. m. /agg. del Tesoro della Lingua Italiana delle Origini},
YEAR = {2011},
ABSTRACT = {Voce interessante dal punto di vista storico-culturale (con un approfondimento sulla caratterizzazione dei "re magi"); punto di partenza per la preparazione dell'articolo in rivista "Magi in italiano antico" (Medioevo lett. Ital. 8). 1 Persona capace di produrre, mediante speciali formule e rituali (gen. di natura esoterica), effetti straordinari, apparentemente in contrasto con le leggi naturali e non giustificabili razionalmente; persona in grado di esercitare particolari poteri partecipando delle forze occulte immanenti alla natura (segnatamente le forze demoniache). 1. 1 [Appellativo del Simone che tentò di acquistare da Pietro il potere di amministrare lo Spirito Santo (Atti degli Apostoli)]. 2 Aristocratico persiano appartenente alla casta dei sacerdoti del culto di Zoroastro. Estens. Regnante persiano. 2. 1 Plur. I tre sapienti orientali che seguendo la stella cometa si recarono a Betlemme per adorare Gesù Cristo appena nato. 3 Agg. Lo stesso che magico. Arte maga, arti maghe: magia},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana},
URL = {http://tlio.ovi.cnr.it/voci/027442.htm},
VOLUME = {15},
ISSN = {2240-5216},
JOURNAL = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI},
}
@ARTICLE{GUADAGNINI_2011_ARTICLE_G_269021,
AUTHOR = {Guadagnini, E.},
TITLE = {Voce SEME (1) s. m. /s. f. /avv. del Tesoro della Lingua Italiana delle Origini},
YEAR = {2011},
ABSTRACT = {Ampio ventaglio semantico. 1 Parte della pianta (gen. di forma tondeggiante e poco cedevole al tatto) che, germogliata, ne assicura la riproduzione. 1. 1 Fras. A seme di papaveri, di papavero: in grande quantità. 1. 2 [Con valore collettivo: ] l'insieme dei semi da seminare o seminati. 1. 3 [Per indicare collettivamente i cereali coltivati a fine alimentare]. 1. 4 [Rif. a semi usati per scopi diversi dalla coltivazione, specif. in ambito gastronomico o farmaceutico]. 1. 5 [Rif. estens. a ciò che fa nascere qsa altro: ] uovo (fecondato). 1. 6 [In contesto o con valore fig., per indicare ciò che è causa o origine (di qsa)]. 1. 7 [Considerato come il prodotto della pianta (anche fig.)]. 2 Liquido organico maschile (dell'uomo, di animali o di entità antropomorfe) responsabile della fecondazione, sperma. 2. 1 Meton. Figlio. Estens. Stirpe, discendenza. 2. 2 [Detto degli ovuli femm., equiparati tipologicamente al liquido seminale masch. ]. 3 [Generic., per opporre gli organismi viventi (vegetali e animali) agli oggetti inanimati: ] corpo riproduttivo. Produrre con seme, senza seme. 4 [Agr. ] Operazione di semina. Estens. Coltivazione (della terra); anche fig. 4. 1 [Detto di det. quantità di cereali o ortaggi, di cui si esplicita l'utilizzo per coltura: ] per seme. 4. 2 [Detto di det. varietà di cereale o di ortaggio: ] locuz. agg. Da seme: che si coltiva specif. per raccoglierne il seme. Grano da seme. 5 [Associato ad una misura di superficie: ] quantità di semi necessaria a seminare una det. porzione di terreno. 6 Avv. Poco. [Spec. in frasi neg.: ] per niente, niente affatto},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana},
URL = {http://tlio.ovi.cnr.it/voci/026094.htm},
VOLUME = {15},
ISSN = {2240-5216},
JOURNAL = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI},
}
@ARTICLE{GUADAGNINI_2011_ARTICLE_G_272209,
AUTHOR = {Guadagnini, E.},
TITLE = {Voce ARISMO s. m. del Tesoro della Lingua Italiana delle Origini},
YEAR = {2011},
ABSTRACT = {Assieme alle voci "orismo" e "ritmo" fornisce un quadro delle diverse soluzioni filologiche proposte per un passo controverso di Guido Cavalcanti},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana, Cavalcanti},
URL = {http://tlio.ovi.cnr.it/voci/026312.htm},
VOLUME = {15},
ISSN = {2240-5216},
JOURNAL = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI},
}
@ARTICLE{GUADAGNINI_2011_ARTICLE_GV_241057,
AUTHOR = {Guadagnini, E. and Vaccaro, G.},
TITLE = {Qui dice Tullio, qui parla lo sponitore. Il lessico retorico nei volgarizzamenti ciceroniani},
YEAR = {2011},
ABSTRACT = {This work examines the rethorical terminology that derives from Cicero, that is to say the one that is found in the medieval treatises of the XIII and XIV centuries, directly based on De inventione and-because of the traditional attribution-on the Rhetorica ad Herennium. From a general point of view, we register a tendency of freeing from Latin, put into effect through fully vulgar reformulations of the verbs, while the loans for nouns are more common. Also in the case of nouns, however, we observe sometimes interesting attempts of reformulation and resorting to serial linguistic elements, like the suffix-mento, significant clue of linguistic technicization},
PAGES = {5-21},
URL = {https://iris.cnr.it/handle/20.500.14243/241057},
VOLUME = {28},
ISSN = {0392-5218},
JOURNAL = {STUDI DI LESSICOGRAFIA ITALIANA},
}
@ARTICLE{MARZI_2011_ARTICLE_MPS_224009,
AUTHOR = {Marzi, C. and Pardelli, G. and Sassi, M.},
TITLE = {A terminology based re-definition of Grey Literature},
YEAR = {2011},
ABSTRACT = {The conventionally accepted definition of Grey Literature, as Information produced and distributed by non-commercial publishing, does not take into consideration either the increasing availability of forms of grey knowledge, or the growing importance of computerbased encoding and management as the standard mode of creating and developing grey literature. Semi-automated terminological analysis of almost twenty years of terminological creativity in the proceedings of eleven GL International Conferences offers the opportunity to pave the way to a bottom-up redefinition of Grey Literature stemming from attested terminological creativity and lexical innovation. In this paper, we focus on a set of automatically-acquired terms obtained by subjecting our reference Corpus to a number of pre-processing steps of automated text analysis, such as concordances, frequency lists and lexical association scores. Acquired terms allow us to throw in sharp relief developing trends and important shifts of emphasis in the current understanding of the notion of Grey Literature},
KEYWORDS = {Grey Literature, Terminology extraction},
PAGES = {19-23},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-84869064979\&origin=inward},
VOLUME = {7 (1)},
ISSN = {1574-1796},
JOURNAL = {THE GREY JOURNAL},
}
@ARTICLE{NAHLI_2011_ARTICLE_N_222328,
AUTHOR = {Nahli, O.},
TITLE = {ya?ya: ibn ?adi: sulla differenza ?a la logica greca e la grammatica araba},
YEAR = {2011},
ABSTRACT = {?is paper examines the Treatise on the Difference between the two fields of philosophical logic and Arabic grammar (Maq?la f? taby?n al-fa?l bayna ?ina'atay al-man?iq al-falsaf? wa-l-na?w al-'arab?) by Ab? Zakariy?' Ya?y? ibn 'Ad?, providing also its Italian translation. It will appear that Ya?y? ibn 'Ad?'s approach is based on F?r?b?'s ideas about the relationship between logic and the sciences of language. Even more important is the fact that the difference established by Ya?y? ibn 'Ad?'s between logic and grammar both as for the subject (maw??') and as for scope (?arad) counts as the source for Avicenna's distinction between subject (maw??') and scope (?arad) of the metaphysics},
PAGES = {47-67},
URL = {http://www.greekintoarabic.eu/uploads/media/3wafae_utlimo.pdf},
VOLUME = {1},
ISSN = {2239-012X},
JOURNAL = {STUDIA GRAECO-ARABICA},
}
@ARTICLE{PEZZULO_2011_ARTICLE_P_179888,
AUTHOR = {Pezzulo, G.},
TITLE = {Grounding Procedural and Declarative Knowledge in Sensorimotor Anticipation},
YEAR = {2011},
ABSTRACT = {We propose a view of embodied representations that is alternative to both symbolic/linguistic approaches and purely sensorimotor views of cognition, and can account for procedural and declarative knowledge manipulation. In accordance with recent evidence in cognitive neuroscience and psychology, we argue that anticipatory and simulative mechanisms, which arose during evolution for action control and not for cognition, determined the first form of representational content and were exapted for increasingly sophisticated cognitive uses. In particular, procedural and declarative forms of knowledge can be explained, respectively, in terms of on-line sensorimotor anticipation and off-line simulations of potential actions, which can give access to tacit knowledge and make it explicit. That is, mechanisms that evolved for the on-line prediction of the consequences of one's own actions (i. e. forward models) determine a (procedural) form of representation, and became exapted for off-line use. They can therefore be used to produce (declarative) knowledge of the world, by running a simulation of the action that would produce the relevant information. We conclude by discussing how embodied representations afford a form of internal manipulation that can be described as internalized situated action},
KEYWORDS = {anticipation, simulation, representation, internal model, grounding},
PAGES = {78-114},
URL = {https://iris.cnr.it/handle/20.500.14243/179888},
VOLUME = {26 (1)},
ISSN = {0268-1064},
JOURNAL = {MIND \& LANGUAGE},
}
@ARTICLE{PEZZULO_2011_ARTICLE_PBCN_10218,
AUTHOR = {Pezzulo, G. and Baldassarre, G. and Cesta, A. and Nolfi, S.},
TITLE = {Research on Cognitive Robotics at the Institute of Cognitive Sciences and Technologies, National Research Council of Italy},
YEAR = {2011},
ABSTRACT = {ISTC-CNR is a research hub in cognitive robotics as this is the main research focus of several research labs working within it. The interdisciplinary approach used is one of the key characteristics of cognitive robotics studies at ISTC-CNR. This research involves over 30 people (among researchers, Post-Docs, and PhD students) having different backgrounds (ranging from engineering and computer science to psychology, neuroscience, and philosophy) and pursuing research objectives as diverse as (a) the use of computational and robotic models to investigate psychological and neural phenomena, (b) the realization of novel paradigms for robot learning, control, planning, decision making, team making, and human-robot interaction, and (c) the delivery of novel autonomous robotic technologies that act in real-world scenarios},
KEYWORDS = {Cognitive Robotics, Cognitive Sistems},
PAGES = {367-374},
URL = {https://iris.cnr.it/handle/20.500.14243/10218},
VOLUME = {12},
DOI = {10.1007/s10339-011-0402-3},
ISSN = {1612-4782},
JOURNAL = {COGNITIVE PROCESSING},
}
@ARTICLE{PEZZULO_2011_ARTICLE_PBCFMS_175341,
AUTHOR = {Pezzulo, G. and Barsalou, L. W. and Cangelosi, A. and Fischer, M. H. and McRae, K. and Spivey, M. J.},
TITLE = {The mechanics of embodiment: A dialogue on embodiment and computational modeling},
YEAR = {2011},
ABSTRACT = {Embodied theories are increasingly challenging traditional views of cognition by arguing that conceptual representations that constitute our knowledge are grounded in sensory and motor experiences, and processed at this sensorimotor level, rather than being represented and processed abstractly in an amodal conceptual system. Given the established empirical foundation, and the relatively underspecified theories to date, many researchers are extremely interested in embodied cognition but are clamoring for more mechanistic implementations. What is needed at this stage is a push toward explicit computational models that implement sensorimotor grounding as intrinsic to cognitive processes. In this article, six authors from varying backgrounds and approaches address issues concerning the construction of embodied computational models, and illustrate what they view as the critical current and next steps toward mechanistic theories of embodiment. The first part has the form of a dialog between two fictional characters: Ernest, the "experimenter, " and Mary, the "computational modeler. " The dialog consists of an interactive sequence of questions, requests for clarification, challenges, and (tentative) answers, and touches the most important aspects of grounded theories that should inform computational modeling and, conversely, the impact that computational modeling could have on embodied theories. The second part of the article discusses the most important open challenges for embodied computational modeling},
KEYWORDS = {rounded cognition, embodiment, simulation, cognitive robotics, computational modeling},
PAGES = {1-21},
URL = {http://www.frontiersin.org/cognition/10.3389/fpsyg.2011.00005/abstract},
VOLUME = {2 (5)},
DOI = {10.3389/fpsyg.2011.00005},
}
@ARTICLE{PEZZULO_2011_ARTICLE_PC_175345,
AUTHOR = {Pezzulo, G. and Calvi, G.},
TITLE = {Computational explorations of perceptual symbol system theory},
YEAR = {2011},
ABSTRACT = {The aim of this paper is twofold. First, we provide a methodological pathway from theories of situated, embodied cognition to simulations with an eye to empirical evidence, and suggest a possible cross-fertilization between cognitive robotics and psychology. Psychological theories, in particular those formulated at an abstract level, include models which are often severely underspecified at the level of mechanisms. This is true in the synchronic, constructive perspective (how can the effects observed in experiments be concretely generated by the model's mechanisms?) and in the diachronic, developmental perspective (how can such mechanisms be learned and developed?). The synthetic method of artificial cognitive systems research, and in particular of cognitive robotics, can complement research in psychology (and neurosciences) by exploring the constructive and developmental aspects of theories. Our second aim is to provide an example of such a methodology by describing simulations aiming at developing a perceptual symbol system (PSS) (Barsalou, 1999). We then describe the two main theoretical constructs of the PSS, perceptual symbols and simulators, illustrate their development in an artificial system, and test the system in prediction, categorization, and abstraction tasks},
KEYWORDS = {Perceptual symbol system, Schema, Embodiment, Anticipation, Simulation},
PAGES = {275-297},
URL = {http://www.sciencedirect.com/science/article/pii/S0732118X09000336},
VOLUME = {29 (3)},
DOI = {10.1016/j.newideapsych.2009.07.004},
ISSN = {0732-118X},
JOURNAL = {NEW IDEAS IN PSYCHOLOGY},
}
@ARTICLE{PEZZULO_2011_ARTICLE_PD_179908,
AUTHOR = {Pezzulo, G. and Dindo, H.},
TITLE = {What should I do next? Using shared representations to solve interaction problems},
YEAR = {2011},
ABSTRACT = {Studies on how the social mind" works reveal that cognitive agents engaged in joint actions actively estimate and in uence another's cognitive variables, and form shared representations with them. (How) do shared rep-resentations enhance coordination? In this paper we provide a probabilistic model of joint action that emphasizes how shared representations help solv-ing interaction problems. We focus on two aspects of the model. First, we discuss how shared representations permit to coordinate at the level of cog-nitive variables (beliefs, intentions and actions), and determine a coherent unfolding of execution and predictive processes in the brains of two agents. Second, we discuss the importance of signaling actions as part of a strategy for sharing representations and the active guidance of another's actions to-wards the achievement of a joint goal. Furthermore, we present data from a human-computer experiment (the Tower Game) in which two agents (human and computer) have to build together a tower made of colored blocks, but only the human knows the constellation of the tower to be built (e. g., red-blue-red-blue-.). We report evidence that humans use signaling strategies that take another's uncertainty into consideration, and that in turn our model is able to use humans' actions as cues to align" its representations and to select complementary actions},
KEYWORDS = {prediction, joint action, signaling},
PAGES = {613-630},
URL = {https://iris.cnr.it/handle/20.500.14243/179908},
VOLUME = {211},
DOI = {10.1007/s00221-011-2712-1},
ISSN = {1432-1106},
JOURNAL = {EXPERIMENTAL BRAIN RESEARCH (INTERNET)},
}
@ARTICLE{PEZZULO_2011_ARTICLE_PR_179915,
AUTHOR = {Pezzulo, G. and Rigoli, F.},
TITLE = {The value of foresight: how prospection affects decision-making},
YEAR = {2011},
ABSTRACT = {Traditional theories of decision-making assume that utilities are based on the intrinsic value of outcomes; in turn, these values depend on associations between expected outcomes and the current motivational state of the decision-maker. This view disregards the fact that humans (and possibly other animals) have prospection abilities, which permit anticipating future mental processes and motivational and emotional states. For instance, we can evaluate future outcomes in light of the motivational state we expect to have when the outcome is collected, not (only) when we make a decision. Consequently, we can plan for the future and choose to store food to be consumed when we expect to be hungry, not immediately. Furthermore, similarly to any expected outcome, we can assign a value to our anticipated mental processes and emotions. It has been reported that (in some circumstances) human subjects prefer to receive an unavoidable punishment immediately, probably because they are anticipating the dread associated with the time spent waiting for the punishment. This article offers a formal framework to guide neuroeconomic research on how prospection affects decision-making. The model has two characteristics. First, it uses model-based Bayesian inference to describe anticipation of cognitive and motivational processes. Second, the utility-maximization process considers these anticipations in two ways: to evaluate outcomes (e. g., the pleasure of eating a pie is evaluated differently at the beginning of a dinner, when one is hungry, and at the end of the dinner, when one is satiated), and as outcomes having a value themselves (e. g., the case of dread as a cost of waiting for punishment). By explicitly accounting for the relationship between prospection and value, our model provides a framework to reconcile the utility-maximization approach with psychological phenomena such as planning for the future and dread},
KEYWORDS = {prediction, prospection, decision-making},
PAGES = {1-15},
URL = {http://www.frontiersin.org/decision_neuroscience/10.3389/fnins.2011.00079/abstract},
VOLUME = {5},
DOI = {10.3389/fnins.2011.00079},
ISSN = {1662-453X},
JOURNAL = {FRONTIERS IN NEUROSCIENCE (ONLINE)},
}
@ARTICLE{THOMPSON_2011_ARTICLE_TMMCDLMMPQRSVRA_175344,
AUTHOR = {Thompson, P. and McNaught, J. and Montemagni, S. and Calzolari, N. and Del Gratta, R. and Lee, V. and Marchi, S. and Monachini, M. and Pezik, P. and Quochi, V. and Rupp, C. and Sasaki, Y. and Venturi, G. and Rebholzschuhmann, D. and Ananiadou, S.},
TITLE = {The BioLexicon: a large-scale terminological resource for biomedical text mining},
YEAR = {2011},
ABSTRACT = {Background Due to the rapidly expanding body of biomedical literature, biologists require increasingly sophisticated and efficient systems to help them to search for relevant information. Such systems should account for the multiple written variants used to represent biomedical concepts, and allow the user to search for specific pieces of knowledge (or events) involving these concepts, e. g., protein-protein interactions. Such functionality requires access to detailed information about words used in the biomedical literature. Existing databases and ontologies often have a specific focus and are oriented towards human use. Consequently, biological knowledge is dispersed amongst many resources, which often do not attempt to account for the large and frequently changing set of variants that appear in the literature. Additionally, such resources typically do not provide information about how terms relate to each other in texts to describe events. Results This article provides an overview of the design, construction and evaluation of a large-scale lexical and conceptual resource for the biomedical domain, the BioLexicon. The resource can be exploited by text mining tools at several levels, e. g., part-of-speech tagging, recognition of biomedical entities, and the extraction of events in which they are involved. As such, the BioLexicon must account for real usage of words in biomedical texts. In particular, the BioLexicon gathers together different types of terms from several existing data resources into a single, unified repository, and augments them with new term variants automatically extracted from biomedical literature. Extraction of events is facilitated through the inclusion of biologically pertinent verbs (around which events are typically organized) together with information about typical patterns of grammatical and semantic behaviour, which are acquired from domain-specific texts. In order to foster interoperability, the BioLexicon is modelled using the Lexical Markup Framework, an ISO standard. Conclusions The BioLexicon contains over 2. 2 M lexical entries and over 1. 8 M terminological variants, as well as over 3. 3 M semantic relations, including over 2 M synonymy relations. Its exploitation can benefit both application developers and users. We demonstrate some such benefits by describing integration of the resource into a number of different tools, and evaluating improvements in performance that this can bring},
KEYWORDS = {Text Mining, Information Extraction, Computational Lexicon},
PAGES = {1-29},
URL = {http://www.biomedcentral.com/1471-2105/12/397},
VOLUME = {12 (397)},
DOI = {10.1186/1471-2105-12-397},
ISSN = {1471-2105},
JOURNAL = {BMC BIOINFORMATICS},
}
@ARTICLE{VALENZA_2011_ARTICLE_VPAFSD_559026,
AUTHOR = {Valenza, G. and Pioggia, G. and Armato, A. and Ferro, M. and Scilingo, E. P. and De Rossi, D.},
TITLE = {A neuron-astrocyte transistor-like model for neuromorphic dressed neurons},
YEAR = {2011},
ABSTRACT = {Experimental evidences on the role of the synaptic glia as an active partner together with the bold synapse in neuronal signaling and dynamics of neural tissue strongly suggest to investigate on a more realistic neuron-glia model for better understanding human brain processing. Among the glial cells, the astrocytes play a crucial role in the tripartite synapsis, i. e. the dressed neuron. A well-known two-way astrocyte-neuron interaction can be found in the literature, completely revising the purely supportive role for the glia. The aim of this study is to provide a computationally efficient model for neuron-glia interaction. The neuron-glia interactions were simulated by implementing the Li-Rinzel model for an astrocyte and the Izhikevich model for a neuron. Assuming the dressed neuron dynamics similar to the nonlinear input-output characteristics of a bipolar junction transistor, we derived our computationally efficient model. This model may represent the fundamental computational unit for the development of real-time artificial neuron-glia networks opening new perspectives in pattern recognition systems and in brain neurophysiology. © 2011 Elsevier Ltd},
KEYWORDS = {Astrocyte, Neuron, Neuron-astrocyte interaction model, Synapse},
PAGES = {679-685},
URL = {https://iris.cnr.it/handle/20.500.14243/559026},
VOLUME = {24 (7)},
DOI = {10.1016/j.neunet.2011.03.013},
ISSN = {0893-6080},
JOURNAL = {NEURAL NETWORKS},
}
@ARTICLE{VENTURI_2011_ARTICLE_V_279141,
AUTHOR = {Venturi, G.},
TITLE = {Semantic annotation of Italian legal texts: a FrameNet-based approach},
YEAR = {2011},
PAGES = {46-79},
URL = {https://iris.cnr.it/handle/20.500.14243/279141},
VOLUME = {3 (1)},
DOI = {10.1075/cf.3.1.02ven},
ISSN = {1876-1933},
JOURNAL = {CONSTRUCTIONS AND FRAMES},
}
@BOOK{RATTI_2011_BOOK_RMOM_279036,
AUTHOR = {Ratti, D. and Marconi, L. and Oyee, J. B. and Mosuy, P. N.},
TITLE = {Diccionario Fang-Español Español-Fang},
YEAR = {2011},
ABSTRACT = {Un diccionario es un libro que habla de las palabras, que explica el sentido de las palabras, no es un libro que se lee como un cuento, sino un libro que se abre para buscar información, para aclarar dudas, para saber cómo se dice en fa? o en español una determinada palabra. Un diccionario bilingüe además explica el sentido de la palabra de una lengua a la otra y funciona como instrumento para aprender a comunicarse en una lengua nueva y también para afianzar el conocimiento de su propia lengua. Este diccionario tiene la ambición de representar, como lengua escrita, las dos variedades del fang de Guinea, el oka y el ntumu, y contiene 8773 entradas repartidas en 3531 comunes a oka y ntumu, 2690 entradas solo del oka y 2552 solo del ntumu. Además, se presenta como un instrumento de fácil consulta, tanto para los hablantes de fang, como para todo el que quiera aprenderlo. Para la realización de esta obra se han tenido que tomar muchas opciones en el ámbito de la ortografía, de las entradas, de la clasificación de las palabras, de las definiciones, etc., y, por lo tanto, este diccionario se propone como una hipótesis que los hablantes de Guinea y los académicos nativos podrán y tendrán que corregir. El uso de la lengua a lo largo del tiempo sancionará la validez de las reglas y las convenciones o determinará cómo cambiarlas. El conocimiento de cualquier fenómeno no viene dado por la solución de cualesquiera dudas o experiencias, sino por el desarrollo o la negación de lo que ya se conoce: nunca se pasa de la perfecta ignorancia al perfecto conocimiento. El diccionario está dividido en dos partes, la primera contiene las palabras fang como entrada y la traducción española. La segunda parte contiene las palabras españolas con la correspondiente traducción en fang},
KEYWORDS = {dizionario, lingua fang, spagnolo},
PAGES = {1148},
URL = {https://iris.cnr.it/handle/20.500.14243/279036},
PUBLISHER = {2CT Asociación para la Conservación de la Cultura tribal (Pieve Ligure, ITA)},
ISBN = {978-88-906102-0-2},
CONFERENCE_PLACE = {Pieve Ligure},
}
@INCOLLECTION{BOZZI_2011_INCOLLECTION_BD_228537,
AUTHOR = {Bozzi, A. and Del Grosso, A. M.},
TITLE = {Progettazione, sviluppo e gestione di una infrastruttura filologico-computazionale per la produzione, interrogazione e pubblicazione sul web di documenti digitali},
YEAR = {2011},
ABSTRACT = {L'obiettivo precipuo della ricerca e? stato quello di favorire lo studio nonche? la diffusione di dati, informazioni e lavori scientifici tramite supporti tecnologici, relativi al concetto di "migrazione" in ambito linguistico e culturale. Verra? offerto un lavoro di analisi e specifica dei requisiti, di progettazione, d'implementazione e di manutenzione, di una serie di componenti che andranno a formare la piattaforma tecnologica in grado di favorire lo studio dei testi indicati nelle linee e negli obiettivi di ricerca},
KEYWORDS = {filologia computazionale, piattaforma web},
PAGES = {339-369},
URL = {https://iris.cnr.it/handle/20.500.14243/228537},
PUBLISHER = {Mc Graw-Hill (Milano, ITA)},
ISBN = {978-88-386-7296-5},
CONFERENCE_PLACE = {Milano},
BOOKTITLE = {Percorsi migranti},
EDITOR = {Bruno, G. C. and Caruso, I. and Sanna, M. and Vellecco, I.},
}
@INCOLLECTION{CALZOLARI_2011_INCOLLECTION_C_279904,
AUTHOR = {Calzolari, N.},
TITLE = {Linguistica Computazionale e Risorse Linguistiche},
YEAR = {2011},
ABSTRACT = {A partire dagli anni '80 le cosiddette Risorse Linguistiche (RL) hanno progressivamente acquisito un ruolo sempre più importan te nella linguistica computazionale e nel Trattamento Automatico della Lingua (TAL). Questo processo è iniziato con il diffondersi degli approcci data-driven, all'interno dei quali le RL hanno con tribuito in modo decisivo allo sviluppo di sistemi innovativi e so prattutto "robusti", cioè in grado di trattare i fenomeni reali della lingua così come usata dai parlanti piuttosto che i fenomeni ritenuti "interessanti" dal linguista. Si è cominciato allora a riconoscere il ruolo infrastrutturale delle RL: Antonio Zampolli è stato il primo a comprendere questo ruolo e a lui dobbiamo anche l'introduzione del termine stesso "risorse linguistiche"},
URL = {https://iris.cnr.it/handle/20.500.14243/279904},
ISBN = {978-88-311-3505-4},
}
@INCOLLECTION{DELLORLETTA_2011_INCOLLECTION_DMVV_94003,
AUTHOR = {Dell'Orletta, F. and Montemagni, S. and Vecchi Eva, M. and Venturi, G.},
TITLE = {Tecnologie linguistico-computazionali per il monitoraggio della competenza linguistica italiana degli alunni stranieri nella scuola primaria e secondaria},
YEAR = {2011},
ABSTRACT = {La possibilità di disporre di tecnologie avanzate e innovative che permettano di monitorare la competenza linguistica degli alunni stranieri e, al contempo, valutare l'adeguatezza dei materiali didattici a loro offerti può essere di supporto all'insegnante nell'orientare la propria azione formativa, rendendo così il processo di integrazione linguistico-culturale meno faticoso e traumatico. In tale ottica, questo studio, realizzato col supporto di una piattaforma ormai consolidata di metodi e strumenti per il trattamento automatico dell'italiano, costituisce il primo tentativo condotto in relazione alla lingua italiana, per mettere a punto una metodologia di monitoraggio linguistico rivolta specificamente agli studenti apprendenti la lingua italiana come L2 ed alle loro produzioni scritte},
KEYWORDS = {Trattamento Automatico del Linguaggio, Stranieri, Lingua italiana},
PAGES = {319-336},
URL = {https://iris.cnr.it/handle/20.500.14243/94003},
PUBLISHER = {Mc Graw-Hill (Milano, ITA)},
ISBN = {978-88-386-7296-5},
CONFERENCE_PLACE = {Milano},
BOOKTITLE = {Percorsi Migranti},
EDITOR = {Bruno, G. C. and Caruso, I. and Sanna, M. and Vellecco, I.},
}
@INCOLLECTION{HAYASHI_2011_INCOLLECTION_HDCMSB_176083,
AUTHOR = {Hayashi, Y. and Declerck, T. and Calzolari, N. and Monachini, M. and Soria, C. and Buitelaar, P.},
TITLE = {Language Service Ontology},
YEAR = {2011},
ABSTRACT = {The Language Grid is a distinctive language service infrastructure in the sense that it accommodates a wide variety of user needs, ranging from technical novices to experts; language resource consumers to language resource providers. As these language services are various in type and each of them can be idiosyncratic in many aspects, the service infrastructure has to address the issue of interoperability. A key to solve this issue is not only to build the services around standardized resources and interfaces, but also to establish a knowledge structure that copes effectively with a range of language services. Given this knowledge structure, referred to as a service ontology, each language service can be systematically classified and its usage specified by a corresponding API. This not only enables the utilization of existing language resources but facilitates the dissemination of newly created language resources as services},
KEYWORDS = {Language grid, ontology},
PAGES = {85-100},
URL = {https://iris.cnr.it/handle/20.500.14243/176083},
DOI = {10.1007/978-3-642-21178-2_6},
PUBLISHER = {Springer-Verlag (Berlin/Heidelberg, DEU)},
ISBN = {978-3-642-21177-5},
CONFERENCE_PLACE = {Berlin/Heidelberg},
BOOKTITLE = {The Language Grid},
EDITOR = {Ishida, T.},
}
@INCOLLECTION{MARINELLI_2011_INCOLLECTION_M_182890,
AUTHOR = {Marinelli, R.},
TITLE = {Costruzione di risorse terminologiche: criteri, risultati e prodotti},
YEAR = {2011},
ABSTRACT = {L'articolo parla della costruzione di tre lessici specialistici organizzati come database di tipo relazionale. I tre database contengono termini appartenenti a tre campi di conoscenza specifici: terminologia marittima (navigazione e trasporti marittimi), terminologia fiscale, terminologia sindacale e del lavoro. Il database di terminologia marittima è stato costruito sulla base del modello del database semantico lessicale ItalWordNet e la metodologia sperimentata è stata applicata per creare gli altri database. Essa fa riferimento i) alla gestione di corpora di linguaggi specialistici, ii) all'uso di database generici per identificare ed estrarre insiemi di parole, potenzialmente appartenenti a domini particolari, che possano essere inseriti nei database terminologici e iii) alla creazione del software e all'utilizzo del tool per la gestione dei database. Vorremo mettere in rilievo nella descrizione delle tre risorse terminologiche i vari tipi di relazioni semantico lessicali che legano ciascun termine agli altri concetti all'interno del singolo database di dominio, ai database generici di lingua Italiana (ItalWordNet) e Inglese (WordNet), e infine ai concetti dell'ontologia generale (Top Ontology) ereditata da IWN e ai concetti dell'ontologia di dominio},
KEYWORDS = {lexical resources, terminology, lexical semantic databases},
PAGES = {129-146},
URL = {https://iris.cnr.it/handle/20.500.14243/182890},
PUBLISHER = {EDUCatt Università Cattolica (Milano, ITA)},
ISBN = {978-88-8311-820-3},
CONFERENCE_PLACE = {Milano},
BOOKTITLE = {Terminologie specialistiche e prodotti terminologici},
EDITOR = {Zanola, M. T. and Bonadonna, M. F.},
}
@INCOLLECTION{OGNIBENE_2011_INCOLLECTION_OVP_175336,
AUTHOR = {Ognibene, D. and Volpi, N. C. and Pezzulo, G.},
TITLE = {Learning to grasp information with your own hands},
YEAR = {2011},
ABSTRACT = {Autonomous robots immersed in a complex world can seldom directly access relevant parts of the environment by only using their sensors. Indeed, finding relevant information for a task can require the execution of actions that explicitly aim at unveiling previously hidden information. Informativeness of an action depends strongly on the current environment and task beyond the architecture of the agent. An autonomous adaptive agent has to learn to exploit the epistemic (e. g., information-gathering) implications of actions that are not architecturally designed to acquire information (e. g. orientation of sensors). The selection of these actions cannot be hardwired as general-purpose information-gathering actions, because differently from sensor control actions they can have effects on the environment and can affect the task execution. In robotics information-gathering actions have been used in navigation [7]; in active vision [4]; and in manipulation [3]. In all these works the informative value of each action was known and exploited at design time while the problem of actively facing un-predicted state uncertainty has not received much},
KEYWORDS = {Artificial Intelligence, Robotics},
PAGES = {398-399},
URL = {https://iris.cnr.it/handle/20.500.14243/175336},
DOI = {10.1007/978-3-642-23232-9_46},
ISBN = {978-3-642-23231-2},
BOOKTITLE = {Towards Autonomous Robotic Systems: 12th Annual Conference, TAROS 2011},
EDITOR = {Groß, R. and Alboul, L. and Melhuish, C. and Witkowski, M. and Prescott, T. J. and Penders, J.},
}
@INCOLLECTION{PAPALEO_2011_INCOLLECTION_PCAC_139482,
AUTHOR = {Papaleo, G. and Chiarella, D. and Aiello, M. and Caviglione, L.},
TITLE = {Analysis, Development and Deployment of Statistical Anomaly Detection Techniques for real e-mail Traffic},
YEAR = {2011},
ABSTRACT = {Even if new interaction paradigms, such as the Voice over IP (VoIP), are becoming popular and widely adopted, the e-mail is still one of the most utilized ways to communicate across the Internet. However, many malicious threats are conveyed via e-mails. Usually, the authors can exploit two different approaches: i) analyzing the logs produced by e-mail servers or ii) reconstruct the e-mail flows by capturing data directly from the network by placing ad-hoc probes. In this vein, this Chapter discusses the analysis, development and deployment of statistical detection techniques aimed at the detection of Internet worms. For what concerns i), they introduce a tool called Log Mail Analyzer (LMA), which allows to overcome the complexity of inspecting multiple logs created from a heterogeneous population of mail servers. In the perspective of ii) they briefly discuss an alternative solution, based on ad-hoc network probes, to be properly placed to collect traffic and then reconstruct the e-mail flow to be monitored. Lastly, the authors introduce a threshold mechanism, based on a simple statistical framework, to automatically detect and identify different worm activities},
PAGES = {47-71},
URL = {http://www.igi-global.com/chapter/attacks-systems-categories-motives/61218},
DOI = {10.4018/978-1-61350-507-6.ch003},
PUBLISHER = {IGI Global (Hershey, USA)},
CONFERENCE_PLACE = {Hershey},
BOOKTITLE = {Information Assurance and Security Technologies for Risk Assessment and Threat Management: Advances},
}
@INCOLLECTION{ROBALDO_2011_INCOLLECTION_RCRG_217953,
AUTHOR = {Robaldo, L. and Caselli, T. and Russo, I. and Grella, M.},
TITLE = {From Italian Text to TimeML Document via Dependency Parsing},
YEAR = {2011},
ABSTRACT = {This paper describes the first prototype for building TimeML xml documents starting from raw text for Italian. First, the text is parsed with the TULE parser, a dependency parser developed at the University of Turin. The parsed text is then used as input to the TimeML rule-based module we have implemented, henceforth called as 'The converter'. So far, the converter identifies and classifies events in the sentence. The results are rather satisfatory, and this leads us to support the use of dependency syntactic relations for the development of higher level semantic tools},
KEYWORDS = {Parsing, TimeML},
PAGES = {177-187},
URL = {https://iris.cnr.it/handle/20.500.14243/217953},
PUBLISHER = {Springer-Verlag (Berlin/Heidelberg, DEU)},
ISBN = {978-3-642-19436-8},
CONFERENCE_PLACE = {Berlin/Heidelberg},
EDITOR = {Gelbukh, A.},
}
@INCOLLECTION{SASSI_2011_INCOLLECTION_SC_182310,
AUTHOR = {Sassi, M. and Cinini, A.},
TITLE = {La banca dati dei provvedimenti della sezione disciplinare del Consiglio Superiore della Magistratura(1990-2007)},
YEAR = {2011},
KEYWORDS = {Linguistica Computazionale, Analisi Sentenze},
PAGES = {129-150},
URL = {https://iris.cnr.it/handle/20.500.14243/182310},
PUBLISHER = {CLUEB (Bologna, ITA)},
ISBN = {978-88-491-3513-8},
CONFERENCE_PLACE = {Bologna},
EDITOR = {Fabri, M.},
}
@EDITORIAL{BELTRAMI_2011_EDITORIAL_BLSABGIGMRVV_146303,
AUTHOR = {Beltrami, P. D. and Larson, P. C. and Squillacioti, P. C. and Artale, E. and Boccellari, A. and Guadagnini, E. and Iorio Fili, D. and Giuliani, M. and Mosti, R. and Ravani, S. and Vaccaro, G. and Verlato, Z.},
TITLE = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI-Edizione online: www. vocabolario. org (ISSN 2240-5216)-Versione 2011},
YEAR = {2011},
ABSTRACT = {Copia in pdf del Tesoro della Lingua Italiana delle Origini (TLIO), dizionario dell'italiano antico in fieri, pubblicato online, alla fine del 2011. Il TLIO è la prima sezione del Dizionario Storico dell'Italiano, la cui realizzazione costituisce la missione dell'OVI},
KEYWORDS = {Lingua italiana, Lessico, Lessicografia},
URL = {http://tlio.ovi.cnr.it/TLIO},
ISSN = {2240-5216},
}
@EDITORIAL{CALZOLARI_2011_EDITORIAL_CBSGMQ_174748,
AUTHOR = {Calzolari, N. and Baroni, P. and Soria, C. and Goggi, S. and Monachini, M. and Quochi, V.},
TITLE = {Proceedings of the 3rd European Language Resources and Technologies Forum: Language Resources in the Sharing Age-the Strategic Agenda},
YEAR = {2011},
ABSTRACT = {Proceedings of the third FLaReNet forum on the European Language Resources and Technologies, held in Venezia, at the Auditorium Santa Margherita of the Università Ca' Foscari, on 26-27 May 2011},
KEYWORDS = {Language Resources, Language Technologies},
PAGES = {86},
URL = {http://www.flarenet.eu/sites/default/files/FLaReNet_Forum_2011_Proceedings.pdf},
}
@INPROCEEDINGS{CALZOLARI_2011_INPROCEEDINGS_CDFR_214980,
AUTHOR = {Calzolari, N. and Del Gratta, R. and Frontini, F. and Russo, I.},
TITLE = {The Language Library: Many Layers, More Knowledge},
YEAR = {2011},
ABSTRACT = {In this paper we outline the general concept of the Language Library, a new initiative that has the purpose of building a huge archive of structured colletion of linguistic information. The Language Library is conceived as a community built repository and as an environment that allows language specialists to share multidimensional and multi-level annotated/processed resources. The first steps towards its implementation are briefly sketched},
KEYWORDS = {Language Resources, Language Library},
PAGES = {93-97},
URL = {https://iris.cnr.it/handle/20.500.14243/214980},
ISBN = {978-974-466-564-5},
CONFERENCE_NAME = {Workshop on Language Resources, Technology and Services in the Sharing Paradigm},
BOOKTITLE = {Workshop on Language Resources, Technology and Services in the Sharing Paradigm},
}
@INPROCEEDINGS{CALZOLARI_2011_INPROCEEDINGS_CMQ_217943,
AUTHOR = {Calzolari, N. and Monachini, M. and Quochi, V.},
TITLE = {Interoperability Framework: The FLaReNet action plan proposal},
YEAR = {2011},
ABSTRACT = {Standards are fundamental to ex-change, preserve, maintain and integrate data and language resources, and as an essential basis of any language resource infrastructure. This paper promotes an Interoperability Framework as a dynamic environment of standards and guidelines, also intended to support the provision of language-(web)service interoperability. In the past two decades, the need to define common practices and formats for linguistic resources has been increasingly recognized and sought. Today open, collaborative, shared data is at the core of a sound language strategy, and standardisation is actively on the move. This paper first describes the current landscape of standards, and presents the major barriers to their adoption; then, it describes those scenarios that critically involve the use of standards and provide a strong motivation for their adoption; lastly, a series of actions and steps needed to operationalise standards and achieve a full interoperability for Language Resources and Technologies are proposed},
KEYWORDS = {Language Resources, standards},
PAGES = {41-49},
URL = {https://iris.cnr.it/handle/20.500.14243/217943},
ISBN = {978-974-466-564-5},
CONFERENCE_NAME = {Workshop on Language Resources, Technology and Services in the Sharing Paradigm},
}
@INPROCEEDINGS{CIGNONI_2011_INPROCEEDINGS_CFCF_214936,
AUTHOR = {Cignoni, L. and Fornaciari, A. and Coschino, F. and Fornaciari, G.},
TITLE = {Step-by-step Organization of a University CLIL Course},
YEAR = {2011},
ABSTRACT = {This paper reports on the organization of CLIL (Content and Language Integrated Learning) University courses in funerary archaeology held at the Division of Palaeopathology of Pisa University. We outline the different steps involved in the practical implementation of the proposed approach, which include choice of topic, linguistic content, tasks and strategies, and we describe the ways in which CLIL can be used both in the classroom and in archaeological fieldwork excavations for teaching of the discipline and practical experience with leading scholars in the field. Each two-hour lesson slot is divided into four parts, devoted to both the receptive (reading, listening) and productive (writing, speaking) skills, which constantly expose the students to language, helping them understand the contents of the discipline. It is necessary to take into account the additional difficulties students attending the courses might have, which are due to their having to learn basic and academic language skills and new subject concepts at the same time. All the material relevant to the course is simplified and adapted to the needs and language of the students, who are supported by authentic materials in the form of text-books, articles, tutorials, illustrations, audio and video recordings, and by a number of activities ranging from gap-filling exercises, matching words with their definitions, jumbled sentences, sentence formation, preparation of posters, powerpoint demonstrations. The trainees are also involved in increasing an ongoing bilingual English-Italian glossary and contextualized English grammar. Working individually, then in pairs and in small groups, they are responsible for the different areas of the discipline. Funerary archaeology is the study of death, ancient burials and human skeletal remains, body disposal, etc., and includes skeleton anthropology, bone diagenesis, taphonomic anthropology, as well as other features comprising excavation phases, techniques and tools employed, field archaeology},
KEYWORDS = {Funerary archaeology},
PAGES = {7},
URL = {https://iris.cnr.it/handle/20.500.14243/214936},
ISBN = {978-88-7647-677-8},
CONFERENCE_NAME = {International Conference-ICT for Language Learning},
EDITOR = {Editore, S.},
}
@INPROCEEDINGS{CIGNONI_2011_INPROCEEDINGS_CFF_214944,
AUTHOR = {Cignoni, L. and Fornaciari, A. and Fornaciari, G.},
TITLE = {An English Grammar and a bilingual Glossary acting as complementary Tools for a CLIL-based Course},
YEAR = {2011},
ABSTRACT = {This paper describes how two complementary tools, an English grammar and a bilingual (Italian-English) glossary, can be expanded by University students attending a CLIL (Content and Language Integrated Learning) course in which a funerary archaeology lecturer, an English language instructor and an archaeologist work together, integrating content and language. This work is part of a wider project carried out at the Division of Palaeopathology, History of Medicine and Bioethics, and approved by the University of Pisa. Starting from a sample of Italian and English monographic texts and other publications in printed or electronic form dealing with the subject of funerary archaeology and other related research areas (anthropology, field archaeology, anatomy and chemistry, which can provide new insights into past civilizations, cultures and practices so far undiscovered), we have extracted separate, preliminary lists of specialized terms. The students working alone, in pairs or in groups, are asked to expand these lists, tracking down additional words with their definitions and example sentences drawn from other authoritative sources. The information with specification of the authors and detailed bibliographical references should be written in independent appropriately labelled files, and sent to the computer analyst responsible for the computer software editing. The reading of various definitions at different levels of depth will enable the user to understand better, have a clearer and more exhaustive picture of a particular word, concept, or phenomenon. The glossary, addressed to the students who are at the same time creators and users of the product, can also be of interest to professors, scholars or translators who need to dispose of the specialised terms of funerary archaeology in a language other than their own. Many of the definitions and other types of useful information can be exploited to illustrate the different grammar points and structures of an easy-to-use on-line English intermediate-level grammar book, to study the grammar not in isolation but in meaningful contexts and real-life situations, to encourage the learners to become active explorers of the language. This ongoing grammar can be a valuable resource for students with minimum linguistic knowledge and competence, but also be useful to those wishing to improve the English language, enhancing their learning proficiency. Implementation of the two complementary products-grammar and glossary-will proceed together, contributing to the learning of funerary archaeology on the part of the students, both learners and creators of the two tools. As we know, the possibilities offered by the computer in terms of space, links, cross-references, etc. make it possible to organize and customize the material, meeting as much as possible the users' needs. The technological tools increasingly available in the educational context support both the subject and language teacher in making the learning process easier and more engaging, helping clarify certain concepts in a non-traditional way in order to accomplish various instructional objectives},
KEYWORDS = {funerary archaeology},
PAGES = {1834-1841},
URL = {https://iris.cnr.it/handle/20.500.14243/214944},
ISBN = {978-84-615-0442-8},
CONFERENCE_NAME = {International Conference on Education and Development and New Learning Technologies},
EDITOR = {Chova, L. G. and Belenguer, D. M. and Martínez, A. L.},
}
@INPROCEEDINGS{CUTUGNO_2011_INPROCEEDINGS_CCZMM_217014,
AUTHOR = {Cutugno, P. and Chiarella, D. and Zini, V. and Marconi, L. and Morgavi, G.},
TITLE = {CorLES: Corpus e Lessico Elementare Scritto. Realización de un corpus y léxico del italiano escrito en las escuelas},
YEAR = {2011},
PAGES = {935-938},
URL = {https://iris.cnr.it/handle/20.500.14243/217014},
VOLUME = {II},
PUBLISHER = {Centro de Lingüística Aplicada, Ministero de Ciencia, Tecnología y Medio Ambiente (Santiago de Cuba, CUB)},
ISBN = {9789597174196},
CONFERENCE_NAME = {XII Simposio Internacional de Comunicación Social: Comunicación Social en el siglo XXI},
CONFERENCE_PLACE = {Santiago de Cuba},
BOOKTITLE = {Comunicación Social en el siglo XXI-Vol. II},
EDITOR = {Ruiz Miyares, L. and Alvarez Silva, M. R.},
}
@INPROCEEDINGS{CUTUGNO_2011_INPROCEEDINGS_CZCM_217013,
AUTHOR = {Cutugno, P. and Zini, V. and Chiarella, D. and Marconi, L.},
TITLE = {To tell oneself on the web: the case of the teenager blog},
YEAR = {2011},
PAGES = {939-943},
URL = {https://iris.cnr.it/handle/20.500.14243/217013},
VOLUME = {II},
PUBLISHER = {Centro de Lingüística Aplicada, Ministero de Ciencia, Tecnología y Medio Ambiente (Santiago de Cuba, CUB)},
ISBN = {9789597174196},
CONFERENCE_NAME = {XII Simposio Internacional de Comunicación Social: Comunicación Social en el siglo XXI},
CONFERENCE_PLACE = {Santiago de Cuba},
BOOKTITLE = {Comunicación Social en el siglo XXI-Vol. II},
EDITOR = {Ruiz Miyares, L. and Alvarez Silva, M. R.},
}
@INPROCEEDINGS{DELLORLETTA_2011_INPROCEEDINGS_DMV_214930,
AUTHOR = {Dell'Orletta, F. and Montemagni, S. and Venturi, G.},
TITLE = {READ-IT: assessing readability of Italian texts with a view to text simplification},
YEAR = {2011},
ABSTRACT = {In this paper, we propose a new approach to readability assessment with a specific view to the task of text simplification: the intended audience includes people with low literacy skills and/or with mild cognitive impairment. READ-IT represents the first advanced readability assessment tool for what concerns Italian, which combines traditional raw text features with lexical, morpho-syntactic and syntactic information. In READ-IT readability assessment is carried out with respect to both documents and sentences where the latter represents an important novelty of the proposed approach creating the prerequisites for aligning the readability assessment step with the text simplification process. READ-IT shows a high accuracy in the document classification task and promising results in the sentence classification scenario},
KEYWORDS = {Readability Assessment, Text Simplification},
PAGES = {73-83},
URL = {http://dl.acm.org/citation.cfm?id=2140511},
ISBN = {978-1-937284-14-5},
CONFERENCE_NAME = {SLPAT '11 Proceedings of the Second Workshop on Speech and Language Processing for Assistive Technologies},
}
@INPROCEEDINGS{DELLORLETTA_2011_INPROCEEDINGS_DVM_214925,
AUTHOR = {Dell'Orletta, F. and Venturi, G. and Montemagni, S.},
TITLE = {ULISSE: an unsupervised algorithm for detecting reliable dependency parses},
YEAR = {2011},
ABSTRACT = {In this paper we present ULISSE, an unsupervised linguistically-driven algorithm to select reliable parses from the output of a dependency parser. Different experiments were devised to show that the algorithm is robust enough to deal with the output of different parsers and with different languages, as well as to be used across different domains. In all cases, ULISSE appears to outperform the baseline algorithms},
KEYWORDS = {Dependency Parsing, Selection of Reliable Parses, Unsupervised Algorithm},
PAGES = {115-124},
URL = {http://dl.acm.org/citation.cfm?id=2018950},
ISBN = {978-1-932432-92-3},
CONFERENCE_NAME = {CoNLL '11 Proceedings of the Fifteenth Conference on Computational Natural Language Learning},
}
@INPROCEEDINGS{DINDO_2011_INPROCEEDINGS_DZP_175774,
AUTHOR = {Dindo, H. and Zambuto, D. and Pezzulo, G.},
TITLE = {Motor simulation via coupled internal models using sequential Monte Carlo},
YEAR = {2011},
ABSTRACT = {We describe a generative Bayesian model for action understanding in which inverse-forward internal model pairs are considered 'hypotheses' of plausible action goals that are explored in parallel via an approximate inference mechanism based on sequential Monte Carlo methods. The reenactment of internal model pairs can be considered a form of motor simulation, which supports both perceptual prediction and action understanding at the goal level. However, this procedure is generally considered to be computationally inefficient. We present a model that dynamically reallocates computational resources to more accurate internal models depending on both the available prior information and the prediction error of the inverse-forward models, and which leads to successful action recognition. We present experimental results that test the robustness and efficiency of our model in real-world scenarios},
KEYWORDS = {prediction, simulation},
PAGES = {2113-2119},
URL = {https://iris.cnr.it/handle/20.500.14243/175774},
PUBLISHER = {AAAI Press (Arlington [VA], USA)},
CONFERENCE_NAME = {Proceedings of the Twenty-Second International Joint Conference on Artificial Intelligence, Barcelona, Catalonia, Spain, 16-22 July 2011},
CONFERENCE_PLACE = {Arlington [VA]},
EDITOR = {Walsh, T.},
}
@INPROCEEDINGS{FERRO_2011_INPROCEEDINGS_FMP_214910,
AUTHOR = {Ferro, M. and Marzi, C. and Pirrelli, V.},
TITLE = {T2HSOM: Understanding the Lexicon by Simulating Memory Processes for Serial Order},
YEAR = {2011},
ABSTRACT = {Over the last several years, both theoretical and empirical approaches to lexical knowledge and encoding have prompted a radical reappraisal of the traditional dichotomy between lexicon and grammar. The lexicon is not simply a large waste basket of exceptions and sub-regularities, but a dynamic, possibly redundant repository of linguistic knowledge whose principles of relational organization are the driving force of productive generalizations. In this paper, we overview a few models of dynamic lexical organization based on neural network architectures that are purported to meet this challenging view. In particular, we illustrate a novel family of Kohonen self-organizing maps (T2HSOMs) that have the potential of simulating competitive storage of symbolic time series while exhibiting interesting properties of morphological organization and generalization. The model, tested on training samples of as morphologically diverse languages as Italian, German and Arabic, shows sensitivity to manifold types of morphological structure and can be used to bootstrap morphological knowledge in an unsupervised way},
KEYWORDS = {Mental Lexicon, Self-organizing Maps, Morphology},
PAGES = {32-41},
URL = {http://alpage.inria.fr/~sagot/woler2011/WoLeR2011/Program_\&_Proceedings.html},
CONFERENCE_NAME = {First International Workshop on Lexical Resources},
BOOKTITLE = {First International Workshop on Lexical Resources},
EDITOR = {Sagot, B.},
}
@INPROCEEDINGS{FRONTINI_2011_INPROCEEDINGS_FMGLPFAM_215017,
AUTHOR = {Frontini, F. and Monachini, M. and Gavrilidou, M. and Labropoulou, P. and Piperidis, S. and Francopoulo, G. and Arranz, V. and Mapelli, V.},
TITLE = {A Metadata Schema for the Description ofLanguage Resources (LRs)},
YEAR = {2011},
ABSTRACT = {This paper presents the metadata schema for describing language resources (LRs) currently under development for the needs of META-SHARE, an open distributed facility for the exchange and sharing of LRs. An essential ingredient in its setup is the existence of formal and standardized LR descriptions, cornerstone of the interoperability layer of any such initiative. The description of LRs is granular and abstractive, combining the taxonomy of LRs with an inventory of a structured set of descriptive elements, of which only a minimal subset is obligatory; the schema additionally proposes recommended and optional elements. Moreover, the schema includes a set of relations catering for the appropriate inter-linking of resources. The current paper presents the main principles and features of the metadata schema, focusing on the description of text corpora and lexical / conceptual resources},
KEYWORDS = {metadata, language resources},
PAGES = {84-92},
URL = {https://iris.cnr.it/handle/20.500.14243/215017},
ISBN = {978-974-466-564-5},
CONFERENCE_NAME = {Workshop on Language Resources, Technology and Services in the Sharing Paradigm},
}
@INPROCEEDINGS{GIOVANNETTI_2011_INPROCEEDINGS_GM_244994,
AUTHOR = {Giovannetti, E. and Marchi, S.},
TITLE = {Cross-Language Boosting in Pattern-based Semantic Relation Extraction from Text},
YEAR = {2011},
ABSTRACT = {In this work we propose a novel technique called "Cross-Language Boosting" (C-LB), aimed at increasing the accuracy of pattern-based semantic relation extraction systems: given a pair of terms expressed in a "Target Language" (e. g. in Italian), we can translate the terms in a "Support Language" (e. g. in English) and apply the translated term pair to reliable lexico-syntactic patterns expressed in that language to increase the accuracy of the system. Experiments have been conducted by comparing the results obtained by the SemRelEx system, a hybrid unsupervised system for semantic relation extraction from texts, with and without the support of the C-LB technique, applied to a set of candidate semantically related term pairs automatically extracted from a corpus in the History of Art domain},
KEYWORDS = {Computational Linguistics, Cross Language, semantic relation extraction systems, Ontology Learning from Text},
PAGES = {29-36},
URL = {https://web.archive.org/web/20121101020859/http://www.proceedings2011.cla-conf.info/},
ISBN = {9788360810477},
CONFERENCE_NAME = {Computational Linguistics Application Conference-CLA 2011},
BOOKTITLE = {Proceedings of the Computational Linguistics-Applications Conference},
EDITOR = {Jassem, K. and Fuglewicz, P. and Piasecki, M. and Przepiorkowski, A.},
}
@INPROCEEDINGS{GUADAGNINI_2011_INPROCEEDINGS_G_241024,
AUTHOR = {Guadagnini, E.},
TITLE = {Lingua francese e francesismi in Zanazzo},
YEAR = {2011},
URL = {https://iris.cnr.it/handle/20.500.14243/241024},
PUBLISHER = {Il Cubo (Roma, ITA)},
ISBN = {9788897431022},
CONFERENCE_NAME = {Le voci di Roma. Omaggio a Giggi Zanazzo},
CONFERENCE_PLACE = {Roma},
EDITOR = {Onorati, F. and Scalessa, G.},
}
@INPROCEEDINGS{GUADAGNINI_2011_INPROCEEDINGS_GV_241034,
AUTHOR = {Guadagnini, E. and Vaccaro, G.},
TITLE = {"Da mi si inzengia la grammatica a buj": un glossaire de la région médiane du XIVe siècle},
YEAR = {2011},
ABSTRACT = {Per molte aree geografiche dell'Italia mediana, le uniche attestazioni antiche sono costituite da glossari: è questo, per esempio, il caso di alcune località periferiche (come per esempio Roccantica, dove il notaio Ser Iacopo Ursello produsse un dizionario alla fine del Quattrocento). Tuttavia i glossari aumentano spesso le nostre conoscenze anche per l'area cassinese o per quell'area dialettale "perimediana" che si sviluppa intorno Roma. Il glossario è quindi un documento preziosissimo, proprio perché ci consente di conoscere e di documentare delle situazioni altrimenti non più attingibili. Tutti i glossari mediani a noi noti si collocano a cavallo tra la fine del XIV secolo e la prima metà del XVI, ovvero tra l'inizio dell'attrazione centripeta del toscano letterario (che-come ha dimostrato per primo Ernst-affonda le sue radici in Roma già alla metà del Trecento) e il compimento di quell'azione livellatrice e uniformatrice dei grammatici, e ancor più della prassi linguistica petrarchesca, che, con la prima metà del Cinquecento si fa tanto intensa da attaccare e invadere ogni documento della lingua scritta. Si analizza qui in particolare il glossario contenuto nel manoscritto 1895 della Biblioteca Angelica di Roma, dando spazio in particolare all'analisi del lessico dell'agricoltura},
URL = {https://iris.cnr.it/handle/20.500.14243/241034},
PUBLISHER = {Brepols (Turnhout, BEL)},
ISBN = {9782503541754},
CONFERENCE_NAME = {Glossaires et lexiques médiévaux inédits. Bilan et perspectives},
CONFERENCE_PLACE = {Turnhout},
BOOKTITLE = {Glossaires et lexiques médiévaux inédits. Bilan et perspectives. Actes du Colloque de Paris (7 mai 2010)},
EDITOR = {Meirinhos, J. H. E. J.},
}
@INPROCEEDINGS{GUADAGNINI_2011_INPROCEEDINGS_GV_241048,
AUTHOR = {Guadagnini, E. and Vaccaro, G.},
TITLE = {"Nom de pays: le nom. " Parole, paesi e popoli nel Corpus DiVo},
YEAR = {2011},
ABSTRACT = {Un campo privilegiato per saggiare le possibilità offerte da un corpus di volgarizzamenti (come il Corpus DiVo) è quello degli etnici, poiché essi afferiscono alla tipologia lessicale definibile di tipo 'storico e materiale', in quanto si tratta di termini non marcati in latino e la cui prosecuzione volgare è condizionata dalla scomparsa o dalla sostanziale modifica del referente. I nomi latini dei popoli rappresentano dunque una porzione di lessico che ha spesso caratteristiche archeologiche già in epoca medievale: la conoscenza dei gruppi etnici noti in epoca classica è di natura erudita e si basa in misura sostanziale sulla lettura degli autori di storia romana. Accanto al recupero 'semplice', mediante prestito, di nomi di popoli antichi, si danno due casi ulteriori: l'estensione di nomi antichi a nuovi referenti (generalmente nomi vecchi per i nuovi popoli che abitano il medesimo territorio), o il ricorso a nomi nuovi per tradurre popoli antichi, nel tentativo di un'attualizzazione fondata sulla denominazione corrente del territorio, anacronisticamente estesa al popolo antico},
PAGES = {267-281},
URL = {https://iris.cnr.it/handle/20.500.14243/241048},
PUBLISHER = {Éditions de linguistique et de philologie (Strasbourg, FRA)},
ISBN = {2951835582},
CONFERENCE_NAME = {Studio, Archivio e Lessico dei Volgarizzamenti Italiani},
CONFERENCE_PLACE = {Strasbourg},
BOOKTITLE = {Volgarizzare, tradurre, interpretare nei secc. XIII-XVI. Atti del Convegno internazionale di studio, Studio, Archivio e Lessico dei Volgarizzamenti Italiani (Salerno, 24-25 novembre 2010)},
EDITOR = {Lubello, S.},
}
@INPROCEEDINGS{KHAN_2011_INPROCEEDINGS_K_407582,
AUTHOR = {Khan, A. F. A.},
TITLE = {The Decidability of RPTL},
YEAR = {2011},
ABSTRACT = {In this paper we look at regular path temporal logic, RPTL, a modal logic which combines the ability to quantify over (finite) paths described by regular expressions (a property which characterises PDL) with the addition of temporal operators. The formulation of RPTL was inspired by agent programming verification considerations. In this paper we prove the decidabilty of RPTL and establish complexity bounds on the satisfiability problem for RPTL by translating it into the theory of alternating tree automata on infinite trees},
URL = {https://iris.cnr.it/handle/20.500.14243/407582},
DOI = {10.3233/978-1-60750-676-8-151},
ISBN = {978-1-60750-675-1},
}
@INPROCEEDINGS{MARINELLI_2011_INPROCEEDINGS_MS_214947,
AUTHOR = {Marinelli, R. and Spadoni, G. P.},
TITLE = {An organized set of generic and specialized lexicons},
YEAR = {2011},
ABSTRACT = {The paper describes the construction of three specialized lexicons organized as databases of a relational type. The databases contain terms belonging to different knowledge fields: the first is a database of maritime terminology (technical-nautical and maritime transport domain) (MDB); in the other two databases terms belonging to the knowledge field of taxation law (TDB) and to the domain of labour law and union labour rules (LDB) are codified. The database of maritime terminology (MDB) was built first, on the basis of the EuroWorNet (EWN) and ItalWordNet (IWN) model, using lexical semantic relations to codify terms, within the framework of the Princeton WordNet (WN) philosophy; it includes about 4000 lemmas. The other two databases (1600 and 1500 lemmas respectively) were structured following similar criteria, in keeping with the methods already successfully experimented to create the MDB and also to enhance it with a subset of terms belonging to the scientific domain of Meteorology, that is an organized set of research phases constituting a true methodology to create terminological databases. These phases are herewith described: i) the corpus approach; ii) the generic database approach. Then the whole terminological network is outlined, highlighting the different kinds of relations linking the terminological and the generic resources},
KEYWORDS = {Linguistic resources, lexical semantic databases, terminology},
PAGES = {944-947},
URL = {http://www.santiago.cu/hosting/linguistica/simposios.php?id=en\&s=12th},
VOLUME = {2},
PUBLISHER = {Centro de linguística aplicada, Ministerio de ciencia, tecnología y medio ambiente (Santiago de Cuba, CUB)},
ISBN = {978-959-7174-19-6},
CONFERENCE_NAME = {12th International Symposium on Social Communication},
CONFERENCE_PLACE = {Santiago de Cuba},
}
@INPROCEEDINGS{MARZI_2011_INPROCEEDINGS_MPS_159861,
AUTHOR = {Marzi, C. and Pardelli, G. and Sassi, M.},
TITLE = {A terminology based re-definition of Grey Literature},
YEAR = {2011},
ABSTRACT = {The conventionally accepted definition of Grey Literature, as Information produced and distributed by non-commercial publishing, does not take into consideration either the increasing availability of forms of grey knowledge, or the growing importance of computer-based encoding and management as the standard mode of creating and developing grey literature. Semi-automated terminological analysis of almost twenty years of terminological creativity in the proceedings of eleven GL International Conferences offers the opportunity to pave the way to a bottom-up redefinition of Grey Literature stemming from attested terminological creativity and lexical innovation. In this paper, we focus on a set of automatically-acquired terms obtained by subjecting our reference Corpus to a number of pre-processing steps of automated text analysis, such as concordances, frequency lists and lexical association scores. Acquired terms allow us to throw in sharp relief developing trends and important shifts of emphasis in the current understanding of the notion of Grey Literature. Semi-automated terminological analysis of almost twenty years of terminological creativity in the proceedings of eleven GL International Conferences offers the opportunity to pave the way to a bottom-up redefinition of Grey Literature stemming from attested terminological creativity and lexical innovation. In this paper, we focus on a set of automatically-acquired terms obtained by subjecting our reference Corpus to a number of pre-processing steps of automated text analysis, such as concordances, frequency lists and lexical association scores. Acquired terms allow us to throw in sharp relief developing trends and important shifts of emphasis in the current understanding of the notion of Grey Literature},
KEYWORDS = {GL conference corpus, Grey literature definition, Terminology extraction},
PAGES = {27-31},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-84883303651\&origin=inward},
VOLUME = {12},
PUBLISHER = {TextRelease (Amsterdam, NLD)},
ISSN = {1386-2316},
ISBN = {9789077484166},
CONFERENCE_NAME = {Twelfth International Conference on Grey Literature: Trasparency in Grey Literature, Grey Tech Approaches to High Tech Issues},
CONFERENCE_PLACE = {Amsterdam},
BOOKTITLE = {THE GL-CONFERENCE SERIES. CONFERENCE PROCEEDINGS},
EDITOR = {Farace, D. J. and Fratzen, J.},
}
@INPROCEEDINGS{PARDELLI_2011_INPROCEEDINGS_PSOBG_21492,
AUTHOR = {Pardelli, G. and Sassi, M. and Orsolini, P. and Biagioni, S. and Giannini, S.},
TITLE = {An open archive of scientific communication},
YEAR = {2011},
ABSTRACT = {This paper presents the results of a terminological work conducted by the authors on a Digital Archives Net of the Italian National Research Council (CNR) in the field of Computer Science. In particular, the research tends to analyse the use of certain terms in Computer Science in order to verify their change over the time with the aim of retrieving from the net the very essence of documentation. Its main source is a reference corpus made up of 13, 500 documents which collects the scientific productions of three CNR research Institutes. They are ISTI (Institute of Information Science and Technologies), IIT (Institute of Informatics and Telematics) and ILC (Institute of Computational Linguistics), all of them born from the "Centro Studi sulle Calcolatrici Elettroniche (CSCE)" and now belonging to the CNR Department of Information \& Communication Technologies and Cultural Identity. This study is divided in three sections: an introductory one dedicated to the data extracted from the scientific documentation: the data have in common the use of some terms proper of the Computer Science lexicon although these term belong to different branches (Linguistics, Informatics and Telematics); the second section is devoted to the description of the contents managed by the PUMA (Publication Management System) system; the third section contains a statistical representation of terms extracted from archive: some comparison tables between the occurrences of the most used terms in the scientific documentation produced by the three Institutes will be created and diagrams with percentages about the most frequently used terms will be displayed too. Lastly, indexes and concordances will allow to reflect on the use of certain terms in this field and give possible keys for having access to the extraction of knowledge in the digital era},
KEYWORDS = {Digital Archives, Communication, Terminology, Open Access},
PAGES = {914-918},
URL = {http://www.santiago.cu/hosting/linguistica/simposios.php?s=XII},
VOLUME = {II},
PUBLISHER = {Centro de linguística aplicada, Ministerio de ciencia, tecnología y medio ambiente (Santiago de Cuba, CUB)},
ISBN = {978-959-7174-19-6},
CONFERENCE_NAME = {Comunicación Social en el Siglo XXI. XII Simposio Internacional de Comunicacion Social},
CONFERENCE_PLACE = {Santiago de Cuba},
BOOKTITLE = {Comunicacion social en el siglo XXI, vol. II},
EDITOR = {Miyares, L. R. and Silva, M. R. A.},
}
@INPROCEEDINGS{PEZZULO_2011_INPROCEEDINGS_PR_214961,
AUTHOR = {Pezzulo, G. and Rigoli, F.},
TITLE = {Planning in view of future needs: a bayesian model of anticipated motivation},
YEAR = {2011},
ABSTRACT = {Traditional neuroeconomic theories of decision-making assume that utilities are based on intrinsic values of outcomes and that those values depend on how salient are outcomes in relation to the current motivational state. The fact that humans, and possibly also other animals, are able to plan in view of future motivations is not accounted by this view. So far, it is not clear which are the structures and the computational mechanisms employed by the brain during these processes. In this article, we present a Bayesian computational model that describes how the brain considers future motivations and assigns value to outcomes in relation to this information. We compare our model of anticipated motivation with a model that implements the standard perspective in decision-making and assigns value only based on the animal's current motivations. The results of our simulations indicate an advantage of the model of anticipated motivation in volatile environments. Finally we connect our computational proposal to animal and human studies on prospection and foresight abilities and to neurophysiological investigations on their neural underpinnings},
KEYWORDS = {prospection, foresight, goal-directed decisionmaking, model-based, expected utility},
PAGES = {174-176},
URL = {http://nbu.bg/cogs/eurocogsci2011/proceedings/pdfs/EuroCogSci-paper174.pdf},
ISBN = {978-954-535-660-5},
CONFERENCE_NAME = {European Conference on Cognitive Science 2011},
EDITOR = {Kokinov, B. and Karmiloff Smith, A. and Nersessian, N. J.},
}
@INPROCEEDINGS{PICCHI_2011_INPROCEEDINGS_PS_214957,
AUTHOR = {Picchi, E. and Sassolini, E.},
TITLE = {The "Micro Semantics" for intelligent browsing},
YEAR = {2011},
ABSTRACT = {Study and development of methodologies to improve systems of "information retrieval". Our approach is based on the integration of techniques, originally created to disciplines such as philology, lexicography, literature, with linguistic and statistical tools for the extraction and analysis of information in the text. Also we experimented a special methodology, for the creation of specific semantic metadata for text materials. In this paper, we describe "SmartCity", a project in which we applied these strategies. The project aims at designing and developing multimedia content (audio-guide for the new generation of interactive media and off-line and on-line) for the use of custom-cultural tourist routes, both physical (in the context of museums and cities) and virtual},
KEYWORDS = {Semantic Analysis, Information Retrieval, Text Mining},
PAGES = {117-123},
URL = {https://iris.cnr.it/handle/20.500.14243/214957},
VOLUME = {4},
ISBN = {978-88-905639-8-0},
CONFERENCE_NAME = {5th International Congress on "Science and Technology for the Safeguard of Cultural Heritage in the Mediterranean Basin"},
}
@INPROCEEDINGS{PICCHI_2011_INPROCEEDINGS_PS_333710,
AUTHOR = {Picchi, E. and Sassolini, E.},
TITLE = {THE "MICRO SEMANTICS" FOR INTELLIGENT BROWSING},
YEAR = {2011},
ABSTRACT = {Study and development of methodologies to improve systems of "information retrieval". Our approach is based on the integration of techniques, originally created to disciplines such as philology, lexicography, literature, with linguistic and statistical tools for the extraction and analysis of information in the text. Also we experimented a special methodology, for the creation of specific semantic metadata for text materials. In this paper, we describe "SmartCity", a project in which we applied these strategies. The project aims at designing and developing multimedia content (audio-guide for the new generation of interactive media and off-line and on-line) for the use of custom-cultural tourist routes, both physical (in the context of museums and cities) and virtual},
URL = {https://iris.cnr.it/handle/20.500.14243/333710},
ISBN = {978-88-905639-8-0},
}
@INPROCEEDINGS{RIGOLI_2011_INPROCEEDINGS_RFP_214968,
AUTHOR = {Rigoli, F. and Francesco Pavone, E. and Pezzulo, G.},
TITLE = {Interaction of goal-directed and pavlovian systems in aversive domains},
YEAR = {2011},
ABSTRACT = {Recent neuroscientific models of human behavior distinguish between different cognitive controllers: two instrumental systems (goal-directed and habitual) that maximize utility through learned actions, and a so-called Pavlovian system, which implements innate reactive responses. Although the interaction between instrumental and Pavlovian controllers has been suggested as a key process underlying emotional phenomena and surprising forms of misbehavior, few is known about it, especially in the sensorimotor aversive domain. With a combined experimental and computational approach, we study the interactions between instrumental (goal-directed) and Pavlovian processes in the aversive domain. First, we present a human experiment in which goal-directed and Pavlovian systems compete in order to control responses. The results indicate that Pavlovian processes can significantly interfere with goal-directed behavior. Second, we compare four alternative Bayesian models for their accuracy in modeling human performance. The results indicate a better fit for an architecture in which the Pavlovian controller can use both model-based and model-free features},
KEYWORDS = {Goal-directed system, Pavlovian system, Bayesian model, implicit classical conditioning},
PAGES = {3211-3216},
URL = {http://mindmodeling.org/cogsci2011/papers/0739/paper0739.pdf},
ISBN = {978-954-535-660-5},
CONFERENCE_NAME = {European Conference on Cognitive Science 2011 New Bulgarian University Sofia},
BOOKTITLE = {European Perspectives on Cognitive Science},
EDITOR = {Kokinov, B. and Karmiloff Smith, A. and Nersessian, N. J.},
}
@INPROCEEDINGS{RUSSO_2011_INPROCEEDINGS_RCRBM_217960,
AUTHOR = {Russo, I. and Caselli, T. and Rubino, F. and Boldrini, E. and Martínezbarco, P.},
TITLE = {EMOCause: An Easy-adaptable Approach to Extract Emotion Cause Contexts},
YEAR = {2011},
ABSTRACT = {In this paper we present a method to automatically identify linguistic contexts which contain possible causes of emotions or emotional states from Italian newspaper articles (La Repubblica Corpus). Our methodology is based on the interplay between relevant linguistic patterns and an incremental repository of common sense knowledge on emotional states and emotion eliciting situations. Our approach has been evaluated with respect to manually annotated data. The results obtained so far are satisfying and support the validity of the methodology proposed},
KEYWORDS = {sentiment analysis},
PAGES = {153-160},
URL = {https://iris.cnr.it/handle/20.500.14243/217960},
CONFERENCE_NAME = {2nd Workshop on Computational Approaches to Subjectivity and Sentiment Analysis},
}
@INPROCEEDINGS{SPADONI_2011_INPROCEEDINGS_STS_214332,
AUTHOR = {Spadoni, F. and Tariffi, F. and Sassolini, E.},
TITLE = {SMARTCITY: Innovative Technologies for customized and dynamic multimedia content production for Tourism applications},
YEAR = {2011},
ABSTRACT = {This paper presents the first results of the SMARTCITY project, co-funded by the Tuscany Region under the POR CREO 1. d program. the project proposess an innovative methodology as well as advanced technologies enabling professional services for cultural tourism applications in urban areas as well as larger archaeological sites},
KEYWORDS = {smartcity project, Tourism Applications, Dynamic Multimedia Content Production},
PAGES = {130-135},
URL = {https://iris.cnr.it/handle/20.500.14243/214332},
PUBLISHER = {Pitagora Editrice Bologna (Bologna, ITA)},
ISBN = {88-371-1837-6},
CONFERENCE_NAME = {EVA 2011 Florence Electronic Imaging and the Visual Arts},
CONFERENCE_PLACE = {Bologna},
EDITOR = {Cappellini, V.},
}
@INPROCEEDINGS{SPADONI_2011_INPROCEEDINGS_STSE_333475,
AUTHOR = {Spadoni, F. and Tariffi, F. and Sassolini, E. and , E.},
TITLE = {SMARTCITY: Innovative Technologies for customized and dynamic multimedia content production for Tourism applications},
YEAR = {2011},
ABSTRACT = {This paper presents the first results of the SMARTCITY project, co-funded by the Tuscany Region under the POR CREO 1. d program. the project proposess an innovative methodology as well as advanced technologies enabling professional services for cultural tourism applications in urban areas as well as larger archaeological sites},
URL = {https://iris.cnr.it/handle/20.500.14243/333475},
ISBN = {88-371-1837-6},
}
@INPROCEEDINGS{CUTUGNO_2011_INPROCEEDINGS_CCZRMZCA_277062,
AUTHOR = {Cutugno, P. and Cavioni, V. and Zanetti, M. A. and Renati, R. and Marconi, L. and Zini, V. and Chiarella, D. and Aloisio, V.},
TITLE = {Blog, identità virtuale, narrazione, analisi linguistica, adolescenza},
YEAR = {2011},
PAGES = {91-91},
URL = {https://iris.cnr.it/handle/20.500.14243/277062},
CONFERENCE_NAME = {CKGB Terzo Congresso Nazionale "Empowerment, Formazione e Tecnologie. L'individuo, il Gruppo e l'Organizzazione"},
}
@INPROCEEDINGS{MARZI_2011_INPROCEEDINGS_M_181884,
AUTHOR = {Marzi, C.},
TITLE = {Knowledge Communities in Grey},
YEAR = {2011},
ABSTRACT = {The dynamic nature of modern human social interactions, and the increasing capability of wireless and mobile devices for creating and sharing contents, open up the opportunity for a wide dissemination of information through complex knowledge sharing systems. The development of digital technologies and the continuous evolution of telecommunication networks are rapidly heading our society towards a culture of participation and to a more and more interactive communication. Adaptive networking protocols and data management systems are fostering pervasive information and communication environments. In this context, subject based communities offer the steadily increasing availability of ubiquitous accessible information. Networking communities, focussed on supporting relationships and content sharing, act at the same time as providers and users of all kind of grey literature materials in a highly distributed and collaborative scenario. Collaboration networks are thus becoming a key element in the advancement and dissemination of knowledge in scientific domains as well as in diverse aspects of everyday human life. In this sense, social media at best enhance new frontier ideas and highly innovative contents; they offer the enormous potential to transform research, and research results, into a knowledge co-creation process. As the shared knowledge components build cognitive ties, there is no real sharing of knowledge without a common understanding of it. Large amounts of structured information have to be managed, and generation and assimilation of knowledge have to be facilitated. The unlimited universe of data and information available on the web need to be identified, classified, analyzed, filtered, so as to enhance the generation and assimilation of new knowledge. Knowledge needs to be represented, standardized and distilled from multiple sources. Tagging on a web scale provides a potentially useful source of metadata, and paves the way to automated post-processing services such as information retrieval, and acquisition of concepts from large document repositories. In other words it creates an environment conducive to knowledge transfer. In the full version, particular emphasis will be laid on technologies in natural language understanding and knowledge management for providing structured, intelligent access to the continuously evolving content generated on-line in a pervasive collaborative environment. In particular, the work will focus on exploring the interaction/synergy between different modes/tools for knowledge acquisition and representation: from highly structured, standardized and objective knowledge information systems based on ontological hierarchies and relations to more dynamic, subjective tools for volatile knowledge representation such as word clouds and concept maps. This approach will highlight current automated tools for concept acquisition and ontology learning that are conducive to an incremental approach to content access and management, to establish a fruitful bridge between modes of knowledge sharing/creation and dynamic, incremental approaches to automated knowledge acquisition and representation},
KEYWORDS = {Grey Literature, Web communities, Knowledge sharing, Concept Maps},
PAGES = {26-30},
URL = {https://iris.cnr.it/handle/20.500.14243/181884},
ISBN = {978-90-77484-00-5},
CONFERENCE_NAME = {Thirteenth International Conference on Grey Literature: The Grey circuit-From Social networking to Wealth Creation},
BOOKTITLE = {The Grey Circuit-From Social Networking to Wealth Creation},
EDITOR = {Farace, D. J. and Fratzen, J.},
}
@INPROCEEDINGS{MONTEMAGNI_2011_INPROCEEDINGS_MWDN_181899,
AUTHOR = {Montemagni, S. and Wieling, M. and De Jonge, B. and Nerbonne, J.},
TITLE = {Synchronic patterns of Tuscan phonetic variation and diachronic change: evidence from a dialectometric study},
YEAR = {2011},
ABSTRACT = {A careful investigation of synchronic patterns of linguistic variation with underlying linguistic features can lead to important insights into the comprehension of diachronic phonetic processes. Starting from the analysis of synchronic patterns of phonetic variation in Tuscany we tackled one of the main and most debated features of Tuscan dialects, the phenomenon of spirantization with a specific view to the so-called Tuscan "gorgia" (i. e. voiceless spirantization). In particular, we showed that the newly proposed method of spectral partitioning of bipartite graphs applied to synchronic dialectal data can effectively be used to investigate diachronic phonetic processes. From a careful analysis of the sound correspondences involving voiceless and voiced stops, we tracked the evolution of the spirantization phenomenon in several respects. First, we tracked spirantization geographically, across Tuscany from the influential center of Florence to the peripheral areas. Second, we tracked it phonologically, from voiceless to voiced stops, and within each voicing class from velars to dentals and then to bilabials. Finally, we tracked it demographically, with young speakers using the most innovative sound correspondences more than old speakers. The fact that these results are in line with the literature on the topic of Tuscan "gorgia" demonstrates the potential of the method of spectral partitioning of bipartite graphs with respect to the reconstruction of diachronic processes starting from diatopically distributed synchronic dialectal data},
KEYWORDS = {Dialectometry, Phonetic Variation, Tuscan Dialects},
PAGES = {120-121},
URL = {http://westernlinguistics.ca/methods14/files/all_abstracts_one_document.pdf},
CONFERENCE_NAME = {Fourteenth Methods in Dialectology Conference},
}
@INPROCEEDINGS{PARDELLI_2011_INPROCEEDINGS_PSG_218011,
AUTHOR = {Pardelli, G. and Sassi, M. and Goggi, S.},
TITLE = {Grey Literature Between Tradition and Innovation: Is there a Continuum?},
YEAR = {2011},
ABSTRACT = {This study wants to explore ways of social media communication for Grey Literature. In particular it describes the role of social media in relation with traditional channels and how social media applications can be used for Grey},
KEYWORDS = {Grey Literature, Communication networks, Knowledge networking, knowledge exchange},
PAGES = {64-65},
URL = {https://iris.cnr.it/handle/20.500.14243/218011},
ISBN = {978-90-77484-00-5},
CONFERENCE_NAME = {Thirteenth International Conference on Grey Literature: The Grey Circuit, From Social Networking to Wealth Creation},
EDITOR = {Farace, D. J. and Frantzen, J.},
}
@INPROCEEDINGS{QUOCHI_2011_INPROCEEDINGS_Q_225688,
AUTHOR = {Quochi, V.},
TITLE = {The development of Light-'do' Verb Constructions in Italian},
YEAR = {2011},
ABSTRACT = {This contribution presents the results of a study of the development of Light 'do' Verb Constructions in Italian based on naturalistic data. The claim is that there exists a Light Verb pivot schema that accounts for new productive formations and that this pattern is learnt by young children because it constitutes a labeling technique for naming new events, activities and situations. The findings of this research support two hypotheses of language acquisition. The results are based on analysis of longitudinal transcriptions of adult children interactions contained in the CHILDES databank (MacWhinney 2000)},
KEYWORDS = {child language, construction grammar, light verb constructions},
PAGES = {256-257},
URL = {http://sle2011.cilap.es/downloads/book_abstracts.pdf},
CONFERENCE_NAME = {SLE 2011-44 TH ANNUAL MEETING},
BOOKTITLE = {SLE 2011-44TH ANNUAL MEETING BOOK OF ABSTRACT},
EDITOR = {Arista, J. M.},
}
@INPROCEEDINGS{TERRANOVA_2011_INPROCEEDINGS_TFCRDGRP_181897,
AUTHOR = {Terranova, G. and Ferro, M. and Carpeggiani, C. and Recchia, V. and Dodaro, A. and Gioffrè, D. and Richard, S. and Picano, E.},
TITLE = {Unreadability of current informed consent forms in cardiology-and how to improve it},
YEAR = {2011},
ABSTRACT = {Guidelines on informed consent for clinical practice and research trials recommend the use of standard plain language to enhance patient comprehension and to facilitate shared decision-making. Aim: To assess readability of our current informed consent forms used in cardiology},
KEYWORDS = {public health, health policy, informed consent, readability},
PAGES = {69-70},
URL = {http://spo.escardio.org/abstract-book/presentation.aspx?id=97162},
VOLUME = {32},
CONFERENCE_NAME = {European Society of Cardiology},
}
@TECHREPORT{ARRANZ_2011_TECHREPORT_ABBCCDFGMQRR_231385,
AUTHOR = {Arranz, V. and Bel, N. and Budin, G. and Caselli, T. and Choukri, K. and Del Gratta, R. and Frontini, F. and Goggi, S. and Monachini, M. and Quochi, V. and Rubino, F. and Russo, I.},
TITLE = {The FLaReNet Databook},
YEAR = {2011},
ABSTRACT = {The FLaReNet Databook is not only the collection of all the factual material collected during the activities of the project, but also a set on innovative initiatives and instruments that will remain in place for the continuous collection of such "facts". The purpose of the Databook is in fact, on one side, to consolidate the analyses carried out in the project and, at the same time, to set up the proper mechanisms that will enable the provision of a continuous stream of relevant factual material, also after the end of the project},
KEYWORDS = {Language Resources (LRs)},
PAGES = {1-8},
URL = {http://www.flarenet.eu/?q=FLaReNet_Databook},
}
@TECHREPORT{BARONI_2011_TECHREPORT_B_174805,
AUTHOR = {Baroni, P.},
TITLE = {FLaReNet Web Site End Users Guide-Editing of a Group Wiki Doc using FCKeditor},
YEAR = {2011},
ABSTRACT = {In this guide you will find most of the common tasks used in FCKeditor, the WYSIWYG (What You See Is What You Get) HTML text editor integrated in the Drupal CMS (Content Management System) to provide most of the commonly used functions from desktop editors like Word to the Web},
KEYWORDS = {WYSIWYG HTML text editor},
URL = {https://iris.cnr.it/handle/20.500.14243/174805},
}
@TECHREPORT{BARONI_2011_TECHREPORT_B_174113,
AUTHOR = {Baroni, P.},
TITLE = {ECP-2007-LANG-617001 FLaReNet: Financial Statement},
YEAR = {2011},
ABSTRACT = {Final financial statement of the FLaReNet project},
KEYWORDS = {Financial Statement},
URL = {https://iris.cnr.it/handle/20.500.14243/174113},
}
@TECHREPORT{BARONI_2011_TECHREPORT_B_177112,
AUTHOR = {Baroni, P.},
TITLE = {FLaReNet Web Statistics: 7th December 2008-31st August 2011},
YEAR = {2011},
ABSTRACT = {Statistics relating to the access to the FLaReNet Web site from 7th December 2008 to 31st August 2011},
KEYWORDS = {Language Resources, Web Statistics},
PAGES = {15},
URL = {https://iris.cnr.it/handle/20.500.14243/177112},
}
@TECHREPORT{BARONI_2011_TECHREPORT_B_177114,
AUTHOR = {Baroni, P.},
TITLE = {The FLaReNet Consortium and Network: 1st September 2008-31st August 2011},
YEAR = {2011},
ABSTRACT = {Some statistics relating to the Individual Subscribers, the Institutional Members and the National Contact Points of the FLaReNet network are reported and analysed},
KEYWORDS = {Language Resources, Statistics},
PAGES = {12},
URL = {https://iris.cnr.it/handle/20.500.14243/177114},
}
@TECHREPORT{BARONI_2011_TECHREPORT_BSC_174116,
AUTHOR = {Baroni, P. and Soria, C. and Calzolari, N.},
TITLE = {The FLaReNet Databook: http: //www. flarenet. eu/?q=FLaReNet_Databook},
YEAR = {2011},
ABSTRACT = {A collection of all the factual material collected during the activities of the FLaReNet project and a set of innovative initiatives and instruments that will remain in place for the continuous collection of such "facts". Editors: Paola Baroni, Claudia Soria, Nicoletta Calzolari. Contributors: Victoria Arranz, Núria Bel, Gerhard Budin, Tommaso Caselli, Khalid Choukri, Riccardo Del Gratta, Elina Desypri, Gil Francopoulo, Francesca Frontini, Sara Goggi, Olivier Hamon, Erhard Hinrichs, Penny Labropoulou, Lothar Lemnizer, Steven Krauwer, Valerie Mapelli, Joseph Mariani, Monica Monachini, Jan Odijk, Jungyeul Park, Stelios Piperidis, Adam Przepiorkowski, Valeria Quochi, Eva Revilla, Laurent Romary, Francesco Rubino, Irene Russo, Helmut Schmidt, Hans Uszkoreit, Peter Wittenburg},
KEYWORDS = {Language Resources},
URL = {http://www.flarenet.eu/?q=FLaReNet_Databook},
}
@TECHREPORT{BARONI_2011_TECHREPORT_BSC_183062,
AUTHOR = {Baroni, P. and Soria, C. and Calzolari, N.},
TITLE = {The FLaReNet Databook},
YEAR = {2011},
ABSTRACT = {A collection of all the factual material collected during the activities of the FLaReNet project and a set of innovative initiatives and instruments that will remain in place for the continuous collection of such "facts". Editors: Paola Baroni, Claudia Soria, Nicoletta Calzolari. Contributors: Victoria Arranz, Núria Bel, Gerhard Budin, Tommaso Caselli, Khalid Choukri, Riccardo Del Gratta, Elina Desypri, Gil Francopoulo, Francesca Frontini, Sara Goggi, Olivier Hamon, Erhard Hinrichs, Penny Labropoulou, Lothar Lemnizer, Steven Krauwer, Valerie Mapelli, Joseph Mariani, Monica Monachini, Jan Odijk, Jungyeul Park, Stelios Piperidis, Adam Przepiorkowski, Valeria Quochi, Eva Revilla, Laurent Romary, Francesco Rubino, Irene Russo, Helmut Schmidt, Hans Uszkoreit, Peter Wittenburg},
KEYWORDS = {Language Resources, Language Technologies},
URL = {http://www.flarenet.eu/sites/default/files/FLaReNet_Databook.pdf},
}
@TECHREPORT{BARTOLINI_2011_TECHREPORT_BPHTPRTPB_183058,
AUTHOR = {Bartolini, R. and Poch, M. and Hamon, O. and Toral, A. and Prokopidis, P. and Rubino, F. and Thurmair, G. and Papavassiliou, V. and Bel, N.},
TITLE = {D3. 3 Second version (v2) of the integrated platform and documentation},
YEAR = {2011},
ABSTRACT = {the integrated platform and documentation of panacea},
KEYWORDS = {platform},
URL = {https://iris.cnr.it/handle/20.500.14243/183058},
}
@TECHREPORT{BRIGUGLIO_2011_TECHREPORT_BGLTMCEFCBACVPLBSS_173561,
AUTHOR = {Briguglio, L. and Gordea, S. and Lindley, A. and Tzoannos, E. and Meghini, C. and Cardillo, F. A. and Esuli, A. and Falchi, F. and Ceccarelli, D. and Bolettieri, P. and Aloia, N. and Concordia, C. and Valdes, V. and Paytuvi, O. and Lazaridis, M. and Beloued, A. and Spyratos, N. and Sugibuchi, T.},
TITLE = {ASSETS-Interface specifications and system design},
YEAR = {2011},
ABSTRACT = {This internal document provides the following information regarding the Assets Services:. the service description;. the definition of the interfaces;. the data models and data flows exchanged between services. It integrates results from both T2. 0. 4 "Platform design and implementation guidelines" and T2. 0. 5 "API Specifications". This documentation is the basis for the development activities, because identifies the components, their responsibilities and, a preliminary definition of data models and interfaces. Through the iteration, the data model models and interfaces will be refined and enriched with further details. In this perspective, this documentation could be considered the most important contribution for the next deliverable D2. 0. 4 "The ASSETS APIs", expected for month 12},
KEYWORDS = {Interfaces, System design},
URL = {https://iris.cnr.it/handle/20.500.14243/173561},
}
@TECHREPORT{CALZOLARI_2011_TECHREPORT_CBCMMOPQS_174181,
AUTHOR = {Calzolari, N. and Bel, N. and Choukri, K. and Mariani, J. and Monachini, M. and Odijk, J. and Piperidis, S. and Quochi, V. and Soria, C.},
TITLE = {Final FLaReNet deliverable: Language Resources for the Future-The Future of Language Resources},
YEAR = {2011},
ABSTRACT = {Language Technologies (LT), together with their backbone, Language Resources (LR), provide an essential support to the challenge of Multilingualism and ICT of the future. The main task of language technologies is to bridge language barriers and to help creating a new environment where information flows smoothly across frontiers and languages, no matter the country, and the language, of origin. To achieve this goal, all players involved need to act as a community able to join forces on a set of shared priorities. However, until now the field of Language Resources and Technology has long suffered from an excess of individuality and fragmentation, with a lack of coherence concerning the priorities for the field, the direction to move, not to mention a common timeframe. The context encountered by the FLaReNet project was thus represented by an active field needing a coherence that can only be given by sharing common priorities and endeavours. FLaReNet has contributed to the creation of this coherence by gathering a wide community of experts and making them participate in the definition of an exhaustive set of recommendations},
KEYWORDS = {language resources and technologies, infrastructures},
PAGES = {97},
URL = {https://iris.cnr.it/handle/20.500.14243/174181},
}
@TECHREPORT{CALZOLARI_2011_TECHREPORT_CQS_174758,
AUTHOR = {Calzolari, N. and Quochi, V. and Soria, C.},
TITLE = {FLaReNet Strategic Language Resource Agenda},
YEAR = {2011},
ABSTRACT = {Despite the complexity of handling its languages, the European Union has established that cultural and language differences are a unique asset to be preserved. Europe needs to find means-such as technological ones-to overcome the language barriers to support citizens and industry in a multilingual globalised world. The large majority of industrial technological applications that handle natural language, i. e. Machine Translation, Crosslingual Information Retrieval, Multilingual Information Extraction, Automatic Document Indexing, Question Answering, Natural Language Interfaces, etc., include Language Resources as critical components. Although Language Technologies may consist of language independent engines, they depend on the availability of language-dependent knowledge under the form of Language Resources for their real-life implementation. At the same time, it is proved that a critical mass of Language Resources can make advancement in research and technology development possible and quicker, making Europe the leader of the market related to multilingualism. Companies such as Google or Microsoft play a dominant role in this framework, as they have access to a huge amount of data in many different languages, devote considerable resources to Language Technologies, have massive computing power and a direct research-to-application pipeline using a new business model based on so-called "free" services. The fact that a US company like Google is delivering some of the most comprehensive Language Technology solutions to support multilingualism should raise concern among EU officials},
KEYWORDS = {Language resources, infrastructures},
PAGES = {23},
URL = {https://iris.cnr.it/handle/20.500.14243/174758},
}
@TECHREPORT{CALZOLARI_2011_TECHREPORT_CSBG_183063,
AUTHOR = {Calzolari, N. and Soria, C. and Baroni, P. and Goggi, S.},
TITLE = {ECP-2007-LANG-617001 FLaReNet: Final Report},
YEAR = {2011},
ABSTRACT = {Final report of the FLaReNet project},
KEYWORDS = {Language Resources},
URL = {http://www.flarenet.eu/sites/default/files/D1.15.pdf},
}
@TECHREPORT{CALZOLARI_2011_TECHREPORT_CSBCMOPB_183043,
AUTHOR = {Calzolari, N. and Soria, C. and Bel, N. and Choukri, K. and Mariani, J. and Odijk, J. and Piperidis, S. and Baroni, P.},
TITLE = {ECP-2007-LANG-617001 FLaReNet: Progress Report No. 5},
YEAR = {2011},
ABSTRACT = {Fifth semestrial report on the progress of the FLaReNet project},
KEYWORDS = {Language Resources},
URL = {https://iris.cnr.it/handle/20.500.14243/183043},
}
@TECHREPORT{CALZOLARI_2011_TECHREPORT_CSBCMOPBG_183065,
AUTHOR = {Calzolari, N. and Soria, C. and Bel, N. and Choukri, K. and Mariani, J. and Odijk, J. and Piperidis, S. and Baroni, P. and Goggi, S.},
TITLE = {ECP-2007-LANG-617001 FLaReNet: Progress Report No. 6},
YEAR = {2011},
ABSTRACT = {Sixth semestrial report on the progress of the FLaReNet project},
KEYWORDS = {Language Resources},
URL = {https://iris.cnr.it/handle/20.500.14243/183065},
}
@TECHREPORT{CHIARELLA_2011_TECHREPORT_C_174802,
AUTHOR = {Chiarella, D.},
TITLE = {Uno studio sullo standard 802. 11: introduzione di una rete wifi nella rete dell'U. O. S. ILC di Genova},
YEAR = {2011},
ABSTRACT = {Il termine wireless riferito ad una comunicazione indica che il trasferimento di informazioni avviene senza l'utilizzo di conduttori elettrici o cavi; infatti in una rete wireless lo strumento di comunicazione utilizzato è l'aria. Per estensione tutti i dispositivi che utilizzano questa modalità di comunicazione vengono detti wireless. La comunicazione wireless può permettere di portare un servizio dove una comunicazione cablata risulterebbe impossibile da implementare, sia per quanto riguarda la fattibilità tecnica, sia per quanto riguarda i costi oppure può risultare molto utile nel caso la dinamicità del numero di utenti che utilizzano una rete sia molto alta e l'infrastruttura hardware sia sottodimensionata rispetto al numero degli utenti (i. e. le prese ethernet siano esigue rispetto al numero di computer da cablare). Uno dei casi più comuni che rientra nell'estrema dinamicità sono i giorni in cui viene ospitato in una struttura un evento (i. e. una conferenza) che porta con sé diversi visitatori che necessitano di una connessione ad Internet: in questo caso una soluzione ottima sia per trade-off di tempo di fattibilità sia per facilità d'uso per gli utenti è la creazione di una LAN wireless (WLAN). Per queste motivazioni, nell'ambito della ricerca applicata per l'innovazione del networking e della sicurezza dell'Unità Operativa Staccata di Genova dell'Istituto di Linguistica Computazionale, è stata introdotta all'interno della rete cablata preesistente una rete wireless. Il seguente rapporto tecnico tratta nel primo paragrafo della situazione preesistente della rete, nel secondo paragrafo cerca di dare un'esaustiva panoramica delle reti wireless e delle loro tecnologie, nel terzo paragrafo descrive le soluzioni tecniche prese in considerazione e le scelte fatte per la creazione della rete wireless ILC-WIFI},
KEYWORDS = {reti wireless, standard 802.11, WEP, WPA, WPA2},
URL = {https://iris.cnr.it/handle/20.500.14243/174802},
}
@TECHREPORT{CUCURULLO_2011_TECHREPORT_CS_174807,
AUTHOR = {Cucurullo, S. and Sassi, M.},
TITLE = {"Archivio Elettronico delle Concordanze Diacroniche dell'Orlando Furioso"},
YEAR = {2011},
ABSTRACT = {The project to build a digital electronic archiving of the concordances diachronic Orlando Furioso began in the '70s and had as its objective the study of a computational method for the treatment of variants. The basic text, provided by the "Accademia della Crusca", refers to the latest edition published in 1532 by the author, while the first 2 editions, published respectively in 1516 and in 1521, had not yet been the subject of electronic transcription. This has directed the staff of the project towards a reconstruction of the previous witnesses through accurate recording of the critical apparatus Debenedetti-Segre, 1960},
KEYWORDS = {DBT, Orlando Furioso, banca-dati testuale},
PAGES = {11},
URL = {https://iris.cnr.it/handle/20.500.14243/174807},
}
@TECHREPORT{DELGROSSO_2011_TECHREPORT_D_346852,
AUTHOR = {Del Grosso, A. M.},
TITLE = {The Web-Based System for the Management of Greek-Arabic Texts},
YEAR = {2011},
ABSTRACT = {The work carried out by the ILC-CNR unit in the first period of "Greek into Arabic" has been organized into three main activities, each one devoted to the development of a web-based framework for the study of and collaborative search on the pseudo-Theology of Aristotle and on its Greek sources},
KEYWORDS = {Digital Philology, Digital Humanities},
URL = {https://iris.cnr.it/handle/20.500.14243/346852},
}
@TECHREPORT{DESIPRI_2011_TECHREPORT_DGLPFMVMFD_174745,
AUTHOR = {Desipri, E. and Gavrilidou, M. and Labropoulou, P. and Piperidis, S. and Frontini, F. and Monachini, M. and Victoriaarranz and Mapelli, V. and Francopoulo, G. and Declerck, T.},
TITLE = {Documentation and User Manual of the META-SHARE Metadata Model},
YEAR = {2011},
ABSTRACT = {The current deliverable presents the META-SHARE metadata schema v1. 0, as implemented in the META-SHARE XSD's v1. 0 released to (META-NET and PSP partners) in July 2011 for text corpora and lexical/conceptual resources and its supplement for audio corpora, tools and language descriptions (simplified/refactored version) as implemented in November. It is meant to act as a user manual, providing explanations on the model contents for LRs providers and LRs curators that wish to describe their resources in accordance to it. Work on the schema is ongoing and changes/updates to the model are constantly being made; where appropriate, some changes that are already under way are documented in this deliverable},
KEYWORDS = {Language resources, metadata, standards},
PAGES = {150},
URL = {https://iris.cnr.it/handle/20.500.14243/174745},
}
@TECHREPORT{MARIANI_2011_TECHREPORT_MBS_174118,
AUTHOR = {Mariani, J. and Baroni, P. and Soria, C.},
TITLE = {Feedback from Contact Points on National Initiatives in the Area of Language Resources},
YEAR = {2011},
ABSTRACT = {A survey of existing initiatives on language resources all over the world promoted by the FLaReNet WG7 and carried out with contributions from the 102 FLaReNet National Contact Points},
KEYWORDS = {Language Resources},
URL = {http://www.flarenet.eu/?q=Feedback_from_Contact_Points_on_National_Initiatives_in_the_Area_of_Language_Resources},
}
@TECHREPORT{MARZI_2011_TECHREPORT_M_183045,
AUTHOR = {Marzi, C.},
TITLE = {Understanding the Architecture of the Mental Lexicon: Integration of Existing Approaches},
YEAR = {2011},
ABSTRACT = {The 1st NetWordS Workshop, held on the 24th, 25th and 26th of November 2011 in the Research Area of the Italian National Research Council, brought together 37 participants (Scholars, Post-Docs, PhD students) from various European countries. Eighteen speakers, experts of various scientific domain and with different theoretical inclinations, discussed cross-disciplinary approaches to the Understanding of the Architecture of Mental Lexicon, reflecting the interdisciplinarity and synergy fostered by NetWordS, the European Research Networking Programme on Word Structure The workshop was organised with the ambitious goal of paving the way towards a European interdisciplinary research agenda on the Mental Lexicon for the coming 10 years, with particular emphasis on the three main challenges that NetWordS is intended to address:-Lexicon and Rules in the grammar-Word knowledge and word use-Words and meanings Leading scholars, mostly connected through NetWordS, were invited to address three basic questions:-What are, in the speaker's area of expertise, the most pressing open issues concerning the architecture of the Mental Lexicon?-What and how can progress in other research areas contribute to addressing these issues?-What can advancement in our understanding of these issues contribute to progress in other areas?},
KEYWORDS = {Mental Lexicon, Integration of existing approaches},
URL = {http://www.networds-esf.eu/index.php?page=1st-networds-workshop},
}
@TECHREPORT{MONACHINI_2011_TECHREPORT_MFS_174795,
AUTHOR = {Monachini, M. and Frontini, F. and Soria, C.},
TITLE = {KYOTO-LMF WordNet Representation Format},
YEAR = {2011},
ABSTRACT = {The format described in the following pages is the final revised proposal for representing wordnets inside the Kyoto project (henceforth "Kyoto-LMF wordnet format"). The reference model is Lexical Markup Framework (LMF), version 16, probably one of the most widely recognized standards for the representation of NLP lexicons. The goals of LMF are to provide a common model for the creation and use of such lexical resources, to manage the exchange of data between and among them, and to enable the merging of a large number of individual resources to form extensive global electronic respurces. LMF was specifically designed to accomodate as many models of lexical representations as possible. Purposefully, it is designed as a mea-model, i. e a high-level specification for lexical resources defining the structural constraints of a lexicon},
KEYWORDS = {Wordnets, LMF, ISO, Representation formats, standards},
PAGES = {32},
URL = {https://iris.cnr.it/handle/20.500.14243/174795},
}
@TECHREPORT{MONACHINI_2011_TECHREPORT_MQCBBCCFHKLMOPPRSUW_177116,
AUTHOR = {Monachini, M. and Quochi, V. and Calzolari, N. and Bel, N. and Budin, G. and Caselli, T. and Choukri, K. and Francopoulo, G. and Hinrichs, E. and Krauwer, S. and Lemnitzer, L. and Mariani, J. and Odijk, J. and Piperidis, S. and Przepiorkowski, A. and Romary, L. and Schmidt, H. and Uszkoreit, H. and Wittenburg, P.},
TITLE = {The Standards' Landscape Towards an Interoperability Framework},
YEAR = {2011},
ABSTRACT = {This document proposes an overview of the current scene towards an Interoperability Framework and acts as a reference point for the current standards that the community fosters and encourages to adopt/improve. This initiative is in close synchronization with other relevant initiatives such as CLARIN, ELRA, ISO and TEI and META-Share. The document builds on the CLARIN Standardisation Action Plan and adapts and extends it to the needs of the broader LT Community, beyond the SSH research areas including the industry. The main goal of this document is to give a practical orientation for various LT players, both commercial and academic; the main message being that a harmonized domain of language resources and technology can be achieved stepwise, but that an effort to adopt standards is necessary to overcome fragmentation. NB: This is to be intended by no means as a static, closed document, rather a dynamic one which needs to be constantly/periodically revised and updated by the community itself},
KEYWORDS = {Standards, interoperability},
PAGES = {23},
URL = {https://iris.cnr.it/handle/20.500.14243/177116},
}
@TECHREPORT{MONTEMAGNI_2011_TECHREPORT_MW_177115,
AUTHOR = {Montemagni, S. and Wieling, M.},
TITLE = {Definizione di un modello computazionale della variazione dialettale basato sull'integrazione di fattori socio-demografici e geografici},
YEAR = {2011},
ABSTRACT = {In this study, we used a mixed-effects logistic regression model in combination with generalized additive logistic modeling to predict lexical differences in Tuscan dialects with respect to standard Italian. We used lexical information for 170 concepts in 213 locations in Tuscany. Although geographical position is an important predictor with locations distant from Florence having lexical forms more likely to differ from standard Italian, several other factors emerged as significant. The model predicts that lexical variants used by older speakers and in smaller as well as poorer communities are more likely to differ from standard Italian. The impact of the demographic variables, however, varied from concept to concept. For a majority of concepts, smaller and poorer communities have lexical forms different from standard Italian. For a smaller minority of concepts, however, larger and richer communities have lexical forms different from standard Italian. Similarly, the effect of speaker age and the average community age also varied per concept. While not significant as a fixed effect, the concept frequency showed significant geographical variation. These results clearly identify important factors involved in dialect variation at the lexical level. In addition, this study illustrates the usefulness of mixed-effects regression techniques together with generalized additive modeling for analyzing lexical dialect data},
KEYWORDS = {Dialettologia toscana, Dialettometria, variazione lessicale},
URL = {https://iris.cnr.it/handle/20.500.14243/177115},
}
@TECHREPORT{PROKOPIDIS_2011_TECHREPORT_PPTPFRT_290521,
AUTHOR = {Prokopidis, P. and Papavassiliou, V. and Toral, A. and Poch Riera, M. and Frontini, F. and Rubino, F. and Thurmair, G.},
TITLE = {WP-4. 4: Report on the revised Corpus Acquisition & Annotation subsystem and its components},
YEAR = {2011},
KEYWORDS = {corpus acquisition, corpus annotation},
URL = {http://www.panacea-lr.eu/system/deliverables/PANACEA_D4.4.pdf},
}
@TECHREPORT{PROKOPIDIS_2011_TECHREPORT_PPTRFRT_290522,
AUTHOR = {Prokopidis, P. and Papavassiliou, V. and Toral, A. and Riera, M. P. and Frontini, F. and Rubino, F. and Thurmair, G.},
TITLE = {WP-4. 5: Final Report on the Corpus Acquisition & Annotation subsystem and its components},
YEAR = {2011},
KEYWORDS = {corpus acquisition, corpus annotation},
URL = {http://www.panacea-lr.eu/system/deliverables/PANACEA_D4.5.pdf},
}
@TECHREPORT{SASSOLINI_2011_TECHREPORT_SC_183039,
AUTHOR = {Sassolini, E. and Cinini, A.},
TITLE = {Metodologie di "thorough indexing" descrittivo, semantico e topologico delle risorse contenutistiche},
YEAR = {2011},
ABSTRACT = {D4 (deliverable) is the final result of task T2. 1. of Smartcity project. It analyzes the principles and methodologies of "Thorough indexing" of the text materials in order to define possible new rules for the application of a systematic approach to tagging of knowledge base},
KEYWORDS = {Term extraction, Analisi Semantica},
URL = {https://iris.cnr.it/handle/20.500.14243/183039},
}
@TECHREPORT{SASSOLINI_2011_TECHREPORT_SC_174755,
AUTHOR = {Sassolini, E. and Cinini, A.},
TITLE = {SmartCity-II relazione scientifica: report tecnico},
YEAR = {2011},
ABSTRACT = {This technical report presents the use of NLP techniques (text mining, text analysis) to develop specific tools that allow to create linguistic resources related to the cultural heritage domain, particularly "Empoli e dintorni"},
KEYWORDS = {Corpus (creation, annotation, etc.), Cultural Heritage},
URL = {https://iris.cnr.it/handle/20.500.14243/174755},
}
@TECHREPORT{SASSOLINI_2011_TECHREPORT_SS_174798,
AUTHOR = {Sassolini, E. and Stefano, S.},
TITLE = {Primo report tecnico: tecnologie per il trattamento delle informazioni multimediali. ILC-CNR e STRAT-CRIT},
YEAR = {2011},
ABSTRACT = {Technologies for semantic annotation, automatic classification, clustering and browsing in textual databases, for realization of a multimedia on-line press review},
KEYWORDS = {Information Extraction, Information Retrieval},
URL = {https://iris.cnr.it/handle/20.500.14243/174798},
}
@TECHREPORT{SORIA_2011_TECHREPORT_SC_174175,
AUTHOR = {Soria, C. and Calzolari, N.},
TITLE = {Project presentation-results},
YEAR = {2011},
ABSTRACT = {International cooperation and re-creation of a community are the most important drivers for a coherent evolution of the Language Resource (LR) area in the next years. FLaReNet has been a European forum to facilitate interaction among LR stakeholders and its structure took into account the fact that LRs present various dimensions and must be approached from many perspectives: technical, but also organisational, economic, legal, political. The Network addressed also multicultural and multilingual aspects, essential when facing access and use of digital content in today's Europe. FLaReNet consolidated existing knowledge, presenting it analytically and visibly, and contributed to structuring the area of LRs of the future by discussing new strategies to: convert existing and experimental technologies related to LRs into useful economic and societal benefits; integrate so far partial solutions into broader infrastructures; consolidate areas mature enough for recommendation of best practices; anticipate the needs of new types of LRs. The outcomes of FLaReNet has been of a directive nature, to help identify those priority areas of LRs of major interest for the public that need public funding to develop or improve. A blueprint of actions has constituted the input to policy development both at EU and national level for identifying new language policies that support linguistic diversity in Europe, in combination with strengthening the language product market, e. g. for new products and innovative services, especially for less technologically advanced languages},
KEYWORDS = {Language resources, infrastructures, international cooperation},
PAGES = {44},
URL = {https://iris.cnr.it/handle/20.500.14243/174175},
}
@TECHREPORT{SORIA_2011_TECHREPORT_SM_174177,
AUTHOR = {Soria, C. and Mariani, J.},
TITLE = {Report on Existing Projects and Initiatives},
YEAR = {2011},
ABSTRACT = {It is of utmost importance for a project such as T4ME to get a comprehensive and reliable overview of the projects and initiatives addressing similar topics. Mainly in order to establish relationships, build on previous achievement, and get a reliable and up-to-date view about the currentstate of the art. This report surveys ongoing and recent projects and initiatives at the national, EU and transnational level addressing Machine Translation, multilingual issues, language resources and technologies, or infrastructural issues at large. Focus is on Europe but relevant initia-tives outside Europe have been reviewed as well},
KEYWORDS = {language resources and technologies, infrastructures},
PAGES = {134},
URL = {http://www.meta-net.eu/public_documents/t4me/META-NET-D11.3-Final.pdf},
}
@TECHREPORT{VOSSEN_2011_TECHREPORT_VBRASADHMBF_174121,
AUTHOR = {Vossen, P. and Bosma, W. and Rigau, G. and Agirre, E. and Soroa, A. and Aliprandi, C. and De Jonge, J. and Hielkema, F. and Monachini, M. and Bartolini, R. and Frontini, F.},
TITLE = {KyotoCore: integrated system for knowledge mining from text},
YEAR = {2011},
ABSTRACT = {In this deliverable, we describe KyotoCore, an integrated system for applying text mining. We describe the software architecture of KyotoCore, the single modules and the process flows. Finally, we describe a use case where we apply the complete process toan English database on estuaries},
KEYWORDS = {Knowledge and text mining software},
PAGES = {56},
URL = {https://iris.cnr.it/handle/20.500.14243/174121},
}
@MISC{DELGROSSO_2011_MISC_D_370144,
AUTHOR = {Del Grosso, A. M.},
TITLE = {Moduli e componenti di Pinakes Text},
YEAR = {2011},
ABSTRACT = {Il contributo illustra i moduli dell'applicativo Pinakes Text implementati per il progetto ERC 2009 Advanced Grant n. 249431. Titolo: Greek into Arabic. Philosophical concepts and linguistic bridges},
KEYWORDS = {computational philology, digital philology, software engineering, greek into arabic, erc},
URL = {https://iris.cnr.it/handle/20.500.14243/370144},
}
@MISC{DELLORLETTA_2011_MISC_DM_217961,
AUTHOR = {Dell'Orletta, F. and Montemagni, S.},
TITLE = {Towards an NLP-based approach for measuring syntactic complexity: preliminary experiments with Italian texts from different registers},
YEAR = {2011},
ABSTRACT = {In this paper, we explore how NLP can be used to automatically identify relevant syntactic complexity features in texts with the aim of assessing their correlation with specific linguistic registers. Our final goal is twofold. On the one hand, we demonstrate that automatic morpho-syntactic and syntactic annotation of texts provides sufficiently accurate output for use in the automatic extraction and measurement of syntactic complexity features. On the other hand, we identify the set of syntactic features strongly correlating with considered linguistic registers},
KEYWORDS = {Language Variation, Natural Language Processing, Syntactic Complexity},
URL = {http://www.benszm.net/BSBWWS/Dellorletta_Montemagni.pdf},
CONFERENCE_NAME = {Workshop on "Cross-linguistic and language-internal variation in text and speech: focus on the joint analysis of multiple characteristics"},
}
@MISC{DIDONATO_2011_MISC_D_407974,
AUTHOR = {Di Donato, F.},
TITLE = {Dati pubblici aperti e collegati},
YEAR = {2011},
ABSTRACT = {presentazione al LinuxDay Pisa, Dipartimento di Informatica dell'Università di Pisa, 21 ottobre 2011},
URL = {https://iris.cnr.it/handle/20.500.14243/407974},
}
@MISC{DIDONATO_2011_MISC_D_406282,
AUTHOR = {Di Donato, F.},
TITLE = {Linked Open Data. Definizioni, esempi, esperienze pisane},
YEAR = {2011},
ABSTRACT = {presentazione al Festival Delle Libertà Digitali, Abbazia di San Zeno, Pisa, 7 ottobre 2011},
URL = {https://iris.cnr.it/handle/20.500.14243/406282},
}
@MISC{DIDONATO_2011_MISC_D_406274,
AUTHOR = {Di Donato, F.},
TITLE = {Lo stato trasparente. Il movimento per gli Open Government Data},
YEAR = {2011},
ABSTRACT = {presentazione al ciclo di seminari Krisis-Crisi, Dipartimento di Scienze politiche e sociali dell'Università di Pisa, Pisa, 12 maggio 2011},
URL = {https://iris.cnr.it/handle/20.500.14243/406274},
}
@MISC{FRONTINI_2011_MISC_FM_217962,
AUTHOR = {Frontini, F. and Monachini, M.},
TITLE = {Towards interfacing lexical and ontological resources},
YEAR = {2011},
ABSTRACT = {During the last two decades, the Computational Linguistics community has dedicated considerable effort to the research and development Lexical Resources (LRs), especially Computational Lexicons. These LRs, even though belonging to different linguistic approaches and theories, share a common element; all of them contain, explicitly or implicitly, an ontology as the means of organizing their structure},
KEYWORDS = {language resources, ontologies},
PAGES = {26},
URL = {https://iris.cnr.it/handle/20.500.14243/217962},
CONFERENCE_NAME = {ONTOLOGIES AND LEXICAL SEMANTICS},
}
@MISC{GUADAGNINI_2011_MISC_G_241062,
AUTHOR = {Guadagnini, E.},
TITLE = {recensione a: Giulio Vaccaro, «Nun c'è lingua come la romana» Voci dell'antico dialetto romanesco},
YEAR = {2011},
URL = {https://iris.cnr.it/handle/20.500.14243/241062},
ISSN = {1826-8234},
}
@MISC{MONTEMAGNI_2011_MISC_M_218003,
AUTHOR = {Montemagni, S.},
TITLE = {Ontology Learning. An introduction},
YEAR = {2011},
ABSTRACT = {The tutorial is organised into two parts: PART 1 is devoted to provide the basic notions underlying Ontology Learning, in particular why it is needed, how it can be carried out and how its results can be evaluated. PART 2 discusses the topic of Ontology Learning in the Legal domain, with particular attention to the specific challenges posed by it. It also provides an overview of different feasibility studies carried out in the legal domain},
KEYWORDS = {Ontology Learning, Legal Information extraction, Natural Language Processing},
URL = {https://iris.cnr.it/handle/20.500.14243/218003},
CONFERENCE_NAME = {Summer School LEX 2011, Ravenna, Italy "Managing Legal Resources in the Semantic Web"},
}
@MISC{PEZZULO_2011_MISC_PB_182898,
AUTHOR = {Pezzulo, G. and Butz, M. V.},
TITLE = {Schema-based architectures of machine learning},
YEAR = {2011},
ABSTRACT = {Schema-based architectures (SBAs) consist of collections of modularly and hierarchically organized schemas, which constitute building blocks for perception, cognition, and action. An SBA organizes these schemas in such a way so that action selection, motor coordination, and cognition in the general sense interact effectively. SBAs were mainly inspired by theories of sensorimotor adaptation and cognitive development and learning. Particularly Jean Piaget's research on and theories of cognitive development in infants and children inspired the design of SBAs. Machine learning develops algorithms to learn, structure, and continuously adapt SBAs. Various forms of representations are used to develop SBAs, including symbolic representations, rule-based representations, as well as neural network representations},
KEYWORDS = {Human Cognitive Architecture},
PAGES = {2942-2945},
URL = {http://www.springerreference.com/docs/html/chapterdbid/319710.html},
PUBLISHER = {Springer (Dordrecht, NLD)},
CONFERENCE_PLACE = {Dordrecht},
EDITOR = {Seel, N. M.},
}
@MISC{PIRRELLI_2011_MISC_P_228505,
AUTHOR = {Pirrelli, V.},
TITLE = {ESF Research Networking Programme: "The European Network on Word Structure. Cross-disciplinary approaches to understanding word structure in the languages of Europe-(NetWordS)},
YEAR = {2011},
URL = {https://iris.cnr.it/handle/20.500.14243/228505},
}
@MISC{VBUTZ_2011_MISC_VP_175356,
AUTHOR = {V Butz, M. and Pezzulo, G.},
TITLE = {Anticipatory learning},
YEAR = {2011},
ABSTRACT = {Anticipatory learning is sometimes considered synonymous with the general mechanism of learning to generate predictions or learning a predictive or forward model of an encountered environment or problem. However, the term anticipation usually does not simply refer to predictions, but rather to predictions that are expected to be relevant to an organism and that are used to effectively adapt decisions and behaviors of organisms. Therefore, anticipatory learning is not merely about learning to predict, but learning to predict those aspects that are relevant for the learning system. Such predictions may start on a very low sensorimotor level, such as learning how body movements feel in order to be able to focus on other sensory information. On a higher level, action-dependent contingencies may be learned that are highly useful for decision making},
KEYWORDS = {Curious learning, Ideo-motor principle of learning, Learning of predictions, Sensorimotor learning},
PAGES = {263-266},
URL = {http://www.springerreference.com/docs/html/chapterdbid/319709.html},
PUBLISHER = {Springer (Dordrecht, NLD)},
ISBN = {978-1-4419-1427-9},
CONFERENCE_PLACE = {Dordrecht},
}
@MISC{VENTURI_2011_MISC_V_108688,
AUTHOR = {Venturi, G.},
TITLE = {Tecnologie linguistico-computazionali per il monitoraggio della competenza linguistica italiana degli alunni stranieri nella scuola primaria e secondaria},
YEAR = {2011},
URL = {https://iris.cnr.it/handle/20.500.14243/108688},
CONFERENCE_NAME = {Migrazioni / Linguaggi, seminario (Roma, 30 marzo 2011)},
}
@ARTICLE{ARTALE_2010_ARTICLE_AGV_146444,
AUTHOR = {Artale, E. and Guadagnini, E. and Vaccaro, G.},
TITLE = {Per una bibliografia dei volgarizzamenti dei classici (il Corpus DiVo)},
YEAR = {2010},
ABSTRACT = {Viene presentato un primo spoglio bibliografico della bibliografia del Corpus DiVo (il corpus del Dizionario dei Volgarizzamenti, progetto nato nel 2009 all'Opera del Vocabolario Italiano per iniziativa di Elisa Guadagnini e Giulio Vaccaro), corpus che intende comprendere tutti i volgarizzamenti due e trecenteschi di testi latini (o greci) composti in epoca antica e tardoantica, fino a Boezio (che morì nel 525 d. C.). Vi sono inclusi testi tradotti in una qualunque varietà dell'italiano antico, eventualmente attraverso un tramite francese o appartenente ad una diversa varietà italoromanza. Sono state censite soltanto le traduzioni che propongono una resa volgare puntuale del testo latino, escludendo le compilazioni e le enciclopedie. Le schede bibliografiche sono ordinate alfabeticamente, con riferimento al campo "abbreviazione DiVo". La paternità delle schede è segnalata dalla sigla che occupa l'ultimo campo: si indica con [EA] Elena Artale, con [EG] Elisa Guadagnini, con [GV] Giulio Vaccaro},
KEYWORDS = {Volgarizzamenti, classici latini, vocabolari},
PAGES = {309-366},
URL = {https://iris.cnr.it/handle/20.500.14243/146444},
VOLUME = {15},
ISSN = {1591-8254},
JOURNAL = {BOLLETTINO-OPERA DEL VOCABOLARIO ITALIANO},
}
@ARTICLE{CALZOLARI_2010_ARTICLE_C_37720,
AUTHOR = {Calzolari, N.},
TITLE = {FLaReNet-META-NET-CLARIN. La presenza Italiana nei più importanti progetti strategici e infrastrutturali di TAL in Europa},
YEAR = {2010},
URL = {https://iris.cnr.it/handle/20.500.14243/37720},
}
@ARTICLE{CASTELFRANCHI_2010_ARTICLE_CPT_150097,
AUTHOR = {Castelfranchi, C. and Pezzulo, G. and Tummolini, L.},
TITLE = {Behavioral Implicit Communication (BIC): Communicating with smart environments via our practical behaviors and its traces},
YEAR = {2010},
ABSTRACT = {A crucial part of the intelligence that smart environments should display is a specific form of social intelligence: the ability to read humans behavior and its traces in terms of the underlying intentions and assumptions. Such ability is crucial to enable human users to tacitly coordinate and negotiate with smart and proactive digital environments. In this paper, we argue that the necessary tool for this is behavioral and stigmergic implicit (i. e. non-conventional) communication. We present the basic theory of such a fundamental interactive means: the theory of Behavioral Implicit Communication (BIC)},
KEYWORDS = {Tacit communication, stigmergy, coordination, mindreading, ambient intelligence, mind-reading, communication},
PAGES = {1-12},
URL = {https://iris.cnr.it/handle/20.500.14243/150097},
VOLUME = {2},
}
@ARTICLE{DIDONATO_2010_ARTICLE_D_384155,
AUTHOR = {Di Donato, F.},
TITLE = {Le sfide dell'Open Access al sistema di comunicazione della scienza},
YEAR = {2010},
ABSTRACT = {Il movimento per l'accesso aperto alla letteratura scientifica ha avviato una campagna in favore della condivisione dell'informazione e della conoscenza nei primi anni novanta del secolo scorso, ma è tra il 2002 e il 2003 che l'Open Access ha cominciato a configurarsi in seno alla comunita accademica come un nuovo paradigma di pubblicazione. Risalgono infatti a quegli anni le due imponenti iniziative, la Budapest Open Access Initiative (2002) e la Conference on Open Access to Knowledge in the Sciences and Humanities (2003), che hanno siglato il riconoscimento internazionale del movimento per una letteratura scientifica Open Access, vale a dire letteratura digitale, on-line, gratuita e libera da alcune restrizioni dettate dalle licenze per i diritti di sfruttamento commerciale},
URL = {https://iris.cnr.it/handle/20.500.14243/384155},
ISSN = {1825-0327},
JOURNAL = {SIFP},
}
@ARTICLE{FERRO_2010_ARTICLE_FOPP_37718,
AUTHOR = {Ferro, M. and Ognibene, D. and Pezzulo, G. and Pirrelli, V.},
TITLE = {Reading as active sensing: a computational model of gaze planning in word recognition},
YEAR = {2010},
ABSTRACT = {We offer a computational model of gaze planning during reading that consists of two main components: a lexical representation network, acquiring lexical representations from input texts (a subset of the Italian CHILDES database), and a gaze planner, designed to recognize written words by mapping strings of characters onto lexical representations. The model implements an active sensing strategy that selects which characters of the input string are to be fixated, depending on the predictions dynamically made by the lexical representation network. We analyze the developmental trajectory of the system in performing the word recognition task as a function of both increasing lexical competence, and correspondingly increasing lexical prediction ability. We conclude by discussing how our approach can be scaled up in the context of an active sensing strategy applied to a robotic setting},
KEYWORDS = {Reading, Language Learning, Mental Lexicon},
PAGES = {1-16},
URL = {https://iris.cnr.it/handle/20.500.14243/37718},
VOLUME = {4},
ISSN = {1662-5218},
JOURNAL = {FRONTIERS IN NEUROROBOTICS},
}
@ARTICLE{FERRO_2010_ARTICLE_FPP_37719,
AUTHOR = {Ferro, M. and Pezzulo, G. and Pirrelli, V.},
TITLE = {Morphology, Memory and the Mental Lexicon},
YEAR = {2010},
ABSTRACT = {Recent experimental evidence on morphological learning and processing has prompted a less deterministic and modular view of the interaction between stored word knowledge and on-line processing. Storing a word in the mental lexicon does not simply entail keeping a faithful memory image of that word in the most compact way. It also requires encoding and manipulating such image through topological structures that are optimally adapted to word production and comprehension. Temporal Self-Organizing Maps (THSOMs) are a novel model of artificial neural network that keeps time serial information through predictive activation chains of receptors encoding both spatial and temporal information of input stimuli. The impact of this model on issues of lexical organization and morphological processing is investigated in detail through a series of simulations shedding light on the dynamics between short-term memory (activation), long-term memory (learning) and morphological organization of stored word forms (topology)},
KEYWORDS = {Morphology, Word Processing, Word Learning, Mental Lexicon},
PAGES = {203-242},
URL = {https://iris.cnr.it/handle/20.500.14243/37719},
VOLUME = {2},
ISSN = {1720-9331},
JOURNAL = {LINGUE E LINGUAGGIO},
}
@ARTICLE{FORNACIARI_2010_ARTICLE_FCF_433730,
AUTHOR = {Fornaciari, A. and Cignoni, L. and Fornaciari, G.},
TITLE = {STUDENTS' PARTICIPATION IN AN ARCHAEOANTHROPOLOGY COURSE USING A CONTENT AND LANGUAGE INTEGRATED LEARNING (CLIL) METHODOLOGY},
YEAR = {2010},
ABSTRACT = {In this paper we present the results of an ongoing archaeoanthropology project which was started in the year 2007 at Benabbio, a village located near Lucca, in northern Tuscany, Italy. Aim of the project is to exhume individuals buried in the medieval cemetery near the church of the Castle of Benabbio (also in course of excavation), and of people who died in the village during the cholera epidemic of the year 1855. Burials and artefacts, ranging between 12th and 19th centuries, have been recorded on a computer database to provide information about the cultural and physical aspects of this ancient human group. The discovery of some well preserved medieval houses led to the decision to examine the settlement in its entirety, exploring the spatial and chronological development of the site. Archaeological exploration of this vast area will involve not only the cemetery of the castle but also the houses and the manor, investigating the origins of the settlement and the early stages of encastlement, by which the local lord could dominate the surrounding countryside and control his neighbours. It will be possible to reconstruct the different phases of organization of the settlement and the life-style and diseases of the inhabitants of the castle. Furthermore, this project is an important testbed for the development of field techniques such as balloon photography, high-resolution georadar survey, GIS, as well as special laboratory techniques for palaeopathology such as computerized tomography (CT), electron microscopy (EM), stable isotope palaeonutrition and ancient DNA (aDNA), that can be used to diagnose ancient diseases. This paper has a dual purpose: on the one hand, it makes the first results of the excavations available to the widest possible audience; on the other hand, it describes the application of a CLIL methodology which uses a foreign language to study a specific discipline. In this case, English is used as supporting language to carry out a number of tasks on},
KEYWORDS = {archaeology},
PAGES = {2684-2692},
URL = {https://iris.cnr.it/handle/20.500.14243/433730},
VOLUME = {1},
}
@ARTICLE{FRANCESCONI_2010_ARTICLE_FMPT_50348,
AUTHOR = {Francesconi, E. and Montemagni, S. and Peters, W. and Tiscornia, D.},
TITLE = {Integrating a Bottom-Up and Top-Down Methodology for Building Semantic Resources for the Multilingual Legal Domain},
YEAR = {2010},
ABSTRACT = {This article presents a methodology for multilingual legal knowledge acquisition and modelling. It encompasses two comlementary strategies. On the one hand, there is the top-down definition of the conceptual structure of the legal domain under consideration on the basis of expert jugdment. This structure is language-independent, modeled as an ontology, and can be aligned with other ontologies that capture similar or complementary knowledge, in order to provide a wider conceptual embedding. Another top-down approach is the exploitation of the explicit structure of legal texts, which enables the targeted identification of text spans that play an ontological role and their subsequent inclusion in the knowledge model. On the other hand, the linguistically motivated, text-based bottom-up population and incremental refinement of this conceptual structure using (semi-)automatic NLP techniques, maximizes the completeness and domain-specificity of the resulting knowledge. The proposed methodology is concerned with the relation between these two differently derived types of knowledge, and defines a framework for interfacing lexical and ontological knowledge, the result of which offers various perspectives on multilingual legal knowledge. Two case-studies combining bottom-up and top-down methodologies for knowledge modelling and learning are presented as illustrations of the methodology},
KEYWORDS = {Knowledge Modelling, Knowledge Acquisition, Natural Language Processing, Ontology Learning},
PAGES = {95-121},
URL = {https://iris.cnr.it/handle/20.500.14243/50348},
VOLUME = {6036/},
}
@ARTICLE{GUADAGNINI_2010_ARTICLE_G_275407,
AUTHOR = {Guadagnini, E.},
TITLE = {Scelta di voci del Tesoro della Lingua Italiana delle Origini (quattordicesima serie)},
YEAR = {2010},
ABSTRACT = {Voci forte (1) agg. /avv. /s. m., forte (2) s. m. /s. f., forte (3) s. m., forte (4) s. f. del Tesoro della Lingua Italiana delle Origini (95-131)},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana},
PAGES = {17-196},
URL = {https://iris.cnr.it/handle/20.500.14243/275407},
VOLUME = {15},
ISSN = {1591-8254},
JOURNAL = {BOLLETTINO-OPERA DEL VOCABOLARIO ITALIANO},
}
@ARTICLE{GUADAGNINI_2010_ARTICLE_G_269525,
AUTHOR = {Guadagnini, E.},
TITLE = {Voce LOCUZIONE s. f. del Tesoro della Lingua Italiana delle Origini},
YEAR = {2010},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana},
URL = {http://tlio.ovi.cnr.it/voci/024722.htm},
VOLUME = {14},
ISSN = {2240-5216},
JOURNAL = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI},
}
@ARTICLE{MARINELLI_2010_ARTICLE_MMTM_37716,
AUTHOR = {Marinelli, R. and Mazzocchi, F. and Tiberi, M. and Motta, M.},
TITLE = {Il modello semantico di EuroWordNet come strumento per la strutturazione della relazione associativa nei thesauri},
YEAR = {2010},
ABSTRACT = {Thesauri are tools which semantically organize a domain of knowledge for operational purposes. Their relational semantics is concerned with methods that connect terms with related meanings and it is important to support information retrieval, enhancing the information recall performance and contributing to improve precision. In fact, the network of relations of a thesaurus has an important semantic function, providing a representation of the meaning of each thesaurus term and a map of the conceptual structure of a subject area. The traditional thesaurus format-as described in international standards-includes the hierarchical, associative and equivalence relationships. However, a rather widespread opinion is that this format should be refined, in order to cope with the current needs of information organization. This paper discusses the possibility of refining the associative relation into a number of sub-kinds by adopting the semantic model of EuroWordNet (EWN), as it was used, according to one of its national versions, ItalWordNet (IWN), taking into account the terminological database Mariterm, which contains terms belonging to the maritime domain. It is also stressed how RT designation and refinement appear to be domain dependent, in the sense that they are associated with the specific features of a knowledge field},
KEYWORDS = {terminologia, thesauri, relazione associativa, risorse linguistiche, database semantico-lessicali},
PAGES = {249-263},
URL = {http://www.aib.it/aib/boll/2010/1003263.htm},
VOLUME = {50 (3)},
ISSN = {1121-1490},
JOURNAL = {BOLLETTINO AIB},
}
@ARTICLE{MARZI_2010_ARTICLE_MPS_37721,
AUTHOR = {Marzi, C. and Pardelli, G. and Sassi, M.},
TITLE = {Grey literature and computational linguistics: From paper to net},
YEAR = {2010},
ABSTRACT = {The advent and exponential development of the World Wide Web has led to an increasing availability of unstructured knowledge and distributed information sources, meeting general public requirements that are hardly addressed by other more traditional information channels. This trend has concurrently raised a considerable interest in the application of Computational Linguistics (CL) methodologies to document access and retrieval, as they offer the unprecedented opportunity to make the subjective, user-centred information demands of Net citizens meet the ever changing and heterogeneous information flow of the web. Over the last five years, more and more Italian Universities have introduced CL courses into their Humanities curricula, making available on-line teaching materials, tutorials and language engineering software that appear to supply the lack of offer from traditional Italian publishing houses. In this paper, we consider in some detail the role played by this type of Grey Literature in bringing up a wider and increasingly more aware community of web users in Italy},
KEYWORDS = {Grey Literature},
PAGES = {145-148},
URL = {http://www.scopus.com/record/display.url?eid=2-s2.0-78149461778\&origin=inward},
VOLUME = {6 (3)},
ISSN = {1574-1796},
JOURNAL = {THE GREY JOURNAL},
}
@ARTICLE{OGNIBENE_2010_ARTICLE_OPB_50347,
AUTHOR = {Ognibene, D. and Pezzulo, G. and Baldassarre, G.},
TITLE = {Learning to Look in Different Environments: An Active-Vision Model which Learns and Readapts Visual Routines},
YEAR = {2010},
ABSTRACT = {One of the main claims of the active vision framework is that nding data on the basis of task requirements is more e?cient than reconstructing the whole scene by performing a complete visual scan. To be successful, this approach requires that agents learn visual routines to direct overt attention to locations with the information needed to accomplish the task. In ecological conditions, learning such visual routines is di?cult due to the partial observability of the world, the changes in the environment, and the fact that learning signals might be indirect. This paper uses a reinforcement-learning actor-critic model to study how visual routines can be formed, and then adapted when the environment changes, in a system endowed with a controllable gaze and reaching capabilities. The tests of the model show that: (a) the autonomouslydeveloped visual routines are strongly dependent on the task and the statistical properties of the environment; (b) when the statistics of the environment change, the performance of the system remains rather stable thanks to the re-use of previously discovered visual routines while the visual exploration policy remains for long time sub-optimal. We conclude that the model has a robust behaviour but the acquisition of an optimal visual exploration policy is particularly hard given its complex dependence on statistical properties of the environment, showing another of the di?culties that adaptive active vision agents must face},
KEYWORDS = {adaptive vision, neural networks},
PAGES = {199-210},
URL = {https://iris.cnr.it/handle/20.500.14243/50347},
VOLUME = {6226/},
}
@ARTICLE{PEZZULO_2010_ARTICLE_PBLB_50351,
AUTHOR = {Pezzulo, G. and Barca, L. and Lamberti Bocconi, A. and Borghi, A. M.},
TITLE = {When Affordances Climb into your Mind: Advantages of Motor Simulation in a Memory Task Performed by Novice and Expert Rock Climbers},
YEAR = {2010},
ABSTRACT = {Does the sight of multiple climbing holds laid along a path activate motor simulation of climbing that path? One way of testing whether multiple affordances and their displacement influence the formation of a motor simulation is to study acquired motor skills. We used a behavioral task in which expert and novice rock climbers were shown three routes: an easy route, a route impossible to climb but perceptually salient, and a difficult route. After a distraction task, they were then given a recall test in which they had to write down the sequence of holds composing each route. We found no difference between experts and novices on the easy and impossible routes, whereas on the difficult route, the performance of experts was better than that of novices. This suggests that seeing a climbing wall activates a motor, embodied simulation, which relies not on perceptual salience, but on motor competence. More importantly, our results show that the capability to form this simulation is modulated by individuals' motor repertoire and expertise, and that this strongly impacts recall},
KEYWORDS = {Simulation Affordance Embodied cognition Grounded cognition Canonical neurons Mirror neurons Motor memory Memory for actions Motor chunks},
PAGES = {68-73},
URL = {https://iris.cnr.it/handle/20.500.14243/50351},
VOLUME = {73},
DOI = {10.1016/j.bandc.2010.03.002},
ISSN = {0278-2626},
JOURNAL = {BRAIN AND COGNITION},
}
@ARTICLE{PROIETTI_2010_ARTICLE_PS_403986,
AUTHOR = {Proietti, C. and Sandu, G.},
TITLE = {Fitch's paradox and ceteris paribus modalities},
YEAR = {2010},
ABSTRACT = {The paper attempts to give a solution to the Fitch's paradox though the strategy of the reformulation of the paradox in temporal logic, and a notion of knowledge which is a kind of ceteris paribus modality. An analogous solution has been offered in a different context to solve the problem of metaphysical determinism},
KEYWORDS = {Verificationism, Modal logic, Knowability, Epistemic logic, Epistemology},
PAGES = {75-87},
URL = {https://iris.cnr.it/handle/20.500.14243/403986},
VOLUME = {173 (1)},
DOI = {10.1007/s11229-009-9677-7},
ISSN = {0039-7857},
JOURNAL = {SYNTHESE},
}
@ARTICLE{RUIMY_2010_ARTICLE_R_37717,
AUTHOR = {Ruimy, N.},
TITLE = {Simple_PLUS: a network of lexical semantic relations Simple_PLUS: una red de relaciones léxico-semánticas},
YEAR = {2010},
ABSTRACT = {Este artículo trata de la base de datos léxico-semántica del italiano, Simple_PLUS, y particularmente de su núcleo central: la red de relaciones léxico-semánticas. Este recurso lexical tiene como base Parole-Simple-Clips, un léxico electrónico con cuatro niveles de descripción, elaborado según el modelo SIMPLE. Simple_PLUS se compone de 30. 000 entradas semánticas, sean importadas del léxico fuente, sean recién creadas, todas dotadas de un amplio conjunto de información proporcionado por el modelo subyacente. En Simple_PLUS, aquella representación semántica fue enriquecida con una información relacional esencial, en un proceso semiautomático. Mas de 5. 000 lazos que relacionan los eventos con sus participantes y los co-participantes entre sí-vínculos que no podían ser descritos antes por falta de medios de representación adecuados-fueron codificados mediante un vocabulario descriptivo apropiado, que fue prestado del modelo EuroWordNet. Estos lazos conceptuales, que enriquecen la representación predicativa del léxico, aportan un conocimiento lexical imprescindible para las tareas de PLN y la Web semántica},
KEYWORDS = {Lexicon, lexical semantic relations, SIMPLE model, EuroWordNet model},
PAGES = {99-106},
URL = {http://www.sepln.org/?page_id=348},
VOLUME = {44},
ISSN = {1989-7553},
JOURNAL = {PROCESAMIENTO DEL LENGUAJE NATURAL},
}
@ARTICLE{TURINI_2010_ARTICLE_TBBFP_261434,
AUTHOR = {Turini, F. and Baglioni, M. and Bellandi, A. and Furletti, B. and Pratesi, C.},
TITLE = {Improving the business plan evaluation process: the role of intangibles},
YEAR = {2010},
ABSTRACT = {One of the main objectives of the European MUSING project is to design and test software tools in order to support the activities of small and medium sized businesses. In this paper we examine financial risk management and, more specifically, the self-assessment of business plans. The role of intangible assets is discussed, and we report on how intangible assets can be collected, how they can be represented, taking into account their semantic relationships, and how they can be used to build an analytical tool for business plans. The basic technology embedded in the tool is the construction of classification trees, a well-known technique in inductive learning. We show how using knowledge of intangible assets can improve the construction of the classifier, as proved by the testing carried out so far},
KEYWORDS = {Bayesian causal map, Classification trees, Intangible assets, Qualitative analysis},
PAGES = {35-50},
URL = {https://www.tandfonline.com/doi/abs/10.1080/16843703.2010.11673217},
VOLUME = {7 (1)},
DOI = {10.1080/16843703.2010.11673217},
ISSN = {1684-3703},
JOURNAL = {QUALITY TECHNOLOGY \& QUANTITATIVE MANAGEMENT},
}
@ARTICLE{TURINI_2010_ARTICLE_TBBFP_248691,
AUTHOR = {Turini, F. and Baglioni, M. and Bellandi, A. and Furletti, B. and Pratesi, C.},
TITLE = {Improving The BP Evaluation Process: The Role Of The Intangibles},
YEAR = {2010},
ABSTRACT = {One of the main objectives of the European MUSING project is to design and test software tools in order to support the activities of small and medium sized businesses. In this paper we examine financial risk management and, more specifically, the self-assessment of business plans. The role of intangible assets is discussed, and we report on how intangible assets can be collected, how they can be represented, taking into account their semantic relationships, and how they can be used to build an analytical tool for business plans. The basic technology embedded in the tool is the construction of classification trees, a well-known technique in inductive learning. We show how using knowledge of intangible assets can improve the construction of the classifier, as proved by the testing carried out so far},
URL = {https://iris.cnr.it/handle/20.500.14243/248691},
ISSN = {1684-3703},
JOURNAL = {QUALITY TECHNOLOGY \& QUANTITATIVE MANAGEMENT},
}
@BOOK{DIDONATO_2010_BOOK_D_384152,
AUTHOR = {Di Donato, F.},
TITLE = {Lo stato trasparente. Linked open data e cittadinanza attiva},
YEAR = {2010},
ABSTRACT = {Sapete quanta parte delle vostre tasse viene spesa per lo smaltimento dei rifiuti o per la ricerca sul cancro? Com'è l'aria che respirate nel tragitto da casa vostra al vostro posto di lavoro? O come vengono ripartiti i finanziamenti alla cultura nella vostra città? Un computer in rete può rispondere a questo e altro, se i dati che conserva e organizza sono strutturati in modo intelligente (Linked Data). Questo libro parla di tale possibilità nell'ambito delle istituzioni politiche e della pubblica amministrazione. Questa innovazione non tocca solo pochi specialisti, ma tutti, perché consente di ottenere informazioni in maniera più diretta e trasparente, rendendoci cittadini più consapevoli e dunque più liberi. L'autrice ricostruisce la storia di questa innovazione, promossa dalla dottrina Open Government dall'amministrazione Obama, che gradualmente si sta diffondendo nelle democrazie occidentali con un movimento che viene dal basso, prima che dall'iniziativa dei governi. Il libro spiega anche tecnicamente che cosa sono gli Open Government Data (OGD) e quali sono i requisiti giuridici e tecnici da rispettare affinché i dati possano essere definiti aperti. Un utile strumento per chi ha responsabilità pubbliche, perché anche la politica italiana scopra, affronti e attui quest'importante opportunità di cittadinanza},
URL = {https://iris.cnr.it/handle/20.500.14243/384152},
}
@BOOK{FERRO_2010_BOOK_F_256852,
AUTHOR = {Ferro, M.},
TITLE = {High Efficiency Real-Time Sensor and Actuator Control and Data Processing: A Framework Solution for Control Systems in Biomimetic Autonomous Robots},
YEAR = {2010},
URL = {https://iris.cnr.it/handle/20.500.14243/256852},
ISBN = {978-3-639-25356-6},
}
@BOOK{FRANCESCONI_2010_BOOK_FMPT_154374,
AUTHOR = {Francesconi, E. and Montemagni, S. and Peters, W. and Tiscornia D, C. D.},
TITLE = {Semantic Processing of Legal Texts: Where the Language of Law Meets the Law of Language},
YEAR = {2010},
ABSTRACT = {The last few years have seen a growing body of research and practice addressing aspects such as automated legal reasoning and argumentation, semantic and cross-language legal information retrieval, document classification, legal drafting, legal knowledge discovery and extraction. This State-of-the-Art Survey contains invited contributions of leading researchers and groups eminently active in the field, which were complemented with selected papers from the Workshop on Semantic Processing of Legal Texts, held in Marrakech, Morocco, in 2008, within the framework of the Sixth International Conference on Language Resources and Evaluation (LREC 2008). These publications mirror the state-of-the-art in linguistic technologies, tools and resources focusing on the automatic extraction of relevant information from legal texts, and the structured organization of this extracted knowledge for legal knowledge representation and scholarly activity, with particular emphasis on the crucial role played by language resources and human language technologies. The contents are organized in three topical sections on information extraction; construction of knowledge resources; and semantic indexing, summarization and translation},
KEYWORDS = {Legal Text Processing, Ontology Learning, Information Extraction},
URL = {https://iris.cnr.it/handle/20.500.14243/154374},
}
@BOOK{NAHLI_2010_BOOK_N_222333,
AUTHOR = {Nahli, O.},
TITLE = {lingua araba, il sistema verbale},
YEAR = {2010},
ABSTRACT = {Questo volume offre una descrizione del verbo arabo, in una prospettiva prevalentemente didattica seguendo la struttura di pensiero e le categorie linguistiche proprie della tradizione grammaticale araba. Emerge e si chiarisce così la logica che domina l'articolato sistema verbale arabo e che funge da cardine nell'organizzazione della sintassi e di buona parte della morfologia nominale. Per di più, al termine del libro, è presente un capitolo dedicato alla "frase araba", ovvero alla "frase verbale" e alla "frase nominale" ed ai loro rispettivi elementi costitutivi},
PAGES = {140},
URL = {https://iris.cnr.it/handle/20.500.14243/222333},
ISBN = {9788867413003},
}
@INCOLLECTION{BOZZI_2010_INCOLLECTION_BS_134823,
AUTHOR = {Bozzi, A. and Sandrucci, V.},
TITLE = {Uno strumento al servizio dell'archiviazione, lo studio, l'edizione e l'interrogazione di documenti digitali},
YEAR = {2010},
KEYWORDS = {Computational Philology},
URL = {https://iris.cnr.it/handle/20.500.14243/134823},
PUBLISHER = {L'Harmattan (Paris, FRA)},
CONFERENCE_PLACE = {Paris},
}
@INCOLLECTION{CALZOLARI_2010_INCOLLECTION_CS_50346,
AUTHOR = {Calzolari, N. and Soria, C.},
TITLE = {Planning the Future of Language Resources: The Role of the FLaReNet Network},
YEAR = {2010},
ABSTRACT = {In this paper we analyse the role of Language Resources (LR) and Language Technologies (LT) in today Human Language Technology field and try to speculate on some of the priorities for the next years, from the particular perspective of the FLaReNet project, that has been asked to act as an observatory to assess current status of the field on Language Resources and Technology and to indicate priorities of action for the future},
KEYWORDS = {Language Resources and Technology, strategic initiatives, priorities},
PAGES = {1-11},
URL = {https://rdcu.be/dfs8V},
DOI = {10.1007/978-3-642-12116-6_1},
PUBLISHER = {Springer (Berlin, DEU)},
ISBN = {978-3-642-12116-6},
CONFERENCE_PLACE = {Berlin},
BOOKTITLE = {Computational Linguistics and Intelligent Text Processing. CICLing 2010},
EDITOR = {Gelbukh, A.},
}
@INCOLLECTION{JEZEK_2010_INCOLLECTION_JF_134822,
AUTHOR = {Jezek, E. and Frontini, F.},
TITLE = {From Pattern Dictionary to Patternbank},
YEAR = {2010},
KEYWORDS = {Ontology. Computational Semantics},
PAGES = {215-237},
URL = {https://iris.cnr.it/handle/20.500.14243/134822},
BOOKTITLE = {A Way with Words: Recent Advances in Lexical Theory and Analysis},
EDITOR = {De Schryver, G. M.},
}
@INCOLLECTION{MARINELLI_2010_INCOLLECTION_MSC_134818,
AUTHOR = {Marinelli, R. and Spadoni, G. and Cucurullo, S.},
TITLE = {Visual information to improve a lexical-semantic terminological resource},
YEAR = {2010},
ABSTRACT = {La base de datos léxico-semántica MariTerm contiene información estructurada sobre terminología especializada del dominio marítimo (navegación marítima y transporte). Este artículo describe las fases principales de un proyecto cuyo objetivo es aumentar la base de datos terminológica con un conjunto de imágenes: a) la estructura de la base de datos terminológica; b) el modelado conceptual del dominio; c) la herramienta de administración de la base datos que, entre otras características, permite la visualización de la imagen asociada al termino que se esté buscando, contribuyendo a aclarar el significado de dicho termino y a incrementar su información y potencial de comunicación},
KEYWORDS = {terminology, computational resources, terminological databases, visual information},
PAGES = {493-500},
URL = {https://iris.cnr.it/handle/20.500.14243/134818},
ISBN = {978-84-8427-759-0},
BOOKTITLE = {Modos y formas de la comunicaciòn humana-Ways and modes of human communication},
EDITOR = {Rodriguez, R. C. and Sanz, M. J. P.},
}
@INCOLLECTION{PIRRELLI_2010_INCOLLECTION_PGB_134819,
AUTHOR = {Pirrelli, V. and Guevara, E. and Baroni, M.},
TITLE = {Computational issues in compound processing},
YEAR = {2010},
ABSTRACT = {Understanding compounds is a challenging computational task, cutting across multiple levels of linguistic analysis and touching upon intricate issues of representation, grammar architecture and algorithmic processing. At the same time, compounds raise all these problems in the most direct and exemplar way. From this perspective, they are an ideal probe into core issues of language architecture, making us pause about the need for advanced processing models and multi-disciplinary ap-proaches to long-lasting linguistic cruces. The paper reviews some of the lessons that can be learned from reading twenty years of computa-tional literature on the topic and assesses them against the background of germane theoretical and cognitive issues},
KEYWORDS = {Morphology, Compounding, Natural Language Processing, Mental Lexicon},
PAGES = {271-285},
URL = {https://iris.cnr.it/handle/20.500.14243/134819},
PUBLISHER = {John Benjamins (Amsterdam, NLD)},
ISBN = {9789027248275},
CONFERENCE_PLACE = {Amsterdam},
BOOKTITLE = {Cross-disciplinary issues in compounding},
EDITOR = {Scalise, S. and Vogel, I.},
}
@INCOLLECTION{PROIETTI_2010_INCOLLECTION_P_404003,
AUTHOR = {Proietti, C.},
TITLE = {Carnap e il convenzionalismo semantico},
YEAR = {2010},
ABSTRACT = {La Sintassi logica del linguaggio (Carnap, 1934) rappresentava tra altre cose, nelle intenzioni di Carnap, una spiegazione ed una giustificazione, alla luce degli allora recenti risultati di Gödel, di un punto di vista convenzionalista riguardo ai fondamenti della matematica e del discorso scientifico in generale. L'immagine di convenzionalismo che ne risulta è molto complessa e, per diversi aspetti, di difficile interpretazione. Una prima parte di questo lavoro sarà dedicata all'elucidazione del problema dei fondamenti per come si presentava a Carnap al momento della stesura del suo lavoro, nonché all'analisi delle posizioni filosofiche che determinano il contenuto della Sintassi e, più determinatamente, la scelta dell'opzione metalinguistica. Il metalinguaggio rappresenta infatti, nella visione di Carnap, il corretto metodo della filosofia della scienza e, più in particolare, dell'analisi del problema dei fondamenti. Una seconda sezione sarà dedicata ad enucleare i motivi per cui l'atteggiamento convenzionalista si adatta al punto di vista di un empirista, quale era Carnap, nello spiegare la nozione di analiticità o necessità logico-matematica. Le basi e le ragioni della spiegazione di tale concetto da parte di un logico neo-empirista sono chiaramente molto diverse da quelle che avrebbe fornito un empirista tradizionale. L'ultima sezione mette a confronto la posizione di Carnap, per come si è venuta delineando, con la "refutazione", da parte di Gödel, del punto di vista fondazionale espresso dalla Sintassi e del convenzionalismo in generale. La refutazione è argomentata da Gödel proprio sulla base del significato filosofico dei suoi due celebri risultati metamatematici, ed è proprio sul terreno del metalinguaggio che si gioca il confronto possibile tra le motivazioni dei due},
KEYWORDS = {Carnap, convenzionalismo},
PAGES = {127-141},
URL = {https://iris.cnr.it/handle/20.500.14243/404003},
PUBLISHER = {ETS (Pisa, ITA)},
CONFERENCE_PLACE = {Pisa},
BOOKTITLE = {Quaderni della Ricerca},
EDITOR = {Belotti, L. and Paoletti, G.},
}
@INCOLLECTION{PROIETTI_2010_INCOLLECTION_P_403999,
AUTHOR = {Proietti, C.},
TITLE = {The Kerry-Frege debate about object and concept: some remarks about Kerry's position},
YEAR = {2010},
ABSTRACT = {The controversy between Kerry and Frege on object and concept went down in posterity after Frege's 1891 article Über Begriff und Gegenstand, even if Kerry's objections which sparked Frege's explanation are dated 1887 as they appeared in the IV article of his series Über Anschaung und ihre psychische Verarbeitung. In truth, a real debate between the two philosophers never took place because of Kerry's premature death in 1889. This meant that Kerry could not reply to Frege and above all he could not define the presuppositions of his own positions, thus leaving room for a number of possible exegetic suppositions which I will analyse in this paper},
KEYWORDS = {Benno Kerry, object and concept, Frege},
PAGES = {96-104},
URL = {https://iris.cnr.it/handle/20.500.14243/403999},
PUBLISHER = {ETS (Pisa, ITA)},
CONFERENCE_PLACE = {Pisa},
BOOKTITLE = {First Pisa Colloquium in Logic, Language and Epistemology},
EDITOR = {Marletti, C.},
}
@INCOLLECTION{RONZANO_2010_INCOLLECTION_RMMTC_169557,
AUTHOR = {Ronzano, F. and Monachini, M. and Marchetti, A. and Tesconi, M. and Calzolari, N.},
TITLE = {Bootstrapping and Collaboratively Enriching the Italian Domain WordNet through the WiKyoto Knowledge Editor},
YEAR = {2010},
ABSTRACT = {Enhancing the development of multilingual resources is of utmost importance for use in computer applications. The need of ever growing resources for effective multilingual content processing has given impulse to a radical change in the perspective of language resource (LR) creation, structuring, exploitation and maintenance. The Web has played a key role in this process: indeed the possibility to access growing amounts of structured and unstructured data as well as the ease of creating and sharing contents between distributed communities of users have strongly affected the methodologies and techniques to bootstrap, enrich and access LRs. From static knowledge bases usually created and maintained by groups of experts and tailored to the specific exploitation contexts, LRs have turned into dynamic repositories of linguistic knowledge. Their content is usually easily accessible over the Web and often exploited aggregated and optimized on-the-fly by on-line information mining services. In this context, the adoption of standardized data formats to facilitate interoperability and data exchange is essential. Moreover, the creation and maintenance of these resources has taken great advantage from the possibility to harvest Web data in order to bootstrap or enrich them. Several new frameworks have been proposed to support access, search, integration and interoperability of "new generation" LRs. Wide distributed communities of Web users are more and more directly or indirectly involved in keeping language resources updated or in extending them. After a brief description of modern LRs, we focus our attention on two essential issues involving them: the need for standard formats that support interoperability in a distributed Web context and the possibility for the Web communities to collaboratively maintain and enrich these resources. In particular, we present the Italian WordNet (IWN) and its exploitation in the context of the KYOTO Project, as a real-world scenario where standardization, interlinking, enrichment as well as collaborative editing are put into practice},
KEYWORDS = {NLP, collaborative editing, wordnet, knowledge representation, wiki},
PAGES = {181-208},
URL = {http://www.racai.ro/Multilinguality%20and%20Interoperability/TOC.html},
PUBLISHER = {Romanian Academy Publishing House (Bucharest, ROU)},
ISBN = {978-973-27-1972-5},
CONFERENCE_PLACE = {Bucharest},
BOOKTITLE = {Multilinguality and Interoperability in Language Processing with Emphasis on Romanian},
EDITOR = {Tufis, D. and Forascu, I.},
}
@INCOLLECTION{RUIMY_2010_INCOLLECTION_RBCN_134820,
AUTHOR = {Ruimy, N. and Bouillon, P. and Cartoni, B. and Namer, F.},
TITLE = {Construction (semi-)automatique d'un lexique sémantique du français: inférences interlinguistiques et morphologie},
YEAR = {2010},
ABSTRACT = {Nous décrivons deux méthodes complémentaires pour la dérivation semi-automatique d'un lexique du français, suivant le modèle du Lexique Génératif. La première méthode exploite la similitude entre les langues. Les informations lexicales françaises sont dérivées à partir d'un dictionnaire sémantique électronique de l'italien. À cet effet, nous combinons 2 stratégies: pour les mots construits, nous exploitons la cognacité de certains suffixes. Après avoir recherché dans un dictionnaire bilingue la traduction française du mot italien avec le suffixe français correspondant (ex.: costruzione ? construction), nous générons l'entrée lexicale française en y transférant les informations sémantiques de l'entrée italienne;. pour les mots non construits polysémiques (ex.: frazione [fraction, hameau]), nous utilisons les indicateurs de sens fournis dans les dictionnaires bilingues (pour frazione: (mat.); (centro abitato)) de manière à identifier, dans le lexique électronique italien, l'entrée lexicale appropriée qui donnera naissance à l'entrée du sens français équivalent. La seconde méthode fait appel aux principes de la morphologie constructionnelle du français et permet potentiellement de coder des mots construits dont les équivalents italiens ne figurent pas dans le lexique source. Ces mots nouveaux, extraits de corpus, sont soumis à l'analyseur dérivationnel DériF dont le résultat fournit une grande partie de l'information lexicale permettant la construction de nouvelles entrées françaises},
KEYWORDS = {Computational Lexicography, Computational Morphology},
PAGES = {71-88},
URL = {https://iris.cnr.it/handle/20.500.14243/134820},
PUBLISHER = {Presses de l'Université du Québec (Québec, CAN)},
ISBN = {978-2-7605-2569-6},
CONFERENCE_PLACE = {Québec},
BOOKTITLE = {Multilinguisme et traitement des langues naturelles},
EDITOR = {Biskri, I. and Jebali, A.},
}
@INCOLLECTION{VENTURI_2010_INCOLLECTION_V_50352,
AUTHOR = {Venturi, G.},
TITLE = {Legal Language and Legal Knowledge Management Applications},
YEAR = {2010},
ABSTRACT = {This work is an investigation into the peculiarities of legal language with respect to ordinary language. Based on the idea that a shallow parsing approach can help to provide enough detailed linguistic information, this work presents the results obtained by shallow parsing (i. e. chunking) corpora of Italian and English legal texts and comparing them with corpora of ordinary language. In particular, this paper puts the emphasis of how understanding the syntactic and lexical characteristics of this specialised language has practical importance in the development of domain-specific Knowledge Management applications},
KEYWORDS = {Parsing Legal Texts, Natural Language Processing, Legal Language, Knowledge Management Applications},
PAGES = {3-26},
URL = {https://iris.cnr.it/handle/20.500.14243/50352},
PUBLISHER = {Springer-Verlag (Berlin Heidelberg, DEU)},
ISBN = {3-642-12836-X},
CONFERENCE_PLACE = {Berlin Heidelberg},
BOOKTITLE = {Semantic Processing of Legal Texts. Where the Language of Law Meets the Law of Language},
EDITOR = {Francesconi, E. and Montemagni, S. and Peters, W.},
}
@EDITORIAL{CALZOLARI_2010_EDITORIAL_CBMS_134769,
AUTHOR = {Calzolari, N. and Baroni, P. and Monachini, M. and Soria, C.},
TITLE = {Proceedings of the 2nd European Language Resources and Technologies Forum: Language Resources of the future-the future of Language Resources},
YEAR = {2010},
ABSTRACT = {Proceedings of the second FLaReNet forum on the European Language Resources and Technologies, held in Barcelona, at the Institut d'Estudis Catalans, on 11-12 February 2010},
KEYWORDS = {Language Resources, Language Technologies, Future},
PAGES = {120},
URL = {http://www.flarenet.eu/sites/default/files/FLaReNet_Forum_2010_Proceedings.pdf},
}
@EDITORIAL{DIDONATO_2010_EDITORIAL_D_384157,
AUTHOR = {Di Donato, F.},
TITLE = {Open Access. Contro gli oligopoli nel sapere},
YEAR = {2010},
ABSTRACT = {Guédon illustra come si sono andate configurando le forme della competizione scientifica sul piano nazionale e internazionale. Le definizioni alla base della comunicazione scientifica mondiale dalla nascita dello Science Citation Index (SCI) fino ai nostri giorni, e il sistema di valutazione che ne è derivato, hanno portato nel sapere alla creazione di veri e propri oligopoli, che hanno condizionato e continuano a condizionare il sistema di potere in ambito scientifico. Inoltre, l'autore mostra come le alternative a SCI, proposte da grandi editori e oggi anche dai motori di ricerca, non siano sufficienti a correggere le distorsioni presenti nell'attuale sistema di comunicazione scientifica. Guédon indica piuttosto nell'Open Access una strada che, se esplorata a fondo, appare in grado di superare la divisione tra scienza centrale e scienza periferica-di per sé artificiosa-riportando la competizione scientifica su di un piano che valorizzi qualità ed eccellenza dei ricercatori, indipendentemente dalla loro provenienza geografica e culturale e dall'appartenenza istituzionale e linguistica},
KEYWORDS = {open access, comunicazione scientifica},
URL = {http://www.edizioniets.com/scheda.asp?n=9788846725172},
PUBLISHER = {Edizioni ETS (Pisa, ITA)},
CONFERENCE_PLACE = {Pisa},
}
@EDITORIAL{FRANCESCONI_2010_EDITORIAL_FMPT_223985,
AUTHOR = {Francesconi, E. and Montemagni, S. and Peters, W. and Tiscornia, D.},
TITLE = {Semantic Processing of Legal Texts: Where the Language of Law Meets the Law of Language},
YEAR = {2010},
ABSTRACT = {The last few years have seen a growing body of research and practice addressing aspects such as automated legal reasoning and argumentation, semantic and cross-language legal information retrieval, document classification, legal drafting, legal knowledge discovery and extraction. This State-of-the-Art Survey contains invited contributions of leading researchers and groups eminently active in the field, which were complemented with selected papers from the Workshop on Semantic Processing of Legal Texts, held in Marrakech, Morocco, in 2008, within the framework of the Sixth International Conference on Language Resources and Evaluation (LREC 2008). These publications mirror the state-of-the-art in linguistic technologies, tools and resources focusing on the automatic extraction of relevant information from legal texts, and the structured organization of this extracted knowledge for legal knowledge representation and scholarly activity, with particular emphasis on the crucial role played by language resources and human language technologies. The contents are organized in three topical sections on information extraction; construction of knowledge resources; and semantic indexing, summarization and translation},
PAGES = {249},
URL = {https://iris.cnr.it/handle/20.500.14243/223985},
ISBN = {978-3-642-12836-3},
}
@EDITORIAL{FRANCESCONI_2010_EDITORIAL_FMPW_134826,
AUTHOR = {Francesconi, E. and Montemagni, S. and Peters, W. and Wyner, A.},
TITLE = {Proceedings of the LREC 2010 Workshop on SEMANTIC PROCESSING OF LEGAL TEXTS (SPLeT-2010)},
YEAR = {2010},
KEYWORDS = {Legal Knowledge Extraction, Natural Language Processing},
URL = {https://iris.cnr.it/handle/20.500.14243/134826},
}
@EDITORIAL{FRANCESCONI_2010_EDITORIAL_FMRT_134825,
AUTHOR = {Francesconi, E. and Montemagni, S. and Rossi, P. and Tiscornia, D.},
TITLE = {Proceedings of the 4th Workshop on Legal Ontologies and Artificial Intelligence Techniques (LOAIT 2010)},
YEAR = {2010},
KEYWORDS = {Legal Ontologies, Ontology Learning, Legal Knowledge Extraction, Legal Knowledge Modelling},
URL = {https://iris.cnr.it/handle/20.500.14243/134825},
ISSN = {1613-0073},
}
@EDITORIAL{HUANG_2010_EDITORIAL_HCGLO_183246,
AUTHOR = {Huang, C. and Calzolari, N. and Gangemi, A. and Lenci, A. and Oltramari, A.},
TITLE = {Ontology and the lexicon: a natural language processing perspective},
YEAR = {2010},
URL = {https://iris.cnr.it/handle/20.500.14243/183246},
ISBN = {9780521886598},
}
@EDITORIAL{PIRRELLI_2010_EDITORIAL_P_250731,
AUTHOR = {Pirrelli, V.},
TITLE = {Interdisciplinary Approaches to Understanding Word Processing and Storage},
YEAR = {2010},
ABSTRACT = {The present collection of papers originates from a successful application to the European Science Foundation Exploratory Workshop Programme for the "Words in Action" workshop. The workshop, convened in Pisa on the 12th and 13th of October 2009, brought together experts of various scientific domains and theoretical inclinations to advance the current awareness of theoretical, typological, psycholinguistic, computational and neuro-physiological issues in word processing and storage, with a view to promoting novel methods of research and assessment for grammar architecture and language physiology},
PAGES = {91-240},
URL = {https://iris.cnr.it/handle/20.500.14243/250731},
PUBLISHER = {Societa Editrice il Mulino (Bologna, ITA)},
CONFERENCE_PLACE = {Bologna},
}
@EDITORIAL{DIDONATO_2010_EDITORIAL_D_384171,
AUTHOR = {Di Donato, F.},
TITLE = {L'Open Access tra centro e periferia della scienza},
YEAR = {2010},
ABSTRACT = {Prefazione alla traduzione di "Open Access: contro gli oligopoli nel sapere"},
URL = {https://iris.cnr.it/handle/20.500.14243/384171},
}
@INPROCEEDINGS{AGIRRE_2010_INPROCEEDINGS_ALFHTMVS_151404,
AUTHOR = {Agirre, E. and López, D. L. O. and Fellbaum, C. and Hsieh, S. and Tesconi, M. and Monachini, M. and Vossen, P. and Segers, R.},
TITLE = {SemEval-2010 task 17: All-words word sense disambiguation on a specific domain},
YEAR = {2010},
ABSTRACT = {Domain portability and adaptation of NLP components and Word Sense Disambiguation systems present new challenges. The difficulties found by supervised systems to adapt might change the way we assess the strengths and weaknesses of supervised and knowledge-based WSD systems. Unfortunately, all existing evaluation datasets for specific domains are lexical-sample corpora. This task presented all-words datasets on the environment domain for WSD in four languages (Chinese, Dutch, English, Italian). 11 teams participated, with supervised and knowledge-based systems, mainly in the English dataset. The results show that in all languages the participants where able to beat the most frequent sense heuristic as estimated from general corpora. The most successful approaches used some sort of supervision in the form of hand-tagged examples from the domain},
KEYWORDS = {I.2.7 Natural Language Processing, Word Sense Disambiguation sy, Semantic Annotation, Word-sense disambiguation},
PAGES = {75-80},
URL = {https://iris.cnr.it/handle/20.500.14243/151404},
ISBN = {978-1-932432-70-1},
CONFERENCE_NAME = {ACL 2010-SemEval 2010: 5th International Workshop on Semantic Evaluation},
EDITOR = {Erk, K. and Strapparava, C.},
}
@INPROCEEDINGS{ATTARDI_2010_INPROCEEDINGS_ADDLMS_65145,
AUTHOR = {Attardi, G. and Dei Rossi, S. and Di Pietro, G. and Lenci, A. and Montemagni, S. and Simi, M.},
TITLE = {A Resource and Tool for Super-sense Tagging of Italian Texts},
YEAR = {2010},
KEYWORDS = {Corpus (creation, annotation, etc.), Tools, Systems, Applications, Statistical and machine learning methods},
URL = {https://iris.cnr.it/handle/20.500.14243/65145},
CONFERENCE_NAME = {Seventh International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{ATTIA_2010_INPROCEEDINGS_ATTMV_65154,
AUTHOR = {Attia, M. and Toral, A. and Tounsi, L. and Monachini, M. and Van Genabith, J.},
TITLE = {An Automatically Built Named Entity Lexicon for Arabic},
YEAR = {2010},
ABSTRACT = {We have successfully adapted and extended the automatic Multilingual, Interoperable Named Entity Lexicon approach to Arabic, using Arabic WordNet (AWN) and Arabic Wikipedia (AWK). First, we extract AWN's instantiable nouns and identify the corresponding categories and hyponym subcategories in AWK. Then, we exploit Wikipedia inter-lingual links to locate correspondences between articles in ten different languages in order to identify Named Entities (NEs). We apply keyword search on AWK abstracts to provide for Arabic articles that do not have a correspondence in any of the other languages. In addition, we perform a post-processing step to fetch further NEs from AWK not reachable through AWN. Finally, we investigate diacritization using matching with geonames databases, MADA-TOKAN tools and different heuristics for restoring vowel marks of Arabic NEs. Using this methodology, we have extracted approximately 45, 000 Arabic NEs and built, to the best of our knowledge, the largest Named Entity repository available},
KEYWORDS = {Acquisition, Lexicon, database, Named Entity recognition},
URL = {https://iris.cnr.it/handle/20.500.14243/65154},
ISBN = {2-9517408-6-7},
CONFERENCE_NAME = {Seventh International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{BARCA_2010_INPROCEEDINGS_BPC_65147,
AUTHOR = {Barca, L. and Pezzulo, G. and Castelli, E.},
TITLE = {Egocentric and allocentric spatial references in children with Cerebral Palsy},
YEAR = {2010},
KEYWORDS = {cerebral palsy, spatial, egocentric, allocentric},
URL = {https://iris.cnr.it/handle/20.500.14243/65147},
CONFERENCE_NAME = {Cogsci 2010-annual meeting of the Cognitive Science Society},
}
@INPROCEEDINGS{BARDUCCI_2010_INPROCEEDINGS_BGLNPMPM_154604,
AUTHOR = {Barducci, A. and Guzzi, D. and Lastri, C. and Nardino, V. and Pippi, I. and Magnani, F. and Pieri, M. and Maselli, F.},
TITLE = {CHRIS/Proba-1 acquisitions on San Rossore test site for the ESA SEN3EXP campaign},
YEAR = {2010},
KEYWORDS = {CHRIS/Proba-1, San Rossore, ESA, SEN3EXP},
URL = {https://iris.cnr.it/handle/20.500.14243/154604},
CONFERENCE_NAME = {Hyperspectral Workshop 2010 from CHRIS/Proba to PRISMA \& EnMAP and beyond},
}
@INPROCEEDINGS{BELLANDI_2010_INPROCEEDINGS_BNTTZ_265112,
AUTHOR = {Bellandi, A. and Nasoni, S. and Tarini, D. and Tommasi, A. and Zavattari, C.},
TITLE = {Redada: Mining Knowledge out of Italian Business News Items},
YEAR = {2010},
ABSTRACT = {The paper describes Redada, a fully-implemented ontology-based relation extraction system that integrates classical NLP techniques with expert knowledge expressed by ontologies. Experimenting with the system for the task of supporting law enforcement and intelligence activities against money laundering and corruption, exploring information out of Italian newspapers to help in the identification of networks of activities, both legal and illegal, we evaluate the proposed system against a standard baseline approach, and we present our first results},
URL = {https://iris.cnr.it/handle/20.500.14243/265112},
}
@INPROCEEDINGS{BELLANDI_2010_INPROCEEDINGS_BNTZ_265111,
AUTHOR = {Bellandi, A. and Nasoni, S. and Tommasi, A. and Zavattari, C.},
TITLE = {Ontology-Driven Relation Extraction by Pattern Discovery},
YEAR = {2010},
ABSTRACT = {In this paper we describe an ontology-driven system that performs relation extraction over textual data. The system exploits expert knowledge of the domain, including lexical resources, in the form of an ontology to drive the extraction of patterns using manually annotated texts. Such patterns are then applied in order to identify candidates for relation extraction. Paired with basic, reliable named-entity-level text annotation, this results in the discovery of relations among entities in Italian newspaper articles. In the paper, we describe the system and measure its performance},
URL = {https://iris.cnr.it/handle/20.500.14243/265111},
}
@INPROCEEDINGS{BONIN_2010_INPROCEEDINGS_BDMV_65162,
AUTHOR = {Bonin, F. and Dell'Orletta, F. and Montemagni, S. and Venturi, G.},
TITLE = {A Contrastive Approach to Multi-word Extraction from Domain-specific Corpora},
YEAR = {2010},
ABSTRACT = {In this paper we present a novel approach to multi-word terminology extraction combining a well-known automatic term recognition approach, the C-NC value method, with a contrastive ranking technique, aimed at refining obtained results either by filtering noise due to common words or by discerning between semantically different types of terms within heterogeneous terminologies. The proposed methodology has been tested in two case studies carried out in the History of Art and Legal domains with promising results},
KEYWORDS = {Terminology Extraction, Domain-specific Corpora, Multi-word Expression},
PAGES = {3222-3229},
URL = {https://iris.cnr.it/handle/20.500.14243/65162},
ISBN = {2-9517408-6-7},
CONFERENCE_NAME = {Seventh International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{BONIN_2010_INPROCEEDINGS_BDVM_65168,
AUTHOR = {Bonin, F. and Dell'Orletta, F. and Venturi, G. and Montemagni, S.},
TITLE = {Contrastive filtering of domain specific multi-word terms from different types of corpora},
YEAR = {2010},
ABSTRACT = {In this paper we tackle the challenging task of Multi-word term (MWT) extraction from different types of specialized corpora. Contrastive filtering of previously extracted MWTs results in a considerable increment of acquired domain-specific terms},
KEYWORDS = {multi-word terms extraction, co},
PAGES = {76-79},
URL = {https://iris.cnr.it/handle/20.500.14243/65168},
ISBN = {978-7-900268-00-6},
CONFERENCE_NAME = {The 23rd International Conference on Computational Linguistics (COLING 2010). Multiword Expressions: from Theory to Applications (MWE 2010)},
}
@INPROCEEDINGS{BOSCO_2010_INPROCEEDINGS_BMMDL_65165,
AUTHOR = {Bosco, C. and Montemagni, S. and Mazzei, A. and Dell'Orletta, F. and Lenci, A.},
TITLE = {Evalita'09 Parsing Task: comparing dependency parsers and treebanks},
YEAR = {2010},
KEYWORDS = {dependency parsing, dependency},
URL = {https://iris.cnr.it/handle/20.500.14243/65165},
CONFERENCE_NAME = {Evaluation of NLP and Speech Tools for Italian. EVALITA 2009},
}
@INPROCEEDINGS{BOSCO_2010_INPROCEEDINGS_BMMLDLLASLHNN_65156,
AUTHOR = {Bosco, C. and Montemagni, S. and Mazzei, A. and Lombardo, V. and Dell'Orletta, F. and Lenci, A. and Lesmo, L. and Attardi, G. and Simi, M. and Lavelli, A. and Hall, J. and Nilsson, J. and Nivre, J.},
TITLE = {Comparing the Influence of Different Treebank Annotations on Dependency Parsing},
YEAR = {2010},
KEYWORDS = {Parsing, Corpus (creation, annotation, etc.), Evaluation methodologies},
URL = {https://iris.cnr.it/handle/20.500.14243/65156},
CONFERENCE_NAME = {Seventh International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{BOZZI_2010_INPROCEEDINGS_B_435682,
AUTHOR = {Bozzi, A.},
TITLE = {L'archiviazione, lo studio, l'edizione e l'interrogazione di documenti digitali: Pinakes Text},
YEAR = {2010},
ABSTRACT = {aaa},
KEYWORDS = {Filologia computazionale},
PAGES = {254},
URL = {https://iris.cnr.it/handle/20.500.14243/435682},
VOLUME = {3. 2010},
ISSN = {1825-8980},
ISBN = {9788864940205},
CONFERENCE_NAME = {Metodologie Informatiche per le Scienze Umane},
BOOKTITLE = {POLIS (ROMA)},
}
@INPROCEEDINGS{BUNT_2010_INPROCEEDINGS_BACCFHPPRSTL_65160,
AUTHOR = {Bunt, H. and Alexandersson, J. and Carletta, J. and Choe, J. and Fang, A. C. and Hasida, K. and Petukhova, V. and Popescubelis, A. and Romary, L. and Soria, C. and Traum, D. and Lee, K.},
TITLE = {Towards an ISO Standard for Dialogue Act Annotation},
YEAR = {2010},
ABSTRACT = {This paper describes an ISO project developing an international standard for annotating dialogue with semantic information, in particular concerning the communicative functions of the utterances, the kind of content they address, and the dependency relations to what was said and done earlier in the dialogue. The project, registered as ISO 24617-2 Semantic annotation framework, Part 2: Dialogue acts", is currently at DIS stage},
KEYWORDS = {Dialogue, Corpus (creation, annotation, etc.), Semantics},
PAGES = {2548-2555},
URL = {https://iris.cnr.it/handle/20.500.14243/65160},
PUBLISHER = {European Language Resources Association (ELRA)-Evaluations and Language resources Distribution Agency (ELDA) (Paris, FRA)},
ISBN = {2-9517408-6-7},
CONFERENCE_NAME = {Seventh International Conference on Language Resources and Evaluation},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the Seventh conference on International Language Resources and Evaluation (LREC'10)},
EDITOR = {Calzolari, N. and Choukri, K. and Maegaard, B. and Mariani, J. and Odjik, J. and Piperidis, S. and Rosner, M. and Tapias, D.},
}
@INPROCEEDINGS{CALZOLARI_2010_INPROCEEDINGS_CS_65159,
AUTHOR = {Calzolari, N. and Soria, C.},
TITLE = {Preparing the field for an Open Resource Infrastructure: the role of the FLaReNet Network of Excellence},
YEAR = {2010},
ABSTRACT = {In order to overcome the fragmentation that affects the field of Language Resources and Technologies, an Open and Distributed Resource Infrastructure is the necessary step for building on each other achievements, integrating resources and technologies and avoiding dispersed or conflicting efforts. Since this endeavour represents a true cultural turnpoint in the LRs field, it needs a careful preparation, both in terms of acceptance by the community and thoughtful investigation of the various technical, organisational and practical aspects implied. To achieve this, we need to act as a community able to join forces on a set of shared priorities and we need to act at a worldwide level. FLaReNet-Fostering Language Resources Network-is a Thematic Network funded under the EU eContent program that aims at developing the needed common vision and fostering a European and International strategy for consolidating the sector, thus enhancing competitiveness at EU level and worldwide. In this paper we present the activities undertaken by FLaReNet in order to prepare and support the establishment of such an Infrastructure, which is becoming now a reality within the new MetaNet initiative},
KEYWORDS = {LR Infrastructures and Architectures, LR national/international projects, organizational/policy issues},
PAGES = {1295-1300},
URL = {https://iris.cnr.it/handle/20.500.14243/65159},
PUBLISHER = {European Language Resources Association (ELRA)-Evaluations and Language resources Distribution Agency (ELDA) (Paris, FRA)},
ISBN = {2-9517408-6-7},
CONFERENCE_NAME = {Seventh International Conference on Language Resources and Evaluation},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the Seventh International Conference on Language Resources and Evaluation (LREC'10)},
EDITOR = {Calzolari, N. and Choukri, K. and Maegaard, B. and Mariani, J. and Odijk, J. and Piperidis, S. and Rosner, M. and Tapias, D.},
}
@INPROCEEDINGS{CALZOLARI_2010_INPROCEEDINGS_CSDGQRCMP_65174,
AUTHOR = {Calzolari, N. and Soria, C. and Del Gratta, R. and Goggi, S. and Quochi, V. and Russo, I. and Choukri, K. and Mariani, J. and Piperidis, S.},
TITLE = {The LREC Map of Language Resources and Technologies},
YEAR = {2010},
ABSTRACT = {In this paper we present the LREC Map of Language Resources (data and tools), an innovative feature introduced in conjunction with the LREC 2010 Conference. The purpose of the Map is to shed light on the vast amount of resources that represent the background of the research presented at LREC, in the attempt to fill in a gap in the community knowledge about the resources that are used or created worldwide. It also aims at a change of culture in the field, actively engaging each researcher in the documentation task about resources. The Map has been developed on the basis of the information provided by LREC authors during the submission of papers to the LREC 2010 conference and the LREC workshops, and contains information about almost 2000 resources. The paper illustrates the motivation behind this initiative, its main characteristics, its relevance and future impact in the field, the metadata used to describe the resources, and finally presents some of the most relevant findings},
KEYWORDS = {LR national/international projects, organizational/policy issues},
PAGES = {949-956},
URL = {http://www.lrec-conf.org/proceedings/lrec2010/index.html},
PUBLISHER = {European Language Resources Association (ELRA)-Evaluations and Language resources Distribution Agency (ELDA) (Paris, FRA)},
ISBN = {2-9517408-6-7},
CONFERENCE_NAME = {LREC 2010 Seventh International Conference on Language Resources and Evaluation},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {LREC'10-Seventh International Conference on Language Resources and Evaluation. Proceedings},
EDITOR = {Calzolari, N. and Choukri, K. and Maegaard, B. and Mariani, J. and Odjik, J. and Piperidis, S. and Rosner, M. and Tapias, D.},
}
@INPROCEEDINGS{CASELLI_2010_INPROCEEDINGS_CP_65136,
AUTHOR = {Caselli, T. and Prodanof, I.},
TITLE = {Annotating Event Anaphora: A Case Study},
YEAR = {2010},
KEYWORDS = {Anaphora, Coreference, Corpus (creation, annotation, etc.), Semantics},
URL = {https://iris.cnr.it/handle/20.500.14243/65136},
CONFERENCE_NAME = {Seventh conference on International Language Resources and Evaluation},
}
@INPROCEEDINGS{CIERI_2010_INPROCEEDINGS_CCCLLPIP_65155,
AUTHOR = {Cieri, C. and Choukri, K. and Calzolari, N. and Langendoen, D. T. and Leveling, J. and Palmer, M. and Ide, N. and Pustejovsky, J.},
TITLE = {A Road Map for Interoperable Language Resource Metadata},
YEAR = {2010},
ABSTRACT = {LRs remain expensive to create and thus rare relative to demand across languages and technology types. The accidental re-creation of an LR that already exists is a nearly unforgiveable waste of scarce resources that is unfortunately not so easy to avoid. The number of catalogs the HLT researcher must search, with their different formats, make it possible to overlook an existing resource. This paper sketches the sources of this problem and outlines a proposal to rectify along with a new vision of LR cataloging that will to facilitates the documentation and exploitation of a much wider range of LRs than previously considered},
URL = {https://iris.cnr.it/handle/20.500.14243/65155},
ISBN = {2-9517408-6-7},
}
@INPROCEEDINGS{DELGRATTA_2010_INPROCEEDINGS_DDBCEMQSTC_65149,
AUTHOR = {Del Gratta, R. and D'Onofrio, L. and Bartolini, R. and Caselli, T. and Enea, A. and Monachini, M. and Quochi, V. and Soria, C. and Toral, A. and Calzolari, N.},
TITLE = {A Web-based Architecture for Interoperability of Lexical Resources},
YEAR = {2010},
ABSTRACT = {In this paper we present aWeb Service Architecture for managing high level interoperability of Language Resources (LRs) by means of a Service Oriented Architecture (SOA) and the use of ISO standards, such as ISO LMF. We propose a layered architecture which separates the management of legacy resources (data collection) from data aggregation (workflow) and data access (user requests). We provide a case study to demonstrate how the proposed architecture is capable of managing data exchange among different lexical services in a coherent way and show how the use of a lexical standard becomes of primary importance when a protocol of interoperability is defined},
KEYWORDS = {Interoperability, Web sercives, Lexical resources},
PAGES = {53-62},
URL = {http://weblab.iit.cnr.it/kyoto/www2.let.vu.nl/twiki/pub/Kyoto/Publications/icgl2010_DOnofrioetal.pdf},
PUBLISHER = {City university of Hong Kong press (Hong Kong, CHN)},
ISBN = {978-962-442-323-5},
CONFERENCE_NAME = {2nd International Conference on Global Interoperability for Language Resources},
CONFERENCE_PLACE = {Hong Kong},
BOOKTITLE = {2nd International Conference on Global Interoperability for Language Resources, ICGL 2010},
EDITOR = {Fang, A. C. and Ide, N. and Webster, J.},
}
@INPROCEEDINGS{FORNACIARI_2010_INPROCEEDINGS_FCF_716,
AUTHOR = {Fornaciari, A. and Cignoni, L. and Fornaciari, G.},
TITLE = {STUDENTS' PARTICIPATION IN AN ARCHAEOANTHROPOLOGY COURSE USING A CONTENT AND LANGUAGE INTEGRATED LEARNING (CLIL) METHODOLOGY},
YEAR = {2010},
ABSTRACT = {In this paper we present the results of an ongoing archaeoanthropology project which was started in the year 2007 at Benabbio, a village located near Lucca, in northern Tuscany, Italy. Aim of the project is to exhume individuals buried in the medieval cemetery near the church of the Castle of Benabbio (also in course of excavation), and of people who died in the village during the cholera epidemic of the year 1855. Burials and artefacts, ranging between 12th and 19th centuries, have been recorded on a computer database to provide information about the cultural and physical aspects of this ancient human group. The discovery of some well preserved medieval houses led to the decision to examine the settlement in its entirety, exploring the spatial and chronological development of the site. Archaeological exploration of this vast area will involve not only the cemetery of the castle but also the houses and the manor, investigating the origins of the settlement and the early stages of encastlement, by which the local lord could dominate the surrounding countryside and control his neighbours. It will be possible to reconstruct the different phases of organization of the settlement and the life-style and diseases of the inhabitants of the castle. Furthermore, this project is an important testbed for the development of field techniques such as balloon photography, high-resolution georadar survey, GIS, as well as special laboratory techniques for palaeopathology such as computerized tomography (CT), electron microscopy (EM), stable isotope palaeonutrition and ancient DNA (aDNA), that can be used to diagnose ancient diseases. This paper has a dual purpose: on the one hand, it makes the first results of the excavations available to the widest possible audience; on the other hand, it describes the application of a CLIL methodology which uses a foreign language to study a specific discipline. In this case, English is used as supporting language to carry out a number of tasks on the archaeological site, within an environment of interaction where the peers, the archaeologist, the content and language teachers are working in collaboration. The language is embedded within the activities, in particular two separate groups of students will be working on the two different sites (the cemetery and the residential complex), communicating in English with students graduating in the same discipline in Great Britain and the United States. The two groups will be asked to keep a running diary of the daily activities, and to document this information, using the blogging features of Office Word, a familiar device offering a wide range of writing tools that can help create an ongoing online record of their experiences. The project, organized and funded by the Division of Palaeopathogy of Pisa University, has been approved by the Faculty of Humanities of the University of Pisa},
PAGES = {2684-2692},
URL = {https://iris.cnr.it/handle/20.500.14243/716},
ISBN = {978-84-613-5536-5},
CONFERENCE_NAME = {International Technology, Education and Development Conference},
BOOKTITLE = {Proceedings of International Technology, Education and Development Conference},
EDITOR = {Chova, L. G. and Belenguer, D. M. and Torres, I. C.},
}
@INPROCEEDINGS{GIGLIOTTA_2010_INPROCEEDINGS_GPN_50350,
AUTHOR = {Gigliotta, O. and Pezzulo, G. and Nolfi, S.},
TITLE = {Emergence of an internal model in evolving robots subjected to sensory deprivation},
YEAR = {2010},
ABSTRACT = {In this study we show how simulated robots evolved to display a navigation skills can spontaneously develop an internal model and rely on it to complete their task when sensory stimulation is temporarily unavailable. The analysis of some of the best evolved agents indicates that their internal model operates by anticipating functional properties of the next sensory state rather than the exact state that sensors would have assumed. The characteristics of the states that are anticipated and of the sensory-motor rules that determine how the agents react to the experienced states, however, ensure that the agents produce very similar behaviour during normal and blind phases in which sensory stimulation is available or is self-generated by the agent itself, respectively. The characteristics of the agents' internal models also ensure an effective transition during the phases in which agents' internal dynamics is decoupled and re-coupled with the sensory-motor flow},
KEYWORDS = {internal model, neural networks, evolutionary robotics},
PAGES = {575-586},
URL = {https://iris.cnr.it/handle/20.500.14243/50350},
VOLUME = {6226},
DOI = {10.1007/978-3-642-15193-4_54},
ISBN = {978-3-642-15193-4},
CONFERENCE_NAME = {11th International Conference on Simulation of Adaptive Behavior, SAB 2010},
BOOKTITLE = {From Animals to Animats 11},
}
@INPROCEEDINGS{GIOVANNETTI_2010_INPROCEEDINGS_G_65164,
AUTHOR = {Giovannetti, E.},
TITLE = {An unsupervised approach for semantic relation interpretation},
YEAR = {2010},
ABSTRACT = {In this work we propose a hybrid unsupervised approach for semantic relation extraction from Italian and English texts. The system takes as input pairs of "distributionally similar" terms, possibly involved in a semantic relation. To validate and label the anonymous relations holding between the terms in input, the candidate pairs of terms are looked for on the Web in the context of reliable lexico-syntactic patterns. This paper focuses on the definition of the patterns, on the measures used to assess the reliability of the suggested specific semantic relation and on the evaluation of the implemented system},
KEYWORDS = {Information Extra, Information Retrieval, Knowledge Representation, Ontologies},
PAGES = {3811-3816},
URL = {https://iris.cnr.it/handle/20.500.14243/65164},
PUBLISHER = {European language resources association (ELRA) (Paris, FRA)},
ISBN = {2-9517408-6-7},
CONFERENCE_NAME = {Seventh International Conference on Language Resources and Evaluation},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the Seventh International Conference on Language Resources and Evaluation (LREC'10)},
EDITOR = {Calzolari, N. and Choukri, K. and Maegaard, B. and Mariani, J. and Odijk, J. and Piperidis, S. and Rosner, M. and Tapias, D.},
}
@INPROCEEDINGS{HAWAYEK_2010_INPROCEEDINGS_HDC_65163,
AUTHOR = {Hawayek, A. and Del Gratta, R. and Cappelli, G.},
TITLE = {A bilingual dictionary Mexican Sign Language-Spanish/Spanish-Mexican Sign Language},
YEAR = {2010},
ABSTRACT = {We present a three-part bilingual specialized dictionary Mexican Sign Language-Spanish / Spanish-Mexican Sign Language. This dictionary will be the outcome of a three-years agreement between the Italian "Consiglio Nazionale delleRicerche" and the Mexican Conacyt. Although many other sign language dictionaries have been provided to deaf communities, there are no Mexican Sign Language dictionaries in Mexico, yet. We want to stress on the specialized feature of the proposed dictionary: the bilingual dictionary will contain frequently usedgeneral Spanish forms along with scholastic course specific specialized words whose meanings warrant comprehension ofschool curricula. We emphasize that this aspect of the bilingual dictionary can have a deep social impact, since we will furnish to deaf peoplethe possibility to get competence in official language, which is necessary to ensure access to school curriculum and tobecome full-fledged citizens. From a technical point of view, the dictionary consists of a relational database, where we have saved the sign parametersand a graphical user interface especially designed to allow deaf children to retrieve signs using the relevant parametersand, thus, the meaning of the sign in Spanish},
KEYWORDS = {Sign Language Recognition/Generation, Lexicon, Lexical database, Acquisition},
PAGES = {3055-3062},
URL = {http://www.lrec-conf.org/proceedings/lrec2010/index.html},
ISBN = {2-9517408-6-7},
CONFERENCE_NAME = {Seventh International Conference on Language Resources and Evaluation},
BOOKTITLE = {Seventh International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{JEZEK_2010_INPROCEEDINGS_JQ_65150,
AUTHOR = {Jezek, E. and Quochi, V.},
TITLE = {Capturing Coercions in Texts: a First Annotation Exercise},
YEAR = {2010},
ABSTRACT = {In this paper we report the first results of an annotation exercise of argument coercion phenomena performed on Italian texts. Our corpus consists of ca 4000 sentences from the PAROLE sottoinsieme corpus (Bindi et al. 2000) annotated with Selection and Coercion relations among verb-noun pairs formatted in XML according to the Generative Lexicon Mark-up Language (GLML) format (Pustejovsky et al., 2008). For the purposes of coercion annotation, we selected 26 Italian verbs that impose semantic typing on their arguments in either Subject, Direct Object or Complement position. Every sentence of the corpus is annotated with the source type for the noun arguments by two annotators plus a judge. An overall agreement of 0. 87 kappa indicates that the annotation methodology is reliable. A qualitative analysis of the results allows us to outline some suggestions for improvement of the task: 1) a different account of complex types for nouns has to be devised and 2) a more comprehensive account of coercion mechanisms requires annotation of the deeper meaning dimensions that are targeted in coercion operations, such as those captured by Qualia relations},
KEYWORDS = {Corpus (creation, annotation, etc.), Knowledge Discovery/Representation, Semantics},
PAGES = {1464-1471},
URL = {http://www.lrec-conf.org/proceedings/lrec2010/summaries/713.html},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {2-9517408-6-7},
CONFERENCE_NAME = {Seventh International Conference on Language Resources and Evaluation},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the Seventh International Conference on Language Resources and Evaluation-LREC'10},
EDITOR = {Calzolari, N. and Choukri, K. and Maegaard, B. and Mariani, J. and Odjik, J. and Piperidis, S. and Rosner, M. and Tapias, D.},
}
@INPROCEEDINGS{MARINELLI_2010_INPROCEEDINGS_M_150563,
AUTHOR = {Marinelli, R.},
TITLE = {Ontological variation and sense extension in proper names},
YEAR = {2010},
ABSTRACT = {La cobertura lexical de la base de datos léxico-semántica ItalWordNet ha sido extendida añadiendo al primer núcleo de sustantivos y de verbos, un conjunto de adjetivos y de adverbios, además de un conjunto de nombres propios (NPs). Durante la codificación de los nombres propios, se han encontrado casos particulares de polisemia. Se ha estudiado la variación de significado de los NPs en los recursos lexicos y se han creado nuevas relaciones semánticas para representar el fenómeno de la extensión de sentido en la base de datos. La relación entre los NPs presentes en IWN y la clasificación ontológica de sus clases de pertenencia se ha puesto de relieve: se ha examinado la correspondencia entre las variaciones de significado y las variaciones ontológicas, y también la referencia a la estructura ontológica de IWN ha sido muy útil para el reconocimiento de muchos casos de extensión de sentido},
KEYWORDS = {lexical semantic databases, proper names, cognitive linguistics, metaphor, metonymy.},
PAGES = {687-698},
URL = {http://dialnet.unirioja.es/servlet/articulo?codigo=3411098},
VOLUME = {1},
ISBN = {978-84-8158-479-0},
CONFERENCE_NAME = {XXVIII AESLA Conference "Analizar datos Describir variacion-Analysing data Describing variation", Vigo, University of Vigo. (Vigo, Spain, 15 th-17 th April 2010)},
BOOKTITLE = {XXVIII AESLA Conference, "Analizar datos Describir variacion-Analysing data Describing variation", Vigo, University of Vigo. (Vigo, Spain, 15 th-17 th April 2010). Proceedings, vol. 1},
EDITOR = {Alonso, J. L. B. and Alvarez, D. G. and Torrado, U. K. and Insua, A. E. M. and Guerra, J. P. and Martinez, E. R. and Vasquez, R. R.},
}
@INPROCEEDINGS{MARINELLI_2010_INPROCEEDINGS_M_65169,
AUTHOR = {Marinelli, R.},
TITLE = {Lexical Resources and Ontological Classifications for the Recognition of Proper Names Sense Extension},
YEAR = {2010},
ABSTRACT = {Particular uses of PNs with sense extension are focussed on and inspected taking into account the presence of PNs in lexical semantic databases and electronic corpora. Methodology to select ad include PNs in semantic databases is described; the use of PNs in corpora of Italian Language is examined and evaluated, analyzing the behaviour of a set of PNs in different periods of time. Computational resources can facilitate our study in this field in an effective way by helping codify, translate and handle particular cases of polysemy, but also guiding in metaphorical and metonymic sense recognition, supported by the ontological classification of the lexical semantic entities. The relationship between the "abstract" and the "concrete", which is at the basis of the Conceptual Metaphor perspective, can be considered strictly related to the variation of the ontological values found in our analysis of the PNs and their belonging classes which are codified in the ItalWordNet database},
KEYWORDS = {Lexicon, Lexical Database, Corpus creation and annotation, Ontologies},
PAGES = {518-522},
URL = {http://www.lrec-conf.org/proceedings/lrec2010/index.html},
PUBLISHER = {European Language Resources Association (ELRA)-Evaluations and Language resources Distribution Agency (ELDA) (Paris, FRA)},
ISBN = {2-9517408-6-7},
CONFERENCE_NAME = {Seventh International Conference on Language Resources and Evaluation LREC2010},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {LREC'10-Seventh International Conference on Language Resources and Evaluation (Valletta, Malta, 17-23 May 2010)},
EDITOR = {Calzolari, N. and Choukri, K. and Maegaard, B. and Mariani, J. and Odjik, J. and Piperidis, S. and Rosner, M. and Tapias, D.},
}
@INPROCEEDINGS{MARINELLI_2010_INPROCEEDINGS_MRSC_65140,
AUTHOR = {Marinelli, R. and Roventini, A. and Spadoni, G. and Cucurullo, S.},
TITLE = {Lexical Semantic Resources in a Terminological Network},
YEAR = {2010},
ABSTRACT = {A research has been carried on and is still in progress aimed at the construction of three specialized lexicons organized as databases of relational type. The three databases contain terms belonging to the specialized knowledge fields of maritime terminology (technical-nautical and maritime transport domain), taxation law, and labour law with union labour rules, respectively. The EuroWordNet/ItalWordNet model was firstly used to structure the terminological database of maritime domain. The methodology experimented for its construction was applied to construct the next databases. It consists in i) the management of corpora of specialized languages and ii) the use of generic databases to identify and extract a set of candidate terms to be codified in the terminological databases. The three specialized resources are described highlighting the various kinds of lexical semantic relations linking each term to the others within the single terminological database and to the generic resources WordNet and ItalWordNet. The construction of these specialized lexicons was carried on in the framework of different projects; but they can be seen as a first nucleus of an organized network of generic and specialized lexicons with the purpose of making the meaning of each term clearer from a cognitive point of view},
KEYWORDS = {Lexicon, Semantics, Lexical database, Ontologies},
PAGES = {2288-2291},
URL = {https://iris.cnr.it/handle/20.500.14243/65140},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {2-9517408-6-7},
CONFERENCE_NAME = {Seventh International Conference on Language Resources and Evaluation},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {LREC'10-Seventh International Conference on Language Resources and Evaluation (La Valletta, Malta, 17-23 May 2010). Proceedings},
EDITOR = {Calzolari, N. and Choukri, K. and Maegaard, B. and Mariani, J. and Odjik, J. and Piperidis, S. and Rosner, M. and Tapias, D.},
}
@INPROCEEDINGS{MARINELLI_2010_INPROCEEDINGS_MSC_65161,
AUTHOR = {Marinelli, R. and Spadoni, G. and Cucurullo, S.},
TITLE = {Adding information to a terminological database by means of image files},
YEAR = {2010},
ABSTRACT = {A lexical semantic database containing terms belonging to the specialized lexicon of the maritime navigation and maritime transport was built according to WordNet/EuroWordNet model. Our paper present a project planning the enrichment of the terminological database by means of a set of images. A short description is given about a) the structure of the terminological database and the domain conceptual modelling; b) the various features of the database management tool, and, among all, the possibility of visualizing, on demand, the image which is associated with the term being sought, contributing to clarify and refine the meaning of the term, increasing its information and communication effectiveness},
KEYWORDS = {terminology, lexical databases, computational resources, images.},
PAGES = {347-353},
URL = {http://www.cfilt.iitb.ac.in/gwc2010/pdfs/30_adding_image_info_to_wordnet__Marinelli.pdf},
PUBLISHER = {Narosa Publishing House (New Delhi, IND)},
ISBN = {978-81-8487-083-1},
CONFERENCE_NAME = {5th Global WordNet Conference},
CONFERENCE_PLACE = {New Delhi},
BOOKTITLE = {Proceedings of the 5th Global WordNet Conference, Mumbai India, 2010},
EDITOR = {Bhattacharyya, P. and Fellbaum, C. and Vossen, P.},
}
@INPROCEEDINGS{MARZI_2010_INPROCEEDINGS_MPS_65157,
AUTHOR = {Marzi, C. and Pardelli, G. and Sassi, M.},
TITLE = {Grey Literature and Computational Linguistics: From Paper to Net},
YEAR = {2010},
ABSTRACT = {The advent and exponential development of the World Wide Web has led to an increasing availability of unstructured knowledge and distributed information sources, meeting general public requirements that are hardly addressed by other more traditional information channels. This trend has concurrently raised a considerable interest in the application of Computational Linguistics (CL) methodologies to document access and retrieval, as they offer the unprecedented opportunity to make the subjective, user-centred information demands of Net citizens meet the ever changing and heterogeneous information flow of the web. Over the last five years, more and more Italian Universities have introduced CL courses into their Humanities curricula, making available on-line teaching materials, tutorials and language engineering software that appear to supply the lack of offer from traditional Italian publishing houses. In this paper, we consider in some detail the role played by this type of Grey Literature in bringing up a wider and increasingly more aware community of web users in Italy},
KEYWORDS = {Computational Linguistics, Grey, Web-based information},
PAGES = {81-84},
URL = {https://iris.cnr.it/handle/20.500.14243/65157},
VOLUME = {11},
PUBLISHER = {TextRelease (Amsterdam, NLD)},
ISSN = {1386-2316},
ISBN = {978-90-77484-13-5},
CONFERENCE_NAME = {Eleventh International Conference on Grey Literature. The Grey Mosaic, Piecing it All Together},
CONFERENCE_PLACE = {Amsterdam},
BOOKTITLE = {THE GL-CONFERENCE SERIES. CONFERENCE PROCEEDINGS},
EDITOR = {Farace, D. J. and Frantzen, J.},
}
@INPROCEEDINGS{MONTEMAGNI_2010_INPROCEEDINGS_M_65142,
AUTHOR = {Montemagni, S.},
TITLE = {Esplorazioni computazionali nello spazio della variazione lessicale in Toscana},
YEAR = {2010},
ABSTRACT = {The paper illustrates the results of experiments carried out on the corpus of dialectal data of an online dialectal resource documenting the language varieties spoken in Tuscany (Italy) with dialectometric techniques. The study focuses on patterns of lexical variation attested in Tuscany},
KEYWORDS = {Computational Dialectology, Lexical Variation},
PAGES = {609-634},
URL = {https://iris.cnr.it/handle/20.500.14243/65142},
PUBLISHER = {Centro Editoriale e Librario (Arcavacata di Rende, ITA)},
ISBN = {9788874581030},
CONFERENCE_NAME = {Convegno 'Parole. Il lessico come strumento per organizzare e trasmettere gli etnosaperi'},
CONFERENCE_PLACE = {Arcavacata di Rende},
BOOKTITLE = {Parole. Il lessico come strumento per organizzare e trasmettere gli etnosaperi},
EDITOR = {Prantera, N. and Mendicino, A. and Citraro, C.},
}
@INPROCEEDINGS{PARETI_2010_INPROCEEDINGS_PP_65153,
AUTHOR = {Pareti, S. and Prodanof, I.},
TITLE = {Annotating Attribution Relations: Towards an Italian Discourse Treebank},
YEAR = {2010},
KEYWORDS = {Information Extraction, Information Retrieval},
URL = {https://iris.cnr.it/handle/20.500.14243/65153},
CONFERENCE_NAME = {Seventh International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{PASSAROTTI_2010_INPROCEEDINGS_PD_65148,
AUTHOR = {Passarotti, M. and Dell'Orletta, F.},
TITLE = {Improvements in Parsing the Index Thomisticus Treebank. Revision, Combination and a Feature Model for Medieval Latin},
YEAR = {2010},
KEYWORDS = {Parsing, Corpus (creation, annotation, etc.)},
URL = {https://iris.cnr.it/handle/20.500.14243/65148},
CONFERENCE_NAME = {Seventh International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{PEZZULO_2010_INPROCEEDINGS_PBLB_65146,
AUTHOR = {Pezzulo, G. and Barca, L. and Lamberti Bocconi, A. and Borghi, A. M.},
TITLE = {Motor Simulation in a Memory Task: Evidence from Rock Climbing},
YEAR = {2010},
KEYWORDS = {simulation, affordance, embodied cognition, grounded cognition, canonical neurons, mirror neurons, motor memory, memory for actions, motor chunks},
URL = {https://iris.cnr.it/handle/20.500.14243/65146},
CONFERENCE_NAME = {Proceedings of the 2010 Annual Meeting of the Cognitive Science Society},
}
@INPROCEEDINGS{PICCHI_2010_INPROCEEDINGS_PS_65171,
AUTHOR = {Picchi, E. and Sassolini, E.},
TITLE = {"Text power": Tools for the cultural heritage},
YEAR = {2010},
ABSTRACT = {This article presents NLP techniques (text mining, text analysis) to create tools for the avaluation, analysis and classification of text materials available on the web. In particular we developed tools for the automatic extraction of mistic relevant information related to the cultural heritage domain and tools for linguistic resouces creation. On this knowledge basis, we also developed a system for text browsing},
KEYWORDS = {information extraction, named entity recognition, text bvrowsing},
PAGES = {435-439},
URL = {http://www.cairocongress.com/},
ISBN = {978-88-96680-31-5},
CONFERENCE_NAME = {4-th Intl. Congr. Science and Technology for the Safeguard of Cultural Heritage in the Mediterranean Basin},
BOOKTITLE = {Proceedings in: CHC 2010-4-th Intl. Congr. Science and Technology for the Safeguard of Cultural Heritage in the Mediterranean Basin (Il Cairo, 6-7-8/12/2009)},
EDITOR = {Ferrari, A.},
}
@INPROCEEDINGS{PIOGGIA_2010_INPROCEEDINGS_PCATTFDGR_234936,
AUTHOR = {Pioggia, G. and Carbonaro, N. and Anania, G. and Tognetti, A. and Tartarisco, G. and Ferro, M. and De Rossi, D. and Gaggioli, A. and Riva, G.},
TITLE = {Interreality: The use of advanced technologies in the assessment and treatment of psychological stress},
YEAR = {2010},
ABSTRACT = {Stress and its related comorbid diseases are responsible for a large proportion of disability worldwide. In particular, chronic stress is the main responsible for the dramatic increase of premature mortality in the Western countries. However, advanced simulation and sensing technologies, such as virtual reality and mobile biosensors offer interesting opportunities for innovative personal health-care solutions to stress. In this work, we describe a technology-based approach to the assessment and treatment of stress that is based on the vision of Interreality. The main feature of interreality is the creation of a hybrid-augmented experience merging the physical and virtual world. This is achieved through: a) an extended sense of presence: in interreality advanced simulations (3-D virtual worlds) are used to transform health guidelines and provisions into experience; b) an extended sense of community (social presence): interreality uses hybrid social interaction and dynamics of group sessions to provide each user with targeted social support in both the physical and virtual world; c) real-time feedback between the physical and virtual worlds: interreality uses bio and activity sensors and devices (e. g. smartphones) to track both the behavior and the health status of the user in real time and to provide targeted suggestions and guidelines. The feedback activity is twofold: (1) behavior in physical world influences the experience in the virtual one, and (2) behavior in the virtual world influences the experience in the real one},
PAGES = {1047-1051},
URL = {https://iris.cnr.it/handle/20.500.14243/234936},
DOI = {10.1109/ISDA.2010.5687047},
ISBN = {978-1-4244-8134-7},
CONFERENCE_NAME = {Intelligent Systems Design and Applications (ISDA), 2010 10th International Conference on},
BOOKTITLE = {Intelligent Systems Design and Applications (ISDA), 2010 10th International Conference on},
}
@INPROCEEDINGS{PUSTEJOVSKY_2010_INPROCEEDINGS_PRPJBQ_65141,
AUTHOR = {Pustejovsky, J. and Rumshisky, A. and Plotnick, A. and Jezek, E. and Batiukova, O. and Quochi, V.},
TITLE = {SemEval-2010 Task 7: Argument Selection and Coercion},
YEAR = {2010},
ABSTRACT = {The paper describes the Argument Selection and Coercion task for the SemEval-2010 evaluation exercise, which involves characterizing the type of compositional operation that exists between a predicate and the arguments it selects. Specifically, the goal is to identify whether the type that a verb selects is satisfied directly by the argument, or whether the argument must change type to satisfy the verb typing},
KEYWORDS = {semantic annotation, verb coercion},
URL = {http://www.aclweb.org/anthology/S10-1005},
PUBLISHER = {Association for Computational Linguistics (Stroudsburg, USA)},
ISBN = {978-1-932432-70-1},
CONFERENCE_NAME = {Fifth International Workshop on Semantic Evaluation (SemEval 2010)},
CONFERENCE_PLACE = {Stroudsburg},
BOOKTITLE = {Proceedings of the 5th International Workshop on Semantic Evaluation},
EDITOR = {Erk, K. and Strapparava, C.},
}
@INPROCEEDINGS{RUIMY_2010_INPROCEEDINGS_R_65151,
AUTHOR = {Ruimy, N.},
TITLE = {Formalizzazione, strutturazione e standardizzazione in lessicografia computazionale: un esempio italiano},
YEAR = {2010},
ABSTRACT = {Descrivere una lingua naturale significa raccogliere un numero sterminato di informazioni. In effetti, per la loro ricchezza e complessità, le lingue naturali richiedono una descrizione linguistica a vari livelli. Per la lingua scritta, ad esempio, le informazioni morfologiche, sintattiche e semantiche sono essenziali. Ad ogni livello di conoscenza linguistica, esiste inoltre un'infinità di informazioni idiosincratiche che, sommate alle proprietà condivise da intere classi di parole, rendono la mole complessiva dei dati ingestibile senza un'adeguata strutturazione. Perché un utente umano possa utilizzare, anche in minima parte, questi dati, la descrizione linguistica deve essere coerente, ordinata e formulata in un metalinguaggio descrittivo esplicito. L'essere umano, tuttavia, possiede la capacità di fare inferenze e di interpretare contenuti non immediatamente afferrabili; se invece la gestione e l'uso di una descrizione linguistica sono demandati ad un elaboratore, i suddetti requisiti diventano imprescindibili. Nell'ambito delle Tecnologie del Linguaggio, lo sviluppo di applicazioni richiede un'infrastruttura di cui le risorse lessicali costituiscono l'elemento fondamentale. I sistemi di reperimento ed estrazione di informazioni da corpora, di question answering, di traduzione automatica, ecc. presuppongono, infatti, l'accesso a vasti depositi di conoscenza lessicale espressa in un linguaggio formale sufficientemente ricco in capacità espressive, sotto forma di una rappresentazione rigorosamente strutturata, univoca e computazionalmente trattabile. La formalizzazione non può tuttavia essere estesa a tutti gli aspetti della lingua; d'altra parte, non tutte le proprietà formalizzabili sono pertinenti ad ogni tipo di applicazione. La formalizzazione deve quindi avvenire in funzione di un obiettivo preciso. Trattamento del linguaggio generico o di specializzazione? Traduzione automatica o indicizzazione di testi? I fenomeni da analizzare e le informazioni rilevanti sono diversi a seconda del tipo di linguaggio e di applicazione. Il livello di granularità dell'informazione dipende anch'esso dall'obiettivo, oltre che da fattori di costo, ma è soprattutto determinato dalla capacità di calcolo del sistema: non ha senso introdurre nella descrizione linguistica distinzioni molto sottili ma non computabili. L'assoluta necessità di adottare un formalismo conforme a degli standard internazionali per la costruzione di risorse lessicali è ormai ampiamente riconosciuta nella comunità scientifica. L'uso di un modello formale e standardizzato di rappresentazione permette infatti una formulazione rigorosa e organicamente strutturata della conoscenza lessicale, consentendo quindi la riusabilità del lessico nonché la sua interoperabilità ed integrazione con altre risorse lessicali. Il lessico elettronico PAROLE-SIMPLE-CLIPS è la più vasta risorsa lessicale multilivello dell'italiano; è stato costruito in base agli standard internazionali definiti nel modello lessicale PAROLE-SIMPLE che ha permesso lo sviluppo di dodici lessici per altrettante lingue europee. Il lessico è articolato in quattro moduli indipendenti che corrispondono rispettivamente ai livelli fonologico, morfologico, sintattico e semantico di rappresentazione linguistica. La completa descrizione di un'unità lessicale consta pertanto di un minimo di quattro entrate interrelate, ognuna contenente un ricco insieme strutturato di informazioni inerenti al livello di descrizione che la ospita. I moduli sintattici e semantici, particolarmente ricchi ed innovativi, consentono una descrizione approfondita del comportamento delle unità lessicali che mette in risalto la stretta correlazione tra i due livelli. A livello sintattico, un'entrata descrive un comportamento sintattico di un'unità lessicale, in termini di proprietà inerenti e contestuali. Queste ultime sono espresse in un quadro di sottocategorizzazione nel quale sono formalizzate le proprietà sintattiche di ogni complemento. A livello semantico, il quadro teorico è quello del Lessico Generativo (Pustejovsky, 1995). Il lessico semantico è strutturato in base ad un'ontologia i cui tipi sono organizzati secondo principi ortogonali-mediante i quattro ruoli della Struttura Qualia (formale, costitutivo, telico ed agentivo)-al fine di catturare la multidimensionalità del significato. Ogni singolo senso è descritto in un'entrata semantica caratterizzata da un'ampia tipologia di informazioni di cui fanno parte il dominio d'uso, la classe azionale dei verbi, la formalizzazione della polisemia regolare e una fitta rete di relazioni semantiche basate sui ruoli qualia. La struttura argomentale dei termini predicativi è definita in termini di ruolo semantico e preferenze di selezioni sugli argomenti. Il collegamento fra i livelli semantico e sintattico avviene attraverso la proiezione della struttura argomentale sul quadro di sottocategorizzazione, mediante un raffinato sistema di coindicizzazione tra argomenti e complementi},
KEYWORDS = {Lessicografia Computazionale, Formalizzazione, Strutturazione},
PAGES = {246-256},
URL = {https://iris.cnr.it/handle/20.500.14243/65151},
VOLUME = {07},
PUBLISHER = {CUEC Editrice (Cagliari, ITA)},
ISBN = {978-88-8467-597-2},
CONFERENCE_NAME = {Forme e formalizzazioni Atti del XVI congresso nazionale},
CONFERENCE_PLACE = {Cagliari},
BOOKTITLE = {Forme e formalizzazioni},
EDITOR = {Storari, G. P. and Gola, E.},
}
@INPROCEEDINGS{RUSSO_2010_INPROCEEDINGS_R_65144,
AUTHOR = {Russo, I.},
TITLE = {Discovering Polarity for Ambiguous and Objective Adjectives through Adverbial Modification},
YEAR = {2010},
KEYWORDS = {Emotion Recognition/Generation, Corpus (creation, annotation, etc.), Semantics},
URL = {https://iris.cnr.it/handle/20.500.14243/65144},
CONFERENCE_NAME = {Seventh International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{SASSI_2010_INPROCEEDINGS_SPBCG_147512,
AUTHOR = {Sassi, M. and Pardelli, G. and Biagioni, S. and Carlesi, C. and Goggi, S.},
TITLE = {A Digital Archive of Research Papers in Computer Science},
YEAR = {2010},
ABSTRACT = {This paper presents the results of a terminological work conducted by the authors on a Digital Archives Net of the Italian National Research Council (CNR) in the field of Computer Science. In particular, the research tends to analyse the use of certain terms in Computer Science in order to verify their change over the time with the aim of retrieving from the net the very essence of documentation. Its main source is a reference corpus made up of 13, 500 documents which collects the scientific productions of three CNR research Institutes. They are ISTI (Institute of Information Science and Technologies), IIT (Institute of Informatics and Telematics) and ILC (Institute of Computational Linguistics), all of them born from the "Centro Studi sulle Calcolatrici Elettroniche (CSCE)" and now belonging to the CNR Department of Information \& Communication Technologies and Cultural Identity. This study is divided in three sections: 1) an introductory one dedicated to the data extracted from the scientific documentation: the data have in common the use of some terms proper of the Computer Science lexicon although these term belong to different branches (Linguistics, Informatics and Telematics); 2) the second section is devoted to the description of the contents managed by the PUMA (Publication Management System) system; 3) the third part contains a statistical representation of terms extracted from archive: some comparison tables between the occurrences of the most used terms in the scientific documentation produced by the three Institutes will be created and diagrams with percentages about the most frequently used terms will be displayed too. Lastly, indexes and concordances will allow to reflect on the use of certain terms in this field and give possible keys for having access to the extraction of knowledge in the digital era},
KEYWORDS = {Digital libraries, Document Classification, Text categorisation, Text mining, Natural Language Processing. Text analysis},
PAGES = {1245-1248},
URL = {http://www.lrec-conf.org/proceedings/lrec2010/summaries/945.html},
PUBLISHER = {European Language Resources Association (ELRA)-Evaluations and Language resources Distribution Agency (ELDA) (Paris, FRA)},
ISBN = {2-9517408-6-7},
CONFERENCE_NAME = {Seventh International Conference on Language Resources and Evaluation},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the Seventh International Conference on Language Resources and Evaluation (LREC'10)},
EDITOR = {Calzolari, N. and Choukri, K. and Maegaard, B. and Mariani, J. and Odjik, J. and Piperidis, S. and Rosner, M. and Tapias, D.},
}
@INPROCEEDINGS{SASSOLINI_2010_INPROCEEDINGS_SC_65138,
AUTHOR = {Sassolini, E. and Cinini, A.},
TITLE = {Cultural Heritage: Knowledge Extraction from Web Documents},
YEAR = {2010},
ABSTRACT = {This article presents the use of NLP techniques (text mining, text analysis) to develop specific tools that allow to create linguistic resources related to the cultural heritage domain. The aim of our approach is to create tools for the building of an online "knowledge network", automatically extracted from text materials concerning this domain. A particular methodology was experimented by dividing the automatic acquisition of texts, and consequently, the creation of reference corpus in two phases. In the first phase, on-line documents have been extracted from lists of links provided by human experts. All documents extracted from the web by means of automatic spider have been stored in a repository of text materials. On the basis of these documents, automatic parsers create the reference corpus for the cultural heritage domain. Relevant information and semantic concepts are then extracted from this corpus. In a second phase, all these semantically relevant elements (such as proper names, names of institutions, names of places, and other relevant terms) have been used as basis for a new search strategy of text materials from heterogeneous sources. In this case also specialized crawlers (TP-crawler) have been used to work on a bulk of text materials available on line},
KEYWORDS = {Information Extraction, Information Retrieval, Text mining, Named Entity recognition},
PAGES = {3363-3368},
URL = {https://iris.cnr.it/handle/20.500.14243/65138},
ISBN = {978-2-9517408-6-0},
CONFERENCE_NAME = {Seventh International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{SAVAS_2010_INPROCEEDINGS_SHMSC_65172,
AUTHOR = {Savas, B. and Hayashi, Y. and Monachini, M. and Soria, C. and Calzolari, N.},
TITLE = {An LMF-based Web Service for Accessing WordNet-type Semantic Lexicons},
YEAR = {2010},
ABSTRACT = {This paper describes a Web service for accessing WordNet-type semantic lexicons. The central idea behind the service design is: given a query, the primary functionality of lexicon access is to present a partial lexicon by extracting the relevant part of the target lexicon. Based on this idea, we implemented the system as a RESTful Web service whose input query is specified by the access URI and whose output is presented in a standardized XML data format. LMF, an ISO standard for modeling lexicons, plays the most prominent role: the access URI pattern basically reflects the lexicon structure as defined by LMF; the access results are rendered based on Wordnet-LMF, which is a version of LMF XML-serialization. The Web service currently provides accesses to Princeton WordNet, Japanese WordNet, as well as the EDR Electronic Dictionary as a trial. To accommodate the EDR dictionary within the same framework, we modeled it also as a WordNet-type semantic lexicon. This paper thus propose modifications to LMF},
KEYWORDS = {Standards for LRs, Lexicon, Lexical database, Web Services},
URL = {https://iris.cnr.it/handle/20.500.14243/65172},
ISBN = {2-9517408-6-7},
CONFERENCE_NAME = {Seventh International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{SOROA_2010_INPROCEEDINGS_SALBVMLH_65139,
AUTHOR = {Soroa, A. and Agirre, E. and López De Lacalle, O. and Bosma, W. and Vossen, P. and Monachini, M. and Lo, J. and Hsieh, S.},
TITLE = {Kyoto: An Integrated System for Specific Domain WSD},
YEAR = {2010},
ABSTRACT = {This document describes the preliminary release of the integrated Kyoto system for specific domain WSD. The system uses concept miners (Tybots) to extract domain-related terms and produces a domain-related thesaurus, followed by knowledge-based WSD based on wordnet graphs (UKB). The resulting system can be applied to any language with a lexical knowledge base, and is based on publicly available software and resources. Our participation in Semeval task #17 focused on producing running systems for all languages in the task, and we attained good results in all except Chinese. Due to the pressure of the time-constraints in the competition, the system is still under development, and we expect results to improve in the near future},
KEYWORDS = {Semantic Annotation, Word-sense disambiguation},
PAGES = {417-420},
URL = {https://iris.cnr.it/handle/20.500.14243/65139},
ISBN = {978-1-932432-70-1},
CONFERENCE_NAME = {SemeEval2010-5th International Workshop on Semantic Evaluation},
EDITOR = {Erk, K. and Strapparava, C.},
}
@INPROCEEDINGS{TORAL_2010_INPROCEEDINGS_TBMS_65143,
AUTHOR = {Toral, A. and Bracale, S. and Monachini, M. and Soria, C.},
TITLE = {Rejuvenating the ItalianWordNet: upgrading, standardising, extending},
YEAR = {2010},
ABSTRACT = {This paper reports on recent activities carried out within the KYOTO project aimed at enhancing the Italian WordNet Language Resource. On the one hand we study the formalisation of this lexicon according to the LMF ISO standard and explore its application into a real-world scenario by means of representing it in the WN-LMF dialect. On the other hand, we report on a semiautomatic procedure to upgrade the connections of the lexicon to WordNet, which obtains over 98% accuracy},
KEYWORDS = {Lexical Resources, Standards for LRs},
URL = {http://www.globalwordnet-iitb2010.in/proceedings.php},
CONFERENCE_NAME = {5th Global Wordnet Conference},
EDITOR = {Bhattacharyya, P. and Fellbaum, C. and Vossen, P.},
}
@INPROCEEDINGS{TORAL_2010_INPROCEEDINGS_TMSCRBV_65167,
AUTHOR = {Toral, A. and Monachini, M. and Soria, C. and Cuadros, M. and Rigau, G. and Bosma, W. and Vossen, P.},
TITLE = {Linking a domain thesaurus toWordNet and conversion toWordNet-LMF},
YEAR = {2010},
ABSTRACT = {We present a methodology to link domain thesauri to general-domain lexica. This is applied in the framework of the KYOTO project to link the Species2000 thesaurus to the synsets of the English WordNet. Moreover, we study the formalisation of this thesaurus according to the ISO LMF standard and its dialect WordNet-LMF. This conversion will allow Species2000 to communicate with the other resources available in the KYOTO architecture},
KEYWORDS = {Lexical Resources, Thesaurus},
PAGES = {157-165},
URL = {https://iris.cnr.it/handle/20.500.14243/65167},
ISBN = {978-962-442-323-5},
CONFERENCE_NAME = {ICGL 2010-The Second International Conference on Global Interoperability for Language Resources},
BOOKTITLE = {ICGL2010-Proceedings of the Second International Conference on Global Interoperability for Language Resources-5th Joint ISO-ACL/SIGSEM Workshop on Interoperable Semantic Annotation},
EDITOR = {Fang, A. C. and Ide, N.},
}
@INPROCEEDINGS{VOSSEN_2010_INPROCEEDINGS_VRASMB_612,
AUTHOR = {Vossen, P. and Rigau, G. and Agirre, E. and Soroa, A. and Monachini, M. and Bartolini, R.},
TITLE = {KYOTO: an Open Platform for Mining Facts},
YEAR = {2010},
ABSTRACT = {This paper describes an open text-mining system that was developed for the Asian-European project KYOTO. The KYOTO system uses an open text representation format and a central ontology to enable extraction of knowledge and facts from large volumes of text in many different languages. We implemented a semantic tagging approach that performs off-line reasoning. Mining of facts and knowledge is achieved through a flexible pattern matching module that can work in much the same way for different languages, can handle efficiently large volumes of documents and is not restricted to a specific domain. We applied the system to an English database on estuaries},
URL = {https://iris.cnr.it/handle/20.500.14243/612},
ISBN = {978-7-900268-00-6},
CONFERENCE_NAME = {OntoLex 2010},
BOOKTITLE = {ONTOLEX-COLING 2010},
}
@INPROCEEDINGS{WITTENBURG_2010_INPROCEEDINGS_WBBBCHKLMPPPSTVVW_65170,
AUTHOR = {Wittenburg, P. and Bel, N. and Borin, L. and Budin, G. and Calzolari, N. and Hajicova, E. and Koskenniemi, K. and Lemnitzer, L. and Maegaard, B. and Piasecki, M. and Pierrel, J. and Piperidis, S. and Skadina, I. and Tufis, D. and Van Veenendaal, R. and Váradi, T. and Wynne, M.},
TITLE = {Resource and Service Centres as the Backbone for a Sustainable Service Infrastructure},
YEAR = {2010},
URL = {https://iris.cnr.it/handle/20.500.14243/65170},
}
@INPROCEEDINGS{MARINELLI_2010_INPROCEEDINGS_M_254645,
AUTHOR = {Marinelli, R.},
TITLE = {Costruzione di risorse terminologiche: criteri, risultati e prodotti},
YEAR = {2010},
URL = {https://iris.cnr.it/handle/20.500.14243/254645},
CONFERENCE_NAME = {XX Convegno dell'Associazione Italiana per la Terminologia "Terminologie specialistiche e prodotti terminologici"},
}
@INPROCEEDINGS{MARZI_2010_INPROCEEDINGS_MPS_224021,
AUTHOR = {Marzi, C. and Pardelli, G. and Sassi, M.},
TITLE = {A Terminology Based Re-Definition of Grey Literature},
YEAR = {2010},
ABSTRACT = {The Luxembourg Convention on Grey Literature held in 1997 offered the following definition of Grey Literature (expanded in New York, 2004): "Information produced and distributed on all levels of government, academics, business and industry in electronic and print formats not controlled by commercial publishing, i. e. where publishing is not the primary activity of the producing body". Is this definition still valuable? Is it so far completely satisfactory? Or does it rather need important modifications? We suggest that an interesting re-definition of GL can be based upon careful examination of the longitudinal trend of 10 years of terminological creativity in the proceedings of the GL international Conference. Our empirical basis is the Corpus of GreyText Inhouse Archive, available on http: //www. greynet. org/opensiglerepository. html consisting of titles, themes, keywords and full abstracts, for a total amount of more than sixty thousand word tokens. In the full version of our paper, we intend to focus on a set of automatically-acquired terms (both single-word and multi-word terms) obtained by subjecting our reference Corpus to a number of pre-processing steps of automated text analysis, such as concordances, frequency lists and lexical association scores (e. g. Mutual Information on word pairs). To anticipate some of our results, the following three terms, that appear to be shared by various disciplinary sub-fields, mark, in our view, important stages in the evolution of our current understanding of GL: digital, access and web. The attribute digital, an increasingly popular synonym of the now obsolete electronic, emphasises the growing importance of computer-based encoding as the standard medium of GL. The noun access (defining the process of accessing text documents) is seen in the company of adjectives like easy, full, grey and open to shape up important conceptual innovations in the way GL material is distributed: e. g. open access focuses on the free accessibility of digital contents. Coupled with information, document and repository (note, however, that repository is generally understood as a technical synonym of open archive), access points to a conception of world-wide available, structured cultural contents. Finally, reference to the web lays emphasis on the huge importance of the World Wide Web as the standard means of disseminating GL. All these aspects are not fully taken into account in the standard definition of GL reported above. Our inquiry is intended to pave the way to a bottom-up re-definition of GL, stemming from the terminological creativity and lexical innovation monitored over ten years of technical work in the field},
KEYWORDS = {Terminology extraction, Grey Literature definition, GL Conference corpus},
PAGES = {24-28},
URL = {https://iris.cnr.it/handle/20.500.14243/224021},
VOLUME = {12},
ISBN = {978-90-77484-15-9},
CONFERENCE_NAME = {Twelfth International Conference on Grey Literature: Trasparency in Grey Literature, Grey Tech Approaches to High Tech Issues},
BOOKTITLE = {Trasparency in Grey Literature, Grey Tech Approaches to High Tech Issues},
EDITOR = {Farace, D. J. and Fratzen, J.},
}
@INPROCEEDINGS{MONTEMAGNI_2010_INPROCEEDINGS_MWDN_106764,
AUTHOR = {Montemagni, S. and Wieling, M. and De Jonge, B. and Nerbonne, J.},
TITLE = {Modelli di variazione dialettale e analisi dei tratti linguistici sottostanti: un nuovo approccio dialettometrico},
YEAR = {2010},
KEYWORDS = {Computational dialectology},
URL = {https://iris.cnr.it/handle/20.500.14243/106764},
CONFERENCE_NAME = {XI Congresso Silfi-Congresso della Società Internazionale di Linguistica e Filologia Italiana},
}
@INPROCEEDINGS{PICCHI_2010_INPROCEEDINGS_PSBG_86042,
AUTHOR = {Picchi, E. and Sassi, M. and Biagioni, S. and Giannini, S.},
TITLE = {Extending the "Facets" concept by applying NLP tools to catalog records of scientific literature},
YEAR = {2010},
ABSTRACT = {The prototype of an "intelligent" navigation system, which has been implemented on the contents of PUMA (http: //puma. isti. cnr. it), a digital library of scientific literature, is presented. The system has been implemented by integrating our core textual search engine (known as DBT) with the TextPower (TP) technology. TP is based on NLP techniques and linguistic resources and provides tools specialized for the evaluation, analysis, classification and browsing of scientific literature. TP extends the facet concept by extracting "field content" pairs not only from structured fields but also from free text, eg. abstracts, using a linguistic-statistical approach to annotate relevant terminology, named entities, etc. The enriched text can be queried, analysed, and classified using a new version of the DBT System known as "DBT\&Facets". DBT\&Facets has been implemented on the full bibliographic records of the documents archived in the PUMA digital library of the Italian National Research Council (CNR). PUMA is a user-focused, service-oriented infrastructure which manages 30 CNR institutional repositories containing about 25, 000 published or open access documents in a wide variety of disciplines. In an open domain like scientific documentation, our approach based on the criteria of "semantic similarity" is useful-and perhaps more objective than one based on hierarchical elements-as it makes it possible to link different types of information, also across domains if necessary. DBT\&Facets is an advanced search tool that permits the user to query and refine their results, and to identify particular relations between them. The aim of the project has been to structure a knowledge system of domain-specific information which assists the user by suggesting possible directions for their search},
KEYWORDS = {NLP tools, Digital libraries},
PAGES = {82-87},
URL = {https://iris.cnr.it/handle/20.500.14243/86042},
ISBN = {978-90-77484-15-9},
CONFERENCE_NAME = {Twelfth International Conference on Grey Literature},
EDITOR = {Farace, D. J. and Frantzen, J. and Greynet},
}
@TECHREPORT{BARONI_2010_TECHREPORT_B_183238,
AUTHOR = {Baroni, P.},
TITLE = {ECP-2007-LANG-617001 FLaReNet: Pre-financing Request No. 1},
YEAR = {2010},
KEYWORDS = {Financial Statement},
URL = {https://iris.cnr.it/handle/20.500.14243/183238},
}
@TECHREPORT{BARONI_2010_TECHREPORT_B_183244,
AUTHOR = {Baroni, P.},
TITLE = {ECP-2007-LANG-617001 FLaReNet: Pre-financing Request No. 2},
YEAR = {2010},
KEYWORDS = {Financial Statement},
URL = {https://iris.cnr.it/handle/20.500.14243/183244},
}
@TECHREPORT{BARONI_2010_TECHREPORT_B_183237,
AUTHOR = {Baroni, P.},
TITLE = {FLaReNet Web Statistics: 7 December 2008-31 August 2010},
YEAR = {2010},
ABSTRACT = {Statistics relating to the access to the FLaReNet Web site from 7 December 2008 to 31 August 2010},
KEYWORDS = {Language Resources, Web Statistics},
PAGES = {8},
URL = {https://iris.cnr.it/handle/20.500.14243/183237},
}
@TECHREPORT{CALZOLARI_2010_TECHREPORT_CSB_183243,
AUTHOR = {Calzolari, N. and Soria, C. and Baroni, P.},
TITLE = {ECP-2007-LANG-617001 FLaReNet: Annual Report No. 2},
YEAR = {2010},
KEYWORDS = {Language Resources},
URL = {https://iris.cnr.it/handle/20.500.14243/183243},
}
@TECHREPORT{CALZOLARI_2010_TECHREPORT_CSBBBCMOP_183240,
AUTHOR = {Calzolari, N. and Soria, C. and Baroni, P. and Bel, N. and Budin, G. and Choukri, K. and Mariani, J. and Odijk, J. and Piperidis, S.},
TITLE = {ECP-2007-LANG-617001 FLaReNet: Progress Report No. 3},
YEAR = {2010},
KEYWORDS = {Language Resources},
URL = {https://iris.cnr.it/handle/20.500.14243/183240},
}
@TECHREPORT{CALZOLARI_2010_TECHREPORT_CSBQBBCMOP_183250,
AUTHOR = {Calzolari, N. and Soria, C. and Baroni, P. and Quochi, V. and Bel, N. and Budin, G. and Choukri, K. and Mariani, J. and Odijk, J. and Piperidis, S.},
TITLE = {ECP-2007-LANG-617001 FLaReNet: Progress Report No. 4},
YEAR = {2010},
KEYWORDS = {Language Resources},
URL = {https://iris.cnr.it/handle/20.500.14243/183250},
}
@TECHREPORT{DELGROSSO_2010_TECHREPORT_DG_315844,
AUTHOR = {Del Grosso, A. M. and Giovannetti, E.},
TITLE = {Sistema di gestione della banca dati lessicale},
YEAR = {2010},
ABSTRACT = {Il documento descrive l'analisi e lo studio preliminare svolto sul sistema di gestione della banca dati lessicale sviluppato nell'ambito dei progetti PAROLE, SIMPLE e CLIPS},
KEYWORDS = {Lessico elettronico, piattaforma web},
PAGES = {21},
URL = {https://iris.cnr.it/handle/20.500.14243/315844},
}
@TECHREPORT{MARINELLI_2010_TECHREPORT_MRC_183241,
AUTHOR = {Marinelli, R. and Roventini, A. and Cucurullo, S.},
TITLE = {Descrizione attività Progetto Servizi innovativi di Business Intelligence e p. m. i.: la costituzione di un Sistema di Aziende Estese (BISAE): il modulo ILC},
YEAR = {2010},
KEYWORDS = {Risorse linguistiche, terminologia, database semantico-lessicali, corpora},
URL = {https://iris.cnr.it/handle/20.500.14243/183241},
}
@TECHREPORT{MARZI_2010_TECHREPORT_MM_183242,
AUTHOR = {Marzi, C. and Marchi, S.},
TITLE = {Procedura Web per la generazione automatica dei bandi di concorso per Assegno di Ricerca in formato pdf},
YEAR = {2010},
ABSTRACT = {Lo sviluppo di una procedura web per la generazione automatica e gestione dei testi dei bandi di concorso per il conferimento di Assegni di Ricerca risponde alla necessità di uniformare i testi dei bandi di concorso al Disciplinare dell'Ente in continuo aggiornamento. Ogni modifica apportata al regolamento viene immediatamente recepita e convertita in modifica al modello automatico di bando. La procedura "Bandi" consente, inoltre, ad ogni Gruppo di ricerca, Laboratorio, o Commessa, o anche singolo Ricercatore, di avviare la richiesta per un Assegno di Ricerca generando autonomamente una bozza di testo in formato pdf, da sottoporre agli utenti Validatori per approvazione, correzione e/o integrazione, e la conseguente generazione e stampa del testo definitivo in formato pdf},
KEYWORDS = {Tool, Procedura web creazione bandi},
URL = {http://bandi.ilc.cnr.it/form/login.php},
}
@TECHREPORT{MONTEMAGNI_2010_TECHREPORT_M_183247,
AUTHOR = {Montemagni, S.},
TITLE = {Computational Models of Dialectal Variation and Underlying Linguistic Features},
YEAR = {2010},
KEYWORDS = {Computational Dialectology, Language Variation},
URL = {https://iris.cnr.it/handle/20.500.14243/183247},
}
@TECHREPORT{PIRRELLI_2010_TECHREPORT_PLMDGM_353288,
AUTHOR = {Pirrelli, V. and Lenci, A. and Montemagni, S. and Dell'Orletta, F. and Giovannetti, E. and Marchi, S.},
TITLE = {ConnectToLife (modulo semantico)-Rapporto tecnico finale},
YEAR = {2010},
ABSTRACT = {Il presente documento costituisce il rapporto tecnico finale del progetto Connect-To-Life (modulo semantico) relativo alle attività svolte dall'unità ILC-CNR},
KEYWORDS = {annotazione linguistica, estrazione di termini, clustering semantico, trattamento automatico della lingua, costruzione di ontologie},
PAGES = {16},
URL = {https://iris.cnr.it/handle/20.500.14243/353288},
}
@TECHREPORT{VOSSEN_2010_TECHREPORT_VHARFMIBHJD_183252,
AUTHOR = {Vossen, P. and Hielkema, F. and Aliprandi, C. and Rigau, G. and Fellbaum, C. and Monachini, M. and Isahara, H. and Bond, F. and Hsieh, S. and Joneswalters, L. and De Boom, K.},
TITLE = {Exploitation and Dissemination Plan},
YEAR = {2010},
KEYWORDS = {Ontologie},
URL = {https://iris.cnr.it/handle/20.500.14243/183252},
}
@TECHREPORT{VOSSEN_2010_TECHREPORT_VSHHRAECLKM_183251,
AUTHOR = {Vossen, P. and Segers, R. and Hicks, A. and Herold, A. and Rigau, G. and Agirre, E. and Estarrona, A. and Cuadros, M. and Laparra, E. and Kanzaki, K. and Monachini, M.},
TITLE = {Wordnets mapped to central ontology-revised},
YEAR = {2010},
KEYWORDS = {Ontologie},
URL = {https://iris.cnr.it/handle/20.500.14243/183251},
}
@MISC{BELTRAMI_2010_MISC_BLSABGIGMRV_463973,
AUTHOR = {Beltrami, P. D. and Larson, P. C. and Squillacioti, P. C. and Artale, E. and Boccellari, A. and Guadagnini, E. and Iorio Fili, D. and Giuliani, M. and Mosti, R. and Ravani, S. and Vaccaro, G.},
TITLE = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI-Edizione online: www. vocabolario. org-Versione 2010},
YEAR = {2010},
ABSTRACT = {A pdf copy of the Tesoro della Lingua Italiana delle Origini (TLIO), a dictionary of early Italian in progress, published online, as it was at the end of 2010. TLIO is the first section of the Italian Historical Dictionary which is the mission of the OVI Institute},
KEYWORDS = {Lessicografia italiana, Italiano antico},
URL = {https://iris.cnr.it/handle/20.500.14243/463973},
}
@MISC{BONIN_2010_MISC_BDMV_106763,
AUTHOR = {Bonin, F. and Dell'Orletta, F. and Montemagni, S. and Venturi, G.},
TITLE = {Lessico settoriale e lessico comune nell'estrazione di terminologia specialistica da corpora di dominio},
YEAR = {2010},
KEYWORDS = {Automatic Term Extraction},
URL = {https://iris.cnr.it/handle/20.500.14243/106763},
CONFERENCE_NAME = {XLIV Congresso Internazionale di Studi della Società di Linguistica Italiana},
}
@MISC{CALZOLARI_2010_MISC_CSD_106755,
AUTHOR = {Calzolari, N. and Soria, C. and Del Gratta, R.},
TITLE = {The LREC 2010 Map of Language Resources and Tools},
YEAR = {2010},
KEYWORDS = {Linguistic Tools. Language Resources},
URL = {https://iris.cnr.it/handle/20.500.14243/106755},
}
@MISC{CIGNONI_2010_MISC_CF_183248,
AUTHOR = {Cignoni, L. and Fornaciari, G.},
TITLE = {Fondamenti della Lingua Inglese},
YEAR = {2010},
KEYWORDS = {Grammatica inglese},
PAGES = {1-85},
URL = {http://www.paleopatologia.it/Documenti/GrammaticaInglese.pdf},
}
@MISC{DELLORLETTA_2010_MISC_DMVV_155081,
AUTHOR = {Dell'Orletta, F. and Montemagni, S. and Vecchi, E. M. and Venturi, G.},
TITLE = {Tecnologie linguistico-computazionali per il monitoraggio delle competenze linguistiche di apprendenti l'italiano come L2},
YEAR = {2010},
KEYWORDS = {Natural Language Processing, Educational Linguistics, Language Learning},
URL = {https://iris.cnr.it/handle/20.500.14243/155081},
CONFERENCE_NAME = {Congresso "IT. L2: italiano lingua seconda nell'università, nella scuola e sul territorio. Esperienze didattiche e ricerche" Università del Piemonte Orientale "Amedeo Avogadro", Facoltà di Lettere e Filosofia},
}
@MISC{DIDONATO_2010_MISC_D_406272,
AUTHOR = {Di Donato, F.},
TITLE = {Linkedopencamera. it},
YEAR = {2010},
ABSTRACT = {Presentazione del progetto Linkedopencamera. it},
URL = {https://iris.cnr.it/handle/20.500.14243/406272},
}
@MISC{DIDONATO_2010_MISC_D_406265,
AUTHOR = {Di Donato, F.},
TITLE = {Les enjeux politiques du Web},
YEAR = {2010},
ABSTRACT = {presentazione al convegno 2e. Forum International de Philosophie Politique et Sociale, Toulouse, 12 luglio 2010},
URL = {https://iris.cnr.it/handle/20.500.14243/406265},
}
@MISC{DIDONATO_2010_MISC_D_406270,
AUTHOR = {Di Donato, F.},
TITLE = {Everyday digital scholarship: Using web-based tools for research},
YEAR = {2010},
ABSTRACT = {presentazione "Everyday digital scholarship: Using web-based tools for research", COST A32 Final Conference "In Our End are Fresh Beginnings. Perspectives for Open Scholarly Communities on the Web", Mu?nchen, 2 ottobre 2010},
URL = {https://iris.cnr.it/handle/20.500.14243/406270},
}
@MISC{DIDONATO_2010_MISC_D_406269,
AUTHOR = {Di Donato, F.},
TITLE = {Everyday Digital Scholarship: Using Web-Based Tools for Research},
YEAR = {2010},
ABSTRACT = {"Everyday Digital Scholarship: Using Web-Based Tools for Research", convegno The Judaica Europeana Digital Humanities Workshop, Università di Bologna, Ravenna, 30 luglio 2010},
URL = {https://iris.cnr.it/handle/20.500.14243/406269},
}
@MISC{DIDONATO_2010_MISC_D_406261,
AUTHOR = {Di Donato, F.},
TITLE = {Media telematici e democrazia},
YEAR = {2010},
ABSTRACT = {"Media telematici e democrazia", presentazione al Ciclo di incontri "Politica e sapienza", Facoltà di Scienze politiche di Pisa, 11 marzo 2010},
URL = {https://iris.cnr.it/handle/20.500.14243/406261},
}
@MISC{DIDONATO_2010_MISC_D_406263,
AUTHOR = {Di Donato, F.},
TITLE = {Les enjeux politiques de l'open access contre les Oligopoles},
YEAR = {2010},
ABSTRACT = {presentazione al convegno Stage EuroPhilosophie 2010 à l'Ecole Normale Supérieure de Paris, 17 aprile 2010},
URL = {https://iris.cnr.it/handle/20.500.14243/406263},
}
@MISC{FERRO_2010_MISC_FMP_183239,
AUTHOR = {Ferro, M. and Marzi, C. and Pirrelli, V.},
TITLE = {Word self-organization in time and space?: algorithms and evaluation},
YEAR = {2010},
ABSTRACT = {ABSTRACT: Words are time-bound signals and are amenable to temporal processing. The human brain has an innate ability to encode serial events into spatial patterns of neural activity (David Beiser \& James Houk, 1998). Temporal Hebbian SOMs (THSOMs) allow us to take the two assumptions seriously. They provide a novel computational framework accounting for many paradigm-based generalizations in a natural and insightful way. This claim is validated on inflectional data from German, English and Italian},
KEYWORDS = {Morphology, Word Processing and Learning, Mental Lexicon, L1, SOMs},
URL = {https://iris.cnr.it/handle/20.500.14243/183239},
}
@MISC{FRONTINI_2010_MISC_F_106762,
AUTHOR = {Frontini, F.},
TITLE = {Statistical profiling of Italian L2 texts: competence and native language},
YEAR = {2010},
KEYWORDS = {Text categorization},
URL = {https://iris.cnr.it/handle/20.500.14243/106762},
CONFERENCE_NAME = {20th Annual Conference of the European Second Language Association},
}
@MISC{GUADAGNINI_2010_MISC_G_107690,
AUTHOR = {Guadagnini, E.},
TITLE = {Cicéron et Boèce en Orient: quelques réflexions sur la Rectorique de Jean d'Antioche},
YEAR = {2010},
KEYWORDS = {Filologia romanza, Jean d'Antioche, De inventione, Storia della traduzione},
URL = {https://iris.cnr.it/handle/20.500.14243/107690},
CONFERENCE_NAME = {Medieval Translator 2010-In Principio Fuit Interpres-The Cardiff Conference on the Theory and Practice of Translation in the Middle Ages (Padova 23-27 July 2010)},
}
@MISC{MARZI_2010_MISC_MM_159865,
AUTHOR = {Marzi, C. and Marchi, S.},
TITLE = {Procedura Web per la generazione automatica dei bandi di concorso per Assegno di Ricerca},
YEAR = {2010},
ABSTRACT = {Lo sviluppo di una procedura web per la generazione automatica e gestione dei testi dei bandi di concorso per il conferimento di Assegni di Ricerca risponde alla necessità di uniformare i testi dei bandi di concorso al Disciplinare dell'Ente in continuo aggiornamento. Ogni modifica apportata al regolamento viene immediatamente recepita e convertita in modifica al modello automatico di bando. La procedura "Bandi" consente, inoltre, ad ogni Gruppo di ricerca, Laboratorio, o Commessa, o anche singolo Ricercatore, di avviare la richiesta per un Assegno di Ricerca generando autonomamente una bozza di testo in formato pdf, da sottoporre agli utenti Validatori per approvazione, correzione e/o integrazione, e la conseguente generazione e stampa del testo definitivo in formato pdf},
KEYWORDS = {Tool, Procedura web creazione bandi},
URL = {http://bandi.ilc.cnr.it/form/login.php},
}
@MISC{MONTEMAGNI_2010_MISC_M_106758,
AUTHOR = {Montemagni, S.},
TITLE = {The BioLexicon: a Large-Scale Domain-Specific Lexical Resource for Biomedical Text Mining},
YEAR = {2010},
KEYWORDS = {Text Mining, Knowledge Extraction, Lexical Resources},
URL = {https://iris.cnr.it/handle/20.500.14243/106758},
CONFERENCE_NAME = {LREC 2010 2nd Workshop on Building and evaluating resources for biomedical text mining},
}
@MISC{MONTEMAGNI_2010_MISC_M_106757,
AUTHOR = {Montemagni, S.},
TITLE = {Tecnologie linguistico-computazionali per il monitoraggio della lingua italiana},
YEAR = {2010},
KEYWORDS = {Language Variation, Natural Language Processing},
URL = {https://iris.cnr.it/handle/20.500.14243/106757},
CONFERENCE_NAME = {Giornata di Studio "Lo stato della lingua. Il CNR e l'italiano nel terzo millennio" organizzata dal Consiglio Nazionale delle Ricerche-Dipartimento Identità Culturale},
}
@MISC{MONTEMAGNI_2010_MISC_M_435681,
AUTHOR = {Montemagni, S.},
TITLE = {Ontology Learning. An introduction},
YEAR = {2010},
KEYWORDS = {Legal Text Processing, Ontology Learning, NLP},
URL = {https://iris.cnr.it/handle/20.500.14243/435681},
CONFERENCE_NAME = {Summer School LEX2010-Managing Legal Resources in the Semantic Web, Session "Ontology in the Legal Domain"},
}
@MISC{MONTEMAGNI_2010_MISC_M_106760,
AUTHOR = {Montemagni, S.},
TITLE = {Design, Construction and Use of an Italian Dependency Treebank: Methodological Issues and Empirical Results},
YEAR = {2010},
KEYWORDS = {Syntactic Annotation, Treebanks},
URL = {https://iris.cnr.it/handle/20.500.14243/106760},
CONFERENCE_NAME = {TheCopenhagen Dependency Treebank Workshop on "Designing Treebanks"},
}
@MISC{PICCHI_2010_MISC_PS_106759,
AUTHOR = {Picchi, E. and Sassolini, E.},
TITLE = {La tecnologia TextPower per la navigazione intelligente},
YEAR = {2010},
ABSTRACT = {Compito dell'ILC è di creare una rete di conoscenza linguistica, terminologica e semantica, estratta dai documenti, fatta di concetti che sintetizzano il valore semantico del documento. Questa rete di conoscenza individuata automaticamente costituisce la base conoscitiva necessaria alla classificazione e alla navigazione "intelligente" e rappresenta la ricchezza dello strumento e del servizio che l'Osservatorio può offrire},
KEYWORDS = {Text power, navigazione intelligente},
PAGES = {419-425},
URL = {http://oraal.ittig.cnr.it/oraal/},
VOLUME = {1},
ISBN = {88-14-17365-6},
CONFERENCE_NAME = {Convegno di inaugurazione dell'Osservatorio sulle Regole dell'Agricoltura e dell'Alimentazione},
EDITOR = {Sirsi, M. G. E.},
}
@MISC{PIRRELLI_2010_MISC_P_183245,
AUTHOR = {Pirrelli, V.},
TITLE = {Interdisciplinary Approaches to Understanding Word Processing and Storage},
YEAR = {2010},
ABSTRACT = {The present collection of papers originates from a successful application to the European Science Foundation Exploratory Workshop Programme for the "Words in Action" workshop. The workshop, convened in Pisa on the 12th and 13th of October 2009, brought together experts of various scientific domains and theoretical inclinations to advance the current awareness of theoretical, typological, psycholinguistic, computational and neuro-physiological issues in word processing and storage, with a view to promoting novel methods of research and assessment for grammar architecture and language physiology},
KEYWORDS = {Morphology, Word Processing, Word Learning, Mental Lexicon},
PAGES = {91-95},
URL = {https://iris.cnr.it/handle/20.500.14243/183245},
VOLUME = {IX (2)},
ISSN = {1720-9331},
}
@MISC{RUIMY_2010_MISC_RP_183236,
AUTHOR = {Ruimy, N. and Pardelli, G.},
TITLE = {Un modello lessicale da customizzare per lo sviluppo di un thesaurus lessico elettronico della terminologia saussuriana},
YEAR = {2010},
ABSTRACT = {Progetto di ricerca PRIN 2008: Per un'edizione digitale dei manoscritti di Ferdinand de Saussure. Unità di Ricerca Istituto di Linguistica Computazionale Antonio Zampolli CNR-Pisa Linea di attività II},
KEYWORDS = {Ontology. Computational Semantics},
PAGES = {1},
URL = {https://iris.cnr.it/handle/20.500.14243/183236},
}
@ARTICLE{AIELLO_2009_ARTICLE_ACP_36122,
AUTHOR = {Aiello, M. and Chiarella, D. and Papaleo, G.},
TITLE = {Statistical anomaly detection on real e-mail traffic},
YEAR = {2009},
ABSTRACT = {There are many recent studies and proposal in Anomaly Detection Techniques, especially in worm and virus detection. In this field it does matter to answer few important questions like at which ISO/OSI layer data analysis is done and which approach is used. Furthermore these works suffer of scarcity of real data due to lack of network resources or privacy problem: almost every work in this sector uses synthetic (e. g. DARPA) or pre-made set of data. Our study is based on layer seven quantities (number of e-mail sent in a chosen period): we analyzed quantitatively our network e-mail traffic and applied our method on gathered data to detect indirect worm infection (worms which use e-mail to spread infection). The method is a threshold method and, in our dataset, it identified various worm activities. In this document we show our data analysis and results in order to stimulate new approaches and debates in Anomaly Intrusion Detection Techniques},
KEYWORDS = {Anomaly Detection Techniques, indirect worm, real e-mail traffic.},
PAGES = {604-611},
URL = {https://iris.cnr.it/handle/20.500.14243/36122},
VOLUME = {4 (4)},
ISSN = {1554-1010},
JOURNAL = {JOURNAL OF INFORMATION ASSURANCE AND SECURITY},
}
@ARTICLE{AIELLO_2009_ARTICLE_ACP_56465,
AUTHOR = {Aiello, M. and Chiarella, D. and Papaleo, G.},
TITLE = {Statistical anomaly detection on real e-mail traffic},
YEAR = {2009},
KEYWORDS = {Anomaly Detection Techniques, indirect worm, real e-mail traffic.},
URL = {https://iris.cnr.it/handle/20.500.14243/56465},
}
@ARTICLE{CALZOLARI_2009_ARTICLE_CB_155268,
AUTHOR = {Calzolari, N. and Bel, N.},
TITLE = {FLaReNet: una red para fomentar los recursos lingüísticos (Fostering Language Resources Network: FLaReNet)},
YEAR = {2009},
ABSTRACT = {FLaReNet is a thematic network whose objective is the preparation of strategies and recommendations for the promotion and development of language technologies and the associated language resources because of their importance for minimizing the impact of the linguistic diversity in a digital and multilingual Europe. The results of this joint process of reflection by researchers and professionals of all around the world will be the basisi of European agreed policies for funding and promoting this sector},
URL = {https://iris.cnr.it/handle/20.500.14243/155268},
}
@ARTICLE{DIDONATO_2009_ARTICLE_D_384167,
AUTHOR = {Di Donato, F.},
TITLE = {Che cos'è il social software? Architettura delle reti e politiche del nuovo discorso scientifico},
YEAR = {2009},
ABSTRACT = {«Il social software», ha affermato Clay Shirky, docente di New Media alla New York University, «e? l'ala sperimentale della filosofia politica, una disciplina inconsapevole di avere un'ala sperimentale». E prosegue: «nei nostri strumenti (tools) stiamo letteralmente codificando i princi?pi di liberta? di parola e di liberta? di espressione. Abbiamo percio? la necessita? di discutere gli obiettivi espliciti di quello che stiamo sostenendo e tentando di fare, poiche? si tratta di una discussione importante». Questo contributo prende sul serio l'affermazione di Shirky e considera le tecnologie del software sociale da un punto di vista filosofico, sociale e politico a partire da un'analisi della sua filosofia tecnica. L'obiettivo delle pagine che seguono e? infatti duplice: in primo luogo, definire le caratteristiche filosofiche, socio-culturali e politiche del social software. In secondo luogo, fare da sponda all'invito di Shirky affrontando la questione del modo in cui si definisce il rapporto tra gli utenti e i produttori (architetti) di tecnologie web},
URL = {https://iris.cnr.it/handle/20.500.14243/384167},
ISSN = {1591-4305},
JOURNAL = {BOLLETTINO TELEMATICO DI FILOSOFIA POLITICA},
}
@ARTICLE{DIDONATO_2009_ARTICLE_D_384160,
AUTHOR = {Di Donato, F.},
TITLE = {Neither Property nor Contracts. On Kant and the Right of the Family},
YEAR = {2009},
ABSTRACT = {"The Right to Persons Akin to Rights to Things" is introduced in the Rechtslehre in order to legitimate family relationships. In fact, according to Kant, family relationships neither can be equated to relations with things, nor are merely contractual. This article considers the implications of family right in Kant's political philosophy and what it can suggest for nowadays issues},
URL = {https://iris.cnr.it/handle/20.500.14243/384160},
ISSN = {1724-6121},
JOURNAL = {HISTORIA PHILOSOPHICA},
}
@ARTICLE{FRANCOPOULO_2009_ARTICLE_FBGCMPS_50345,
AUTHOR = {Francopoulo, G. and Bel, N. and George, M. and Calzolari, N. and Monachini, M. and Pet, M. and Soria, C.},
TITLE = {Multilingual resources for NLP in the Lexical Markup Framework (LMF)},
YEAR = {2009},
ABSTRACT = {Optimizing the production, maintenance and extension of lexical resources is one the crucial aspects impacting Natural Language Processing (NLP). A second aspect involves optimizing the process leading to their integration in applications. With this respect, we believe that a consensual specification on monolingual, bilingual and multilingual lexicons can be a useful aid for the various NLP actors. Within ISO, one purpose of Lexical Markup Framework (LMF, ISO-24613) is to define a standard for lexicons that covers multilingual lexical data},
KEYWORDS = {LMF, Standardization, ISO-TC37},
PAGES = {57-70},
URL = {https://iris.cnr.it/handle/20.500.14243/50345},
VOLUME = {43},
DOI = {10.1007/s10579-008-9077-5},
ISSN = {1574-020X},
JOURNAL = {LANGUAGE RESOURCES AND EVALUATION},
}
@ARTICLE{GUADAGNINI_2009_ARTICLE_G_76222,
AUTHOR = {Guadagnini, E.},
TITLE = {Scelta di voci del Tesoro della Lingua Italiana delle Origini (tredicesima serie)},
YEAR = {2009},
ABSTRACT = {Voci conoscente agg. /s. m., conoscenza s. f., freddo agg. /s. m. del Tesoro della Lingua Italiana delle Origini (pp. 34-47, 156-166)},
KEYWORDS = {Lessicografia italiana, Italiano antico},
PAGES = {15-186},
URL = {https://iris.cnr.it/handle/20.500.14243/76222},
VOLUME = {14},
ISSN = {1591-8254},
JOURNAL = {BOLLETTINO-OPERA DEL VOCABOLARIO ITALIANO},
}
@ARTICLE{PEZZULO_2009_ARTICLE_P_436877,
AUTHOR = {Pezzulo, G.},
TITLE = {DiPRA: A Layered Agent Architecture which Integrates Practical Reasoning and Sensorimotor Schemas},
YEAR = {2009},
ABSTRACT = {We introduce the layered agent architecture DiPRA (Distributed Practical Reasoning Architecture), composed of an 'intentional' layer, which includes beliefs, plans and goals, and a 'sensorimotor' layer, which includes schemas for situated action. DiPRA's functioning is illustrated and evaluated in a simulated guards-and-thieves scenario. We also discuss the efficacy of the main features of DiPRA, such as the division of labour between off-line planning and on-line specification of action, the grounding of beliefs in sensorimotor interaction and anticipation, the use of bounded resources and knowledge, and the realization of deliberation and means-ends reasoning as intertwined processes},
KEYWORDS = {layered architecture, practical reasoning, grounding, anticipation, schema},
PAGES = {297-326},
URL = {https://iris.cnr.it/handle/20.500.14243/436877},
VOLUME = {21},
DOI = {10.1080/09540090902954170},
ISSN = {0954-0091},
JOURNAL = {CONNECTION SCIENCE},
}
@ARTICLE{PEZZULO_2009_ARTICLE_PBSB_154372,
AUTHOR = {Pezzulo, G. and Butz, M. and Sigaud, O. and Baldassarre, G.},
TITLE = {Anticipatory Behavior in Adaptive Learning Systems: From Psychological Theories to Artificial Cognitive Systems},
YEAR = {2009},
ABSTRACT = {This book constitutes the thoroughly refereed post-workshop proceedings of the 4th International Workshop on Anticipatory Behavior in Adaptive Learning Systems, ABiALS 2008, held in Munich, Germany, in June 2008, in collaboration with the six-monthly Meeting of euCognition 'The Role of Anticipation in Cognition'. The 18 revised full papers presented were carefully selected during two rounds of reviewing and improvement for inclusion in the book. The introductory chapter of this state-of-the-art survey not only provides an overview of the contributions included in this volume but also revisits the current available terminology on anticipatory behavior and relates it to the available system approaches. The papers are organized in topical sections on anticipation in psychology with focus on the ideomotor view, conceptualizations, anticipation and dynamical systems, computational modeling of psychological processes in the individual and social domains, behavioral and cognitive capabilities based on anticipation, and computational frameworks and algorithms},
KEYWORDS = {Adaptive Learning Systems},
URL = {https://iris.cnr.it/handle/20.500.14243/154372},
VOLUME = {VOL},
}
@ARTICLE{PEZZULO_2009_ARTICLE_PC_50344,
AUTHOR = {Pezzulo, G. and Castelfranchi, C.},
TITLE = {Intentional Action: from Anticipation to Goal-Directed Behavior},
YEAR = {2009},
ABSTRACT = {No abstract available},
KEYWORDS = {cognitive modeling},
PAGES = {437-440},
URL = {https://iris.cnr.it/handle/20.500.14243/50344},
VOLUME = {73},
ISSN = {0340-0727},
JOURNAL = {PSYCHOLOGICAL RESEARCH},
}
@ARTICLE{PEZZULO_2009_ARTICLE_PC_436878,
AUTHOR = {Pezzulo, G. and Castelfranchi, C.},
TITLE = {Thinking as the Control of Imagination: a Conceptual Framework for Goal-Directed Systems},
YEAR = {2009},
ABSTRACT = {This paper offers a conceptual framework which (re)integrates goal-directed control, motivational processes, and executive functions, and suggests a developmentalpathway from situated action to higher level cognition. We first illustrate a basic computational (control-theoretic) model of goal-directed action that makes use of internalmodeling. We then show that by adding the problem of selection among multiple actionalternatives motivation enters the scene, and that the basic mechanisms of executivefunctions such as inhibition, the monitoring of progresses, and working memory, arerequired for this system to work. Further, we elaborate on the idea that the off-line re-enactment of anticipatory mechanisms used for action control gives rise to (embodied)mental simulations, and propose that thinking consists essentially in controlling mental simulations rather than directly controlling behavior and perceptions. We concludeby sketching an evolutionary perspective of this process, proposing that anticipationleveraged cognition, and by highlighting specific predictions of our model},
KEYWORDS = {cognitive modeling},
PAGES = {559-577},
URL = {https://iris.cnr.it/handle/20.500.14243/436878},
VOLUME = {73},
ISSN = {0340-0727},
JOURNAL = {PSYCHOLOGICAL RESEARCH},
}
@ARTICLE{PIFFERI_2009_ARTICLE_PRPPFMPB_218254,
AUTHOR = {Pifferi, M. and Ragazzo, V. and Previti, A. and Pioggia, G. and Ferro, M. and Macchia, P. and Piacentini, G. L. and Boner, A. L.},
TITLE = {Exhaled Breath Temperature: a key feature to discriminate asthmatic children},
YEAR = {2009},
PAGES = {202-203},
URL = {https://iris.cnr.it/handle/20.500.14243/218254},
VOLUME = {20 (2)},
DOI = {10.1111/j.1399-3038.2008.00839.x},
ISSN = {0905-6157},
JOURNAL = {PEDIATRIC ALLERGY AND IMMUNOLOGY},
}
@ARTICLE{SORIA_2009_ARTICLE_SMBCHHMT_154828,
AUTHOR = {Soria, C. and Monachini, M. and Bertagna, F. and Calzolari, N. and Huang, C. and Hsieh, S. and Marchetti, A. and Tesconi, M.},
TITLE = {Exploring Interoperability of Language Resources: the Case of Cross-lingual Semi-automatic Enrichment of Wordnets},
YEAR = {2009},
ABSTRACT = {In this paper we present an application fostering the integration and interoperability of computational lexicons, focusing on the particular case of mutual linking and cross-lingual enrichment of two wordnets, the ItalWordNet and Sinica BOW lexicons. This is intended as a case study investigating the needs and requirements of semi-automatic integration and interoperability of lexical resources, in the view of developing a prototype web application to support the GlobalWordNet Grid Initiative},
KEYWORDS = {H.3 INFORMATION STORAGE AND RETRIEVAL. Linguistic processing, Distributed language resources, Interoperable lexical resources, Language services},
PAGES = {87-96},
URL = {https://iris.cnr.it/handle/20.500.14243/154828},
VOLUME = {43 (1)},
DOI = {10.1007/s10579-009-9082-3},
ISSN = {1574-020X},
JOURNAL = {LANGUAGE RESOURCES AND EVALUATION},
}
@BOOK{DIDONATO_2009_BOOK_D_384159,
AUTHOR = {Di Donato, F.},
TITLE = {La scienza e la rete. L'uso pubblico della ragione nell'età del Web},
YEAR = {2009},
ABSTRACT = {The advent and spread of Internet and the Web have radically transformed the modes of communication. This book considers a particular ambit of online communication, namely that of science. In the first place, the author reconstructs the circumstances that gave rise to the modern system of scientific communication, and the qualitative and quantitative tools for scientific evaluation. After this, the analysis concentrates on the history, philosophy and architecture of the Web from its inception through to the most recent developments of both a technical (Semantic Web) and a socio-cultural kind (Web 2. 0). Finally an open and democratic model for scientific communication is projected and proposed, made possible through the use of transparent, accessible and distributed tools},
URL = {https://iris.cnr.it/handle/20.500.14243/384159},
ISBN = {978-88-8453-494-1},
}
@BOOK{GUADAGNINI_2009_BOOK_G_128770,
AUTHOR = {Guadagnini, E.},
TITLE = {La Rectorique de Cyceron tradotta da Jean d 'Antioche. Edizione e glossario},
YEAR = {2009},
KEYWORDS = {Filologia romanza, Jean d'Antioche, Edizione critica, Cicerone},
URL = {https://iris.cnr.it/handle/20.500.14243/128770},
PUBLISHER = {Scuola Normale Superiore (Pisa, ITA)},
ISBN = {9788876423703},
CONFERENCE_PLACE = {Pisa},
}
@INCOLLECTION{AGNOLONI_2009_INCOLLECTION_ABFPMV_165690,
AUTHOR = {Agnoloni, T. and Bacci, L. and Francesconi, E. and Peters, W. and Montemagni, S. and Venturi, G.},
TITLE = {A two-level Knowledge approach to support multilingual legislative drafting},
YEAR = {2009},
KEYWORDS = {DALOS project, Ontological-linguistic},
URL = {https://iris.cnr.it/handle/20.500.14243/165690},
}
@INCOLLECTION{CIGNONI_2009_INCOLLECTION_CF_134816,
AUTHOR = {Cignoni, L. and Fornaciari, G.},
TITLE = {Teaching Funerary Archaeology through a Foreign Language: a Proposal for a Balanced Content and Language Integrated Learning (CLIL)-Based Course},
YEAR = {2009},
ABSTRACT = {Laura Cignoni and Gino Fornaciari's paper outlines a proposal for a CLIL-based University course in Funerary Archaeology, at the University of Pisa. In this case as well, the subject teacher-a university instructor with solid knowledge of the language-will be assisted by a native speaker who will enhance the qualitative dimension of the CLIL methodology being adopted},
KEYWORDS = {CLIL, Teaching, Funerary Archaeology, English},
PAGES = {113-124},
URL = {https://iris.cnr.it/handle/20.500.14243/134816},
PUBLISHER = {Guerra Edizioni (Perugia, ITA)},
ISBN = {978-88-557-0271-3},
CONFERENCE_PLACE = {Perugia},
BOOKTITLE = {CLIL Methodology in University Instruction: online andin the Classroom. An emerging framework},
EDITOR = {Sisti, F.},
}
@INCOLLECTION{DELLORLETTA_2009_INCOLLECTION_DLMMP_233257,
AUTHOR = {Dell'Orletta, F. and Lenci, A. and Marchi, S. and Montemagni, S. and Pirrelli, V.},
TITLE = {Text-2-Knowledge: una piattaforma linguistico-computazionale per l'estrazione di conoscenza da testi},
YEAR = {2009},
ABSTRACT = {The paper describes the automatic extraction of domain knowledge from Italian document collections and presents a fully-implemented ontology learning system (T2K, Text-2-Knowledge) that includes a battery of tools for Natural Language Processing, statistical text analysis and machine learning. Evaluated results show the considerable potential of systems like T2K, exploiting an incremental interleaving of NLP and machine learning techniques for accurate large-scale semi-automatic extraction and structuring of domain-specific knowledge},
KEYWORDS = {Term extraction, Ontology Learning},
PAGES = {285-300},
URL = {https://iris.cnr.it/handle/20.500.14243/233257},
PUBLISHER = {Bulzoni (Roma, ITA)},
ISBN = {978-88-7870-469-5},
CONFERENCE_PLACE = {Roma},
EDITOR = {Ferrari, G. and Benatti, R. and Mosca, M.},
}
@INCOLLECTION{FERRO_2009_INCOLLECTION_FP_256855,
AUTHOR = {Ferro, M. and Pioggia, G.},
TITLE = {A biologically-based framework for distributed sensory fusion and data processing},
YEAR = {2009},
PAGES = {337-364},
URL = {https://iris.cnr.it/handle/20.500.14243/256855},
DOI = {10.5772/6586},
ISBN = {978-3-902613-52-3},
BOOKTITLE = {Sensor and Data Fusion},
EDITOR = {Milisavljevic, N.},
}
@INCOLLECTION{GUADAGNINI_2009_INCOLLECTION_G_128771,
AUTHOR = {Guadagnini, E.},
TITLE = {Amanieu de Sescas, A vos qu'ieu am deszamatz e Dona per cuy planc e sospir},
YEAR = {2009},
KEYWORDS = {Filologia romanza, Provenzalistica, Amanieu de Sescas},
PAGES = {564-605},
URL = {https://iris.cnr.it/handle/20.500.14243/128771},
PUBLISHER = {Salerno (Roma, ITA)},
ISBN = {9788884026545},
CONFERENCE_PLACE = {Roma},
BOOKTITLE = {Salutz d'amor. Edizione critica del corpus occitanico},
EDITOR = {Gambino, F.},
}
@INCOLLECTION{LENCI_2009_INCOLLECTION_LMP_224573,
AUTHOR = {Lenci, A. and Montemagni, S. and Pirrelli, V.},
TITLE = {Annotazione sintattica di corpora: aspetti metodologici},
YEAR = {2009},
ABSTRACT = {Un assunto sempre più condiviso nell'ambito degli studi sull'acquisizione sia di L1 che di L2 è che l'evidenza empirica privilegiata debba essere rappresentata da corpora di produzioni scritte o orali degli apprendenti, estensivamente annotate a molteplici livelli di rappresentazione linguistica. Più in generale, corpora lemmatizzati e annotati a livello morfosintattico fanno ormai parte dello strumentario comune del linguista. Accanto ad essi, si fa però strada l'esigenza di disporre di risorse testuali più sofisticate dal punto di vista delle modalità di esplorazione linguistica, come ad esempio corpora annotati a livello sintattico (le cosiddette treebank). Questi consentono infatti di osservare i processi di convergenza degli apprendenti verso la lingua "obiettivo" anche a livello di specifici tratti grammaticali astratti o di macro-strutture linguistiche. L'articolo propone uno schema di annotazione sintattica caratterizzato da un doppio livello di codifica. Si tratta di un approccio originale che differisce dalla maggior degli schemi di annotazione sintattica esistenti per due aspetti: 1. la separazione della dimensione relazionale da quella a costituenti, che sono trattati a livelli di annotazione indipendenti, ma al tempo stesso correlati, in modo tale che lo stesso testo è simultaneamente interrogabile ai due livelli; 2. la rappresentazione a costituenti fornisce una rappresentazione del testo come sequenza di proto-costituenti sintagmatici non ricorsivi. Questa strategia di annotazione permette una fattorizzazione di diversi aspetti e dimensioni della struttura sintattica che risulta promettente da un lato per l'annotazione di corpora di lingua "non-standard" come quelli contenenti produzioni di apprendenti di L1 o L2, sia come punto di partenza per successivi processi di estrazione di informazione linguistica dal testo. Dopo aver illustrato le motivazioni sottostanti allo schema proposto, ciascun livello di rappresentazione (chunking e dipendenze funzionali) viene illustrato in dettaglio, mostrandone anche la possibilità di combinazione sullo stesso testo. L'articolo si chiude con la discussione di prospettive di uso di corpora annotati secondo lo schema di annotazione proposto},
KEYWORDS = {Corpora annotati, annotazione sintattica},
PAGES = {25-46},
URL = {https://iris.cnr.it/handle/20.500.14243/224573},
PUBLISHER = {Guerra Edizioni (Perugia, ITA)},
ISBN = {978-88-557-0168-6},
CONFERENCE_PLACE = {Perugia},
BOOKTITLE = {CORPORA DI ITALIANO L2: TECNOLOGIE, METODI, SPUNTI TEORICI},
EDITOR = {Andorno, C. and Rastelli, S.},
}
@INCOLLECTION{LENCI_2009_INCOLLECTION_LMPV_134815,
AUTHOR = {Lenci, A. and Montemagni, S. and Pirrelli, V. and Venturi, G.},
TITLE = {Ontology learning from Italian legal texts},
YEAR = {2009},
ABSTRACT = {The paper reports on the methodology and preliminary results of a case study in automatically extracting ontological knowledge from Italian legislative texts. We use a fully-implemented ontology learning system (T2K) that includes a battery of tools for Natural Language Processing (NLP), statistical text analysis and machine language learning. Tools are dynamically integrated to provide an incremental representation of the content of vast repositories of unstructured documents. Evaluated results, however preliminary, show the great potential of NLP-powered incremental systems like T2K for accurate large-scale semi-automatic extraction of legal ontologies},
KEYWORDS = {Ontology Learning, document management, legal knowledge extraction},
PAGES = {75-94},
URL = {https://iris.cnr.it/handle/20.500.14243/134815},
DOI = {10.3233/978-1-58603-942-4-75},
ISBN = {978-1-58603-942-4},
BOOKTITLE = {Law, Ontologies and the Semantic Web-Channelling the Legal Information Flood},
EDITOR = {Breuker, J. and Casanovas, P. and Klein, M. C. A. and Francesconi, E.},
}
@INCOLLECTION{MARINELLI_2009_INCOLLECTION_M_134814,
AUTHOR = {Marinelli, R.},
TITLE = {Ontological Structure and Digital Corpora for Metaphorical Sense Recognition},
YEAR = {2009},
ABSTRACT = {Se ha creado una base de datos terminológica que contiene términos que pertenecen al léxico específico de la navegación y el transporte marítimo basada en el modelo EuroWordNet/ItalWordNet. Nuestra investigación lexicográfica tiene como objetivo dar prominencia a la frecuencia de expresiones idiomáticas y metáforas, usadas en el lenguaje común, que provienen de este ámbito cultural. Este artículo trata sobre a) expresiones idiomáticas y metáforas del dominio marítimo, el cual se considera el dominio "fuente", b) el uso y la frecuencia de este tipo de expresiones idiomáticas y metáforas en un corpus extenso del italiano contemporáneo, c) la codificación semántica de las metáforas y las expresiones idiomáticas en la base de datos terminológica, d) la forma en que la estructura ontológica de la base de datos puede contribuir y ayudar en el reconocimiento del sentido metafórico},
KEYWORDS = {Ontology, Corpora, Terminology, Figurative language, Metaphorical sense recognition},
PAGES = {1409-1419},
URL = {https://iris.cnr.it/handle/20.500.14243/134814},
PUBLISHER = {AESLA, Universidad de Almeria (Almeria, ESP)},
ISBN = {978-84-692-1479-4},
CONFERENCE_PLACE = {Almeria},
BOOKTITLE = {Applied Linguistics Now: Understanding Language and Mind / La Lingüística Aplicada actual: Comprendiendo el lenguaje y la mente},
EDITOR = {Callejas, C. M. B. and Sánchez, J. F. F. and Ibáñez, J. R. I. and Sánchez, M. E. G. and De Los Ríos, M. E. C. and Ramiro, S. S. and Martínez, M. S. C. and Honeyman, N. P. and Márquez, B. C.},
}
@INCOLLECTION{PROIETTI_2009_INCOLLECTION_P_403992,
AUTHOR = {Proietti, C.},
TITLE = {Ceteris paribus modalities and the future contingents problem},
YEAR = {2009},
ABSTRACT = {This paper presents two systems of temporal logic, \Lambda_(CPT) and \Lambda_(CPT@), with ceteris paribus modalities. The principal aim is to show how this approach can be useful to give an ockhamist solution to the future contingents problem along the same lines of A. Prior. The interest of this work lies also in the fact that \Lambda_(CPT@) represents an alternative modal account of supervaluationist and post-semantics approaches to temporal reasoning},
KEYWORDS = {temporal logic, future contingents},
PAGES = {304-325},
URL = {https://iris.cnr.it/handle/20.500.14243/403992},
BOOKTITLE = {Logics for Dynamics of Information and Preferences},
EDITOR = {Kuerzen, L. and Quesada, F. V.},
}
@INCOLLECTION{QUOCHI_2009_INCOLLECTION_QDSBMC_50342,
AUTHOR = {Quochi, V. and Del Gratta, R. and Sassolini, E. and Bartolini, R. and Monachini, M. and Calzolari, N.},
TITLE = {A Standard Lexical-Terminological Resource for the Bio Domain},
YEAR = {2009},
ABSTRACT = {The present paper describes a large-scale lexical resource for the biology domain designed both for human and for machine use. This lexicon aims at semantic interoperability and extendability, through the adoption of ISO-LMF standard for lexical representation and through a granular and distributed encoding of relevant information. The first part of this contribution focuses on three aspects of the model that are of particular interest to the biology community: the treatment of term variants, the representation on bio events and the alignment with a domain ontology. The second part of the paper describes the physical implementation of the model: a relational database equipped with a set of automatic uploading procedures. Peculiarity of the BioLexicon is that it combines features of both terminologies and lexicons. A set verbs relevant for the domain is also represented with full details on their syntactic and semantic argument structure},
KEYWORDS = {Lexical representation model, Lexical Database, Computational Lexicography, Special Domains, Standards},
PAGES = {325-335},
URL = {https://link.springer.com/chapter/10.1007/978-3-642-04235-5_28},
VOLUME = {5603},
DOI = {10.1007/978-3-642-04235-5_28},
PUBLISHER = {Springer (Berlin, Heidelberg, DEU)},
ISBN = {978-3-642-04235-5},
CONFERENCE_PLACE = {Berlin, Heidelberg},
BOOKTITLE = {Human Language Technology. Challenges of the Information Society},
}
@EDITORIAL{BELTRAMI_2009_EDITORIAL_BLSABGGIMRV_146301,
AUTHOR = {Beltrami, P. D. and Larson, P. C. and Squillacioti, P. C. and Artale, E. and Boccellari, A. and Giuliani, M. and Guadagnini, E. and Ioriofili, D. and Mosti, R. and Ravani, S. and Vaccaro, G.},
TITLE = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI-Edizione online: www. vocabolario. org-Versione 2009 di 21000 voci},
YEAR = {2009},
KEYWORDS = {Lessicografia italiana, Italiano antico},
URL = {http://tlio.ovi.cnr.it/TLIO},
ISSN = {2240-5216},
}
@EDITORIAL{CALZOLARI_2009_EDITORIAL_CBBBCGMMOPQST_1087,
AUTHOR = {Calzolari, N. and Baroni, P. and Bel, N. and Budin, G. and Choukri, K. and Goggi, S. and Mariani, J. and Monachini, M. and Odijk, J. and Piperidis, S. and Quochi, V. and Soria, C. and Toral, A.},
TITLE = {Proceedings of the 1st European Language Resources and Technologies Forum: Shaping the Future of the Multilingual Digital Europe},
YEAR = {2009},
ABSTRACT = {Proceedings of the first FLaReNet Forum on the European Language Resources and Technologies, held in Vienna, at the Austrian Academy of Science, on 12-13 February 2009},
KEYWORDS = {Language Resources, Language Technologies, Multilingual, Digital},
PAGES = {105},
URL = {http://www.flarenet.eu/sites/default/files/Vienna09_Proceedings.pdf},
}
@EDITORIAL{CASELLAS_2009_EDITORIAL_CFHM_89193,
AUTHOR = {Casellas, N. and Francesconi, E. and Hokstra, R. and Montemagni, S. E.},
TITLE = {Proceedings of the 3rd Workshop on Legal Ontologies and Artificial Intelligence Techniques (LOAIT '09) joint with the 2nd Workshop on Semantic Processing of Legal Texts},
YEAR = {2009},
URL = {https://iris.cnr.it/handle/20.500.14243/89193},
ISSN = {2013-5017},
}
@EDITORIAL{WITTENBURG_2009_EDITORIAL_WAFC_183232,
AUTHOR = {Wittenburg, P. and Arppe, A. and Forsstrom, P. and Calzolari, N.},
TITLE = {NEERI 09 Report},
YEAR = {2009},
URL = {https://iris.cnr.it/handle/20.500.14243/183232},
}
@INPROCEEDINGS{ATTARDI_2009_INPROCEEDINGS_AD_65126,
AUTHOR = {Attardi, G. and Dell'Orletta, F.},
TITLE = {Reverse Revision and Linear Tree Combination for Dependency Parsing},
YEAR = {2009},
KEYWORDS = {Dependency parsing, revision parsing, dependency parsing combination},
URL = {https://iris.cnr.it/handle/20.500.14243/65126},
CONFERENCE_NAME = {North American Chapter of the Association for Computational Linguistics-Human Language Technologies},
}
@INPROCEEDINGS{ATTARDI_2009_INPROCEEDINGS_ADSDV_65133,
AUTHOR = {Attardi, G. and Dell'Orletta, F. and Simi, M. and Dei Rossi, S. and Vecchi, E. M.},
TITLE = {The Tanl Named Entity Recognizer at Evalita 2009},
YEAR = {2009},
KEYWORDS = {Named Entity Recognizer},
URL = {https://iris.cnr.it/handle/20.500.14243/65133},
CONFERENCE_NAME = {Evaluation of NLP and Speech Tools for Italian 2009},
}
@INPROCEEDINGS{ATTARDI_2009_INPROCEEDINGS_ADST_65108,
AUTHOR = {Attardi, G. and Dell'Orletta, F. and Simi, M. and Turian, J.},
TITLE = {Accurate Dependency Parsing with a Stacked Multilayer Perceptron},
YEAR = {2009},
KEYWORDS = {Dependency Parsing, Parsing, Multilayer Perceptron},
URL = {https://iris.cnr.it/handle/20.500.14243/65108},
CONFERENCE_NAME = {Evaluation of NLP and Speech Tools for Italian 2009},
}
@INPROCEEDINGS{BELLANDI_2009_INPROCEEDINGS_BT_265113,
AUTHOR = {Bellandi, A. and Turini, F.},
TITLE = {Extending Ontology Queries with Bayesian Network Reasoning},
YEAR = {2009},
URL = {https://iris.cnr.it/handle/20.500.14243/265113},
}
@INPROCEEDINGS{BOSMA_2009_INPROCEEDINGS_BVSRTMMA_158945,
AUTHOR = {Bosma, W. and Vossen, P. and Soroa, A. and Rigau, G. and Tesconi, M. and Marchetti, A. and Monachini, M. and Aliprandi, C.},
TITLE = {KAF: a generic semantic annotation format},
YEAR = {2009},
ABSTRACT = {We present KAF, the KYOTO Annotation Format. KAF is a layered and extendible linguistic annotation format that is specifically developed to arrive at semantic interoperability. KAF is used in seven languages in several applications throughout the KYOTO (Knowledge Yielding Ontologies for Transition-based Organization) project. The goal of these applications is to derive semantic data from linguistically processed text. Separate annotation layers are defined for each annotation process but these can be combined to arrive at a higher level of semantic representation. This paper gives an outline of KAF and a description of how it is applied in the KYOTO project},
KEYWORDS = {I.2.7 Natural Language Processing, Natural language processing, Semantic annotation, Text mining, Standard Formats},
PAGES = {145-152},
URL = {https://iris.cnr.it/handle/20.500.14243/158945},
CONFERENCE_NAME = {5th International Conference on Generative Approaches to the Lexicon},
}
@INPROCEEDINGS{CALZOLARI_2009_INPROCEEDINGS_CS_65131,
AUTHOR = {Calzolari, N. and Soria, C.},
TITLE = {The FLaReNet Thematic Network: a Global Forum for Cooperation},
YEAR = {2009},
KEYWORDS = {Language Resources, Language Technologies},
URL = {https://iris.cnr.it/handle/20.500.14243/65131},
CONFERENCE_NAME = {ACL-IJCNLP 2009-7th Workshop on Asian Language Resources},
}
@INPROCEEDINGS{CASELLI_2009_INPROCEEDINGS_CDP_65129,
AUTHOR = {Caselli, T. and Dell'Orletta, F. and Prodanof, I.},
TITLE = {Temporal Relations with Signals: the Case of Italian Temporal Prepositions},
YEAR = {2009},
KEYWORDS = {temporal relations, taggers, information extraction},
URL = {https://iris.cnr.it/handle/20.500.14243/65129},
CONFERENCE_NAME = {16th International Symposium on Temporal Representation and Reasoning},
}
@INPROCEEDINGS{CASELLI_2009_INPROCEEDINGS_CDP_65128,
AUTHOR = {Caselli, T. and Dell'Orletta, F. and Prodanof, I.},
TITLE = {TETI: a TimeML Compliant TimEx Tagger for Italian},
YEAR = {2009},
KEYWORDS = {temporal expression, information extraction},
URL = {https://iris.cnr.it/handle/20.500.14243/65128},
CONFERENCE_NAME = {International Multiconference on Computer Science and Information Technology},
}
@INPROCEEDINGS{CIGNONI_2009_INPROCEEDINGS_CF_65111,
AUTHOR = {Cignoni, L. and Fornaciari, G.},
TITLE = {Combining different Technologies in a Funerary Archaeology content and language integrated Learning (CLIL) Course},
YEAR = {2009},
KEYWORDS = {Funerary archaeology, CLIL, Language teaching, Computer technology, Field archaeology},
PAGES = {4284-4293},
URL = {https://iris.cnr.it/handle/20.500.14243/65111},
ISBN = {978-84-612-9802-0},
CONFERENCE_NAME = {International Conference on Education and New Learning Technologies},
BOOKTITLE = {International Conference on Education and New Learning Technologies},
EDITOR = {Chova, L. G. and Belenguer, D. M. and Torres, I. C.},
}
@INPROCEEDINGS{CIGNONI_2009_INPROCEEDINGS_CPS_65114,
AUTHOR = {Cignoni, L. and Pardelli, G. and Sassi, M.},
TITLE = {Grey Literature for Natural Language Processing: a Terminological and Statistical Approach},
YEAR = {2009},
ABSTRACT = {This paper presents the results of a study on grey literature (GL) in the field of Natural Language Processing (NLP). Our data has been collected in a corpus of ca 13, 000 records corresponding to the titles of papers presented at International Conferences from 1950 to June 2008. A statistical representation of the most significant terms relative to GL in NLP and other interrelated disciplines associates old and new words, highlighting the terminological changes that have taken place in the course of time. Aim of our study is to contribute to the creation of language resources for the extraction of GL coming from the Web in order to help prevent the disappearance of documents containing NLP words that have undergone rapid development over the last decades. This paper is organised as follows: after a general introduction to our work, section 2 provides a historical overview of NLP; sections 3 and 4 offer an account of the most relevant terms used by specialists in different periods, and indicative of the changes that have taken place; section 5 describes the methodology we have used and also contains information on our GL database and a graphical representation of the data. Finally, the conclusions stress the need to integrate pre-existing or obsolete words and expressions, creating NLP synonym relations},
KEYWORDS = {Computational Linguistics, Terminology, Grey Literature},
PAGES = {93-100},
URL = {https://iris.cnr.it/handle/20.500.14243/65114},
PUBLISHER = {TextRelease (Amsterdam, NLD)},
ISSN = {1386-2316},
ISBN = {978-90-77484-11-1},
CONFERENCE_NAME = {Tenth International Conference on Grey Literature: Designing the Grey Grid for Information Society},
CONFERENCE_PLACE = {Amsterdam},
BOOKTITLE = {THE GL-CONFERENCE SERIES. CONFERENCE PROCEEDINGS},
EDITOR = {Farace, D. J. and Frantzen, J.},
}
@INPROCEEDINGS{DELLORLETTA_2009_INPROCEEDINGS_D_65107,
AUTHOR = {Dell'Orletta, F.},
TITLE = {Ensemble system for Part-of-Speech tagging},
YEAR = {2009},
KEYWORDS = {Part-of-Speech tagging, Ensemble system},
URL = {https://iris.cnr.it/handle/20.500.14243/65107},
CONFERENCE_NAME = {Evaluation of NLP and Speech Tools for Italian, 2009},
}
@INPROCEEDINGS{GIGLIOTTA_2009_INPROCEEDINGS_GPN_65115,
AUTHOR = {Gigliotta, O. and Pezzulo, G. and Nolfi, S.},
TITLE = {How internal modeling arises when 'the world is not enough': an evolutionary robotics study},
YEAR = {2009},
KEYWORDS = {cognitive robotics},
URL = {https://iris.cnr.it/handle/20.500.14243/65115},
CONFERENCE_NAME = {Ninth International Conference on Epigenetic Robotics: Modeling Cognitive Development in Robotic Systems},
}
@INPROCEEDINGS{IDE_2009_INPROCEEDINGS_IPCS_65132,
AUTHOR = {Ide, N. and Pustejovsky, J. and Calzolari, N. and Soria, C.},
TITLE = {The SILT and FLaReNet International Collaboration for Interoperability},
YEAR = {2009},
KEYWORDS = {Interoperability, Language Resources, Language Technologies},
URL = {https://iris.cnr.it/handle/20.500.14243/65132},
CONFERENCE_NAME = {ACL-IJCNLP 2009-3rd Linguistic Annotation Workshop},
}
@INPROCEEDINGS{JEZEK_2009_INPROCEEDINGS_JQC_65125,
AUTHOR = {Jezek, E. and Quochi, V. and Calzolari, N.},
TITLE = {Relevance of Qualia Relations in Coercive Contexts},
YEAR = {2009},
KEYWORDS = {annotation, annotation scheme, semantics, type shift},
URL = {https://iris.cnr.it/handle/20.500.14243/65125},
CONFERENCE_NAME = {5th International Conference on Generative Approaches to the Lexicon},
}
@INPROCEEDINGS{MARINELLI_2009_INPROCEEDINGS_M_65120,
AUTHOR = {Marinelli, R.},
TITLE = {La terminologia condivisa: uno strumento trasversale di lavoro},
YEAR = {2009},
KEYWORDS = {Terminologia, Data Base Semantico Lessicale},
URL = {https://iris.cnr.it/handle/20.500.14243/65120},
CONFERENCE_NAME = {Arte di Ascoltare Laboratorio Interattivo},
}
@INPROCEEDINGS{MARINELLI_2009_INPROCEEDINGS_M_145358,
AUTHOR = {Marinelli, R.},
TITLE = {Costruzione di un database terminologico di dominio fiscale: descrizione e metodologia},
YEAR = {2009},
KEYWORDS = {Terminologia, Database relazionale, Data Base Semantico Lessicale},
URL = {https://iris.cnr.it/handle/20.500.14243/145358},
CONFERENCE_NAME = {Ottava giornata REI: Le parole per dirlo: terminologia e normalizzazione linguistica. Presentazione dei risultati dei gruppi di lavoro REI},
}
@INPROCEEDINGS{MORGAVI_2009_INPROCEEDINGS_MMCMTB_144763,
AUTHOR = {Morgavi, G. and Marconi, L. and Cutugno, P. and Morando, M. and Turrini, G. and Baroni, P.},
TITLE = {WIKIMEMO: A Portal for Italian Language and Culture Heritage Conservation},
YEAR = {2009},
ABSTRACT = {Since 150 years Italian people migrated abroad. Today the community with people with Italian origin add up to 10 million of people, including immigrant descendants in different countries. For these community the link with their original root can be useful for maintaining the self identity. In this paper we present the architecture for the design of Wikimemo, a portal for Italian Language and Culture Heritage conservation. From one side it aims to supply instruments to retrieve the records of the immigration experiences allowing their story telling through voices, sounds, pictures, documents, objects, from the others it offers didactical instruments (like texts, frequency lexicon, form vocabulary, anagrams lists etc.) useful for ameliorating the language knowledge. The whole project is focused on the autobiographical writing, the importance of free sharing of experiences and memories, of linguistic and cultural resources, of tools supporting the Italian language learning. The problems connected with the importance of a friendly user interface and of the usage of security tools is underlined},
KEYWORDS = {Patrimonio Culturale, Italiano},
PAGES = {298-302},
URL = {http://www.santiago.cu/hosting/linguistica/descargar.php?d=634},
PUBLISHER = {Centro de linguística aplicada, Ministerio de ciencia, tecnología y medio ambiente (Santiago de Cuba, CUB)},
ISBN = {978-959-7174-14-1},
CONFERENCE_NAME = {XI simposio Internacional de Comunicación Social Santiago de Cuba},
CONFERENCE_PLACE = {Santiago de Cuba},
BOOKTITLE = {Actas, XI Simposio Internacional Comunicación Social},
EDITOR = {Alvarez Silva, M. R. and Alvares Moreno, C. and Ruiz Miyares, L.},
}
@INPROCEEDINGS{MORGAVI_2009_INPROCEEDINGS_MMMC_56525,
AUTHOR = {Morgavi, G. and Marconi, L. and Morando, M. and Cutugno, P.},
TITLE = {From creative cognitive learning to adaptable artificial system design},
YEAR = {2009},
ABSTRACT = {Background: Over the last decade, a number of researchers have suggested a developmental perspective on AI and robotics. The ultimate shared goal among them seems to be the idea of bootstrapping high-level cognition through a process in which the agent interacts with a real physical environment over extended periods of time [2]. These studies generated epigenetic robotics, a new AI/ robotics field which includes the two-fold goal of understanding biological systems by the interdisciplinary integration between social/life and engineering sciences and, simultaneously, that of enabling robots and other artificial systems to autonomously develop skills for any particular environment (instead of programming them to solve particular goals for a specific environment). Interdisciplinary theory and empirical evidence are used to inform epigenetic robotic models, and these models can be used as theoretical tools to make experimental predictions in developmental psychology and other disciplines studying cognitive development in living systems. One of the fundamental methodological assumptions is that cognition is embodied, which means that it arises from bodily interactions with the real world[1]. The next logical step along the road towards truly autonomous robots that can dive in unpredictable environments is to investigate how one might design robots that are capable of `growing up' through experience. A living artifact grows up when its capabilities, abilities/knowledge, shift to a further level of complexity [3]. Following different psychological points of view, growing up implies: adaptation, change of functional meaning; increased complexity; enlargement of the internal knowledge map; abstraction and insight},
KEYWORDS = {creative processes, abstraction, growing up},
PAGES = {257-260},
URL = {http://www.isefc.rnu.tn/cem09/Downloads/Cem09_Abstracts_Book.pdf},
ISBN = {978-9973-13-009-9},
CONFERENCE_NAME = {CEM09 International Congress on Cognition, Emotion \& Motivation},
EDITOR = {Masmoudi, S. and Naceur, A.},
}
@INPROCEEDINGS{NAMER_2009_INPROCEEDINGS_NBJR_65123,
AUTHOR = {Namer, F. and Bouillon, P. and Jacquey, E. and Ruimy, N.},
TITLE = {Morphology-based Enhancement of a French SIMPLE Lexicon},
YEAR = {2009},
ABSTRACT = {In this paper, we propose a semi-automatic methodology for acquiring a French SIMPLE lexicon based on the morphological properties of complex words. This method combines the results of the French morphological analyzer DériF with information from general lexical resources and corpora, when available. It is evaluated on a set of neologisms extracted from Le Monde newspaper corpora},
KEYWORDS = {Morphology, SIMPLE, French electronic lexicon, Italian electronic lexicon},
URL = {https://iris.cnr.it/handle/20.500.14243/65123},
CONFERENCE_NAME = {5th International Conference on Generative Approaches to the Lexicon},
}
@INPROCEEDINGS{OGNIBENE_2009_INPROCEEDINGS_OPB_65113,
AUTHOR = {Ognibene, D. and Pezzulo, G. and Baldassarre, G.},
TITLE = {How Are Representations Affected by Scene Statistics in an Adaptive Active Vision System?},
YEAR = {2009},
KEYWORDS = {cognitive robotics},
URL = {https://iris.cnr.it/handle/20.500.14243/65113},
CONFERENCE_NAME = {Ninth International Conference on Epigenetic Robotics: Modeling Cognitive Development in Robotic Systems},
}
@INPROCEEDINGS{PARDELLI_2009_INPROCEEDINGS_PSGO_65112,
AUTHOR = {Pardelli, G. and Sassi, M. and Goggi, S. and Orsolini, P.},
TITLE = {Computational Linguistics Terminology},
YEAR = {2009},
ABSTRACT = {The aim of this article is to provide a statistical representation of significant terms used in the field of Natural Language Processing from the 1960's till nowadays, in order to draft a survey on the most significant research trends in that period. By retrieving these keywords it should be possible to highlight the ebb and flow of some thematic topics. The NLP terminological sample derives from a database-created for this purpose using the DBT software (Textual Data Base, ILC patent). Scientific presentations at the above-mentioned conferences point out a frequent recurrence of expressions such as mécanisation des études lexicologique, les machines à cartes perforées et leurs application lexicologique which trace back to the origin of electronic processing of linguistic data and to some solutions of linguistic-literary problems, to lexicographic researches, to the scientific terminology, to automatic dictionaries, to homographs, synonyms and the possibility of producing indexes and concordances by means of an electronic processor: Terms such as meccanizzazione, mechanical translation, machine à traduire used by experts of the field in the 1950s and 1960s seem to well testify the change, the shift, the beginning and then the final consecration of a rapidly evolving field: Natural Language Processing},
KEYWORDS = {Computational Linguistics, Terminology},
PAGES = {303-307},
URL = {https://iris.cnr.it/handle/20.500.14243/65112},
PUBLISHER = {Centro de linguística aplicada, Ministerio de ciencia, tecnología y medio ambiente (Santiago de Cuba, CUB)},
ISBN = {978-959-7174-14-1},
CONFERENCE_NAME = {XI Simposio Internacional de Communicación Social},
CONFERENCE_PLACE = {Santiago de Cuba},
EDITOR = {Alvarez Silvia, M. R. and Alvarez Moreno, C. and Ruiz Miyares, L.},
}
@INPROCEEDINGS{RUIMY_2009_INPROCEEDINGS_R_65134,
AUTHOR = {Ruimy, N.},
TITLE = {Une Ressource Lexicale Exploitable},
YEAR = {2009},
ABSTRACT = {Cet article se propose de donner une vue d'ensemble d'un vaste lexique électronique de l'italien qui fournit un grand nombre d'informations concernant quatre niveaux de description linguistique. Les modules syntaxique et sémantique sont particulièrement riches et intéressants; ils offrent une représentation très fine du comportement des lexèmes et mettent en relief les rapports étroits existant entre ces deux niveaux de description. Grâce à la richesse de son contenu et à l'excellence de son modèle, ce lexique peut être exploité dans différents secteurs, tant dans les applications de TAL que pour la dérivation de lexiques analogues dans d'autres langues},
KEYWORDS = {Lexique électronique, syntaxe, Lexique Génératif, sémantique, structure argumentale},
PAGES = {290-300},
URL = {https://iris.cnr.it/handle/20.500.14243/65134},
PUBLISHER = {University of Bergen (Bergen, NOR)},
ISSN = {1890-4580},
CONFERENCE_NAME = {The 28th Conference on Lexis and Grammar},
CONFERENCE_PLACE = {Bergen},
BOOKTITLE = {ARENA ROMANISTICA},
EDITOR = {Skogseth Clausen, C. and Alvsåker Didriksen, A. and Müller Gjesdal, A. and Moss, B.},
}
@INPROCEEDINGS{SASSI_2009_INPROCEEDINGS_S_65119,
AUTHOR = {Sassi, M.},
TITLE = {La obra de Alejo Carpentier en versión digital: historial, descripción y propuestas},
YEAR = {2009},
KEYWORDS = {Banca dati Testuale, Alejo Carpentier},
URL = {https://iris.cnr.it/handle/20.500.14243/65119},
CONFERENCE_NAME = {XI Simposio Internacional de Comunicación social},
}
@INPROCEEDINGS{SASSI_2009_INPROCEEDINGS_SPG_65130,
AUTHOR = {Sassi, M. and Pardelli, G. and Goggi, S.},
TITLE = {Terminology Extraction from the web},
YEAR = {2009},
ABSTRACT = {This paper presents the results of a study on textual resources in the field of Human Language Technology (HLT). A statistical representation of the most significant terms in HLT and other interrelated disciplines associates old and new words, highlighting the terminological changes that have taken place in the course of time. Aim of our study is to contribute to the creation of language resources for the extraction of documentation coming from the Web in order to help preventing the disappearance of documents containing HLT words that have undergone rapid development over the last decades. This paper is organised as follows: after a general introduction to our work, section 2 provides a historical overview of HLT; sections 3 and 4 offer an account of the most relevant terms used by specialists in different periods, and those indicative of the changes that have taken place; section 5 describes the methodology we have used and also contains information on our database and a graphical representation of the data. Finally, the conclusions stress the need to integrate pre-existing or obsolete words and expressions, creating HLT synonym relations},
KEYWORDS = {Terminology, Computational Linguistics, Web-based information},
PAGES = {417-420},
URL = {https://iris.cnr.it/handle/20.500.14243/65130},
ISBN = {978-83-7177-746-2},
CONFERENCE_NAME = {4th Language Technology Conference: Human Language Technology as a challenge for Computer Science and Linguistics},
EDITOR = {Vetulani, Z.},
}
@INPROCEEDINGS{SASSOLINI_2009_INPROCEEDINGS_SP_65122,
AUTHOR = {Sassolini, E. and Picchi, E.},
TITLE = {Text Power: tools for the Cultural Heritage},
YEAR = {2009},
KEYWORDS = {Text power, Text mining, Cultural Heritage},
URL = {https://iris.cnr.it/handle/20.500.14243/65122},
CONFERENCE_NAME = {4},
}
@INPROCEEDINGS{SASSOLINI_2009_INPROCEEDINGS_SPEG_65116,
AUTHOR = {Sassolini, E. and Picchi, E. and Ensini, M. and Guerriero, L.},
TITLE = {Il progetto SUBITO e l'analisi semantica come strumento utile all'innovazione biomedica},
YEAR = {2009},
KEYWORDS = {Biomedicina, Analisi Semantica, Progetto"Subito"},
URL = {https://iris.cnr.it/handle/20.500.14243/65116},
CONFERENCE_NAME = {10° Congresso Nazionale @ITIM 2009/, Monserrato, Cagliari, Italy},
}
@INPROCEEDINGS{SORIA_2009_INPROCEEDINGS_SMV_65135,
AUTHOR = {Soria, C. and Monachini, M. and Vossen, P.},
TITLE = {Wordnet-LMF: Fleshing out a Standardized Format for Wordnet Interoperability},
YEAR = {2009},
ABSTRACT = {In this paper we present Wordnet-LMF, a dialect of ISO Lexical Markup Framework that instantiates LMF for representing wordnets. Wordnet-LMF was developed in the framework of the EU KYOTO project for the specific purpose of endowing a set of wordnets with a standardized interoperability format allowing the interchange of lexicosemantic information encoded in each of them. The aim of this format is twofold a) to give a preliminary assessment of LMF, by large-scale application to real lexical resources; b) to endow WordNet with a format representation that will allow easier integration among resources sharing the same structure (i. e other wordnets) and, more importantly, across resources with different theoretical and implementation approaches},
KEYWORDS = {Standards, Lexical Markup Framework, Lexical resources, Wordnets, Intercultural collaboration},
PAGES = {139-146},
URL = {https://iris.cnr.it/handle/20.500.14243/65135},
PUBLISHER = {ACM, Association for computing machinery (New York, USA)},
ISBN = {978-1-60558-198-9},
CONFERENCE_NAME = {International Workshop on Intercultural Collaboration},
CONFERENCE_PLACE = {New York},
BOOKTITLE = {Proceedings of the International Workshop on Intercultural Collaboration},
}
@INPROCEEDINGS{SPINOSA_2009_INPROCEEDINGS_SGCMVM_1330,
AUTHOR = {Spinosa, P. and Giardiello, G. and Cherubini, M. and Marchi, S. and Venturi, G. and Montemagni, S.},
TITLE = {NLP based Metadata Extraction for Legal Text Consolidation},
YEAR = {2009},
ABSTRACT = {The paper describes a system for the automatic consolidation of Italian legislative texts to be used as a support of an editorial consolidating activity and dealing with the following typology of textual amendments: repeal, substitution and integration. The focus of the paper is on the semantic analysis of the textual amendment provisions and the formalized representation of the amendments in terms of metadata. The proposed approach to consolidation is metadata-oriented and based on Natural Language Processing (NLP) techniques: we use XML-based standards for metadata annotation of legislative acts and a flexible NLP architecture for extracting metadata from parsed texts. An evaluation of achieved results is also provided},
KEYWORDS = {Natural Language Processing, textual amendments, XML representation, metadata extraction, consolidation of legal text},
PAGES = {40-49},
URL = {https://iris.cnr.it/handle/20.500.14243/1330},
DOI = {10.1145/1568234.1568240},
PUBLISHER = {Association Of Computing Machinery (ACM) (New York, USA)},
ISBN = {978-1-60558-597-0},
CONFERENCE_NAME = {Twelfth International Conference on Artificial Intelligence and Law (ICAIL 2009)},
CONFERENCE_PLACE = {New York},
BOOKTITLE = {Proceeding ICAIL '09 Proceedings of the 12th International Conference on Artificial Intelligence and Law},
EDITOR = {Hafner, C. D. and Casanovas, P.},
}
@INPROCEEDINGS{TOKUNAGA_2009_INPROCEEDINGS_TKCMSSCTXHHK_65124,
AUTHOR = {Tokunaga, T. and Kaplan, D. and Calzolari, N. and Monachini, M. and Soria, C. and Sornlertlamvanich, V. and Charoenporn, T. and Tesconi, M. and Xia, Y. and Huang, C. and Hsieh, S. and Kiyoaki, S.},
TITLE = {Query Expansion using LMF-Compliant Lexical Resources},
YEAR = {2009},
ABSTRACT = {This paper reports prototype multilingual query expansion system relying on LMF compliant lexical resources. The system is one of the deliverables of a three-year project aiming at establishing an international standard for language resources which is applicable to Asian languages. Our important contributions to ISO 24613, standard Lexical Markup Framework (LMF) include its robustness to deal with Asian languages, and its applicability to cross-lingual query tasks, as illustrated by the prototype introduced in this paper},
KEYWORDS = {Lexical resources, Lexical Markup Framework (LMF), Standards},
PAGES = {145-152},
URL = {https://iris.cnr.it/handle/20.500.14243/65124},
ISBN = {978-1-932432-56-5},
CONFERENCE_NAME = {ACL-IJCNLP 2009-7th Workshop on Asian Language Resources},
}
@INPROCEEDINGS{TORAL_2009_INPROCEEDINGS_TMSR_65127,
AUTHOR = {Toral, A. and Monachini, M. and Soroa, A. and Rigau, G.},
TITLE = {Studying the role of Qualia Relations for Word Sense Disambiguation},
YEAR = {2009},
KEYWORDS = {Generative Lexicon, Semantic Information Extraction, Word Sense Disambiguation},
URL = {https://iris.cnr.it/handle/20.500.14243/65127},
CONFERENCE_NAME = {5th International Conference on Generative Approaches to the Lexicon},
}
@INPROCEEDINGS{VENTURI_2009_INPROCEEDINGS_VLMVSTA_155070,
AUTHOR = {Venturi, G. and Lenci, A. and Montemagni, S. and Vecchi, E. M. and Sagri, M. T. and Tiscornia, D. and Agnoloni, T.},
TITLE = {Towards a FrameNet Resource for the Legal Domain},
YEAR = {2009},
KEYWORDS = {Frame Semantics, Legal Ontologies, Knowledge Representation, Corpus Annotation},
URL = {https://iris.cnr.it/handle/20.500.14243/155070},
CONFERENCE_NAME = {3rd Workshop on Legal Ontologies and Artificial Intelligence Techniques joint with 2nd Workshop on Semantic Processing of Legal text},
}
@INPROCEEDINGS{VENTURI_2009_INPROCEEDINGS_VMMSTMA_65110,
AUTHOR = {Venturi, G. and Montemagni, S. and Marchi, S. and Sasaki, Y. and Thompson, P. and McNaught, J. and Ananiadou, S.},
TITLE = {Bootstrapping a Verb Lexicon for Biomedical Information Extraction},
YEAR = {2009},
ABSTRACT = {The extraction of information from texts requires resources that contain both syntactic and semantic properties of lexical units. As the use of language in specialized domains, such as biology, can be very different to the general domain, there is a need for domain-specific resources to ensure that the information extracted is as accurate as possible. We are building a large-scale lexical resource for the biology domain, providing information about predicate-argument structure that has been bootstrapped from a biomedical corpus on the subject of E. Coli. The lexicon is currently focussed on verbs, and includes both automatically-extracted syntactic subcategorization frames, as well as semantic event frames that are based on annotation by domain experts. In addition, the lexicon contains manually-added explicit links between semantic and syntactic slots in corresponding frames. To our knowledge, this lexicon currently represents a unique resource within in the biomedical domain},
KEYWORDS = {domain-specific lexical resources, Biological Language Processing, syntax-semantic linking},
PAGES = {137-148},
URL = {https://iris.cnr.it/handle/20.500.14243/65110},
DOI = {10.1007/978-3-642-00382-0_11},
PUBLISHER = {Springer-Verlag (Berlin Heidelberg, DEU)},
ISBN = {9783642003813},
CONFERENCE_NAME = {10th International Conference on Intelligent Text Processing and Computational Linguistics},
CONFERENCE_PLACE = {Berlin Heidelberg},
}
@INPROCEEDINGS{ZAMPONI_2009_INPROCEEDINGS_ZMCM_65118,
AUTHOR = {Zamponi, R. and Marconi, L. and Cutugno, P. and Morgavi, G.},
TITLE = {La lengua fang de la oralidad al diccionario: cuestiones y problemas atados a la realización de un diccionario bilingüe fang-español y español-fang},
YEAR = {2009},
ABSTRACT = {El fang es una lengua bantú de Africa centro-occidental a tradición oral y a fuerte fragmentación dialectal, sin un estandard y una norma ortográfica de referencia, que mustra hoy día, en Guinea Ecuatorial, país en que reside más allá de la mitad de los suyos ca. 450. 000 hablantes, señales de desintegración bajo el empuje del español (lengua oficial y hegemónica). En las notas que siguen se delinean algunas cuestiones y problemas emergidos en la compilación de un diccionario bilingue fang-español y español-fang atados a el estatus sociolinguístico del fang, a la ausencia de estudios gramaticales detallados y de diccionarios modernos de esta lengua y, en fin, a la tradución del material léxico recogido por nosotros},
URL = {https://iris.cnr.it/handle/20.500.14243/65118},
ISBN = {978-959-7174-14-1},
}
@INPROCEEDINGS{ZAMPONI_2009_INPROCEEDINGS_ZMMC_67789,
AUTHOR = {Zamponi, R. and Marconi, L. and Morgavi, G. and Cutugno, P.},
TITLE = {La lengua fang de la oralidad al diccionario: cuestiones y problemas atados a la realización de un diccionario bilingüe fang-español y español-fang},
YEAR = {2009},
URL = {https://iris.cnr.it/handle/20.500.14243/67789},
CONFERENCE_NAME = {XI simposio Internacional de Comunicación Social},
}
@INPROCEEDINGS{MARINELLI_2009_INPROCEEDINGS_MSC_106753,
AUTHOR = {Marinelli, R. and Spadoni, G. and Cucurullo, S.},
TITLE = {Visual information to improve a lexical-semantic terminological resource},
YEAR = {2009},
ABSTRACT = {The lexical semantic database MariTerm contains structured information about the specialized terminology of the maritime domain (maritime navigation and transport). This paper describes the main phases of a project which aims to enhance the terminological database by means of a set of images: a) the structure of the terminological database; b) the domain conceptual modelling; c) the database management tool which, among its various features, allows visualization on demand of the image which is associated with the term being sought, contributing to clarification of the meaning of the term and increasing its information and communication potential},
KEYWORDS = {Lexical Semantic Data Bases, Visual Information, Terminology},
PAGES = {159-160},
URL = {https://iris.cnr.it/handle/20.500.14243/106753},
CONFERENCE_NAME = {XXVII AESLA Conference "Modos y formas de la comunicacion humana-Ways and modes of human communication"},
}
@INPROCEEDINGS{MARZI_2009_INPROCEEDINGS_MPS_106754,
AUTHOR = {Marzi, C. and Pardelli, G. and Sassi, M.},
TITLE = {Grey Literature and Computational Limguistics: From Paper to Net},
YEAR = {2009},
ABSTRACT = {The advent and exponential development of the World Wide Web has led to an increasing availability of unstructured knowledge and distributed information sources, meeting general public requirements that are hardly addressed by other more traditional information channels. This trend has concurrently raised a considerable interest in the application of Computational Linguistics (CL) methodologies to document access and retrieval, as they offer the unprecedented opportunity to make the subjective, user-centred information demands of Net citizens meet the ever changing and heterogeneous information flow of the web. Over the last five years, more and more Italian Universities have introduced CL courses into their Humanities curricula, making available on-line teaching materials, tutorials and language engineering software that appear to supply the lack of offer from traditional Italian publishing houses. In this paper, we consider in some detail the role played by this type of Grey Literature in bringing up a wider and increasingly more aware community of web users in Italy. Theme: Impact of Grey Literature on Net Citizens},
KEYWORDS = {Computational Linguistics, Grey Literature, Web-based information},
PAGES = {81-84},
URL = {https://iris.cnr.it/handle/20.500.14243/106754},
ISBN = {978-90-77484-14-2},
CONFERENCE_NAME = {Eleventh International Conference on Grey Literature "The Grey Mosaic, Piecing it All Together"},
BOOKTITLE = {Eleventh International Conference on Grey Literature "The Grey Mosaic, Piecing it All Together" Acronimo titolo evento},
EDITOR = {Farace, D. J. and Frantzen, J.},
}
@INPROCEEDINGS{MORGAVI_2009_INPROCEEDINGS_MMMC_236954,
AUTHOR = {Morgavi, G. and Marconi, L. and Morando, M. and Cutugno, P.},
TITLE = {From creative cognitive learning to adaptable artificial system design},
YEAR = {2009},
ABSTRACT = {Background: Over the last decade, a number of researchers have suggested a developmental perspective on AI and robotics. The ultimate shared goal among them seems to be the idea of bootstrapping high-level cognition through a process in which the agent interacts with a real physical environment over extended periods of time [2]. These studies generated epigenetic robotics, a new AI/ robotics field which includes the two-fold goal of understanding biological systems by the interdisciplinary integration between social/life and engineering sciences and, simultaneously, that of enabling robots and other artificial systems to autonomously develop skills for any particular environment (instead of programming them to solve particular goals for a specific environment). Interdisciplinary theory and empirical evidence are used to inform epigenetic robotic models, and these models can be used as theoretical tools to make experimental predictions in developmental psychology and other disciplines studying cognitive development in living systems. One of the fundamental methodological assumptions is that cognition is embodied, which means that it arises from bodily interactions with the real world[1]. The next logical step along the road towards truly autonomous robots that can dive in unpredictable environments is to investigate how one might design robots that are capable of `growing up' through experience. A living artifact grows up when its capabilities, abilities/knowledge, shift to a further level of complexity [3]. Following different psychological points of view, growing up implies: adaptation, change of functional meaning; increased complexity; enlargement of the internal knowledge map; abstraction and insight},
KEYWORDS = {creative processes, abstraction, growing up},
PAGES = {257-260},
URL = {http://www.isefc.rnu.tn/cem09/Downloads/Cem09_Abstracts_Book.pdf},
ISBN = {978-9973-13-009-9},
CONFERENCE_NAME = {CEM09 International Congress on Cognition, Emotion \& Motivation},
BOOKTITLE = {Cognition Emotion Motivation Percept-Concept-Decision: Application to Learning Activities},
EDITOR = {Masmoudi, S. and Naceur, A.},
}
@TECHREPORT{ALIPRANDI_2009_TECHREPORT_ANMRTSMVBAADRS_183221,
AUTHOR = {Aliprandi, C. and Neri, F. and Marchetti, A. and Ronzano, F. and Tesconi, M. and Soria, C. and Monachini, M. and Vossen, P. and Bosma, W. and Agirre, E. and Artola, X. and Diaz, D. I. A. and Rigau, G. and Soroa, A.},
TITLE = {Database Models and Data Formats},
YEAR = {2009},
KEYWORDS = {XML data format, TMF, SEMAF, OWL/KIF, FACTAF},
URL = {https://iris.cnr.it/handle/20.500.14243/183221},
}
@TECHREPORT{BARONI_2009_TECHREPORT_B_247455,
AUTHOR = {Baroni, P.},
TITLE = {FLaReNet Web Statistics: 7 December 2008-31 August 2009},
YEAR = {2009},
ABSTRACT = {Statistics relating to the access to the FLaReNet Web site from 7 December 2008 to 31 August 2009},
KEYWORDS = {Language Resources, Web Statistics},
PAGES = {6},
URL = {https://iris.cnr.it/handle/20.500.14243/247455},
}
@TECHREPORT{CALZOLARI_2009_TECHREPORT_CBGMQST_183227,
AUTHOR = {Calzolari, N. and Baroni, P. and Goggi, S. and Monachini, M. and Quochi, V. and Soria, C. and Toral, A.},
TITLE = {ECP-2007-LANG-617001 FLaReNet: Dissemination Plan},
YEAR = {2009},
KEYWORDS = {Language Resources},
URL = {https://iris.cnr.it/handle/20.500.14243/183227},
}
@TECHREPORT{CALZOLARI_2009_TECHREPORT_CBGMQST_183230,
AUTHOR = {Calzolari, N. and Baroni, P. and Goggi, S. and Monachini, M. and Quochi, V. and Soria, C. and Toral, A.},
TITLE = {ECP-2007-LANG-617001 FLaReNet: Progress Report No. 1},
YEAR = {2009},
KEYWORDS = {Language Resources},
URL = {https://iris.cnr.it/handle/20.500.14243/183230},
}
@TECHREPORT{CALZOLARI_2009_TECHREPORT_CMSBGQT_183229,
AUTHOR = {Calzolari, N. and Monachini, M. and Soria, C. and Baroni, P. and Goggi, S. and Quochi, V. and Toral, A.},
TITLE = {ECP-2007-LANG-617001 FLaReNet: Progress Report No. 2},
YEAR = {2009},
KEYWORDS = {Language Resources},
URL = {https://iris.cnr.it/handle/20.500.14243/183229},
}
@TECHREPORT{CALZOLARI_2009_TECHREPORT_CSBCGMQTBBCMOP_183224,
AUTHOR = {Calzolari, N. and Soria, C. and Baroni, P. and Caselli, T. and Goggi, S. and Monachini, M. and Quochi, V. and Toral, A. and Bel, N. and Budin, G. and Choukri, K. and Mariani, J. and Odijk, J. and Piperidis, S.},
TITLE = {ECP-2007-LANG-617001 FLaReNet: Action Plan},
YEAR = {2009},
KEYWORDS = {Language Resources},
URL = {https://iris.cnr.it/handle/20.500.14243/183224},
}
@TECHREPORT{CALZOLARI_2009_TECHREPORT_CSBGMQT_183228,
AUTHOR = {Calzolari, N. and Soria, C. and Baroni, P. and Goggi, S. and Monachini, M. and Quochi, V. and Toral, A.},
TITLE = {ECP-2007-LANG-617001 FLaReNet: Evaluation Plan for the functioning of the Network},
YEAR = {2009},
KEYWORDS = {Language Resources},
URL = {https://iris.cnr.it/handle/20.500.14243/183228},
}
@TECHREPORT{CALZOLARI_2009_TECHREPORT_CSBMQ_183225,
AUTHOR = {Calzolari, N. and Soria, C. and Baroni, P. and Monachini, M. and Quochi, V.},
TITLE = {ECP-2007-LANG-617001 FLaReNet: Annual Report No. 1},
YEAR = {2009},
KEYWORDS = {Language Resources},
URL = {https://iris.cnr.it/handle/20.500.14243/183225},
}
@TECHREPORT{CALZOLARI_2009_TECHREPORT_CSBMQT_183231,
AUTHOR = {Calzolari, N. and Soria, C. and Baroni, P. and Monachini, M. and Quochi, V. and Toral, A.},
TITLE = {ECP-2007-LANG-617001 FLaReNet: Project Presentation},
YEAR = {2009},
KEYWORDS = {Language Resources},
URL = {https://iris.cnr.it/handle/20.500.14243/183231},
}
@TECHREPORT{CALZOLARI_2009_TECHREPORT_CSBBCCMMOPQT_183226,
AUTHOR = {Calzolari, N. and Soria, C. and Bel, N. and Budin, G. and Caselli, T. and Choukri, K. and Mariani, J. and Monachini, M. and Odijk, J. and Piperidis, S. and Quochi, V. and Toral, A.},
TITLE = {ECP-2007-LANG-617001 FLaReNet: Blueprint of actions and infrastructures No. 1},
YEAR = {2009},
KEYWORDS = {Language Resources, Infrastructures, Recommendations},
URL = {https://iris.cnr.it/handle/20.500.14243/183226},
}
@TECHREPORT{ENEA_2009_TECHREPORT_ES_183220,
AUTHOR = {Enea, A. and Sandri, L.},
TITLE = {L'Archivio dell'Ospedale degli Innocenti di Firenze e il suo inventario on line},
YEAR = {2009},
ABSTRACT = {Sono descritti i passaggi intervenuti per la realizzazione di un sito internet dedicato alla consultazione dell'inventario dell'Archivio dell'antico Ospedale degli Innocenti di Firenze},
KEYWORDS = {Archivistica, Beni Culturali},
URL = {https://iris.cnr.it/handle/20.500.14243/183220},
}
@TECHREPORT{HEROLD_2009_TECHREPORT_HHSVRALMTS_183234,
AUTHOR = {Herold, A. and Hicks, A. and Segers, R. and Vossen, P. and Rigau, G. and Agirre, E. and Laparra, E. and Monachini, M. and Toral, A. and Soria, C.},
TITLE = {WordNets mapped to Central Ontology},
YEAR = {2009},
KEYWORDS = {Ontology},
URL = {https://iris.cnr.it/handle/20.500.14243/183234},
}
@TECHREPORT{PICCHI_2009_TECHREPORT_PSCE_183235,
AUTHOR = {Picchi, E. and Sassolini, E. and Cucurullo, S. and Ensini, M.},
TITLE = {WP3. 1 Tecniche di analisi semantica per l estrazione di ontologie bio-medicali},
YEAR = {2009},
KEYWORDS = {Ontologie, Semantica computazionale, Terminologia medica},
URL = {https://iris.cnr.it/handle/20.500.14243/183235},
}
@TECHREPORT{PIRRELLI_2009_TECHREPORT_PM_159853,
AUTHOR = {Pirrelli, V. and Marzi, C.},
TITLE = {Words In Action: Interdisciplinary Approaches to Understanding Word Processing and Storage},
YEAR = {2009},
ABSTRACT = {Almost all levels of language knowledge and processing (from phonology, to syntax and semantics) are known to be affected by knowledge of word structure at varying degrees. A better understanding of the human strategies involved in learning and processing word structure thus lies at the heart of our comprehension of the basic mechanisms serving both language and cognition and is key to addressing some fundamental challenges for the study of the physiology of grammar. On the 12th and 13th of October 2009, in the Research Area of the Italian National Research Council (CNR) in Pisa, 26 scholars from Europe, Canada and the United States were convened to take part in the European Science Foundation Exploratory Workshop "Words in Action: Interdisciplinary Approaches To Understanding Word Processing And Storage". The workshop brought together experts of various scientific domains and different theoretical inclinations to advance the current awareness of theoretical, historical, psycholinguistic, computational and neurophysiological issues in morphological processing and learning, with a view to assessing levels of research convergence and exploring the potential for synergy and strategic co-operation},
KEYWORDS = {Morphology, Word Processing, Word Learning, Mental Lexicon},
URL = {https://iris.cnr.it/handle/20.500.14243/159853},
}
@TECHREPORT{SASSI_2009_TECHREPORT_SC_183218,
AUTHOR = {Sassi, M. and Cinini, A.},
TITLE = {Dieci anni di informazione sanitaria. Analisi di tre quotidiani a tiratura nazionale},
YEAR = {2009},
ABSTRACT = {L'Istituto di Linguistica Computazionale (ILC-CNR) ha realizzato In collaborazione con L'Osservatorio della Comunicazione Sanitaria (OCS) una Banca Dati Testuale composta dagli articoli che trattano Informazione Sanitaria, pubblicati a partire dall'anno 1999 su tre quotidiani a diffusione nazionale: Corriere della Sera (C), Repubblica (R) e Stampa (S)},
KEYWORDS = {Analisi Informazione sanitaria, Banca dati Testuale},
PAGES = {1-31},
URL = {https://iris.cnr.it/handle/20.500.14243/183218},
}
@TECHREPORT{SASSOLINI_2009_TECHREPORT_SH_333479,
AUTHOR = {Sassolini, E. and Haines, M.},
TITLE = {Gli Anni della Cupola: NewDBT},
YEAR = {2009},
ABSTRACT = {programma NewDBT per l'Opera di Santa Maria del Fiore di Firenze. Sviluppo di una nuova versione di DBT strutturato per OPA in grado di indicizzare, gestire e interrogare il complesso archivio digitale riguardante la costruzione della cupola di Brunelleschi},
URL = {https://iris.cnr.it/handle/20.500.14243/333479},
}
@MISC{BARBERA_2009_MISC_BDD_406249,
AUTHOR = {Barbera, M. and Di Donato, F. and D'Alfonso, M.},
TITLE = {A Quick Start Guide to create Open Scholarly Communities on the Web},
YEAR = {2009},
ABSTRACT = {Final results of a study conducted within the A32 COST Action "Open Scholarly Communities on the Web"},
URL = {https://iris.cnr.it/handle/20.500.14243/406249},
}
@MISC{BOZZI_2009_MISC_B_106751,
AUTHOR = {Bozzi, A.},
TITLE = {Edizione critica elettronica di fonti manoscritte antiche digitali},
YEAR = {2009},
KEYWORDS = {Computational Philology},
URL = {https://iris.cnr.it/handle/20.500.14243/106751},
CONFERENCE_NAME = {Archivi e Biblioteche: dalla memoria del passato al web},
}
@MISC{CALZOLARI_2009_MISC_CBBBCGMMOPQST_183233,
AUTHOR = {Calzolari, N. and Baroni, P. and Bel, N. and Budin, G. and Choukri, K. and Goggi, S. and Mariani, J. and Monachini, M. and Odijk, J. and Piperidis, S. and Quochi, V. and Soria, C. and Toral, A.},
TITLE = {The European Language Resources and Technologies Forum: Shaping the Future of the Multilingual Digital Europe},
YEAR = {2009},
KEYWORDS = {Language Resources, Language Technologies},
URL = {https://iris.cnr.it/handle/20.500.14243/183233},
}
@MISC{CALZOLARI_2009_MISC_CBBCMOPBGMQST_183222,
AUTHOR = {Calzolari, N. and Bel, N. and Budin, G. and Choukri, K. and Mariani, J. and Odijk, J. and Piperidis, S. and Baroni, P. and Goggi, S. and Monachini, M. and Quochi, V. and Soria, C. and Toral, A.},
TITLE = {Short Report of The European Language Resources and Technologies Forum: Shaping the Future of the Multilingual Digital Europe},
YEAR = {2009},
KEYWORDS = {Language Resources, Language Technologies},
URL = {https://iris.cnr.it/handle/20.500.14243/183222},
}
@MISC{CALZOLARI_2009_MISC_CBBCMOPBGMQST_183219,
AUTHOR = {Calzolari, N. and Bel, N. and Budin, G. and Choukri, K. and Mariani, J. and Odijk, J. and Piperidis, S. and Baroni, P. and Goggi, S. and Monachini, M. and Quochi, V. and Soria, C. and Toral, A.},
TITLE = {Extended Report of: The European Language Resources and Technologies Forum: Shaping the Future of the Multilingual Digital Europe},
YEAR = {2009},
KEYWORDS = {Language Resources, Language Technologies},
URL = {https://iris.cnr.it/handle/20.500.14243/183219},
}
@MISC{CASELLAS_2009_MISC_CFHM_183223,
AUTHOR = {Casellas, N. and Francesconi, E. and Hoekstra, R. and Montemagni, S.},
TITLE = {3rd Workshop on Legal Ontologies and Artificial Intelligence Techniques joint with 2nd Workshop on Semantic Processing of Legal text},
YEAR = {2009},
KEYWORDS = {Legal Ontologies, Computational Semantics},
URL = {https://iris.cnr.it/handle/20.500.14243/183223},
}
@MISC{DIDONATO_2009_MISC_D_406246,
AUTHOR = {Di Donato, F.},
TITLE = {Introduzione all'Open Access: storia, filosofia, strumenti},
YEAR = {2009},
ABSTRACT = {Un'introduzione all'Open Access: la storia del movimento, le definizioni, l'evoluzione del concetto e delle politiche},
URL = {https://iris.cnr.it/handle/20.500.14243/406246},
}
@MISC{DIDONATO_2009_MISC_D_406255,
AUTHOR = {Di Donato, F.},
TITLE = {Open Access in Italia},
YEAR = {2009},
ABSTRACT = {Una ricognizione sullo stato del movimento OA in Italia},
URL = {https://iris.cnr.it/handle/20.500.14243/406255},
}
@MISC{DIDONATO_2009_MISC_D_406248,
AUTHOR = {Di Donato, F.},
TITLE = {Una questione di qualità? Credibilità, prestigio e potere nel sistema di valutazione della scienza},
YEAR = {2009},
ABSTRACT = {Una riflessione sul sistema di valutazione della scienza},
URL = {https://iris.cnr.it/handle/20.500.14243/406248},
}
@MISC{DIDONATO_2009_MISC_D_406254,
AUTHOR = {Di Donato, F.},
TITLE = {Philosophie politique, publications en ligne et droits d'auteur},
YEAR = {2009},
ABSTRACT = {Un'introduzione alle tematiche dell'accesso aperto e alle questioni collegate},
URL = {https://iris.cnr.it/handle/20.500.14243/406254},
}
@MISC{DIDONATO_2009_MISC_D_406259,
AUTHOR = {Di Donato, F.},
TITLE = {Open Access. La valutazione della ricerca oltre le divisioni tra le scienze},
YEAR = {2009},
ABSTRACT = {Incontro organizzato a partire dalla pubblicazione del volume di J. C. Guédon, Open Access. Contro gli oligopoli del sapere, a cura di F. Di Donato, ETS, 2009. Presiede B. Henry, ne discutono: M. C. Carrozza, G. Comandè, Eloisa Cristiani, A. Loretoni, P. Perata, F. Strazzari, P. Tonutti, Scuola Superiore Sant'Anna di Pisa, 20 gennaio 2010},
URL = {https://iris.cnr.it/handle/20.500.14243/406259},
}
@MISC{DIDONATO_2009_MISC_D_406257,
AUTHOR = {Di Donato, F.},
TITLE = {Introduzione al Keynotespeech Jean-Claude Guédon},
YEAR = {2009},
ABSTRACT = {Introduzione al Keynotespeech Jean-Claude Guédon e moderatrice del dibattito},
URL = {https://iris.cnr.it/handle/20.500.14243/406257},
}
@MISC{ENEA_2009_MISC_E_106750,
AUTHOR = {Enea, A.},
TITLE = {Comunicazione orale},
YEAR = {2009},
KEYWORDS = {Archivistica, Beni Culturali},
URL = {https://iris.cnr.it/handle/20.500.14243/106750},
CONFERENCE_NAME = {Un archivio on line. Presentazione dell'inventario della sezione storica dell'Archivio dell'Istituto degli Innocenti di Firenze (1218-1996)},
}
@MISC{ENEA_2009_MISC_E_450683,
AUTHOR = {Enea, A.},
TITLE = {Gli ARCHIVI CARTOLINE degli Istituti per la storia della Resistenza e della società contemporanea in Italia},
YEAR = {2009},
ABSTRACT = {Gli ARCHIVI CARTOLINE degli Istituti per la storia della Resistenza e della società contemporanea in Italia consentono una consultazione delle descrizioni delle cartoline del fondo Giulio Fiocchi conservato presso l'Istituto Nazionale "F. Parri" di Milano. Il fondo è organizzato in serie e sottoserie e la descrizione è a livello del singolo documento. Le immagini di tutti i documenti sono riprodotte e consultabili},
KEYWORDS = {archivistica, beni culturali},
URL = {http://www.reteparri.it/risorse-on-line/servizi-archivistici},
}
@MISC{ENEA_2009_MISC_E_123701,
AUTHOR = {Enea, A.},
TITLE = {Il METAOPAC ARCHIVISTICO degli Istituti per la storia della Resistenza e della società contemporanea in Italia},
YEAR = {2009},
ABSTRACT = {Il METAOPAC ARCHIVISTICO degli Istituti per la storia della Resistenza e della società contemporanea in Italia consente una ricerca simultanea alle banche dati Guida, Foto e Carto},
KEYWORDS = {archivistica, beni culturali},
URL = {http://www.reteparri.it/risorse-on-line/servizi-archivistici},
}
@MISC{ENEA_2009_MISC_ES_126290,
AUTHOR = {Enea, A. and Sandri, L.},
TITLE = {L'Inventario della sezione storica dell'Archivio dell'Ospedale degli Innocenti di Firenze},
YEAR = {2009},
KEYWORDS = {Archivistica, Beni Culturali},
URL = {http://www.istitutodeglinnocenti.it/?q=content/inventario},
}
@MISC{GIOVANNETTI_2009_MISC_G_244995,
AUTHOR = {Giovannetti, E.},
TITLE = {Semantic relation labelling in ontology learning from texts},
YEAR = {2009},
ABSTRACT = {Semantic relation extraction is a crucial task for Ontology Learning from Texts. In literature, statistical unsupervised systems are used for semantic relation extraction: these systems typically detect pairs of semantically related terms (on the basis of their distribution in texts) without specifying the semantic relation holding between them. In this work I propose a fully unsupervised approach for semantic relation validation and extraction from texts. A statistical component (CLASS, CLustering through Analogy-based Semantic Similarity) is used to obtain a set of pairs of "distributionally similar" terms occurring in similar contexts, and possibly involved in "paradigmatic" relations (as, for instance, the words "car" and "motorcycle" in the sentences "I drive my car" and "Bob drives his mo-torcycle"). To validate and label the anonymous relations obtained through the statistical module occurrences of the candidate pairs of terms are looked for in the Web in the context of "reliable" lexico-syntactic patterns, where they are involved in a "syntagmatic relation" (such as, for example, the words "steer" and "car" in the sentence "steer is part of the car"). This work focuses on the definition and application of the lexico-syntactic patterns and on the measures used to assess the reliability of the specific semantic relation the system suggests. The chosen semantic relations are hyponymy, meronymy, co-hyponymy and co-meronymy, for the relevance they have in ontology construction. Different lexico-syntactic patterns are used for different kinds of relations. In particular, patterns including both terms are used for hyponymy and meronymy discovery, (e. g. "cyclosporine is a medicine"): the number of occurrences of the pattern on the Web will indicate the confidence of the candidate semantic relation. Concerning co-hyponymy and co-meronymy, explorative "open" patterns, including just one term, are used. For example, given the term pair "electron-nucleus", we can see if a co-meronymy relation holds between them by applying the following two patterns: "electron is part of" and "nucleus is part of" and then by looking for common holonyms (e. g. "atom"). Concerning evaluation, two different measures have been defined, one for hypernymy and meronymy relations and the other for co-hyponymy and co-meronymy. The measures are basically built upon the number of occurrences of the patterns on the Web and, concerning co-hyponymy and co-meronymy, on the number of common hypernyms (or holonyms) shared between the terms},
URL = {https://iris.cnr.it/handle/20.500.14243/244995},
}
@MISC{MARCHI_2009_MISC_MM_458600,
AUTHOR = {Marchi, S. and Montemagni, S.},
TITLE = {BOOTSTREP: the information extractor},
YEAR = {2009},
ABSTRACT = {Software per l'estrazione di informazione linguistica (sottocategorizzazione sintattica e quadri argomentali) da corpora di dominio biomedico in lingua inglese},
URL = {https://iris.cnr.it/handle/20.500.14243/458600},
}
@MISC{MONACHINI_2009_MISC_M_106749,
AUTHOR = {Monachini, M.},
TITLE = {A 15-year journey in Standards for Lexical Resources},
YEAR = {2009},
KEYWORDS = {Standards, Lexicon},
URL = {https://iris.cnr.it/handle/20.500.14243/106749},
CONFERENCE_NAME = {New horizons for Linguistic Resources in a Global Context},
}
@MISC{MONACHINI_2009_MISC_M_435680,
AUTHOR = {Monachini, M.},
TITLE = {The WordNet-LMF Representation Format},
YEAR = {2009},
KEYWORDS = {Standards, Lexicon},
URL = {https://iris.cnr.it/handle/20.500.14243/435680},
CONFERENCE_NAME = {The First KYOTO Workshop Environmental Knowledge Transition and Exchange},
}
@MISC{PIRRELLI_2009_MISC_PV_228601,
AUTHOR = {Pirrelli and Vito},
TITLE = {Comprendere un documento con il computer},
YEAR = {2009},
ABSTRACT = {In this talk, I shall deal with the complex process of computer reading and understanding of text documents as the result of the interleaving of a number of levels of processing, both linguistic and extra-linguistic, such as parsing, classifying, learning and knowing. In real tasks, there exists no parsing without classifying, no classifying without learning, no learning without knowing and eventually no knowing without "doing things with words". Only through robust integration and co-operation of less than optimal components and inter-disciplinary cross-fertilization we can hope to develop general and comprehensive solutions which are more than the sums of their parts},
KEYWORDS = {Gestione documentale, annotazione linguistica, indicizzazione},
URL = {https://iris.cnr.it/handle/20.500.14243/228601},
CONFERENCE_NAME = {Documentazione, terminologia e Scienze delle Informazione},
}
@MISC{QUOCHI_2009_MISC_Q_227948,
AUTHOR = {Quochi, V.},
TITLE = {Usage scenarios and basic workflows},
YEAR = {2009},
PAGES = {5-5},
URL = {http://www.clarin.eu/sites/default/files/CLARIN_Newsletter_no_6.pdf},
VOLUME = {6},
}
@MISC{RUIMY_2009_MISC_RBP_106752,
AUTHOR = {Ruimy, N. and Bozzi, A. and Pardelli, G.},
TITLE = {Modèle lexical pour un thésaurus-lexique électronique de la terminologie saussurienne},
YEAR = {2009},
ABSTRACT = {Le modèle lexical SIMPLE que nous nous proposons d'adopter pour la création d'un thésaurus-lexique de la terminologie linguistique saussurienne a été créé dans le cadre du projet européen éponyme et a permis le développement de lexiques sémantiques monolingues harmonisés pour douze langues de l'Union Européenne. Dès sa création, il s'est imposé comme standard de facto et a ainsi inspiré de manière déterminante le standard international ISO pour les lexiques du Traitement Automatique des Langues. Dans le panorama de la Lexicographie Computationnelle, ce modèle lexical se distingue par certains aspects particulièrement novateurs. L'approche théorique adoptée pour la représentation de l'information sémantique est basée sur les principes fondamentaux de la théorie du Lexique Génératif (J. Pustejovsky, 1995; 2001). L'architecture flexible du modèle ainsi que la méthodologie de construction du lexique permettent d'encoder dans les entrées lexicales une ample gamme d'informations hautement structurées couvrant tous les aspects de la sémantique lexicale des mots; ceci de manière cohérente, et au degré de granularité souhaité. La structuration conceptuelle du lexique est confiée à une ontologie linguistique mettant en relief le caractère multidimensionnel du sens lexical. L'ontologie SIMPLE est formée de types sémantiques indépendants des langues et a été conçue en prévision d'expansions ou de spécialisations visant à satisfaire aux exigences de domaines d'intérêt particuliers. Outre la classification ontologique et un certain nombre de traits sémantiques, les unités lexicales sont caractérisées par un réseau de relations sémantiques qui sont en majeure partie le fruit d'une relecture de la structure des qualia que Pustejovsky emprunte à Moravcsik, 1975. Ces relations permettent de modéliser l'information concernant les différentes composantes sémantiques qui concourent à définir la structure interne d'une unité lexicale. Elles explicitent ses liens hyperonymiques et méronymiques mais aussi, sur l'axe syntagmatique, les liens aux différents prédicats qui contribuent à éclairer son sens, et en particulier l'origine et la fonction de l'entité dénotée. D'autres relations, telles que la synonymie, la polysémie logique et la dérivation morphologique sont également définies. Les lexèmes prédicatifs, et en particulier les verbes, sont de surcroît caractérisés par le scénario sémantique dans lequel ils sont impliqués. Celui-ci est décrit en termes de classe aspectuelle et de structure argumentale du prédicat, avec indication du rôle sémantique et des restrictions de sélection de chacun des arguments},
KEYWORDS = {Computational Lexicon, Thesaurus},
PAGES = {1-17},
URL = {https://iris.cnr.it/handle/20.500.14243/106752},
CONFERENCE_NAME = {Séminaire international "Publier les manuscrits de Ferdinand de Saussure"},
}
@MISC{SPINOSA_2009_MISC_SGCMVM_90828,
AUTHOR = {Spinosa, P. and Giardiello, G. and Cherubini, M. and Marchi, S. and Venturi, G. and Montemagni, S.},
TITLE = {NLP based Metadata Extraction for Legal Text Consolidation},
YEAR = {2009},
KEYWORDS = {Natural Language Processing, textual amendments, XML representation, metadata extraction, consolidation of legal text},
URL = {https://iris.cnr.it/handle/20.500.14243/90828},
CONFERENCE_NAME = {Twelfth International Conference on Artificial Intelligence and Law (ICAIL 2009)},
}
@MISC{VENTURI_2009_MISC_VMMSTMA_106756,
AUTHOR = {Venturi, G. and Montemagni, S. and Marchi, S. and Sasaki, Y. and Thompson, P. and McNaught, J. and Ananiadou, S.},
TITLE = {Bootstrapping a Verb Lexicon for Biomedical Information Extraction},
YEAR = {2009},
ABSTRACT = {The extraction of information from texts requires resources that contain both syntactic and semantic properties of lexical units. As the use Of language in specialized domains, such as biology, can be very different to the general domain, there is a need for domain-specific resources to ensure that the information extracted is as accurate as possible. We are building a large-scale lexical resource for the biology domain. providing information about predicate-argument structure that has been bootstrapped from a biomedical corpus on the subject of E. Coli. The lexicon is currently focussed on verbs, and includes both automatically-extracted syntactic subcategorization frames, as well as semantic event frames that are based on annotation by domain experts. In addition, the lexicon contains manually-added explicit links between semantic and syntactic slots in corresponding frames. To Our knowledge, this lexicon currently represents a unique resource within in the biomedical domain},
KEYWORDS = {domain-specific lexical resources, lexical acquisition, syntax-semantics linking, Information Extraction, Biological Language Processing},
PAGES = {137-148},
URL = {https://iris.cnr.it/handle/20.500.14243/106756},
VOLUME = {5449},
ISBN = {978-3-642-00381-3},
CONFERENCE_NAME = {International Conference on Intelligent Text Processing and Computational Linguistics (CICLing 2009)},
EDITOR = {Gelbukh, A.},
}
@ARTICLE{BAGLIONI_2008_ARTICLE_BGMRS_63020,
AUTHOR = {Baglioni, M. and Giovannetti, E. and Masserotti, M. V. and Renso, C. and Spinsanti, L.},
TITLE = {Ontology-supported Querying of Geographical Databases},
YEAR = {2008},
ABSTRACT = {Querying geographical information systems has been recognized as a difficult task for non-expert users. Furthermore, user queries are often characterized by semantic aspects not directly managed by traditional spatial databases or GIS. Examples of such semantic geospatial queries are the use of implicit spatial relations between objects, or the reference of domain concepts not explicitly represented in data. To handle such queries, we envisage a system that translates natural language queries into spatial SQL statements on a database, thus improving standard GIS with new semantic capabilities. Within this general objective, the contribution of this article is to introduce a methodology to handle semantic geospatial queries issued over a spatial database. This approach captures semantics from an ontology built upon the spatial database and enriched by domain concepts and properties specifically defined to represent the localization of objects. Some examples of the use of the methodology in the urban domain are presented},
KEYWORDS = {H.2.8 Database Applications, Ontology extraction, Spatial databases},
PAGES = {31-44},
URL = {https://iris.cnr.it/handle/20.500.14243/63020},
VOLUME = {12 (SUPPL. 1)},
ISSN = {1467-9671},
JOURNAL = {TRANSACTIONS IN GIS (ONLINE)},
}
@ARTICLE{CALZOLARI_2008_ARTICLE_C_50341,
AUTHOR = {Calzolari, N.},
TITLE = {Initiatives, Tendencies and Driving Forces for a 'Lexical Web' as Part of a 'Language Infrastructure'},
YEAR = {2008},
ABSTRACT = {While highlighting the infrastructural role of Language Resources (LR) I sketch my perception of the current situation in the LR field. I underline some of the priority areas of concern today with respect to implementing an open Language Infrastructure, and specifically what we could call a "Lexical Web". My objective is to show that it is imperative that there is an underlying global strategy behind the set of initiatives which are/can be launched in Europe and world-wide, and that a global vision and cooperation among different communities is necessary to achieve more coherent and useful results. I end up mentioning two new European initiatives that go on this direction and promise to be influential in shaping the future of the LR area},
URL = {https://iris.cnr.it/handle/20.500.14243/50341},
DOI = {10.1007/978-3-540-78159-2_10},
}
@ARTICLE{CALZOLARI_2008_ARTICLE_CC_230711,
AUTHOR = {Calzolari, N. and Choukri, K.},
TITLE = {LREC2008-The Language Resources and Evaluation Conference},
YEAR = {2008},
ABSTRACT = {LREC, launched in 1998 in Granada as a visionary idea of Antonio Zampolli and other colleagues, celebrated its tenth birthday in the wonderful city of Marrakech. The conference had the honour of receiving the Royal Patronage of His Majesty Mohammed VI, King of Morocco, highlighting the importance assigned to multilingual and multicultural issues},
URL = {https://iris.cnr.it/handle/20.500.14243/230711},
ISSN = {0926-4981},
JOURNAL = {ERCIM NEWS},
}
@ARTICLE{CIGNONI_2008_ARTICLE_C_37712,
AUTHOR = {Cignoni, L.},
TITLE = {'Yummy Yummy! Per giocare con l'inglese', Inglese Educazione alimentare},
YEAR = {2008},
ABSTRACT = {No abstract available},
KEYWORDS = {Insegnamento lingua inglese, bambini, educazione alimentare, scuola dell'infanzia},
PAGES = {1-32},
URL = {https://iris.cnr.it/handle/20.500.14243/37712},
VOLUME = {(4)},
ISSN = {1590-3206},
JOURNAL = {SCUOLA DELL'INFANZIA},
}
@ARTICLE{CLAUDET_2008_ARTICLE_COBDGPBBBBCDFGMSSSVVP_14600,
AUTHOR = {Claudet, J. and Osenberg, C. W. and Benedetti Cecchi, L. and Domenici, P. and Garcia Charton, J. A. and Perez Ruzafa, A. and Badalamenti, F. and Bayle Sempere, J. and Brito, A. and Bulleri, F. and Culioli, J. M. and Dimech, M. and Falcon, J. M. and Guala, I. and Milazzo, M. and Sanchez Meca, J. and Somerfield, P. J. and Stobart, B. and Vandeperre, F. and Valle, C. and Planes, S.},
TITLE = {Marine reserves: size and age do matter},
YEAR = {2008},
ABSTRACT = {Abstract: Marine reserves are widely used throughout the world to prevent overfishing and conserve biodiversity, but uncertainties remain about their optimal design. The effects of marine reserves are heterogeneous. Despite theoretical findings, empirical studies have previously found no effect of size on the effectiveness of marine reserves in protecting commercial fish stocks. Using 58 datasets from 19 European marine reserves, we show that reserve size and age do matter: Increasing the size of the no-take zone increases the density of commercial fishes within the reserve compared with outside; whereas the size of the buffer zone has the opposite effect. Moreover, positive effects of marine reserve on commercial fish species and species richness are linked to the time elapsed since the establishment of the protection scheme. The reserve size-dependency of the response to protection has strong implications for the spatial management of coastal areas because marine reserves are used for spatial zoning},
KEYWORDS = {Asymmetrical analysis of variance, coastal marine ecosystems, commercial species, fish assemblages, heterogeneity, marine protected area, marine reserve age, marine reserve design, marine reserve network, marine reserve size, weighted meta-analysis.},
PAGES = {481-489},
URL = {https://iris.cnr.it/handle/20.500.14243/14600},
VOLUME = {11},
DOI = {10.1111/j.1461-0248.2008.01166.x},
ISSN = {1461-023X},
JOURNAL = {ECOLOGY LETTERS},
}
@ARTICLE{DELLORLETTA_2008_ARTICLE_DLMMPV_37713,
AUTHOR = {Dell'Orletta, F. and Lenci, A. and Marchi, S. and Montemagni, S. and Pirrelli, V. and Venturi, G.},
TITLE = {Dal testo alla conoscenza e ritorno: estrazione terminologica e annotazione semantica di basi documentali di dominio},
YEAR = {2008},
ABSTRACT = {The paper focuses on the automatic extraction of domain knowledge from Italian legal texts and presents a fully-implemented ontology learning system (T2K, Text-2-Knowledge) that includes a battery of tools for Natural Language Processing, statistical text analysis and machine learning. Evaluated results show the considerable potential of systems like T2K, exploiting an incremental interleaving of NLP and machine learning techniques for accurate large-scale semi-automatic extraction and structuring of domain-specific knowledge},
KEYWORDS = {Natural Language Processing, Machine Learning, Knowledge extraction from texts, Ontology learning, Legal ontologies},
PAGES = {197-218},
URL = {https://iris.cnr.it/handle/20.500.14243/37713},
VOLUME = {26 (1-2)},
ISSN = {1594-2201},
JOURNAL = {AIDA INFORMAZIONI (ONLINE)},
}
@ARTICLE{DIDONATO_2008_ARTICLE_D_384178,
AUTHOR = {Di Donato, F.},
TITLE = {Università, scienza e politica nel Conflitto delle facoltà di Kant},
YEAR = {2008},
ABSTRACT = {Una riflessione sul rapporto tra scienza e politica nel Conflitto delle facoltà di Kant},
URL = {https://iris.cnr.it/handle/20.500.14243/384178},
ISSN = {1591-4305},
JOURNAL = {BOLLETTINO TELEMATICO DI FILOSOFIA POLITICA},
}
@ARTICLE{GUADAGNINI_2008_ARTICLE_G_75455,
AUTHOR = {Guadagnini, E.},
TITLE = {Scelta di voci del Tesoro della Lingua Italiana delle Origini (dodicesima serie)},
YEAR = {2008},
ABSTRACT = {Voci calda s. f., caldetto agg., caldità s. f., caldo agg. /s. m., calefattorio s. m., calere v., calidamente avv., calidezza s. f., calidità s. f., càlido agg. /s. m., calore s. m., calura s. f., calurare v., coperta s. f., coperto agg. /s. m. /avv., copertura s. f., coprimento s. m., coprire v., copritura s. f. del Tesoro della Lingua Italiana delle Origini (pp. 84-118, 124-159)},
KEYWORDS = {Lessicografia italiana, Italiano antico},
PAGES = {15-349},
URL = {https://iris.cnr.it/handle/20.500.14243/75455},
VOLUME = {13},
ISSN = {1591-8254},
JOURNAL = {BOLLETTINO-OPERA DEL VOCABOLARIO ITALIANO},
}
@ARTICLE{MONTEMAGNI_2008_ARTICLE_M_433729,
AUTHOR = {Montemagni, S.},
TITLE = {The space of Tuscan dialectal variation. A correlation study},
YEAR = {2008},
ABSTRACT = {The paper illustrates the results of a correlation study focusing on linguistic variation in an Italian region, Tuscany. By exploiting a multi-level representation scheme of dialectal data, the study analyses attested patterns of phonetic and morpho-lexical variation with the aim of testing the degree of correlation between a) phonetic and morpho-lexical variation, and b) linguistic variation and geographic distance. The correlation analysis was performed by combining two complementary approaches proposed in dialectometric literature, namely by computing both global and place-specific correlation measures and by inspecting their spatial distribution. Achieved results demonstrate that phonetic and morpho-lexical variations in Tuscany seem to follow a different pattern than encountered in previous studies},
KEYWORDS = {Computational dialectology, Dialectometry},
PAGES = {135-152},
URL = {http://www.euppublishing.com/doi/abs/10.3366/E1753854809000354},
VOLUME = {2 (1-2)},
DOI = {10.3366/E1753854809000354},
ISSN = {1753-8548},
JOURNAL = {INTERNATIONAL JOURNAL OF HUMANITIES AND ARTS COMPUTING},
}
@ARTICLE{PIOGGIA_2008_ARTICLE_PISFMAD_1032,
AUTHOR = {Pioggia, G. and Igliozzi, R. and Sica, M. and Ferro, M. and Muratori, F. and Ahluwalia, A. and De Rossi, D.},
TITLE = {Exploring emotional and imitational android-based interactions in autistic spectrum disorders},
YEAR = {2008},
ABSTRACT = {Individuals with Autistic Spectrum Disorders (ASDs) have impairments in processing of social and emotional information. To widen emotive responsiveness, the employment of robotic systems to engage proactive interactive responses in children with ASDs has been recently suggested. Understanding and teaching the processing of socio-emotional abilities is the inspiring principle of this novel approach and could be of tremendous clinical significance. Encouraging studies with robotic dolls, mobile robots and humanoids acting as social mediators have provided important insights and demonstrate the necessity of long term studies. In this study we report on a series of experiments on four subjects affected by ASDs as they interact with a biomimetic android. We assessed both their spontaneous behavior and reactions to therapist presses in correlation with the time course of the physiological and behavioral data, as well as the focusing of attention towards the android's eye movements and the spontaneous ability to imitate gesture and facial expressions. Overall, subjects demonstrated a decrease in dysfunction in the areas of social communication, implying a marked improvement in these areas after interacting with the android},
PAGES = {49-62},
URL = {https://iris.cnr.it/handle/20.500.14243/1032},
VOLUME = {1 (1)},
ISSN = {1784-9934},
JOURNAL = {JOURNAL OF CYBERTHERAPY AND REHABILITATION},
}
@ARTICLE{PROIETTI_2008_ARTICLE_PC_403989,
AUTHOR = {Proietti and Carlo},
TITLE = {Natural Numbers and Infinitesimals: A Discussion between Benno Kerry and Georg Cantor},
YEAR = {2008},
ABSTRACT = {During the first months of 1887, while completing the drafts of his Mitteilungen zur Lehre vom Transfiniten, Georg Cantor maintained a continuous correspondence with Benno Kerry. Their exchange essentially concerned two main topics in the philosophy of mathematics, namely, (a) the concept of natural number and (b) the infinitesimals. Cantor's and Kerry's positions turned out to be irreconcilable, mostly because of Kerry's irremediably psychologistic outlook, according to Cantor at least. In this study, I will examine and reconstruct the main points in the discussion around (a) and (b) and stress some interesting aspects of the philosophical and mathematical thought of Benno Kerry},
KEYWORDS = {history of mathematics, history of logic, Frege, infinitesimals, natural numbers, Benno Kerry},
PAGES = {343-359},
URL = {https://iris.cnr.it/handle/20.500.14243/403989},
VOLUME = {29 (4)},
DOI = {10.1080/01445340802025768},
ISSN = {0144-5340},
JOURNAL = {HISTORY AND PHILOSOPHY OF LOGIC},
}
@INCOLLECTION{BACCIU_2008_INCOLLECTION_BBFGR_248696,
AUTHOR = {Bacciu, D. and Bellandi, A. and Furletti, B. and Grossi, V. and Romei, A.},
TITLE = {Discovering Strategic Behaviors in Multi-Agent Scenarios by Ontology-Driven Mining},
YEAR = {2008},
URL = {https://iris.cnr.it/handle/20.500.14243/248696},
ISBN = {978-953-7619-16-9},
}
@INCOLLECTION{MARINELLI_2008_INCOLLECTION_M_165205,
AUTHOR = {Marinelli, R.},
TITLE = {Analisi di metafore e espressioni idiomatiche per mezzo di risorse computazionali e corpora elettronici},
YEAR = {2008},
ABSTRACT = {Sulla base del modello di database semantico lessicale EWN e IWN è stato creato un database terminologico che contiene circa 3000 termini appartenenti al lessico specializzato del dominio marittimo},
KEYWORDS = {Metafore, corpora, database semantici, ontologia.},
PAGES = {469-488},
URL = {https://iris.cnr.it/handle/20.500.14243/165205},
PUBLISHER = {Viella (Roma, ITA)},
ISBN = {978-88-8334-431-2},
CONFERENCE_PLACE = {Roma},
BOOKTITLE = {Critica del testo. L'Europa dei proverbi},
EDITOR = {Punzi, A. and Tomassetti, I.},
}
@INCOLLECTION{MARINELLI_2008_INCOLLECTION_M_134812,
AUTHOR = {Marinelli, R.},
TITLE = {Idiomatic Expressions and Metaphors from the Maritime Domain},
YEAR = {2008},
ABSTRACT = {According to euroWordNet/ItalWordNet model, a terminological database has been created which contains terms belonging to the specialized lexicon of the technical-nautical and maritime transport domain. We want to give prominence to the frequency of idiomatic expressions and methaphors coming from this cultural environment used in everyday language. Our lexicographic research aims at: i) analyzing the relationship between the maritime domain as "source domain" and the concepts described in the "target domain"; ii) structuring the semantic code of idiomatic expressions in the terminological database as well as the link with the equivalent or closest expressions in English; iii) checking the use and the frequency of this type of idiomatic expressions and metaphors in a large corpus of Italian contemporary language},
KEYWORDS = {Terminology, Idiomatic Expressions, Metaphors, Lexical databases},
PAGES = {209-220},
URL = {https://iris.cnr.it/handle/20.500.14243/134812},
PUBLISHER = {Peter Lang Internationaler Verlag der Wissenschaften (Francoforte, DEU)},
ISBN = {978-3-631-57419-5},
CONFERENCE_PLACE = {Francoforte},
BOOKTITLE = {Lenguaje figurado y motivacion. Una perspectiva desde la fraseologia},
EDITOR = {De La Granja, M. A.},
}
@INCOLLECTION{MAZZOCCHI_2008_INCOLLECTION_MMT_134813,
AUTHOR = {Mazzocchi, F. and Marinelli, R. and Tiberi, M.},
TITLE = {Refining the Thesaural Associative Relationship by Applying the EuroWordNet Semantic Model},
YEAR = {2008},
KEYWORDS = {Thesaurus},
URL = {https://iris.cnr.it/handle/20.500.14243/134813},
}
@INCOLLECTION{MONTEMAGNI_2008_INCOLLECTION_M_134811,
AUTHOR = {Montemagni, S.},
TITLE = {Analisi linguistico-computazionali del corpus dialettale dell'Atlante Lessicale Toscano. Primi risultati sul rapporto toscano-italiano},
YEAR = {2008},
KEYWORDS = {Corpus dialettale},
URL = {https://iris.cnr.it/handle/20.500.14243/134811},
PUBLISHER = {Pacini (Pisa, ITA)},
CONFERENCE_PLACE = {Pisa},
}
Warning: Undefined array key 0 in /mnt/resources/apps/pipol_v5/lib_pipol.php on line 7034
Deprecated: strtoupper(): Passing null to parameter #1 ($string) of type string is deprecated in /mnt/resources/apps/pipol_v5/lib_pipol.php on line 7034
@EDITORIAL{_2008_EDITORIAL__181029,
AUTHOR = {},
TITLE = {Language Resources and Evaluation},
YEAR = {2008},
URL = {https://iris.cnr.it/handle/20.500.14243/181029},
}
@EDITORIAL{BELTRAMI_2008_EDITORIAL_BLSABGGIMRV_146302,
AUTHOR = {Beltrami, P. D. and Larson, P. C. and Squillacioti, P. C. and Artale, E. and Boccellari, A. and Giuliani, M. and Guadagnini, E. and Ioriofili, D. and Mosti, R. and Ravani, S. and Vaccaro, G.},
TITLE = {TESORO DELLA LINGUA ITALIANA DELLE ORIGINI-Edizione online: www. vocabolario. org-Versione 2008 di 19000 voci},
YEAR = {2008},
KEYWORDS = {Lingua italiana, Lessico, Lessicografia},
URL = {http://tlio.ovi.cnr.it/TLIO},
ISSN = {2240-5216},
}
@INPROCEEDINGS{AIELLO_2008_INPROCEEDINGS_ACMP_68638,
AUTHOR = {Aiello, M. and Chiarella, D. and Merlo, A. and Papaleo, G.},
TITLE = {Improvements in physical intrusion detection on LAN. PRISE 2008},
YEAR = {2008},
URL = {https://iris.cnr.it/handle/20.500.14243/68638},
CONFERENCE_NAME = {Prise 2008},
}
@INPROCEEDINGS{ANANIADOU_2008_INPROCEEDINGS_AMNS_65088,
AUTHOR = {Ananiadou, S. and Monachini, M. and Nenadic, G. and Su, J.},
TITLE = {Foreword},
YEAR = {2008},
ABSTRACT = {Key resources of interest in biomedical text mining are lexical and knowledge repositories (controlled vocabularies, terminologies, thesauri, ontologies) and annotated corpora, including both task-specific resources and repositories reengineered from biomedical or general language resources. Of particular interest is the process of building annotated resources, including designing guidelines and annotation schemas (aiming at both syntactic and semantic interoperability) and relying on language engineering standards. Challenging aspects are updates and evolution management of resources, as well as their documentation, dissemination and evaluation},
KEYWORDS = {Biomedical text mining, Corpora annotated},
URL = {https://iris.cnr.it/handle/20.500.14243/65088},
ISBN = {2-9517408-4-0},
CONFERENCE_NAME = {LREC 2008, Sixth International Conference on Language Resources and Evaluation-Workshop},
}
@INPROCEEDINGS{BAGLIONI_2008_INPROCEEDINGS_BBFST_265115,
AUTHOR = {Baglioni, M. and Bellandi, A. and Furletti, B. and Spinsanti, L. and Turini, F.},
TITLE = {Ontology-Based Business Plan Classification},
YEAR = {2008},
ABSTRACT = {The problem of providing Small and Medium Enterprises (SMEs) with good self-assessment tools is becoming more and more urgent every day, not only because of increasing market competition, but also because of new rules for credit granting, as for example the ones referred to as Basel II. One of the critical issues in designing supporting tools is the quality of the knowledge embedded in them. We maintain that a better quality of decisions can be obtained by exploiting not only quantitative information but also qualitative information and expert knowledge. Here we present a system able to classify the quality of innovation plans of SMEs by exploiting both quantitative and qualitative knowledge embedded in ontology. The ontological approach allows representing qualitative knowledge in a very natural way and, as a consequence, we are able to elicit it by means that are natural for SME officers, as for example questionnaires},
URL = {https://iris.cnr.it/handle/20.500.14243/265115},
}
@INPROCEEDINGS{BELLANDI_2008_INPROCEEDINGS_BFGR_265114,
AUTHOR = {Bellandi, A. and Furletti, B. and Grossi, V. and Romei, A.},
TITLE = {Ontological Support For Association Rule Mining},
YEAR = {2008},
ABSTRACT = {This paper describes some improvements of our previous work that realizes an integrated framework for extracting constraint based multilevel association rules with an ontology support. The ontology is not the repository of the data, but it models the application domain describing the metadata. Furthermore, it permits to focus the analysis only on a subset of data and to express multi level constraints on them. In this context, we report some theoretical notion already introduced and a detailed description of the recent improvements: the introduction of the object properties in the framework, and the implementation of an user interface},
KEYWORDS = {Association Rules, Ontology, Data mining},
PAGES = {110-115},
URL = {http://dl.acm.org/citation.cfm?id=1712781},
PUBLISHER = {Acta Press (Anaheim, USA)},
ISBN = {978-0-88986-710-9},
CONFERENCE_NAME = {26th IASTED International Conference on Artificial Intelligence and Applications, 2008},
CONFERENCE_PLACE = {Anaheim},
}
@INPROCEEDINGS{BROEDER_2008_INPROCEEDINGS_BDHPRCW_65090,
AUTHOR = {Broeder, D. and Declerck, T. and Hinrichs, E. and Piperidis, S. and Romary, L. and Calzolari, N. and Wittenburg, P.},
TITLE = {Foundation of a Component-based Flexible Registry for Language Resources and Technology},
YEAR = {2008},
URL = {https://iris.cnr.it/handle/20.500.14243/65090},
}
@INPROCEEDINGS{CASELLI_2008_INPROCEEDINGS_CIB_65075,
AUTHOR = {Caselli, T. and Ide, N. and Bartolini, R.},
TITLE = {A Bilingual Corpus of Inter-linked Events},
YEAR = {2008},
ABSTRACT = {This paper describes the creation of a bilingual corpus of inter-linked events for Italian and English. Linkage is accomplished through the Inter-Lingual Index (ILI) that links ItalWordNet withWordNet. The availability of this resource, on the one hand, enables contrastive analysis of the linguistic phenomena surrounding events in both languages, and on the other hand, can be used to perform multilingual temporal analysis of texts. In addition to describing the methodology for construction of the inter-linked corpus and the analysis of the data collected, we demonstrate that the ILI could potentially be used to bootstrap the creation of comparable corpora by exporting layers of annotation for words that have the same sense},
KEYWORDS = {Corpus (creation, annotation, etc.), Semantics, Validation of LRs},
PAGES = {2424-2429},
URL = {http://www.lrec-conf.org/proceedings/lrec2008/pdf/610_paper.pdf},
PUBLISHER = {European Language Resources Association (ELRA)-Evaluations and Language resources Distribution Agency (ELDA) (Paris, FRA)},
ISBN = {2-9517408-4-0},
CONFERENCE_NAME = {LREC 2008, Sixth International Conference on Language Resources and Evaluation},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {LREC 2008, Sixth International Conference on Language Resources and Evaluation},
EDITOR = {Calzolari, N. and Choukri, K. and Maegaard, B. and Mariani, J. and Odjik, J. and Piperidis, S. and Tapias, D.},
}
@INPROCEEDINGS{CIGNONI_2008_INPROCEEDINGS_C_65087,
AUTHOR = {Cignoni, L.},
TITLE = {Filling the gap: a three-language philological dictionary based on contexts from authoritative sources},
YEAR = {2008},
ABSTRACT = {This paper describes the methodology adopted for the creation of a multilingual-English-Italian-French-philological dictionary, designed to meet as far as possible the requirements of users in the field of philology, who need to use specific terms in a language other than their own. The project is addressed to graduate and post-graduate students, tutors and scholars, translators and interpreters for whom a glossary of specialised terms relative to a given universe of discourse is essential. The dictionary defines a variety of terms associated with philology and extends to other closely connected disciplines such as textual criticism, codicology, palaeography, epigraphy, papyrology, genetic criticism, etc. The three-language glossary is arranged in conventional form-each lexical entry listed alphabetically-and the English terms are followed by their equivalents in Italian and French. The Greek or Latin words from which many philological words have derived and frequently used to refer to a particular concept or phenomenon are also included. The project involves recording not just the term but also a brief contextualized definition in each language, accurately quoting the source, certified and scientifically reliable, from which the information was drawn. Alongside these definitions, a number of other contextualizations appear, also derived from authoritative sources, and different types of illustrations-e. g. manuscripts, stems, images of people and places-relative to the terminology are provided. The textual data and images will be included into an application (Alpha version) of the PINAKES project, released in March 2007, which is able to deal with different types of information-text, scientific objects, tables or graphics. This ongoing dictionary project, at present covering a total of around 1000 words, is constantly enriched with new entries, definitions and contextualizations in the different languages},
KEYWORDS = {Computational Philology, Terminology, Di},
PAGES = {947-955},
URL = {https://iris.cnr.it/handle/20.500.14243/65087},
PUBLISHER = {IULA-Institut Universitari de Lingüística Aplicada (Barcelona, ESP)},
ISBN = {978-84-96742-67-3},
CONFERENCE_NAME = {XIII Euralex International Congress},
CONFERENCE_PLACE = {Barcelona},
BOOKTITLE = {XIII Euralex International Congress},
EDITOR = {Bernal, E. and Decesaris, J.},
}
@INPROCEEDINGS{DELGRATTA_2008_INPROCEEDINGS_DBCMSC_65103,
AUTHOR = {Del Gratta, R. and Bartolini, R. and Caselli, T. and Monachini, M. and Soria, C. and Calzolari, N.},
TITLE = {UFRA: a UIMA-based Approach to Federated Language Resource Architecture},
YEAR = {2008},
ABSTRACT = {In this paper we address the issue of developing an interoperable infrastructure for language resources and technologies. In our approach, called UFRA, we extend the Federate Database Architecture System adding typical functionalities caming from UIMA. In this way, we capitalize the advantages of a federated architecture, such as autonomy, heterogeneity and distribution of components, monitored by a central authority responsible for checking both the integration of components and user rights on performing different tasks. We use the UIMA approach to manage and define one common front-end, enabling users and clients to query, retrieve and use language resources and technologies. The purpose of this paper is to show how UIMA leads from a Federated Database Architecture to a Federated Resource Architecture, adding to a registry of available components both static resources such as lexicons and corpora and dynamic ones such as tools and general purpose language technologies. At the end of the paper, we present a case-study that adopts this framework to integrate the SIMPLE lexicon and TIMEML annotation guidelines to tag natural language texts},
KEYWORDS = {LR Infrastructures and Architectures, LR web services, Lexicon, Lexical database},
PAGES = {2634-2639},
URL = {http://www.lrec-conf.org/proceedings/lrec2008/pdf/656_paper.pdf},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {2-9517408-4-0},
CONFERENCE_NAME = {LREC 2008, Sixth International Conference on Language Resources and Evaluation},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {LREC 2008, Sixth International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{DELGRATTA_2008_INPROCEEDINGS_DCCR_65098,
AUTHOR = {Del Gratta, R. and Caselli, T. and Calzolari, N. and Ruimy, N.},
TITLE = {TimeML: An ontological mapping onto UIMA Type Systems},
YEAR = {2008},
ABSTRACT = {TimeML is a markup language for events},
KEYWORDS = {Infrastructure, UIMA, Event detection},
URL = {https://iris.cnr.it/handle/20.500.14243/65098},
CONFERENCE_NAME = {ICGL 2008, The First International Conference on Global Interoperability for Language Resources},
BOOKTITLE = {ICGL 2008, The First International Conference on Global Interoperability for Language Resources},
}
@INPROCEEDINGS{DELGRATTA_2008_INPROCEEDINGS_DRT_65102,
AUTHOR = {Del Gratta, R. and Ruimy, N. and Toral, A.},
TITLE = {Simple-Clips ongoing research: more information with less data by implementing inheritance},
YEAR = {2008},
ABSTRACT = {This paper presents the application of inheritance to the formal taxonomy (is-a) of a semantically rich Lexical Resource (LR) based on the Generative Lexicon theory, SIMPLE-CLIPS. The aim is to lighten the representation of its semantic layer by reducing the number of encoded relations. A prediction calculation on the impact of introducing inheritance as regards space occupancy is carried out, which yields a significant space reduction of 22%. This is corroborated by its actual application that reduces the number of explicitly encoded relations in this lexicon by 18. 4%. Later on, we study the issues that inheritance poses to the Lexical Resources and discuss sensitive solutions, illustrated by examples, to tackle each of them. Finally, we present a discussion on the application of inheritance, from which two advantages arise: consistency enhancement and inference capabilities},
KEYWORDS = {Lexicon, Knowle, Lexical database},
PAGES = {2380-2385},
URL = {https://iris.cnr.it/handle/20.500.14243/65102},
ISBN = {2-9517408-4-0},
CONFERENCE_NAME = {LREC 2008, Sixth International Conference on Language Resources and Evaluation},
BOOKTITLE = {LREC 2008, Sixth International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{DELLORLETTA_2008_INPROCEEDINGS_DLMMPV_65083,
AUTHOR = {Dell'Orletta, F. and Lenci, A. and Marchi, S. and Montemagni, S. and Pirrelli, V. and Venturi, G.},
TITLE = {Dal testo alla conoscenza e ritorno: estrazione terminologica e annotazione semantica di basi documentali di dominio},
YEAR = {2008},
ABSTRACT = {The paper focuses on the automatic extraction of domain knowledge from Italian legal texts and presents a fully-implemented ontology learning system (T2K, Text-2-Knowledge) that includes a battery of tools for Natural Language Processing, statistical text analysis and machine learning. Evaluated results show the considerable potential of systems like T2K, exploiting an incremental interleaving of NLP and machine learning techniques for accurate large-scale semi-automatic extraction and structuring of domain-specific knowledge},
KEYWORDS = {Natural Language Processing, Machine Learning, Knowledge extraction from texts, Ontology learning, Legal ontologies},
PAGES = {197-218},
URL = {http://www.assiterm91.it/wp-content/uploads/2010/11/Convegno-2008.pdf},
VOLUME = {ANNO 26, NUMERO 1-2},
ISSN = {1121-0095},
CONFERENCE_NAME = {Atti del Convegno Nazionale Ass. I. Term},
BOOKTITLE = {AIDA INFORMAZIONI},
}
@INPROCEEDINGS{DELLORLETTA_2008_INPROCEEDINGS_DLMMPV_65074,
AUTHOR = {Dell'Orletta, F. and Lenci, A. and Montemagni, S. and Marchi, S. and Pirrelli, V. and Venturi, G.},
TITLE = {Acquiring Legal Ontologies from Domain-specific Texts},
YEAR = {2008},
ABSTRACT = {The paper reports on methodology and preliminary results ofa case study in automatically extracting ontological knowledgefrom Italian legislative texts in the environmental domain. Weuse a fully-implemented ontology learning system (T2K) thatincludes a battery of tools for Natural Language Processing(NLP), statistical text analysis and machine language learn-ing. Tools are dynamically integrated to provide an incremen-tal representation of the content of vast repositories of unstruc-tured documents. Evaluated results, however preliminary, arevery encouraging, showing the great potential of NLP-poweredincremental systems like T2K for accurate large-scale semi-automatic extraction of legal ontologies},
KEYWORDS = {Ontology learning, Document management, knowledge extraction from texts, Natural Language Processing},
PAGES = {98-101},
URL = {https://iris.cnr.it/handle/20.500.14243/65074},
CONFERENCE_NAME = {LangTech 2008},
}
@INPROCEEDINGS{FRANCOPOULO_2008_INPROCEEDINGS_FDSDM_65084,
AUTHOR = {Francopoulo, G. and Declerck, T. and Sornlertlamvanich, V. and De La Clergerie, E. and Monachini, M.},
TITLE = {Data Category Registry: Morpho-syntactic and Syntactic Profiles},
YEAR = {2008},
ABSTRACT = {After a brief presentation of the data model, we describe a work in progress to define an initial set of morpho-syntactic and syntactic data categories dedicated to NLP applications. The aim is to improve interoperability among language resources and to optimize the process leading to their integration in applications. The main point is to be sure that when a language resource makes use of a value, the other language resources and programs have the same interpretation for this given value. From a practical point of view, these values are collected from existing lists, discussed, extended, and then recorded within a freely accessible data base: the ISO Data Category Registry},
KEYWORDS = {Data Category, Language resources, ISO},
PAGES = {31-39},
URL = {https://iris.cnr.it/handle/20.500.14243/65084},
ISBN = {2-9517408-4-0},
CONFERENCE_NAME = {LREC 2008, Sixth International Conference on Language Resources and Evaluation-Workshop: Use and usage of language resource-related standards},
}
@INPROCEEDINGS{GIOVANNETTI_2008_INPROCEEDINGS_GMM_65082,
AUTHOR = {Giovannetti, E. and Marchi, S. and Montemagni, S.},
TITLE = {Combining statistical techniques and lexico-syntactic patterns for semantic relations extraction from text},
YEAR = {2008},
ABSTRACT = {We describe here a methodology to combine two different techniques for Semantic Relation Extraction from texts. On the one hand, generic lexicosyntactic patterns are applied to the linguistically analyzed corpus to detect a first set of pairs of co-occurring words, possibly involved in "syntagmatic" relations. On the other hand, a statistical unsupervised association system is used to obtain a second set of pairs of "distributionally similar" terms, that appear to occur in similar contexts, thus possibly involved in "paradigmatic" relations. The approach aims at learning ontological information by filtering the candidate relations obtained through generic lexico-syntactic patterns and by labelling the anonymous relations obtained through the statistical system. The resulting set of relations can be used to enrich existing ontologies and for semantic annotation of documents or web pages},
KEYWORDS = {Ontology Learning from Text, Semantic Relation Extraction, Lexico-syntactic Patterns, Distributional Similarity},
URL = {http://sunsite.informatik.rwth-aachen.de/Publications/CEUR-WS/Vol-426/swap2008_submission_54.pdf},
CONFERENCE_NAME = {SWAP 2008-Semantic Web Applications and Perspectives},
EDITOR = {Gangemi, A. and Keizer, J. and Presutti, V. and Stoermer, H.},
}
@INPROCEEDINGS{GIOVANNETTI_2008_INPROCEEDINGS_GMMB_65100,
AUTHOR = {Giovannetti, E. and Marchi, S. and Montemagni, S. and Bartolini, R.},
TITLE = {Ontology Learning and Semantic Annotation: a Necessary Symbiosis},
YEAR = {2008},
ABSTRACT = {Semantic annotation of text requires the dynamic merging of linguistically structured information and a "world model", usually represented as a domain-specific ontology. On the other hand, the process of engineering a domain-ontology through semi-automatic ontology learning system requires the availability of a considerable amount of semantically annotated documents. Facing this bootstrapping paradox requires an incremental process of annotation-acquisition-annotation, whereby domain-specific knowledge is acquired from linguistically-annotated texts and then projected back onto texts for extra linguistic information to be annotated and further knowledge layers to be extracted. The presented methodology is a first step in the direction of a full "virtuous" circle where the semantic annotation platform and the evolving ontology interact in symbiosis. As a case study we have chosen the semantic annotation of product catalogues. We propose a hybrid approach, combining pattern matching techniques to exploit the regular structure of product descriptions in catalogues, and Natural Language Processing techniques which are resorted to analyze natural language descriptions. The semantic annotation involves the access to the ontology, semi-automatically bootstrapped with an ontology learning tool from annotated collections of catalogues},
KEYWORDS = {Information Extraction, Information Retrieval, Ontologies, Tools, Systems},
PAGES = {2079-2085},
URL = {http://www.lrec-conf.org/proceedings/lrec2008/},
PUBLISHER = {European Language Resources Association (ELRA)-Evaluations and Language resources Distribution Agency (ELDA) (Paris, FRA)},
ISBN = {2-9517408-4-0},
CONFERENCE_NAME = {LREC 2008, Sixth International Conference on Language Resources and Evaluation},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {LREC 2008, Sixth International Conference on Language Resources and Evaluation},
EDITOR = {Calzolari, N. and Choukri, K. and Maegaard, B. and Mariani, J. and Odjik, J. and Piperidis, S. and Tapias, D.},
}
@INPROCEEDINGS{HAYASHI_2008_INPROCEEDINGS_HDBM_65097,
AUTHOR = {Hayashi, Y. and Declerck, T. and Buitelaar, P. and Monachini, M.},
TITLE = {Ontologies for a Global Language Infrastructure},
YEAR = {2008},
ABSTRACT = {Given a situation where human language technologies have been maturing considerably and a rapidly growing range of language data resources being now available, together with natural language processing (NLP) tools/systems, a strong need for a global language infrastructure (GLI) is becoming more and more evident, if one wants to ensure re-usability of the resources. A GLI is essentially an open and web-based software platform on which tailored language services can be efficiently composed, disseminated and consumed. An infrastructure of this sort is also expected to facilitate further development of language data resources and NLP functionalities. The aims of this paper are twofold: (1) to discuss necessity of ontologies for a GLI, and (2) to draw a high-level configuration of the ontologies, which are integrated into a comprehensive language service ontology. To these ends, this paper first explores dimensions of GLI, and then draws a triangular view of a language service, from which necessary ontologies are derived. This paper also examines relevant ongoing international standardization efforts such as LAF, MAF, SynAF, DCR and LMF, and discusses how these frameworks are incorporated into our comprehensive language service ontology. The paper concludes in stressing the need for an international collaboration on the development of a standardized language service ontology},
KEYWORDS = {Ontology, Global language infrastructure (GLI)},
PAGES = {105-112},
URL = {https://iris.cnr.it/handle/20.500.14243/65097},
CONFERENCE_NAME = {ICGL 2008-The First International Conference on Global Interoperability for Language Resources},
EDITOR = {Webster, J. and Ide, N. and Fang, A.},
}
@INPROCEEDINGS{HAYASHI_2008_INPROCEEDINGS_HNMSC_65099,
AUTHOR = {Hayashi, Y. and Narawa, C. and Monachini, M. and Soria, C. and Calzolari, N.},
TITLE = {Ontologizing Lexicon Access Functions based on an LMF-based Lexicon Taxonomy},
YEAR = {2008},
ABSTRACT = {This paper discusses ontologization of lexicon access functions in the context of a service-oriented language infrastructure, such as the Language Grid. In such a language infrastructure, an access function to a lexical resource, embodied as an atomic Web service, plays a crucially important role in composing a composite Web service tailored to a user's specific requirement. To facilitate the composition process involving service discovery, planning and invocation, the language infrastructure should be ontology-based; hence the ontologization of a range of lexicon functions is highly required. In a service-oriented environment, lexical resources however can be classified from a service-oriented perspective rather than from a lexicographically motivated standard. Hence to address the issue of interoperability, the taxonomy for lexical resources should be ground to principled and shared lexicon ontology. To do this, we have ontologized the standardized lexicon modeling framework LMF, and utilized it as a foundation to stipulate the service-oriented lexicon taxonomy and the corresponding ontology for lexicon access functions. This paper also examines a possible solution to fill the gap between the ontological descriptions and the actual Web service API by adopting a W3C recommendation SAWSDL, with which Web service descriptions can be linked with the domain ontology},
KEYWORDS = {Lexicon, LR web services, Standards for LRs, Lexical database},
PAGES = {916-922},
URL = {https://iris.cnr.it/handle/20.500.14243/65099},
ISBN = {2-9517408-4-0},
CONFERENCE_NAME = {LREC 2008, Sixth International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{LENCI_2008_INPROCEEDINGS_LMPM_65104,
AUTHOR = {Lenci, A. and McGillivray, B. and Pirrelli, V. and Montemagni, S.},
TITLE = {Unsupervised Acquisition of Verb Subcategorization Frames from Shallow-Parsed Corpora},
YEAR = {2008},
KEYWORDS = {Acquisition, Machine Learning, Corpus (creation, annotation, etc.), Lexicon, Lexical database},
URL = {https://iris.cnr.it/handle/20.500.14243/65104},
CONFERENCE_NAME = {LREC 2008, Sixth International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{MAGNINI_2008_INPROCEEDINGS_MCTBMLBCTBSS_63164,
AUTHOR = {Magnini, B. and Cappelli, A. and Tamburini, F. and Bosco, C. and Mazzei, A. and Lombardo, V. and Bertagna, F. and Calzolari, N. and Toral, A. and Bartalesi Lenzi, V. and Sprugnoli, R. and Speranza, M.},
TITLE = {Evaluation of natural language tools for italian: EVALITA 2007},
YEAR = {2008},
ABSTRACT = {EVALITA 2007, the first edition of the initiative devoted to the evaluation of Natural Language Processing tools for Italian, provided a shared framework where participants' systems had the possibility to be evaluated on five different tasks, namely Part of Speech Tagging (organised by the University of Bologna), Parsing (organised by the University of Torino), Word Sense Disambiguation (organised by CNR-ILC, Pisa), Temporal Expression Recognition and Normalization (organised by CELCT, Trento), and Named Entity Recognition (organised by FBK, Trento). We believe that the diffusion of shared tasks and shared evaluation practices is a crucial step towards the development of resources and tools for Natural Language Processing. Experiences of this kind, in fact, are a valuable contribution to the validation of existing models and data, allowing for consistent comparisons among approaches and among representation schemes. The good response obtained by EVALITA, both in the number of participants and in the quality of results, showed that pursuing such goals is feasible not only for English, but also for other languages},
KEYWORDS = {Natural language evaluation, Standards for LRs, Evaluation methodo},
PAGES = {2536-2543},
URL = {http://www.lrec-conf.org/proceedings/lrec2008/},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {2-9517408-4-0},
CONFERENCE_NAME = {Proceedings of LREC 2008},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceeding LREC 2008},
EDITOR = {Calzolari, N. and Choukri, K. and Maegard, B.},
}
@INPROCEEDINGS{MAGNINI_2008_INPROCEEDINGS_MCTBMLBCTBSS_148288,
AUTHOR = {Magnini, B. and Cappelli, A. and Tamburini, F. and Bosco, C. and Mazzei, A. and Lombardo, V. and Bertagna, F. and Calzolari, N. and Toral, R. A. and Bartalesi, L. V. and Sprugnoli, R. and Speranza, M.},
TITLE = {Evaluation of natural language tools for italian: EVALITA 2007},
YEAR = {2008},
ABSTRACT = {EVALITA 2007, the first edition of the initiative devoted to the evaluation of Natural Language Processing tools for Italian, provided a shared framework where participants' systems had the possibility to be evaluated on five different tasks, namely Part of Speech Tagging (organised by the University of Bologna), Parsing (organised by the University of Torino), Word Sense Disambiguation (organised by CNR-ILC, Pisa), Temporal Expression Recognition and Normalization (organised by CELCT, Trento), and Named Entity Recognition (organised by FBK, Trento). We believe that the diffusion of shared tasks and shared evaluation practices is a crucial step towards the development of resources and tools for Natural Language Processing. Experiences of this kind, in fact, are a valuable contribution to the validation of existing models and data, allowing for consistent comparisons among approaches and among representation schemes. The good response obtained by EVALITA, both in the number of participants and in the quality of results, showed that pursuing such goals is feasible not only for English, but also for other languages},
KEYWORDS = {Natural language evaluation, Standards for LRs, Evaluation methodologies, H.3 INFORMATION STORAGE AND RETRIEVAL. Linguistic processing},
PAGES = {2536-2543},
URL = {https://iris.cnr.it/handle/20.500.14243/148288},
CONFERENCE_NAME = {LREC 2008, Sixth International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{MARCHETTI_2008_INPROCEEDINGS_MTVARCMFHIKNRV_158927,
AUTHOR = {Marchetti, A. and Tesconi, M. and Vossen, P. and Agirre, E. and Rigau, G. and Calzolari, N. and Monachini, M. and Fellbaum, C. and Hsieh, S. and Isahara, H. and Kanzaki, K. and Neri, F. and Raffaelli, R. and Vangent, J.},
TITLE = {KYOTO: A System for Mining, Structuring, and Distributing Knowledge Across Languages and Cultures},
YEAR = {2008},
ABSTRACT = {We outline work to be carried out within the framework of an impending EC project. The goal is to construct a language-independent information system for a specific domain (environment/ecology) anchored in a language-independent ontology that is linked to WordNets in several languages. For each language, information extraction and identification of lexicalized concepts with ontological entries will be done by text miners ("Kybots"). The mapping of language-specific lexemes to the ontology allows for crosslinguistic identification and translation of equivalent terms. The infrastructure developed within this project will enable long-range knowledge sharing and transfer to many languages and cultures, addressing the need for global and uniform transition of knowledge beyond the domain of ecology and environment addressed here},
KEYWORDS = {Global WordNet Grid, Ontologies and WordNets, Multilinguality, Semantic indexing and search, Text mining},
PAGES = {474-484},
URL = {https://iris.cnr.it/handle/20.500.14243/158927},
ISBN = {978-963-482-854-9},
CONFERENCE_NAME = {GWC2008-The Fourth Global WordNet Conference},
EDITOR = {Tanács, A. and Csendes, D. and Vincze, V. and Fellbaum, C. and Vossen, P.},
}
@INPROCEEDINGS{MARINELLI_2008_INPROCEEDINGS_M_65086,
AUTHOR = {Marinelli, R.},
TITLE = {Enhancing a Terminological Database with Terms from a Scientific Domain},
YEAR = {2008},
ABSTRACT = {This paper reports on the enhancing of a maritime terminological database by means of a set of terms belonging to meteorology. The main phases of this research are described and the initial results outlined: the model of the terminological database, following EWN/IWN; the criteria used to build corpora of specialized texts to be employed as the source for term selection and extraction; the use of a semantic database (IWN) as source for exporting synsets to be coded in the terminological resource and as reference (WN 3. 0) for comparing and evaluating synsets. The set of semantic relations useful for codifying new terms belonging to the discipline of meteorology is described; in addition to the semantic relations provided by the IWN model, new relations are introduced which are more suitably tailored to specific needs either scientific or pragmatic},
KEYWORDS = {Terminology, Corpus linguistics, Semantics, Lexical databases, Semantic relations},
PAGES = {165-172},
URL = {https://iris.cnr.it/handle/20.500.14243/65086},
PUBLISHER = {Vytautas Magnus University, Institute of the Lithuanian Language (Kaunas, LTU)},
ISBN = {978-9955-704-53-9},
CONFERENCE_NAME = {The Third Baltic Conference on Human Language Technologies},
CONFERENCE_PLACE = {Kaunas},
BOOKTITLE = {The Third Baltic Conference on Human Language Technologies},
EDITOR = {Cermak, F. and Marcinkevièienë, R. and Rimkutë, E. and Zabarskaitë, J.},
}
@INPROCEEDINGS{MARINELLI_2008_INPROCEEDINGS_MB_65106,
AUTHOR = {Marinelli, R. and Bindi, R.},
TITLE = {Uso metaforico e metonimico dei nomi propri: una verifica su un corpus di italiano contemporaneo},
YEAR = {2008},
KEYWORDS = {Italian Corpus, Proper Names},
URL = {https://iris.cnr.it/handle/20.500.14243/65106},
CONFERENCE_NAME = {Prospettive nello studio del lessico italiano: atti del IX Congresso SILFI, Firenze, 14-17 giugno 2006},
}
@INPROCEEDINGS{MARINELLI_2008_INPROCEEDINGS_MBMSCCC_106747,
AUTHOR = {Marinelli, R. and Bindi, R. and Marchi, S. and Santarcangelo, L. E. and Cavallaro, I. F. and Castellani, E. and Carli, G.},
TITLE = {Suscettibilità ipnotica e linguaggio},
YEAR = {2008},
KEYWORDS = {Psycholinguistics},
PAGES = {10},
URL = {https://iris.cnr.it/handle/20.500.14243/106747},
PUBLISHER = {Bulzoni (Roma, ITA)},
ISBN = {978-88-7870-652-1},
CONFERENCE_NAME = {XLII Congresso Internazionale di Studi della Società di Linguistica Italiana},
CONFERENCE_PLACE = {Roma},
}
@INPROCEEDINGS{MARINELLI_2008_INPROCEEDINGS_MTB_65085,
AUTHOR = {Marinelli, R. and Tiberi, M. and Bindi, R.},
TITLE = {Encoding Terms from a Scientific Domain in a Terminological Database: Methodology and Criteria},
YEAR = {2008},
KEYWORDS = {Knowledge representation, Lexicon, Corpus (creation, annotation, etc.), Lexical database},
URL = {https://iris.cnr.it/handle/20.500.14243/65085},
CONFERENCE_NAME = {LREC 2008, Sixth International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{MAZZOCCHI_2008_INPROCEEDINGS_MMT_435019,
AUTHOR = {Mazzocchi, F. and Marinelli, R. and Tiberi, M.},
TITLE = {Refining the thesaural associative relationship by applying the EuroWordnet semantic model},
YEAR = {2008},
ABSTRACT = {Thesauri are tools which semantically organize a domain of knowledge for operational purposes. Their relational semantics is concerned with methods that connect terms with related meanings and are designed to support information retrieval, namely enhancing the information recall performance and contributing to improve precision, too. The network of relations of a thesaurus has a semantic function: by means of it, in fact, a representation of the meaning of each thesaurus term is provided, as well as of the conceptual structure of a subject area. The traditional thesaurus format-as described in international standards-includes three basic relationships, two of them at a conceptual level, hierarchical and associative relations, the other mostly at a lexical level, relation of equivalence. However, a rather widespread opinion is that this format should be refined in order to cope with the current needs of information organization. This refinement is necessary to enhance thesaurus suitability for uses in artificial intelligence (AI) and in the Semantic Web environments, as well as to increase possibilities for IR. This paper discusses the possibility of refining the associative relation into a number of sub-kinds by adopting the semantic model of EuroWordNet (EWN), as it was used, according to one of its national versions, ItalWordNet (IWN), to structure a terminological resource for a specific domain. A number of issues that such a work of refinement could imply, and in particular its domain dependence, are also discussed},
KEYWORDS = {thesaurus, lexical database, semantic relations},
PAGES = {61-77},
URL = {https://iris.cnr.it/handle/20.500.14243/435019},
ISBN = {978-3-89913-644-9},
CONFERENCE_NAME = {TKE2008, Managing Ontologies and Lexical Resources: 8th International Conference on Terminology and Knowledge Engineering},
BOOKTITLE = {Proceedings of the 8th International Conference on Terminology and Knowledge Engineering (TKE 2008), "Managing Ontologies and Lexical Resources"},
EDITOR = {Madsen, B. N. and Thomsen, H. E.},
}
@INPROCEEDINGS{MONACHINI_2008_INPROCEEDINGS_MQDC_65105,
AUTHOR = {Monachini, M. and Quochi, V. and Del Gratta, R. and Calzolari, N.},
TITLE = {Using LMF to Shape a Lexicon for the Biomedical Domain},
YEAR = {2008},
ABSTRACT = {This paper describes the design, implementation and population of the BioLexicon in the framework of BootStrep, an FP6 project. The BioLexicon (BL) is a lexical resource designed for text mining in the bio-domain. It has been conceived to meet both domain requirements and upcoming ISO standards for lexical representation. The data model and data categories are compliant to the ISO Lexical Markup Framework and the Data Category Registry. The BioLexicon integrates features of lexicons and terminologies: term entries (and variants) derived from existing resources are enriched with linguistic features, including sub-categorization and predicate-argument information, extracted from texts. Thus, it is an extendable resource. Furthermore, the lexical entries will be aligned to concepts in the BioOntology, the ontological resource of the project. The BL implementation is an extensible relational database with automatic population procedures. Population relies on a dedicated input data structure allowing to upload terms and their linguistic properties and "pull-and-push" them in the database. The BioLexicon teaches that the state-of-the-art is mature enough to aim at setting up a standard in this domain. Being conformant to lexical standards, the BioLexicon is interoperable and portable to other areas},
KEYWORDS = {Domain terminologies, Computational lexicons, Lexical standards, Lexical architectures},
PAGES = {153-157},
URL = {https://iris.cnr.it/handle/20.500.14243/65105},
CONFERENCE_NAME = {LangTech 2008-Tecnologia applicata alla linguistica},
BOOKTITLE = {LangTech 2008-Tecnologia applicata alla linguistica},
EDITOR = {Delogu, C. and Falcone, M.},
}
@INPROCEEDINGS{MORGAVI_2008_INPROCEEDINGS_MM_170503,
AUTHOR = {Morgavi, G. and Marconi, L.},
TITLE = {Growing Up of Autonomous Agents: an Emergent Phenomenon},
YEAR = {2008},
ABSTRACT = {A fundamental research challenge is the design of robust artifacts that are capable of operating under changing environments and noisy input, and yet exhibit the desired behavior and response time. These systems should be able to adapt and learn how to react to unforeseen scenarios as well as to display properties comparable to biological entities. The turn to nature has brought us many unforeseen great concepts. Biological systems are able to handle many of these challenges with an elegance and efficiency still far beyond current human artifacts. A living artifact grows up when its capabilities, abilities/knowledge, shift to a further level of complexity, i. e. the complexity rank of its internal capabilities performs a step forward. In the attempt to define an architecture for autonomous growing up agents [1]. We conducted an experiment on the abstraction process in children as natural parts of a cognitive system. We found that linguistic growing up involve a number of different trial processes. We identified a fixed number of distinct paths that were crossed by children. Once a given interpretation paths was discovered useless, they tried to follow another path, until the new meaning was emerging. This study generates suggestion about the evolutionary conditions conducive to the emergence of growing up in robots and provides guidelines for designing artificial evolutionary systems displaying spontaneous adaptation abilities. The importance of multi-sensor perception, motivation and emotional drives are underlined and, above all, the growing up insights shows similarities to emergent self-organized behaviors},
KEYWORDS = {growing up, emergence, adaptive systems, living artifacts, epigenetic robotics},
PAGES = {177-186},
URL = {https://iris.cnr.it/handle/20.500.14243/170503},
DOI = {10.1063/1.3020657},
ISBN = {978-0-7354-0579-0},
CONFERENCE_NAME = {CASYS2007 Eight International Conference on Computing Anticipatory Systems},
BOOKTITLE = {Computing Anticipatory Systems},
EDITOR = {Daniel, D.},
}
@INPROCEEDINGS{MORGAVI_2008_INPROCEEDINGS_MMM_67788,
AUTHOR = {Morgavi, G. and Marconi, L. and Morando, M.},
TITLE = {A contribution to specification toward truly autonomous robots},
YEAR = {2008},
ABSTRACT = {A great deal of current research work in robotics and autonomous systems is still focused on getting an agent to learn to do some task such as recognizing an object or going to a specific place. The learning process may be supervised, unsupervised or a process of occasional reinforcement, but the whole aim in such work is to get the robot to achieve the task that was predefined by the researcher. The next logical step along the road towards truly autonomous robots that can dive in unpredictable environments is to investigate how one might design robots that are capable of `growing up' through experience. A living artifact grows up when its capabilities, abilities/knowledge, shift to a further level of complexity, i. e. the complexity rank of its internal capabilities performs a step forward. Robotics researchers increasingly agree that ideas from nature and self-organization can strongly benefit the design of autonomous robots. In this paper we studied the modalities through which pre-school children (from 4 to 5) tackle with a growing up process: the abstraction. Children of these ages are not supposed to be able to perform the abstraction process, but they have a sufficient knowledge of the natural language that allow the description of the processes they are using when they try to reach the meaning of an abstract sentence. This experiment resulted in some very interesting suggestions on what can be useful for the architecture of an adaptive and evolving robot. The importance of multi-sensor perception, motivation and emotional drives are underlined and, above all, the growing up insights shows similarities to emergent self-organized behaviors},
KEYWORDS = {growing up, emergence, adaptive systems, living artifacts, epigenetic robotics},
PAGES = {153-158},
URL = {http://www.eurasip.org/Proceedings/Ext/CIP2008/CIP08%20Authors.html},
CONFERENCE_NAME = {IAPR Workshop on Cognitive Information Processing},
}
@INPROCEEDINGS{PICCHI_2008_INPROCEEDINGS_PSCB_65093,
AUTHOR = {Picchi, E. and Sassolini, E. and Cucurullo, S. and Bertagna, F.},
TITLE = {Mining the News with Semantic Press},
YEAR = {2008},
KEYWORDS = {Text mining, Press review},
URL = {https://iris.cnr.it/handle/20.500.14243/65093},
CONFERENCE_NAME = {LangTech 2008},
}
@INPROCEEDINGS{PICCHI_2008_INPROCEEDINGS_PSCBB_65101,
AUTHOR = {Picchi, E. and Sassolini, E. and Cucurullo, S. and Bertagna, F. and Baroni, P.},
TITLE = {Semantic Press},
YEAR = {2008},
ABSTRACT = {In this paper Semantic Press, a tool for the automatic press review, is introduced. It is based on Text Mining technologies and is tailored to meet the needs of the eGovernment and eParticipation communities. First, a general description of the application demands emerging from the eParticipation and eGovernment sectors is offered. Then, an introduction to the framework of the automatic analysis and classification of newspaper content is provided, together with a description of the technologies underlying it},
KEYWORDS = {Text Mining, Tools, Systems, Applications},
PAGES = {2752-2756},
URL = {http://www.lrec-conf.org/proceedings/lrec2008/},
PUBLISHER = {European Language Resources Association (ELRA)-Evaluations and Language resources Distribution Agency (ELDA) (Paris, FRA)},
ISBN = {2-9517408-4-0},
CONFERENCE_NAME = {LREC 2008-Sixth International Conference on Language Resources and Evaluation},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the Sixth International Conference on Language Resources and Evaluation},
EDITOR = {Calzolari, N. and Choukri, K. and Maegaard, B. and Mariani, J. and Odjik, J. and Piperidis, S. and Tapias, D.},
}
@INPROCEEDINGS{QUOCHI_2008_INPROCEEDINGS_QC_227370,
AUTHOR = {Quochi, V. and Calderone, B.},
TITLE = {Learning properties of Noun Phrases: from data to functions},
YEAR = {2008},
ABSTRACT = {The paper presents two experiments of unsupervised classification of Italian noun phrases. The goal of the experiments is to identify the most prominent contextual properties that allow for a functional classification of noun phrases. For this purpose, we used a Self Organizing Map is trained with syntactically-annotated contexts containing noun phrases. The contexts are defined by means of a set of features representing morpho-syntactic properties of both nouns and their wider contexts. Two types of experiments have been run: one based on noun types and the other based on noun tokens. The results of the type simulation show that when frequency is the most prominent classification factor, the network isolates idiomatic or fixed phrases. The results of the token simulation experiment, instead, show that, of the 3 6 attributes represented in the original input matrix, only a few of them are prominent in the re-organization of the map. In particular, key features in the emergent macro-classification are the type of determiner and the grammatical number of the noun. An additional but not less interesting result is an organization into semantic/pragmatic micro-classes. In conclusions, our result confirm the relative prominence of determiner type and grammatical number in the task of noun (phrase) categorization},
KEYWORDS = {cognitive linguistics, noun phrase},
PAGES = {2596-2602},
URL = {http://www.lrec-conf.org/proceedings/lrec2008/summaries/644.html},
ISBN = {2-9517408-4-0},
CONFERENCE_NAME = {Sixth International Conference on Language Resources and Evaluation (LREC'08)},
}
@INPROCEEDINGS{QUOCHI_2008_INPROCEEDINGS_QMDC_65076,
AUTHOR = {Quochi, V. and Monachini, M. and Del Gratta, R. and Calzolari, N.},
TITLE = {A lexicon for biology and bioinformatics: the BOOTStrep experience},
YEAR = {2008},
ABSTRACT = {This paper describes the design, implementation and population of a lexical resource for biology and bioinformatics (the BioLexicon) developed within an ongoing European project. The aim of this project is text-based knowledge harvesting for support to information extraction and text mining in the biomedical domain. The BioLexicon is a large-scale lexical-terminological resource encoding different information types in one single integrated resource. In the design of the resource we follow the ISO/DIS 24613 "Lexical Mark-up Framework" standard, which ensures reusability of the information encoded and easy exchange of both data and architecture. The design of the resource also takes into account the needs of our text mining partners who automatically extract syntactic and semantic information from texts and feed it to the lexicon. The present contribution first describes in detail the model of the BioLexicon along its three main layers: morphology, syntax and semantics; then, it briefly describes the database implementation of the model and the population strategy followed within the project, together with an example. The BioLexicon database in fact comes equipped with automatic uploading procedures based on a common exchange XML format, which guarantees that the lexicon can be properly populated with data coming from different sources},
KEYWORDS = {Lexicon, Ontologies, Lexical database},
PAGES = {2285-2292},
URL = {http://www.lrec-conf.org/proceedings/lrec2008/pdf/576_paper.pdf},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {2-9517408-4-0},
CONFERENCE_NAME = {LREC 2008, Sixth International Conference on Language Resources and Evaluation},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {LREC 2008, Sixth International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{ROVENTINI_2008_INPROCEEDINGS_RR_65094,
AUTHOR = {Roventini, A. and Ruimy, N.},
TITLE = {Mapping Events and Abstract Entities from PAROLE-SIMPLE-CLIPS to ItalWordNet},
YEAR = {2008},
KEYWORDS = {Lexicon, Lexical database, Semantics, Ontologies},
URL = {https://iris.cnr.it/handle/20.500.14243/65094},
CONFERENCE_NAME = {LREC 2008, Sixth International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{RUIMY_2008_INPROCEEDINGS_RRMU_65092,
AUTHOR = {Ruimy, N. and Roventini, A. and Marinelli, R. and Ulivieri, M.},
TITLE = {Linking and Integrating two Electronic Lexicons},
YEAR = {2008},
KEYWORDS = {Electronics Lexicons, Language Resources},
URL = {https://iris.cnr.it/handle/20.500.14243/65092},
CONFERENCE_NAME = {The First International Conference on Global Interoperability for Language Resources},
}
@INPROCEEDINGS{RUIMY_2008_INPROCEEDINGS_RT_65095,
AUTHOR = {Ruimy, N. and Toral, R. A.},
TITLE = {More semantic links in the SIMPLE-CLIPS database},
YEAR = {2008},
ABSTRACT = {Notwithstanding its acknowledged richness, the SIMPLE semantic model does not offer the representational vocabulary for encoding some conceptual links holding between events and their participants and among co-participants in events. Although critical for boosting performance in many NLP application tasks, such deep lexical information is therefore only partially encoded in the SIMPLE-CLIPS Italian semantic database. This paper reports on the enrichment of the SIMPLE relation set by some expressive means, namely semantic relations, borrowed from the EuroWordNet model and their implementation in the SIMPLE-CLIPS lexicon. The original situation existing in the database, as to the expression of this type of information is described and the loan descriptive vocabulary presented. Strategies based on the exploitation of the source lexicon data were adopted to induce new information: a wide range of semantic-but also syntactic-information was investigated for singling out word senses candidate to be linked by the new relations. The lexicon enrichment by 5, 000 new relations instantiated so far has therefore been carried out as a largely automated, low-effort and cost-free process, with no heavy human intervention. The redundancy set off by such an extension of information is being addressed by the implementation of inheritance in the SIMPLE-CLIPS database (Del Gratta et al., 2008)},
KEYWORDS = {Lexicon, Knowledge representation, Semantics, Lexical database},
PAGES = {3555-3560},
URL = {http://www.lrec-conf.org/proceedings/lrec2008/},
PUBLISHER = {European Language Resources Association (ELRA)-Evaluations and Language resources Distribution Agency (ELDA) (Paris, FRA)},
ISBN = {2-9517408-4-0},
CONFERENCE_NAME = {LREC 2008, Sixth International Conference on Language Resources and Evaluation},
CONFERENCE_PLACE = {Paris},
EDITOR = {Calzolari, N. and Choukri, K. and Maegaard, B. and Mariani, J. and Odjik, J. and Piperidis, S. and Tapias, D.},
}
@INPROCEEDINGS{SASAKI_2008_INPROCEEDINGS_SMPRMA_65079,
AUTHOR = {Sasaki, Y. and Montemagni, S. and Pezik, P. and Rebholzschuhmann, D. and McNaught, J. and Ananiadou, S.},
TITLE = {BioLexicon: A Lexical Resource for the Biology Domain},
YEAR = {2008},
KEYWORDS = {BioLexicon, Terminological verbs},
URL = {https://iris.cnr.it/handle/20.500.14243/65079},
CONFERENCE_NAME = {Third International Symposium on Semantic Mining in Biomedicine},
}
@INPROCEEDINGS{TAKENOBU_2008_INPROCEEDINGS_TKHHCMSSSCY_65077,
AUTHOR = {Takenobu, T. and Kaplan, D. and Huang, C. and Hsieh, S. and Calzolari, N. and Monachini, M. and Soria, C. and Shirai, K. and Sornlertlamvanich, V. and Charoenporn, T. and Yingju, X.},
TITLE = {Adapting International Standard for Asian Language Technologies},
YEAR = {2008},
ABSTRACT = {Corpus-based approaches and statistical approaches have been the main stream of natural language processing research for the past two decades. Language resources play a key role in such approaches, but there is an insufficient amount of language resources in many Asian languages. In this situation, standardisation of language resources would be of great help in developing resources in new languages. This paper presents the latest development efforts of our project which aims at creating a common standard for Asian language resources that is compatible with an international standard. In particular, the paper focuses on i) lexical specification and data categories relevant for building multilingual lexical resources for Asian languages; ii) a core upper-layer ontology needed for ensuring multilingual interoperability and iii) the evaluation platform used to test the entire architectural framework},
KEYWORDS = {LR national/international projects, Organizational/policy issues, LR Infrastructures and Architectures, Lexicon, Lexical database},
PAGES = {1663},
URL = {http://www.lrec-conf.org/proceedings/lrec2008/pdf/422_paper.pdf},
PUBLISHER = {European Language Resources Association ELRA (Paris, FRA)},
ISBN = {2-9517408-4-0},
CONFERENCE_NAME = {LREC 2008, Sixth International Conference on Language Resources and Evaluation},
CONFERENCE_PLACE = {Paris},
}
@INPROCEEDINGS{THOMPSON_2008_INPROCEEDINGS_TCAMMTV_65080,
AUTHOR = {Thompson, P. and Cotter, P. and Ananiadou, S. and McNaught, J. and Montemagni, S. and Trabucco, A. and Venturi, G.},
TITLE = {Building a Bio-Event Annotated Corpus for the Acquisition of Semantic Frames from Biomedical Corpora},
YEAR = {2008},
KEYWORDS = {Corpus (creation, annotation, etc.), Text mining, Semantics, Event Extraction},
PAGES = {2159-2166},
URL = {https://iris.cnr.it/handle/20.500.14243/65080},
ISBN = {2-9517408-4-0},
CONFERENCE_NAME = {LREC 2008, Sixth International Conference on Language Resouces and Evaluation},
}
@INPROCEEDINGS{THOMPSON_2008_INPROCEEDINGS_TVMMA_65081,
AUTHOR = {Thompson, P. and Venturi, G. and McNaught, J. and Montemagni, S. and Ananiadou, S.},
TITLE = {Categorising Modality in Biomedical Texts},
YEAR = {2008},
ABSTRACT = {The accurate recognition of modal information is vital for the correct interpretation of statements. In this paper, we report on the collection a list of words and phrases that express modal information in biomedical texts, and propose a categorisation scheme according to the type of information conveyed. We have performed a small pilot study through the annotation of 202 MEDLINE abstracts according to our proposed scheme. Our initial results suggest that modality in biomedical statements can be predicted fairly reliably though the presence of particular lexical items, together with a small amount of contextual information},
KEYWORDS = {Biomedical texts, Modality},
PAGES = {27-34},
URL = {https://iris.cnr.it/handle/20.500.14243/65081},
ISBN = {2-9517408-4-0},
CONFERENCE_NAME = {LREC 2008, Sixth International Conference on Language Resources and Evaluation: Workshop 'Building and Evaluating Resources for Biomedical Text Mining'},
}
@INPROCEEDINGS{TORALRUIZ_2008_INPROCEEDINGS_TQDMSC_65089,
AUTHOR = {Toral Ruiz, A. and Quochi, V. and Del Gratta, R. and Monachini, M. and Soria, C. and Calzolari, N.},
TITLE = {Lexically-based Ontologies and Ontologically Based Lexicons},
YEAR = {2008},
ABSTRACT = {This paper deals with the relations between ontologies and lexicons. We study the role of these two components and their evolution during the last years in the field of Computational Linguistics. Subsequently, we survey the current lines of research at ILC-CNR which tackle this topic. They involve (I) the reuse of already existing Lexical Resources to derive formal ontologies, (II) the conversion and combination of terminologies into rich and formal Lexical Resources and (III) the use of formal ontologies as the backbone of multilingual Lexical Resources},
KEYWORDS = {Resource Infrastructure, UIMA, Clarin},
PAGES = {49-59},
URL = {https://iris.cnr.it/handle/20.500.14243/65089},
CONFERENCE_NAME = {AI*IA 2008-10th Congress of Italian Association for Artificial Intelligence},
BOOKTITLE = {AI*IA 2008-10th Congress of Italian Association for Artificial Intelligence},
}
@INPROCEEDINGS{TORAL_2008_INPROCEEDINGS_TMM_65096,
AUTHOR = {Toral, R. A. and Muñoz, R. and Monachini, M.},
TITLE = {Named Entity WordNet},
YEAR = {2008},
ABSTRACT = {This paper presents the automatic extension of Princeton WordNet with Named Entities (NEs). This new resource is called Named Entity WordNet. Our method maps the noun is-a hierarchy of WordNet to Wikipedia categories, identifies the NEs present in the latter and extracts different information from them such as written variants, definitions, etc. This information is inserted into a NE repository. A module that converts from this generic repository to the WordNet specific format has been developed. The paper explores different aspects of our methodology such as the treatment of polysemous terms, the identification of hyponyms within the Wikipedia categorization system, the identification of Wikipedia articles which are NEs and the design of a NE repository compliant with the LMF ISO standard. So far, this procedure enriches WordNet with 310, 742 NEs and 381, 043 "instance of" relations},
KEYWORDS = {Lexicon, Named Entity recognition, Ontologies, Lexical database},
PAGES = {741-747},
URL = {https://iris.cnr.it/handle/20.500.14243/65096},
ISBN = {2-9517408-4-0},
CONFERENCE_NAME = {LREC 2008, Sixth International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{VOSSEN_2008_INPROCEEDINGS_VACFHHIKMMNRRTV_65091,
AUTHOR = {Vossen, P. and Agirre, E. and Calzolari, N. and Fellbaum, C. and Hsieh, S. and Huang, C. and Isahara, H. and Kanzaki, K. and Marchetti, A. and Monachini, M. and Neri, F. and Raffaelli, R. and Rigau, G. and Tesconi, M. and Vangent, J.},
TITLE = {KYOTO: A System for Mining, Structuring, and Distributing Knowledge Across Languages and Cultures},
YEAR = {2008},
ABSTRACT = {We outline work performed within the framework of a current EC project. The goal is to construct a language-independent information system for a specific domain (environment/ecology/biodiversity) anchored in a language-independent ontology that is linked to wordnets in seven languages. For each language, information extraction and identification of lexicalized concepts with ontological entries is carried out by text miners ("Kybots"). The mapping of language-specific lexemes to the ontology allows for crosslinguistic identification and translation of equivalent terms. The infrastructure developed within this project enables long-range knowledge sharing and transfer across many languages and cultures, addressing the need for global and uniform transition of knowledge beyond the specific domains addressed here},
KEYWORDS = {Information Extraction, Information Retrieval, Digital libraries, Lexicon, Lexical database},
URL = {https://iris.cnr.it/handle/20.500.14243/65091},
ISBN = {2-9517408-4-0},
CONFERENCE_NAME = {LREC 2008, Sixth International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{CARLI_2008_INPROCEEDINGS_CMBMCCS_106745,
AUTHOR = {Carli, G. and Marinelli, R. and Bindi, R. and Marchi, S. and Cavallaro, F. I. and Castellani, E. and Santarcangelo, E. L.},
TITLE = {Language modulation by hypnotizability},
YEAR = {2008},
KEYWORDS = {Psychotherapy, Neurorehabilitation},
URL = {https://iris.cnr.it/handle/20.500.14243/106745},
CONFERENCE_NAME = {59° Congresso Nazionale della Società Italiana di Fisiologia},
}
@INPROCEEDINGS{CIGNONI_2008_INPROCEEDINGS_CPS_435679,
AUTHOR = {Cignoni, L. and Pardelli, G. and Sassi, M.},
TITLE = {Grey Literature for Natural Language Processing: a Terminological and Statistical Approach},
YEAR = {2008},
ABSTRACT = {This paper presents the results of a study on grey literature (GL) in the field of Natural Language Processing (NLP). Our data has been collected in a corpus of ca 13, 000 records corresponding to the titles of papers presented at International Conferences from 1950 to June 2008. A statistical representation of the most significant terms relative to GL in NLP and other interrelated disciplines associates old and new words, highlighting the terminological changes that have taken place in the course of time. Aim of our study is to contribute to the creation of language resources for the extraction of GL coming from the Web in order to help prevent the disappearance of documents containing NLP words that have undergone rapid development over the last decades. This paper is organised as follows: after a general introduction to our work, section 2 provides a historical overview of NLP; sections 3 and 4 offer an account of the most relevant terms used by specialists in different periods, and indicative of the changes that have taken place; section 5 describes the methodology we have used and also contains information on our GL database and a graphical representation of the data. Finally, the conclusions stress the need to integrate pre-existing or obsolete words and expressions, creating NLP synonym relations},
KEYWORDS = {Computational Linguistics, Grey Literature},
PAGES = {116-120},
URL = {https://iris.cnr.it/handle/20.500.14243/435679},
ISBN = {978-90-77484-12-8},
CONFERENCE_NAME = {Tenth International Conference on Grey Literature: Designing the Grey Grid for Information Society},
EDITOR = {Farace, D. G. and Frantzen, J.},
}
@INPROCEEDINGS{MARINELLI_2008_INPROCEEDINGS_M_106746,
AUTHOR = {Marinelli, R.},
TITLE = {Ontological Structure and Digital Corpora for Metaphorical Sense Recognition},
YEAR = {2008},
KEYWORDS = {Ontology},
URL = {https://iris.cnr.it/handle/20.500.14243/106746},
CONFERENCE_NAME = {XXVI AESLA Conference 'From Applied Linguistics to the Linguistics of the Mind: Issues, Practices and Trends'},
}
@INPROCEEDINGS{MONTEMAGNI_2008_INPROCEEDINGS_M_106744,
AUTHOR = {Montemagni, S.},
TITLE = {Exploring the correlation between phonetic and lexical variation in Tuscany},
YEAR = {2008},
KEYWORDS = {Dialectal variation, ALT-Web},
URL = {https://iris.cnr.it/handle/20.500.14243/106744},
CONFERENCE_NAME = {Thirteenth International Conference on Methods in Dialectology},
}
@INPROCEEDINGS{REBHOLZSCHUHMANN_2008_INPROCEEDINGS_RPLDKSMMMCA_106743,
AUTHOR = {Rebholzschuhmann, D. and Pezik, P. and Lee, V. and Del Gratta, R. and Kim, J. and Sasaki, Y. and McNaught, J. and Montemagni, S. and Monachini, M. and Calzolari, N. and Ananiadou, S.},
TITLE = {BioLexicon: Towards a reference terminological resource in the biomedical domain},
YEAR = {2008},
ABSTRACT = {The BioLexicon is a publicly available large-scale terminological resource which brings together potential terms from several resources representing selected semantic types (genes, proteins, chemicals, species, enzymes, selected ontological terms). The schema of the BioLexicon enables improved resolution of term ambiguity and follows lexical standards for terminological resources},
KEYWORDS = {BioLexicon},
URL = {https://iris.cnr.it/handle/20.500.14243/106743},
ISBN = {978-1-61567-371-1},
CONFERENCE_NAME = {16th Annual International Conference on Intelligent Systems for Molecular Biology},
BOOKTITLE = {16th Annual International Conference on Intelligent Systems for Molecular Biology},
}
@TECHREPORT{AIELLO_2008_TECHREPORT_ACMQ_190692,
AUTHOR = {Aiello, M. and Chiarella, D. and Martini, C. and Quarati, A.},
TITLE = {Introduzione del mail-gateway ESVA nella rete ARiGe},
YEAR = {2008},
ABSTRACT = {Con la crescita esponenziale di Internet e l'utilizzo sempre più pervasivo di strumenti di telecomunicazione mediata dal computer, i veicoli di trasmissione più comuni per virus e worm sono costituiti dal traffico Web e dalla posta elettronica. Inoltre, il crescente volume di e-mail non richieste, classificabili prevalentemente come spamming e phishing, costituisce un' evidente minaccia per la sicurezza dei dati personali e per la produttività sia dei singoli che delle realtà produttive. Per questi motivi, un sistema di sicurezza a livello di gateway, in grado di garantire una efficace protezione contro malware (virus e worm) ed e-mail indesiderate (spamming e phishing), è un elemento indispensabile negli attuali ambienti di rete collegati a Internet. In questo scenario il gruppo Servizio Infrastrutture Reti (SIR) del C. N. R, Area della Ricerca di Genova (ARiGe), con l'intento di fornire una protezione completa del traffico di posta elettronica, ha effettuato una valutazione delle principali classi tecnologiche di prodotti mail-gateway attualmente disponibili: appliance, software commerciale e opensource. L'esame comparato costi/benefici di alcuni tra i più noti di questi strumenti, ha permesso di individuare nel mail-gateway opensource ESVA (E-mail Scanning and Security Virtual Appliance), la soluzione più appropriata. L'inserimento di ESVA in ARiGe è avvenuto in due fasi. Alla versione standard, basata su un approccio a macchina virtuale, installata inizialmente, ha fatto seguito, con l'obbiettivo di aumentarne le prestazioni, lo studio e la realizzazione di una sua versione de-virtualizzata (ESDA). ESDA ha difatti permesso di ottenere un ulteriore miglioramento a livello di performance (e. g. riduzione del carico dei server), dei servizi di posta elettronica supportati, che affianca la già ottima risposta in termini di fruibilità fornita agli utenti (e. g. diminuita quantità di spam e virus, di e-mail non giunte a destinazione) dalla versione virtualizzata},
URL = {https://iris.cnr.it/handle/20.500.14243/190692},
}
@TECHREPORT{ALIPRANDI_2008_TECHREPORT_ANMRTSMVBAAARS_195958,
AUTHOR = {Aliprandi, C. and Neri, F. and Marchetti, A. and Ronzano, F. and Tesconi, M. and Soria, C. and Monachini, M. and Vossen, P. and Bosma, W. and Agirre, E. and Artola, X. and Arantza, D. and Rigau, G. and Soroa, A.},
TITLE = {Database models and data formats},
YEAR = {2008},
KEYWORDS = {XML data format, TMF, SEMAF, OWL/KIF, FACTAF},
URL = {https://iris.cnr.it/handle/20.500.14243/195958},
}
@TECHREPORT{BINDI_2008_TECHREPORT_BMGP_457845,
AUTHOR = {Bindi, R. and Marinelli, R. and Goggi, S. and Picchi, E.},
TITLE = {LE-PAROLE, Italian Corpus Description, Part Available for Distribution. Updated Version},
YEAR = {2008},
KEYWORDS = {Corpus, Corpus linguistics, Databases},
URL = {https://iris.cnr.it/handle/20.500.14243/457845},
}
@TECHREPORT{CININI_2008_TECHREPORT_CS_344160,
AUTHOR = {Cinini, A. and Sassi, M.},
TITLE = {Aggiornamento della Banca Dati del CSM},
YEAR = {2008},
ABSTRACT = {Aggiornamento della Banca dati delle sentenze e ordinanze della Sezione Disciplinare del Consiglio Superiore della Magistratura, realizzata in collaborazione con l'Istituto di Ricerca sui Sistemi Giudiziari (IRSIG-CNR), con i documenti relativi agli anni 2004-2007. Sperimentazione di nuove funzioni di estrazione dell'informazione tramite software di trattamento automatico del linguaggio (TAL), con particolare riferimento ad analisi diacroniche dei risultati di ricerche complesse su dati testuali},
KEYWORDS = {Informatica giuridica documentale, Analisi Sentenze, DBT},
PAGES = {1-17},
URL = {https://iris.cnr.it/handle/20.500.14243/344160},
}
@TECHREPORT{MARCHETTI_2008_TECHREPORT_MRTSMVB_183217,
AUTHOR = {Marchetti, A. and Ronzano, F. and Tesconi, M. and Soria, C. and Monachini, M. and Vossen, P. and Bosma, W.},
TITLE = {XML Schema for Wordnet and Ontology},
YEAR = {2008},
ABSTRACT = {This deliverable describes the XML schema adopted to represent all the data related to the management of the multi-language wordnets and the ontology; they constitute the set of linguistic and semantic resources of KYOTO system},
KEYWORDS = {XML Schema, Wordnet, Ontology, LMF, TMF},
URL = {https://iris.cnr.it/handle/20.500.14243/183217},
}
@TECHREPORT{MARINELLI_2008_TECHREPORT_M_195955,
AUTHOR = {Marinelli, R.},
TITLE = {Descrizione dei criteri e dei metodi per la costruzione di un database di terminologia},
YEAR = {2008},
KEYWORDS = {Terminology},
URL = {https://iris.cnr.it/handle/20.500.14243/195955},
}
@TECHREPORT{MARINELLI_2008_TECHREPORT_MT_195956,
AUTHOR = {Marinelli, R. and Tiberi, M.},
TITLE = {L'ampliamento del db semantico lessicale terminologico Mariterm con un insieme di termini di meteorologia},
YEAR = {2008},
KEYWORDS = {Terminology},
URL = {https://iris.cnr.it/handle/20.500.14243/195956},
}
@TECHREPORT{MONACHINI_2008_TECHREPORT_MS_183214,
AUTHOR = {Monachini, M. and Soria, C.},
TITLE = {Report on use of TMF and LMF for representing raw terms},
YEAR = {2008},
KEYWORDS = {Terminological Data Collection, Terminological Markup Framework, Terminological Markup Language},
URL = {https://iris.cnr.it/handle/20.500.14243/183214},
}
@TECHREPORT{MONACHINI_2008_TECHREPORT_MS_184110,
AUTHOR = {Monachini, M. and Soria, C.},
TITLE = {Report on use of LMF for representing WordNets},
YEAR = {2008},
KEYWORDS = {WordNets},
URL = {https://iris.cnr.it/handle/20.500.14243/184110},
}
@TECHREPORT{MONACHINI_2008_TECHREPORT_MSC_183216,
AUTHOR = {Monachini, M. and Soria, C. and Calzolari, N.},
TITLE = {The Lexical Grid: Lexical Resources in Language Infrastructures},
YEAR = {2008},
ABSTRACT = {Language Resources are recognized as a central and strategic for the development of any Human Language Technology system and application product. they play a critical role as horizontal technology and have been recognized in many occasions as a priority also by national and spra-national funding a number of initiatives (such as EAGLES, ISLE, ELRA) to establish some sort of coordination of LR activities, and a number of large LR creation projects, both in the written and in the speech areas},
KEYWORDS = {Human Language Technology, Language Resources},
URL = {https://iris.cnr.it/handle/20.500.14243/183216},
}
@TECHREPORT{MONTEMAGNI_2008_TECHREPORT_M_195957,
AUTHOR = {Montemagni, S.},
TITLE = {Augmented version of the bio-lexicon extended with bio event information and term-to-term weighted links},
YEAR = {2008},
KEYWORDS = {Bio-lexicon},
URL = {https://iris.cnr.it/handle/20.500.14243/195957},
}
@TECHREPORT{PARDELLI_2008_TECHREPORT_PSOP_185974,
AUTHOR = {Pardelli, G. and Sassi, M. and Orsolini, P. and Parrinelli, V.},
TITLE = {Verso la costruzione di una Biblioteca Digitale},
YEAR = {2008},
ABSTRACT = {A data base of the "Antonio Zampolli Fund" has been created and the respective catalogue has been published1. The work of analysis and selection of texts for cataloguing helped in creating this bibliography, in large part built on references extracted by books and journals. Very old bibliographical references have also been retrieved by curricula prepared by Professor Zampolli for various projects and commissions},
URL = {https://iris.cnr.it/handle/20.500.14243/185974},
}
@TECHREPORT{SORIA_2008_TECHREPORT_SM_195959,
AUTHOR = {Soria, C. and Monachini, M.},
TITLE = {KYOTO-LMF WordNet Representation Format},
YEAR = {2008},
KEYWORDS = {Ontology linked to wordnets},
URL = {https://iris.cnr.it/handle/20.500.14243/195959},
}
@TECHREPORT{TOKUNAGA_2008_TECHREPORT_TCHKSYCCHKMPS_183215,
AUTHOR = {Tokunaga, T. and Calzolari, N. and Huang, C. and Kiyoaki, S. and Sornlertlamvanich, V. and Yingju, X. and Charoenporn, T. and Chung, S. and Hsieh, S. and Kaplan, D. and Monachini, M. and Prévot, L. and Soria, C.},
TITLE = {Developing International Standards of Language Resources for Semantic Web Applications-Research Report of the International Joint Research Program NEDO},
YEAR = {2008},
ABSTRACT = {This report describes a three-year project aiming at an international standard for language resources that includes Asian languages. We summarise our contribution to an international standard of lexical markup framework (LMF) and introduce a prototype query expansion system using LMF-compliant lexical resources. Since ISO 24613 was in the FDIS stage and fairly stable, we built sample lexicons in Chinese, English, Italian, Japanese, and Thai based on ISO24613. At the same time, we implemented a query expansion system utilising rich linguistic resources including lexicons described in the ISO 24613 framework. We confirmed that a system was feasible which worked on the tested languages (including both Western and Eastern languages) when given lexicons are compliant with the framework},
KEYWORDS = {International standards, Language resources, Semantic web applications},
URL = {https://iris.cnr.it/handle/20.500.14243/183215},
}
@MISC{BARONI_2008_MISC_B_312504,
AUTHOR = {Baroni, P.},
TITLE = {ECP-2007-LANG-617001 FLaReNet: Project Web Site},
YEAR = {2008},
ABSTRACT = {Web site of the project FLaReNet-Fostering Language Resources Network (eContentplus Programme | Grant Agreement No. ECP-2007-LANG-617001), powered by Drupal, developed in English},
KEYWORDS = {Sito web},
URL = {http://www.flarenet.eu},
}
@MISC{CUCURULLO_2008_MISC_CPB_192749,
AUTHOR = {Cucurullo, S. and Picchi, E. and Biffi, M.},
TITLE = {Lessico italiano radiofonico 1995-2003},
YEAR = {2008},
KEYWORDS = {Lessico radiofonico, Corpus parlato},
URL = {https://iris.cnr.it/handle/20.500.14243/192749},
}
@MISC{CUCURULLO_2008_MISC_CPSSMM_192750,
AUTHOR = {Cucurullo, S. and Picchi, E. and Sassi, M. and Segre, C. and Martignoni, C. and Morini, L.},
TITLE = {Le concordanze diacroniche dell'Orlando Furioso},
YEAR = {2008},
KEYWORDS = {Furioso, Orlando, Concordanze diacroniche},
URL = {https://iris.cnr.it/handle/20.500.14243/192750},
}
@MISC{DIDONATO_2008_MISC_D_406243,
AUTHOR = {Di Donato, F.},
TITLE = {The Evaluation in the Republic of Science. From peer review to open soft peer review},
YEAR = {2008},
ABSTRACT = {"No university teacher likes to be reminded of discussions of appointments, for they are seldom agreeable. And yet I may say that in the numerous cases known to me there was, without exception, the good will to allow purely objective reasons to be decisive. However, the decision over academic fates is too often largely a 'hazard'". In his well-known lecture Wissenschaft als Beruf (1918), Science as a Vocation, Max Weber underlined the limitations of an appointment procedure based on building consensus among peers. However, his reflection can also be interpreted as a specific instance of the more general problem of the relationship between objectivity and evaluation. In his lecture, Weber sees Science as both a vocation and a profession. His analysis starts from the differences and analogies of the career and retirement system in German and American universities, which he considers respectively "plutocratic" and bureaucratic. This presentation isn't focused on studying appointment procedures but rather scholarly peer review. Hence, the link with the arguments of the German sociologist, may not appear so evident at a first sight. However, it suddenly becomes visible if we consider the topic from a philosophical and sociological point of view. From this perspective, peer review procedures are clearly connected both to the role of science within the academia and its influence on the society in general. A reflection on evaluation procedures involves scientific and moral issues concerning knowledge production and its dissemination. It also involves careers, funding and the basic structure of the "Republic of Science" itself. The reviewing procedures used today are almost exclusively based on the good will of the reviewers to keep the evaluation on an objective ground. A premise that I consider, like Weber does, largely insufficient and hazardous. This presentation has three objectives:-Firstly, it aims at clarifying the motivations and the historical context that led to the birth of peer review.-Secondly, it aims at reflecting, from a political philosophy perspective, on the impact of evaluation procedures on the government of the Republic of Science. To put it in simple terms: Is the Republic of Science a proper Republic? Which form of government should be chosen for an Open Scholarly Community on the web?-Thirdly, it aims at proposing a novel approach to peer review that could be adopted in Open Scholarly Communities on the Web. I call this approach "open soft peer review"},
URL = {https://iris.cnr.it/handle/20.500.14243/406243},
}
@MISC{DIDONATO_2008_MISC_D_406245,
AUTHOR = {Di Donato, F.},
TITLE = {Neither property nor contracts. The need of Das persönliche Recht auf dingliche Art in The Metaphysics of Morals},
YEAR = {2008},
ABSTRACT = {Presentation held at PSA Workshops in Political Theory-Kant on Economic Justice, Manchester Metropolitan University (2008)},
URL = {https://iris.cnr.it/handle/20.500.14243/406245},
}
@MISC{DIDONATO_2008_MISC_D_384175,
AUTHOR = {Di Donato, F.},
TITLE = {Polanyi, Michael, Scienza, fede e società},
YEAR = {2008},
URL = {https://iris.cnr.it/handle/20.500.14243/384175},
ISSN = {1826-4654},
}
@MISC{DIDONATO_2008_MISC_D_384172,
AUTHOR = {Di Donato, F.},
TITLE = {Kant I., Riproposizione della questione: se il genere umano sia in costante progresso verso il meglio},
YEAR = {2008},
ABSTRACT = {Traduzione dall'originale tedesco},
URL = {https://iris.cnr.it/handle/20.500.14243/384172},
ISSN = {1591-4305},
}
@MISC{GIOVANNETTI_2008_MISC_G_244997,
AUTHOR = {Giovannetti, E.},
TITLE = {Combining statistical techniques and lexico-syntactic patterns for semantic relations extraction from text},
YEAR = {2008},
ABSTRACT = {Semantic relation extraction is a crucial task for Ontology Learning from Texts. In literature, statistical unsupervised systems are used for semantic relation extraction: these systems typically detect pairs of semantically related terms (on the basis of their distribution in texts) without specifying the semantic relation holding between them. In this work we propose a fully unsupervised approach for semantic relation validation and extraction from texts. A statistical component (CLASS, CLustering through Analogy-based Semantic Similarity) is used to obtain a set of pairs of distributionally-similar terms occurring in similar contexts, and possibly involved in paradigmatic relations (as, for instance, the words "car" and "motorcycle" in the sentences "I drive my car" and "Bob drives his motorcycle"). To validate and label the anonymous relations obtained through the statistical module occurrences of the candidate pairs of terms are looked for in the Web in the context of reliable lexico-syntactic patterns, where they are involved in a syntagmatic relation (such as, for example, the words "steer" and "car" in the sentence "steer is part of the car"). This work focuses on the definition and application of the lexico-syntactic patterns and on the measures used to assess the reliability of the specific semantic relation the system suggests. The chosen semantic relations are hyponymy, meronymy, co-hyponymy and co-meronymy, for the relevance they have in ontology construction. Different lexico-syntactic patterns are used for different kinds of relations. In particular, patterns including both terms are used for hyponymy and meronymy discovery, (e. g. "cyclosporine is a medicine"): the number of occurrences of the pattern on the Web will indicate the confidence of the candidate semantic relation. Concerning co-hyponymy and co-meronymy, xplorative open patterns, including just one term, are used. For example, given the term pair "electron-nucleus", we can see if a co-meronymy relation holds between them by applying the following two patterns: "electron is part of" and "nucleus is part of" and then by looking for common holonyms (e. g. "atom"). Concerning evaluation, two different measures have been defined, one for hypernymy and meronymy relations and the other for co-hyponymy and comeronymy. The measures are basically built upon the number of occurrences of the patterns on the Web and, concerning co-hyponymy and co-meronymy, on the number of common hypernyms (or holonyms) shared between the terms},
URL = {https://iris.cnr.it/handle/20.500.14243/244997},
}
@MISC{MARINELLI_2008_MISC_M_106748,
AUTHOR = {Marinelli, R.},
TITLE = {Analisi di metafore e espressioni idiomatiche per mezzo di risorse computazionali e corpora elettronici},
YEAR = {2008},
KEYWORDS = {risorse computazionali, terminologia, linguaggio figurativo, corpora, ontologia},
URL = {https://iris.cnr.it/handle/20.500.14243/106748},
}
@MISC{PICCHI_2008_MISC_PCS_192752,
AUTHOR = {Picchi, E. and Cucurullo, S. and Sassolini, E.},
TITLE = {Semantic Press},
YEAR = {2008},
KEYWORDS = {Rassegna stampa, Estrazione di informazione},
URL = {https://iris.cnr.it/handle/20.500.14243/192752},
}
@MISC{PIRRELLI_2008_MISC_P_228606,
AUTHOR = {Pirrelli, V.},
TITLE = {Morphology Learning as Paradigm Learning: Developmental and Computational Evidence from Romance Languages},
YEAR = {2008},
ABSTRACT = {In a comprehensive comparison of the developmental stages in the acquisition of inflection in nearly two dozen languages (in the Indo-European, Ugro-Finnic and Semitic families plus Turkish), Bittner et al. (2003) arrive at the conclusion that the transition from lexical processing to morphological patterning is not the automatic outcome of rote lexical storage, but rather the result of an active construction of the child, crucially conditioned by typological factors such as richness, uniformity and transparency of inflectional paradigms. In the present talk I intend to assess this hypothesis by observing the dynamics of a purely morphological acquisition of Romance verb paradigms through a family of Artificial Neural Networks known as Self-Organizing Maps (Kohonen 2002). I shall show that the interplay between built-in principles of acquisition of time-coded sequences and morphology-specific principles of organization of inflectional paradigms can go a long way in accounting for the typological trends highlighted in Bittner et al. (2003). Reported results allow us to draw some general conclusions concerning the process of morphology acquisition as paradigm-based learning and lead to a reappraisal of the traditional one-route vs. dual-route debate in morphology processing and learning},
URL = {http://www.mod-langs.ox.ac.uk/romance-morphology/oxmorph1.html},
CONFERENCE_NAME = {First Oxford Workshop on Romance Verb Morphology},
}
@MISC{PIRRELLI_2008_MISC_PM_192753,
AUTHOR = {Pirrelli, V. and Montemagni, S.},
TITLE = {AnITA},
YEAR = {2008},
KEYWORDS = {NLP Tools},
URL = {https://iris.cnr.it/handle/20.500.14243/192753},
}
@MISC{SASSOLINI_2008_MISC_SPBP_192751,
AUTHOR = {Sassolini, E. and Picchi, E. and Bellone, G. and Porquier, E.},
TITLE = {Progetto per lo studio e la realizzazione di un sistema di erogazione on line in modalità multicanale, dei servizi sanitari prioritari per cittadini e imprese},
YEAR = {2008},
KEYWORDS = {Studi statistici, Patologia},
URL = {https://iris.cnr.it/handle/20.500.14243/192751},
}
@MISC{SASSOLINI_2008_MISC_SPH_464694,
AUTHOR = {Sassolini, E. and Picchi, E. and Haines, M.},
TITLE = {Gli anni della Cupola},
YEAR = {2008},
KEYWORDS = {Corpus trilingue di documenti antichi},
URL = {https://iris.cnr.it/handle/20.500.14243/464694},
}
@ARTICLE{BARONI_2007_ARTICLE_BGP_433727,
AUTHOR = {Baroni, M. and Guevara, E. and Pirrelli, V.},
TITLE = {NN Compounds in Italian: Modelling Category Induction and Analogical Extension},
YEAR = {2007},
ABSTRACT = {Dopo un inquadramento teorico del problema della composizione nelle scienze cognitive e in linguistica, presentiamo una serie di esperimenti sui composti nominali in italiano che mettono alla prova l'ipotesi che ci sia una distinzione fondamentale tra composti relazionali (legittimati da proprietà della testa) e composti attributivi (legittimati dal modificatore). Un'analisi computazionale basata su un corpus conferma che tale distinzione può in linea di principio venire indotta da dati di tipo distribuzionale. Inoltre, dati sperimentali mostrano che il modello è in grado di predire almeno in parte l'accettabilità di nuovi composti formati cambiando testa e modificatore di composti esistenti},
KEYWORDS = {Morphology, Compounding, Mental Lexicon, Lexical Semantics},
PAGES = {263-290},
URL = {https://iris.cnr.it/handle/20.500.14243/433727},
VOLUME = {2},
ISSN = {1720-9331},
JOURNAL = {LINGUE E LINGUAGGIO},
}
@ARTICLE{BERTAGNA_2007_ARTICLE_BTC_37706,
AUTHOR = {Bertagna, F. and Toral, A. and Calzolari, N.},
TITLE = {Evalita 2007: The All-Words WSD Task},
YEAR = {2007},
ABSTRACT = {This report describes the Italian all-words sense disambiguation task organized for EVALITA. The objectives of the task and the type of data prepared and distributed to participants are presented. Moreover, evaluation measures and the results obtained by the participating system are introduced},
URL = {https://iris.cnr.it/handle/20.500.14243/37706},
}
@ARTICLE{BOZZI_2007_ARTICLE_BCF_37707,
AUTHOR = {Bozzi, A. and Cignoni, L. and Fedele, G.},
TITLE = {Linguistic Tools for Navigation in a Virtual Museum},
YEAR = {2007},
ABSTRACT = {Introduction. The digital and Virtual Reality technologies introduced in recent years in the world of museums have promoted the development of innovative products able to provide users and visitors with access modes very different from the traditional ones. Basically, such products are constituted by interactive information units set up in the display rooms, or by digital devices (CDs, DVDs) simulating the path followed by the visitors; they are suitable for didactic purposes and can sell very well if supplied with multilingual audio guides available at the bookshops of the museums. However, if we consider the information available on the net and try to enter a museum of this type which either corresponds to a real one or reflects a typological set of objects actually housed in different and even geographically distant sites, we will certainly be unsatisfied for a number of reasons. Firstly, the few cases available can be looked upon as only partially virtual since the correlated information such as catalogue identification, inventory number, description, etc., has simply been converted into the new condition of digital format. It is true that an artifact that a visitor can see in a low resolution icon catalogue simplifies the information retrieval operations, but it offers no innovative approach capable of justifying the considerable resources invested to produce the digitized objects consultable on-line. Another problem we would like to face is represented by the possible interaction between digital objects and their linguistic captions which we think could highly contribute to the development of a real virtual museum, as long as the environment of navigation and interaction with the user occurs with appropriate paradigms. A number of simple suggestions on this matter will be provided below. The work described here refers to an experiment that was carried out in order to make the visit to a painting gallery, represented by iconographical objects collected in an imaginary space, at the same time virtual and independent of cultural prejudices. Our virtual museum is thus considered as a series of undefined places, e. g. Internet sites or addresses relative to image files in. jpg format, eventually stored in directories available on one or more discs. For each painting it was necessary to produce a text format description of about 400 words, therefore much longer than that of an ordinary caption, but shorter than a monographic essay. In particular, we wanted to check whether and to what extent the element represented by a text would make it possible to create a logical and conceptual association even among elements with apparently no relation (at least for users with low or medium level of culture), as well as among those with evident relations that anybody could identify easily. The system, therefore, functions regardless of the cultural background of the visitor, with the result that anybody, experts and non-experts alike, can see the associations between the iconographic works and the linguistic reasons taken into account by the system for their realization. Let us first anticipate that technology makes it possible nowadays to intervene automatically so that iconographic elements can be identified by digital image analysis; therefore, no linguistic description is actually necessary to associate paintings which have a number of elements in common. However, it should be pointed out that such methods can only highlight the similarities among chromatic elements, graphical patterns, well evident features in the foreground of the image, while many other aspects impossible to capture are missed, thus reducing the number of feasible associations. On the other hand, the associations carried out on linguistic grounds have sometimes shown to be excessive, owing to the considerable amount of information (in particular the profuse sequence of diversified adjectives) contained in historical and artistic works. This negative element which emerged from the experiment can however be exploited to find suitable solutions aimed at reducing the production of partially useless results},
KEYWORDS = {Information extraction, Data mining, Self Organising Maps},
PAGES = {209-220},
URL = {https://iris.cnr.it/handle/20.500.14243/37707},
VOLUME = {1},
ISSN = {1120-6861},
JOURNAL = {ARCHEOLOGIA E CALCOLATORI},
}
@ARTICLE{CALDERONE_2007_ARTICLE_CHP_37709,
AUTHOR = {Calderone, B. and Herreros, I. and Pirrelli, V.},
TITLE = {Learning Inflection: The Importance of Starting Big},
YEAR = {2007},
ABSTRACT = {Perchè i sistemi verbali morfologicamente più "ricchi" vengono appresi da un bambino con maggiore facilità di sistemi più "poveri", caratterizzati da maggiore suppletivismo e da un minor numero di marcatori flessionali? Studi recenti condotti nel quadro della Morfologia Naturale (Bittner et al. 2003) hanno evidenziato il ruolo centrale svolto in questo apparente paradosso dal "contrasto morfologico" e dalla relazione biunivoca tra forma e contenuto all'interno del paradigma flessionale. Il presente lavoro illustra da questo punto di vista il comportamento di un modello originale di reti neurali artificiali auto-organizzanti con architettura "a cascata" e apprendimento asincrono, addestrato su forme verbali codificate fonologicamente. Il modello addestrato è in grado di memorizzare sia configurazioni morfologiche astratte, corrispondenti alle terminazioni flessionali di forme verbali regolari e irregolari, sia forme flesse piene, in funzione della loro frequenza per tipo e per unità nel corpus di addestramento. Il comportamento del modello è valutato su due differenti corpora di addestramento, italiano e inglese, entrambi campionati dal database CHILDES. L'analisi della topologia delle informazioni memorizzate dal modello addestrato consente di trarre alcune conclusioni generali sull'interazione tra processi di acquisizione di sequenze fonotattiche e principi di acquisizione paradigmatica. Le implicazioni teoriche dei risultati vengono inoltre discusse alla luce del tradizionale dibattito tra modelli "a meccanismo singolo" e "a meccanismo doppio" di acquisizione morfologica},
PAGES = {175-200},
URL = {https://iris.cnr.it/handle/20.500.14243/37709},
VOLUME = {2},
ISSN = {1720-9331},
JOURNAL = {LINGUE E LINGUAGGIO},
}
@ARTICLE{CIGNONI_2007_ARTICLE_C_37711,
AUTHOR = {Cignoni, L.},
TITLE = {'The magic tree', Natale in Festa},
YEAR = {2007},
ABSTRACT = {Le feste natalizie possono essere un pretesto per svolgere in maniera divertente ma costruttiva una serie di attività costituite da recite, canti, filastrocche e realizzazioni manuali, tutte legate al tema del Natale. Il racconto che viene presentato, dal titolo, The Magic Tree fa da filo conduttore a tutte le altre attività, in unatmosfera piacevole e familiare. Si inizia con lorganizzazione della recita, e la definizione del contesto in cui questa si svolgerà, poi si continua con la preparazione degli addobbi. La costruzione di piccoli oggetti da utilizzare per la drammatizzazione di una storia e lallestimento dellambiente natalizio costituiscono unattività socializzante e gratificante che aiuta il bambino a comunicare, a collaborare con i compagni, a creare esperienze comuni durante le quali la lingua inglese viene usata in maniera divertente. Il fare finta di è unattività importante per lo sviluppo del bambino: la maestra racconta la storia e poi incoraggia i bambini a recitarla sviluppando così il loro vocabolario. Le canzoncine e le filastrocche, ascoltate più volte, permettono ai bambini di divertirsi attraverso il movimento e la mimica, ma allo stesso tempo gli offrono la possibilità di ripetere e consolidare il lessico e le strutture più semplici. La maestra abitua i bambini ad accompagnare le parole che pronunciano al gesto corrispondente, acquisendo così familiarità con i suoni della lingua inglese, favorendo la comprensione orale dei bambini, la loro partecipazione attiva, linteresse e la motivazione a apprendere. Il metodo adottato è quello sviluppato da James Usher del Total Physical Response, secondo cui il bambino per la sua naturale capacità di apprendere è in grado di eseguire o mimare delle azioni sulla base di comandi impartiti dalla maestra. La festa del Natale offre anche la possibilità di coinvolgere i bambini di altre nazionalità: ognuno dei bambini può cantare, oppure portare, o preparare con laiuto degli altri qualcosa di caratteristico del proprio paese},
URL = {https://iris.cnr.it/handle/20.500.14243/37711},
ISSN = {1590-3206},
JOURNAL = {SCUOLA DELL'INFANZIA},
}
@ARTICLE{DELLORLETTA_2007_ARTICLE_DFLMP_37710,
AUTHOR = {Dell'Orletta, F. and Federico, M. and Lenci, A. and Montemagni, S. and Pirrelli, V.},
TITLE = {Maximum Entropy for Italian PoS Tagging},
YEAR = {2007},
ABSTRACT = {L'articolo illustra le prestazioni del ILC-UniPi MaxEnt PoS Tagger in Evalita 2007. The report contains a description of the ILC-UniPi MaxEnt PoS Tagger performance in Evalita 2007},
PAGES = {10-11},
URL = {https://iris.cnr.it/handle/20.500.14243/37710},
VOLUME = {IV(2)},
}
@ARTICLE{DIDONATO_2007_ARTICLE_D_384174,
AUTHOR = {Di Donato, F.},
TITLE = {Come si valuta la qualità nella Repubblica della Scienza? Una riflessione sul concetto di peer review},
YEAR = {2007},
ABSTRACT = {Peer reviewing is often called for as an essential divide between scientific knowledge and bare opinion. In general terms, it is an evaluation tool consisting in the formula through which an academic submits a text to the opinion of other academics (the so-called "peers") who state its legitimacy; as a technical term, it amounts to the specific evaluation process that comes before publication on a scientific journal, a presentation's approval to a conference or funding and grant allocation by funding agencies. In the abstract, peer review is required for appraising the quality of knowledge while it helps assuring its truthfulness and reputation; significantly, in the current transition between print and digital era, peer review itself is evoked as an element of continuity with the past and as a guarantee of scientific quality: while technology continuously upgrades, it is claimed, the knowledge validation process remains the same. Actually, it is one of the engines propelling research funding: as a filter by which it is decided whether to publish a scientific result, it influences both recruitment and career in the Republic of Science phaenomenon (that is, both in the academia and within research institutions), and public and private research funding. In practice, it often leaves room for abuses and frauds, allowing the darkest exertion of academic power. It may be for these reasons that peer review is acknowledged as the distinguishing feature of the modern academic system and, although legally unbinding, not only it is embraced (as a tool of the trade) by generations of scholars, but also it is very often deemed as the establishing and distinguishing feature of scientific knowledge. In the following pages I will examine the current praxis of peer review, to meditate then on the evolution and the future of this tool and, eventually, I will cast a glance at the historical and technological framework in which it first came to light},
URL = {https://iris.cnr.it/handle/20.500.14243/384174},
ISSN = {1591-4305},
JOURNAL = {BOLLETTINO TELEMATICO DI FILOSOFIA POLITICA},
}
@ARTICLE{GUADAGNINI_2007_ARTICLE_G_75439,
AUTHOR = {Guadagnini, E.},
TITLE = {Scelta di voci del Tesoro della Lingua Italiana delle Origini (undicesima serie)},
YEAR = {2007},
ABSTRACT = {Voci fàvola s. f., fiaba s. f., fola s. f., folletto (1) s. m., folletto (2) agg., fumo s. m., fuoco s. m. del Tesoro della Lingua Italiana delle Origini (pp. 108-112, 148-149, 163-212)},
KEYWORDS = {Lessicografia, Vocabolario storico, Italiano antico},
PAGES = {9-246},
URL = {https://iris.cnr.it/handle/20.500.14243/75439},
VOLUME = {12},
ISSN = {1591-8254},
JOURNAL = {BOLLETTINO-OPERA DEL VOCABOLARIO ITALIANO},
}
@ARTICLE{PIRRELLI_2007_ARTICLE_P_37708,
AUTHOR = {Pirrelli, V.},
TITLE = {Psycho-Computational Issues in Morphology Learning and Processing: An Overture},
YEAR = {2007},
PAGES = {131-138},
URL = {https://iris.cnr.it/handle/20.500.14243/37708},
VOLUME = {2},
}
@BOOK{SABA_2007_BOOK_S_134809,
AUTHOR = {Saba, A.},
TITLE = {El Léxico del Arte de la verdadera Navegación de Pedro de Siria},
YEAR = {2007},
ABSTRACT = {El Arte de la verdadera Navegación de Pedro de Siria, cuyas concordancias aquí presentamos, forma parte de un corpus de textos del siglo XVI preparado para la construcción del Léxico Náutico del Español del Siglo de Oro (LéNESO*). Este corpus, que consta de quince textos, se ha llevado a cabo con la contribución del Istituto di Linguistica Computazionale del Consiglio Nazionale delle Ricerche e del Dipartimento di Lingue Romanze dell'Università di Pisa, del Departamento de Lengua Española y Lingüística General, y de la Sección de Medios Impresos de la UNED de Madrid que está atendiendo a la publicación de los varios léxicos por separado. Con el descubrimiento de América, España adquirió gran renombre y prestigio internacional en todos los campos, especialmente en las técnicas de navegación y en las disciplinas relacionadas con el arte de marear. En este período el horizonte geográfico se amplió, se produjeron nuevas cartas y se perfeccionaron las existentes y varios fueron los alcances en los campos de la astronomía, de la geografía, de la metereología, etc. La necesidad de favorecer el comercio con el Nuevo Mundo creó la exigencia de multiplicar los viajes de exploración en el Atlántico y al mismo tiempo garantizar una mayor seguridad a los barcos y a sus tripulaciones durante la navegación, por lo cual fue necesario redactar textos de teoría y de práctica marinera que sirviesen de guía a los navegantes en los derroteros transoceánicos. La obra de Siria Arte de la verdadera Navegación se imprimió en 1602, pero su realización es más antigua, como revela al lector el mismo autor "Los muchos ruegos de algunos amigos, a los quales es justo obedecer, me han movido a que sacasse a luz este libro, que ya casi tenía olvidado". El texto abarca muchos temas, hablando de ". de la máchina del mundo, es a saber, cielos y elementos, de las mareas y señales de tempestades, del aguja de marear, del modo de hazer cartas de navegar, del uso dellas, de la declinación y rodeo que comúnmente hazen los pilotos, del modo verdadero de navegar por círculo menor, por línea recta sin declinación ni rodeo, el modo cómo se sabrá el camino, y leguas que ha navegado el piloto por qualquier rumbo, y últimamente el saber tomar el altura del polo". Este volumen, al cuidado de Antonina Saba**, contiene la concordancia lematizada, los índices de frecuencia de los lemas, los índices de los nombres propios, el diccionario inverso del Arte de la verdadera Navegación, y un CD-ROM con un sistema de consulta del texto que constituyen una novedad y un estímulo para toda investigación sobre el texto del autor valenciano},
KEYWORDS = {analisi linguistica, lessicografia},
PAGES = {IX-LXIII},
URL = {https://iris.cnr.it/handle/20.500.14243/134809},
ISBN = {9788436254877},
CONFERENCE_PLACE = {Madrid},
EDITOR = {Saba, A.},
}
@INCOLLECTION{CALZOLARI_2007_INCOLLECTION_C_134805,
AUTHOR = {Calzolari, N.},
TITLE = {Corpus-based lexicon building: an overview across projects, problems, approaches},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/134805},
ISBN = {0415338964},
}
@INCOLLECTION{DELLORLETTA_2007_INCOLLECTION_DLMP_134810,
AUTHOR = {Dellorletta, F. and Lenci, A. and Montemagni, S. and Pirrelli, V.},
TITLE = {Corpus-based Modelling of Grammar Variation},
YEAR = {2007},
KEYWORDS = {Grammar variation, stochastic parsing, linguistic typology},
PAGES = {38-55},
URL = {https://iris.cnr.it/handle/20.500.14243/134810},
PUBLISHER = {Angeli (Milano, ITA)},
ISBN = {9788846489449},
CONFERENCE_PLACE = {Milano},
BOOKTITLE = {Language resources and linguistic theory},
EDITOR = {Sansò, A.},
}
@EDITORIAL{NARDI_2007_EDITORIAL_NPQ_166678,
AUTHOR = {Nardi, A. and Peters, C. and Quochi, V.},
TITLE = {CLEF 2007. Editorial},
YEAR = {2007},
ABSTRACT = {These Working Notes contain descriptions of the experiments conducted within CLEF 2007 organised by the Cross-Language evaluation Forum. The final papers-revised and extended as a result of the discussions at the Workshop-together with a comparative analysis of the results will appear in the CLEF 2007 Proceedings, to be published by Springer in their Lecture Notes for Computer Science series. CLEF organises a series of evaluation tracks designed to test different aspects of mono-and cross-language information retrieval system development. The intention is to encourage systems to move from monolingual text retrieval to the implementation of a full multilingual multimedia search service},
KEYWORDS = {Information Retrieval},
PAGES = {9},
URL = {https://iris.cnr.it/handle/20.500.14243/166678},
}
@INPROCEEDINGS{AGNOLONI_2007_INPROCEEDINGS_ABFSTMV_143465,
AUTHOR = {Agnoloni, T. and Bacci, L. and Francesconi, E. and Spinosa, P. and Tiscornia, D. and Montemagni, S. and Venturi, G.},
TITLE = {Building an ontological support for multilingual legislative drafting},
YEAR = {2007},
PAGES = {9-18},
URL = {https://iris.cnr.it/handle/20.500.14243/143465},
CONFERENCE_NAME = {International Conference on Legal Knowledge and Information Systems (JURIX 2007)},
BOOKTITLE = {Legal Knowledge and information Systems},
EDITOR = {Ar, L. and Mommers, L.},
}
@INPROCEEDINGS{BARONI_2007_INPROCEEDINGS_BGP_65050,
AUTHOR = {Baroni, M. and Guevara, E. and Pirrelli, V.},
TITLE = {Sulla tipologia dei composti N N in italiano: principi categoriali ed evidenza distribuzionale a confronto},
YEAR = {2007},
KEYWORDS = {Morphology, Compounding, Mental Lexicon, Lexical Semantics},
URL = {https://iris.cnr.it/handle/20.500.14243/65050},
ISBN = {978-88-7870-469-5},
CONFERENCE_NAME = {XL Congresso Internazionale di Studi della Società di Linguistica Italiana (SLI 2006)},
BOOKTITLE = {Linguistica e modelli tecnologici della ricerca},
EDITOR = {Ferrari, G. and Benatti, R. and Mosca, M.},
}
@INPROCEEDINGS{BELLANDI_2007_INPROCEEDINGS_BFGR_265117,
AUTHOR = {Bellandi, A. and Furletti, B. and Grossi, V. and Romei, A.},
TITLE = {Pushing Constraint in Association Rules Mining: an Ontology-Based Approach},
YEAR = {2007},
ABSTRACT = {This paper proposes an integrated framework for the extraction of constraint-based multi-level association rules with the aid of an ontology. The latter, that represents an enriched taxonomy, is used to describe the application domain by means of data properties. Defining or updating these properties is a simple task and does not imply changing the items hierarchy, or the implementation level of our framework. The system enables the definition of domain-specific constraints by using the ontology to filter the instances used in the association rule mining process. This can improve the quality of the extracted associations rules and make them more interesting and easy to understand. We describe our framework, also including examples of queries based on real-data},
URL = {https://iris.cnr.it/handle/20.500.14243/265117},
}
@INPROCEEDINGS{BELLANDI_2007_INPROCEEDINGS_BFGR_265116,
AUTHOR = {Bellandi, A. and Furletti, B. and Grossi, V. and Romei, A.},
TITLE = {Ontology-Driven Association Rule Extraction: A Case Study},
YEAR = {2007},
ABSTRACT = {This paper proposes an integrated framework for extracting Constraint-based Multi-level Association Rules with an ontology support. The system permits the definition of a set of domain-specific constraints on a specific domain ontology, and to query the ontology for filtering the instances used in the association rule mining process. This method can improve the quality of the extracted associations rules in terms of relevance and understandability},
KEYWORDS = {Association Rules, Ontology, Data mining},
PAGES = {10-19},
URL = {https://iris.cnr.it/handle/20.500.14243/265116},
PUBLISHER = {CEUR-WS. org (Aachen, DEU)},
CONFERENCE_NAME = {C\&O: RR-2007-International Workshop on Contexts and Ontologies: Representation and Reasoning},
CONFERENCE_PLACE = {Aachen},
}
@INPROCEEDINGS{BERTAGNA_2007_INPROCEEDINGS_BMSCRTM_145342,
AUTHOR = {Bertagna, F. and Monachini, M. and Soria, C. and Calzolari, N. and Ronzano, N. and Tesconi, M. and Marchetti, A.},
TITLE = {Cooperative Building of Semantic Resources},
YEAR = {2007},
ABSTRACT = {In this paper we present LexFlow, a framework for the automatic and cooperative enrichment, integration and exploitation of semantic resources. Borrowing from techniques used in the domain of document workflows, we model the activity of lexicon management as a particular case of workflow instance, where lexical entries move across agents and become dynamically updated. We also give an important exploitation example of the semantic resources managed or built thanks to LexFlow, describing its integration with SemKey, a system for semantic collaborative tagging},
KEYWORDS = {semantic resources, cooperative knowledge definition, semantic tagging},
URL = {https://iris.cnr.it/handle/20.500.14243/145342},
ISBN = {3-540-74781-8},
CONFERENCE_NAME = {10th Congress of Italian Association for Artificial Intelligence-Cooperative construction of linguistic knowledge bases Workshop},
}
@INPROCEEDINGS{BERTAGNA_2007_INPROCEEDINGS_BMSMTHH_154420,
AUTHOR = {Bertagna, F. and Monachini, M. and Soria, C. and Marchetti, A. and Tesconi, M. and Huang, C. and Hsich, S.},
TITLE = {Fostering Intercultural Collaboration: a Web Service Architecture for Cross-Fertilization of Distributed Wordnets},
YEAR = {2007},
ABSTRACT = {Enhancing the development of multilingual lexicons is of foremost importance for intercultural collaboration to take place, as multilingual lexicons are the cornerstone of several multilingual applications. However, the development and maintenance of large-scale, robust multilingual dictionaries is a tantalizing task. In this paper we present a tool, based on a web service architecture, enabling semi-automatic generation of bilingual lexicons through linking of distributed monolingual lexical resources. In addition to lexicon development, the architecture also allows enrichment of monolingual source lexicons through exploitation of the semantic information encoded in corresponding entries. In the paper we describe our case study applied to the Italian and Chinese wordnets, and we illustrate how the architecture can be extended to access distributed multilingual WordNets over the Internet, paving the way to exploitation in a cross-lingual framework of the wealth of information built over the last decade},
KEYWORDS = {distributed language resources, interoperable lexical resources, integration of WordNets},
PAGES = {185-198},
URL = {https://iris.cnr.it/handle/20.500.14243/154420},
VOLUME = {4568},
DOI = {10.1007/978-3-540-74000-1_11},
PUBLISHER = {Springer (Berlin, DEU)},
ISBN = {978-1-60558-198-9},
CONFERENCE_NAME = {IWIC 2007-The First International Workshop on Intercultural Collaboration},
CONFERENCE_PLACE = {Berlin},
}
@INPROCEEDINGS{BOMBARA_2007_INPROCEEDINGS_BCCCGMRST_456882,
AUTHOR = {Bombara, M. and Calì, D. and Calì, I. and Cartelli, V. and Giovannetti, E. and Masserotti, M. and Renso, C. and Spinanti, L. and Tropea, G.},
TITLE = {Tecnologie open-source nel progetto FuLL (Fuzzy Logic and Language)},
YEAR = {2007},
ABSTRACT = {FuLL (Fuzzy Logic and Language) è un progetto di ricerca della Software Company BC, finanziato dal MAP e sviluppato in collaborazione con partner di ricerca del CNR e universitari, che aveva come obiettivo lo sviluppo di una tecnologia software che innova i sistemi di interrogazione dei database tramite l'utilizzo di un'interfaccia in linguaggio naturale. Nell'ambito del progetto, l'impiego di strumenti e tecnologie open-source ha consentito la sperimentazione del prototipo in tempi brevi e senza legare il sistema ad una specifica tecnologia proprietaria. L'interfaccia in linguaggio naturale FuLL, alla base del progetto, è stata sperimentata collegandola a due distinti database GIS di due province italiane, Bologna e Catania. I dati originali sono stati importati all'interno di un DB PostgreSQL con estensioni PostGIS e collegati fra loro con l'impiego di funzioni spaziali e relazioni di natura semantica, per consentirne la consultazione in linguaggio naturale. Per visualizzare i dati geografici su web è stata integrata una web-application GIS, sviluppata con MapServer in tecnologia JSP e pienamente compatibile con PostGIS. Un risultato importante della scelta di tecnologie standard, come le estensioni OpenGIS spaziali di PostgreSQL, è la piena portabilità verso altri sistemi DBMS spaziali},
KEYWORDS = {Interoperabilità, Linguaggio naturale, GIS, Standardizzazione},
PAGES = {5},
URL = {https://geomatica.icar.cnr.it/grass_meeting/articoli/bc_grass2007_full.pdf},
CONFERENCE_NAME = {GRASS \& GFOSS Meeting 2007},
BOOKTITLE = {Atti del Meeting Utenti Italiani GRASS e GFOSS-VIII Edizione 2007},
}
@INPROCEEDINGS{CARPI_2007_INPROCEEDINGS_CS_65048,
AUTHOR = {Carpi, E. and Saba, A.},
TITLE = {El Corpus del Léxico Nàutico del Siglo de Oro},
YEAR = {2007},
ABSTRACT = {El desarrollo de la tecnología informática ha revolucionado la investigación y la práctica lexicográfica de estas últimas décadas. Debido a la difusión de instrumentos cada vez más sofisticados para el tratamiento automático de los materiales lingüísticos, se han abierto para los investigadores perspectivas cada vez más interesantes. Con la difusión de las computadoras personales, y aunque al principio el proceso de informatización en el campo humanístico ha sido más lento que en otros, los lingüístas utilizan cada vez más los nuevos medios electrónicos; por esta razón, sobrevino la exigencia de estudiar nuevos programas de fácil acceso y uso que fuesen manejables por la mayoría de los usuarios, incluso los menos informatizados. Por lo tanto, en el Instituto de Linguística Computacional del CNR de Pisa se ha realizado un sistema de análisis de textos automático, AyDA, y otros instrumentos para su consulta interactiva (COR) y la producción de indices de frecuencia de los lemas y de las formas de cada texto y de un corpus completo (CLE). Estos programas han permitido llevar a cabo un proyecto para la constitución de un corpus de textos náuticos españoles del Siglo de Oro, cuyo objetivo es la producción de un diccionario del léxico de la navegación, denominado LÉNESO},
KEYWORDS = {linguaggio scientifico e tecnico, strumenti informatici, lessicografia},
PAGES = {61-73},
URL = {http://www.edizioniets.com},
VOLUME = {27},
PUBLISHER = {Edizioni ETS (Pisa, ITA)},
ISBN = {9788846712264},
CONFERENCE_NAME = {GIORNATE DI STUDIO DI LESSICOGRAFIA ROMANZA Il linguaggio scientifico e tecnico (medico, botanico, farmaceutico e nautico) fra Medioevo e Rinascimento},
CONFERENCE_PLACE = {Pisa},
BOOKTITLE = {Giornate di Studio di Lessicografia romanza: Il linguaggio scientifico e tecnico fra Medioevo e Rinascimento},
EDITOR = {Corradini, M. S. and Periñán, B.},
}
@INPROCEEDINGS{CASELLI_2007_INPROCEEDINGS_CPRC_65049,
AUTHOR = {Caselli, T. and Prodanof, I. and Ruimy, N. and Calzolari, N.},
TITLE = {Mapping SIMPLE and TimeML: improving event identification and classification using a semantic lexicon},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/65049},
CONFERENCE_NAME = {GL2007: Fourth International Workshop on Generative Approaches to the Lexicon},
}
@INPROCEEDINGS{CASELLI_2007_INPROCEEDINGS_CQ_65051,
AUTHOR = {Caselli, T. and Quochi, V.},
TITLE = {Inferring the semantics of temporal prepositions in Italian},
YEAR = {2007},
KEYWORDS = {italian, prepositions, computational linguistics},
PAGES = {38-44},
URL = {http://www.aclweb.org/anthology/W07-1606},
PUBLISHER = {Association for Computational Linguistics (Stroudsburg, USA)},
CONFERENCE_NAME = {Fourth ACL-SIGSEM Workshop on Prepositions},
CONFERENCE_PLACE = {Stroudsburg},
BOOKTITLE = {Proceedings of the Fourth ACL-SIGSEM Workshop on Prepositions},
EDITOR = {Fintan Costello, J. K. and Volk, M.},
}
@INPROCEEDINGS{CIGNONI_2007_INPROCEEDINGS_CR_65052,
AUTHOR = {Cignoni, L. and Ruffolo, P.},
TITLE = {Verso un dizionario filologico multilingue contestualizzato},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/65052},
CONFERENCE_NAME = {XXV CILPR Congrès International de Linguistique et de Philologie Romanes},
}
@INPROCEEDINGS{CUTUGNO_2007_INPROCEEDINGS_CMMM_155325,
AUTHOR = {Cutugno, P. and Marconi, L. and Morgavi, G. and Morando, M.},
TITLE = {CoLFIS: sistemas de interrogación online},
YEAR = {2007},
ABSTRACT = {CoLFIS: sistemas de interrogación online. CoLFIS es una base de datos de la lengua italiana escrita de 3. 798. 275 palabras, formada de textos escritos de varios generes pesados oportunamente y selecionados en tres distintos sectores: diarios, periodicos y libros. El producto realizado representa el italiano leido mas bien que toda la lengua italiana escrita. Esta eleccion se justifica en cuanto se deseaba construir un corpus, y en consecuencia un lexico de frecuencia, que se acercara los mas posible al lexico mental de un hablante de media cultura y no a un diccionario de la lengua italiana. Los diarios con 1. 836. 119 palabras se han extraido de los tres diarios mas importantes y leidos en Italia: Il Corriere Della Sera, Repubblica, La Stampa. En cada diario se han elegidos textos de 9 diferentes subsectores: economia, cronica local, cronica mundana, cronica negra, politica exterior, politica interior, ciencia, espectaculo y deporte. El sector de los periodicos es constituido por 1. 306. 653 palabras elejdas entre 12 differentes subsectores: arte-ciencia-tecnica, auto-nautica, ninos-muchachos, casa-hobby, femenino, fotonovelas, informacion general, cronica mundana, radio-television, deporte, viajes-ecologia y otro. El sector de los libros es constituido por 655. 503 palabras elejdas entre 13 generos literarios: arte, ninos, ficcion, gialli espionaje, hobby y viajes, narrativa clasica, narrativa moderna, rosa, ensaystica, ciencias naturales y exactas, ciencias sociales y humanas, teatro y poesia. El corpus CoLFIS ha sido sometido a una lematizacion completa y se han desarrollado paquetes software de analisis estadistico para producir los lexicos de frecuencia relativos al corpus total y a los distintos sectores para cada lema y formas relativas. En este trabajo seran explicados los metodos de interogacion realizados para ayudar el usuario que quiere acercarse al corpus, puesto a disposicion en internet, y obtener informaciones del corpus, del corpus con lematizacion, de los lexicos de frecuencia. Ademas se ensenarà un estudio sobre los adverbios derivados, es decir los adverbios que terminan en-mente, como ejemplo de posibles investigaciones permitidas del material linguistico y del sistema de interogacion a disposicion. Se presenteran los porcentajes de las distintas tipologias adverbiales y se analizara la posicion del adverbio en la oracion buscando evaluar sus posibilidades combinatorias},
KEYWORDS = {Corpora, Lessico, Italiano},
PAGES = {505-510},
URL = {http://www.santiago.cu/hosting/linguistica/descargar.php?d=425},
PUBLISHER = {Centro de linguística aplicada, Ministerio de ciencia, tecnología y medio ambiente (Santiago de Cuba, CUB)},
ISBN = {959-7174-08-1},
CONFERENCE_NAME = {X Simposio Internacional Comunicacion Social},
CONFERENCE_PLACE = {Santiago de Cuba},
BOOKTITLE = {Actas-I X Simposio Internacional Comunicación Social},
EDITOR = {Miyares, L. R. and Alvarado, A. M. and Moreno, C. A.},
}
@INPROCEEDINGS{DELLORLETTA_2007_INPROCEEDINGS_DFLMP_65073,
AUTHOR = {Dell'Orletta, F. and Federico, M. and Lenci, A. and Montemagni, S. and Pirrelli, V.},
TITLE = {Maximum Entropy for Italian PoS Tagging},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/65073},
CONFERENCE_NAME = {Evaluation of NLP Tools for Italian-EVALITA 2007},
}
@INPROCEEDINGS{DELLORLETTA_2007_INPROCEEDINGS_DLMMP_65065,
AUTHOR = {Dell'Orletta, F. and Lenci, A. and Marchi, S. and Montemagni, S. and Pirrelli, S.},
TITLE = {Text-2-Knowledge: una piattaforma linguistico-computazionale per l'estrazione di conoscenza da testi},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/65065},
CONFERENCE_NAME = {XL Congresso Internazionale di Studi della Società di Linguistica Italiana (SLI 2006)},
}
@INPROCEEDINGS{FRANCOPOULO_2007_INPROCEEDINGS_FBGCMPS_65053,
AUTHOR = {Francopoulo, G. and Bel, N. and George, M. and Calzolari, N. and Monachini, M. and Pet, M. and Soria, C.},
TITLE = {Lexical Markup Framework: an ISO Standard for Semantic Information in NLP Lexicons},
YEAR = {2007},
ABSTRACT = {Lexical Markup Framework (LMF) is a model that provides a common standardized framework for Natural Language Processing (NLP) lexicons. The goals of LMF are to provide a common model for the creation and use of such lexical resources to manage the exchange of data between and among these resources, and to enable the merging of a large number of individual resources to form extensive global electronic resources},
URL = {https://iris.cnr.it/handle/20.500.14243/65053},
ISBN = {978-3-8233-6314-9},
CONFERENCE_NAME = {GLDV2007-Lexical-Semantic and Ontological Resources of the GLDV Working Group on Lexicography at the Biennal Spring Conference},
}
@INPROCEEDINGS{GIOVANNETTI_2007_INPROCEEDINGS_GMMB_65068,
AUTHOR = {Giovannetti, E. and Marchi, S. and Montemagni, S. and Bartolini, R.},
TITLE = {Ontology-based Semantic Annotation of Product Catalogues},
YEAR = {2007},
ABSTRACT = {This paper describes a methodology for the semantic annotation of product catalogues. We propose a hybrid approach, combining pattern matching techniques to exploit the regular structure of product descriptions in catalogues, and Natural Language Processing techniques which are resorted to analyze natural language descriptions. It also includes the access to an application ontology, semi-automatically bootstrapped from collections of catalogues with an ontology learning tool, which is used to drive the semantic annotation process},
KEYWORDS = {Semantic Annotation of texts, Ontology Learning, Information Extraction for e-commerce},
PAGES = {235-239},
URL = {https://iris.cnr.it/handle/20.500.14243/65068},
CONFERENCE_NAME = {Recent Advances in Natural Language Processing (RANLP-2007)},
BOOKTITLE = {Proceedings of the International Conference "Recent Advances in Natural Language Processing"},
}
@INPROCEEDINGS{LENCI_2007_INPROCEEDINGS_LMPV_65070,
AUTHOR = {Lenci, A. and Montemagni, S. and Pirrelli, V. and Venturi, G.},
TITLE = {NLP-based ontology learning from legal texts. A case study},
YEAR = {2007},
ABSTRACT = {The paper reports on the methodology and preliminary results of a case study in automatically extracting ontological knowledge from Italian legislative texts in the environmental domain. We use a fully-implemented ontology learning system (T2K) that includes a battery of tools for Natural Language Processing (NLP), statistical text analysis and machine language learning. Tools are dynamically integrated to provide an incremental representation of the content of vast repositories of unstructured documents. Evaluated results, however preliminary, are very encouraging, showing the great potential of NLP-powered incremental systems like T2K for accurate large-scale semi-automatic extraction of legal ontologies},
PAGES = {113-129},
URL = {https://iris.cnr.it/handle/20.500.14243/65070},
CONFERENCE_NAME = {II Workshop on Legal Ontologies and Artificial Intelligence Techniques (LOAIT'07)},
}
@INPROCEEDINGS{MARINELLI_2007_INPROCEEDINGS_MB_65054,
AUTHOR = {Marinelli, R. and Bindi, R.},
TITLE = {Creativity and Fixation Processes in Proper Names Sense Extensions},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/65054},
CONFERENCE_NAME = {XXIX International Conference of Functional Linguistics},
}
@INPROCEEDINGS{MARINELLI_2007_INPROCEEDINGS_MS_65055,
AUTHOR = {Marinelli, R. and Spadoni, G.},
TITLE = {Modeling a Maritime Domain Ontology},
YEAR = {2007},
ABSTRACT = {The users' demand has determined the need to manage the growing new technical maritime terminology which includes very different domains such as the juridical or commercial ones. A terminological database was built by exploiting the computational tools of ItalWordNet (IWN) and its lexical-semantic model EuroWordNet. This paper concerns the development of database structure and data coding, relevance of the concepts of 'term' and 'domain', information potential of the terms, complexity of this domain and detailed ontology structuring recently undertaken and still in progress. Our domain structure is described defining a core set of terms representing the two main sub-domains specified in 'technical-nautical' and 'maritime transport' terminology. These terms are sufficiently general to be the root nodes of the core ontology we are developing. They are mostly domain-dependent, but the link with the Top Ontology of IWN remains, endorsing either general and 'foundation' information, or detailed description directly connected with the specific domain. This structure seems to be the most appropriate to characterize the main conceptual schemas that people of the technical-nautical or maritime transport "world" actually use, namely activity plans, navigation management, etc. Also a set of acronyms has been codified to represent their ever increasing use in maritime terminology. Through the semantic relations linking the synsets, every term 'inherits' the IWN Top Ontology definitions and becomes itself an integral part of the structure. While codifying a term in the maritime database, the reference is at the same time allowed to the Base Concepts of the terminological ontology embedding the term in the semantic network, showing that upper and core ontologies make it possible for the framework to integrate different views on the same domain in a meaningful way},
KEYWORDS = {terminology, lexical databases, ontology, computational resources},
PAGES = {511-515},
URL = {http://www.santiago.cu/hosting/linguistica/detalles.php?id=en\&d=316},
PUBLISHER = {Centre for applied linguistics (Santiago de Cuba, CUB)},
ISBN = {959-7174-08-1},
CONFERENCE_NAME = {Tenth International Symposium on Social Communication. Santiago de Cuba January 22-26, 2007},
CONFERENCE_PLACE = {Santiago de Cuba},
BOOKTITLE = {Proceedings of the Tenth International Symposium on Social Communication. Santiago de Cuba, 2007},
EDITOR = {Myarez, L. and Myarez, E. B.},
}
@INPROCEEDINGS{MONACHINI_2007_INPROCEEDINGS_MQRC_65056,
AUTHOR = {Monachini, M. and Quochi, V. and Ruimy, N. and Calzolari, N.},
TITLE = {Lexical Relations and Domain Knowledge: The BioLexicon Meets the Qualia Structure},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/65056},
CONFERENCE_NAME = {GL2007: Fourth International Conference on Generative Approaches to the Lexicon},
EDITOR = {Bouillon, P. and Danlos, L. and Kanzaki, K.},
}
@INPROCEEDINGS{MONTEMAGNI_2007_INPROCEEDINGS_M_65072,
AUTHOR = {Montemagni, S.},
TITLE = {Acquisizione automatica di termini da testi: primi esperimenti di estrazione e strutturazione di terminologia metalinguistica},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/65072},
CONFERENCE_NAME = {DLM su Lessicologia e metalinguaggio},
}
@INPROCEEDINGS{MONTEMAGNI_2007_INPROCEEDINGS_M_65069,
AUTHOR = {Montemagni, S.},
TITLE = {Patterns of phonetic variation in Tuscany: using dialectometric techniques on multi-level representations of dialectal data},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/65069},
CONFERENCE_NAME = {International Workshop on Computational Phonology},
}
@INPROCEEDINGS{MONTEMAGNI_2007_INPROCEEDINGS_M_65071,
AUTHOR = {Montemagni, S.},
TITLE = {Aree fonetiche e lessicali toscane a confronto: prime elaborazioni computazionale dei dati dell Atlante Lessicale Toscano},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/65071},
CONFERENCE_NAME = {XL Congresso Internazionale di Studi della Società di Linguistica Italiana},
}
@INPROCEEDINGS{MORGAVI_2007_INPROCEEDINGS_MMMC_150322,
AUTHOR = {Morgavi, G. and Morando, M. and Marconi, L. and Cutugno, P.},
TITLE = {Instruments for evaluating communication processes},
YEAR = {2007},
ABSTRACT = {When humans want to use language to communicate orally with each other, they are faced with a sort of coordination problem: no one monopolizes the floor but the participants take turns to speak. This important concept in linguistic interaction is called "turn-taking". Recent studies showed that turn taking depends on whether speakers have a specific task and role. Often the turn taking is guided by a set of rules that speakers in a conversation adhere to. In the Psychological interviews, i. e., speakers have a non-symmetric role in the conversation; one speaker is supposed to provide information about a certain task, while the other speaker should carefully listen to the interviewee, giving a set of accepting feedbacks. Usually, we evaluate this whole communication process focusing our attention on semantic meanings of pronounced words, but actually this analysis cannot be automatically performed. In this paper we propose the extraction of some information on the evolution of the interview process through simple turn taking quantitative measurements. Over 1000 research interviews made from students during their psychology university course have been analyzed. Each whole interview process has been considered as a complex system evolving in the time. Our approach founds on analogies between interviews and mathematical chaotic processes. The proposed procedure allows the extraction of information on the conversation evolution: phase portraits with anomalous paths indicate situations where the communication has been troubled from external references. Some parameters showing very good indication on the process evolution are proposed},
KEYWORDS = {turn taking, chaotic modeling, linguistic interaction},
PAGES = {485-489},
URL = {http://www.santiago.cu/hosting/linguistica/descargar.php?d=415},
PUBLISHER = {Centro de linguística aplicada, Ministerio de ciencia, tecnología y medio ambiente (Santiago de Cuba, CUB)},
ISBN = {959-7174-08-1},
CONFERENCE_NAME = {X Simposio Internacional Comunicacion Social},
CONFERENCE_PLACE = {Santiago de Cuba},
BOOKTITLE = {ACTAS-I X Simposio Internacional Comunicacion Social},
EDITOR = {Miyares, L. R. and Alvarado, A. M. and Moreno, C. A.},
}
@INPROCEEDINGS{PARDELLI_2007_INPROCEEDINGS_PSG_65057,
AUTHOR = {Pardelli, G. and Sassi, M. and Goggi, S.},
TITLE = {A survey on Human Language Technology Terminology},
YEAR = {2007},
ABSTRACT = {This article originates from the revision of a 1969 unpublished article by Professor Antonio Zampolli carried out by Gabriella Pardelli and Manuela Sassi, two of his collaborators at the Institute of Computational Linguistics in Pisa. It is a technical report titled "Due Conversazioni sul Panorama Attuale della Linguistica Computazionale", drawn up by Zampolli on the occasion of two lectures at the Istituto di Matematica Ulisse Dini of Florence in June 1969. A synthesis of the introductory part-mainly based on some classifications for the various areas of Computational Linguistics-is reported here because the most interesting from the point of view of the relationship between automatic processing of linguistic data and other sciences. The rich bibliographic part has been extracted as well from the report and used for a terminological statistical analysis. Some sections, for example those on the International Conference on Computational Linguistics of 1969 and on the "Sezione Linguistica" of CNUCE in Pisa, have not-or only partly-been taken into account because already published by Zampolli in other books and journals (and not because considered less important). The whole revised technical report will soon be published in the "Quaderni di Linguistica Computazionale" edited by the Istituto di Linguistica Computazionale. The paper is divided in three parts: the first section is a terminological overview on the use of terms such like Computational Linguistics, Applied Linguistics and Mathematical Linguistics; the second has a statistical approach and shows the graphical representation of terms extracted from bibliographies and used in the 1960s; lastly, the conclusions. This contribution is a "historical" document which places itself at the beginning of a field which afterwards knew an exceptional development and it highlights both the continuity and the change which brought to the present Human Language Technology},
KEYWORDS = {Human Language Technology, Terminology},
PAGES = {364-368},
URL = {https://iris.cnr.it/handle/20.500.14243/65057},
PUBLISHER = {Wydawnictwo Poznanskie Sp. z o. o (Poznan, POL)},
ISBN = {978-90-77484-17-3},
CONFERENCE_NAME = {3rd Language \& Technology Conference},
CONFERENCE_PLACE = {Poznan},
BOOKTITLE = {Human Language Technologies as a Challenge for Computer Science and Linguistics},
EDITOR = {Vetulani, Z.},
}
@INPROCEEDINGS{PIOGGIA_2007_INPROCEEDINGS_PFZCD_234919,
AUTHOR = {Pioggia, G. and Ferro, M. and Zupone, G. and Chirulli, L. and De Rossi, D.},
TITLE = {Development of a sensing seat for human authentication},
YEAR = {2007},
ABSTRACT = {In this work the development of a sensing seat for human authentication is reported. Such a system can be used in all the critical scenarios where a seat is available to the human subject. In order to face the authentication task, the sensing seat was developed by means of a novel unobtrusive sensing technology. This is mainly due to two aspects: the unavailability of an existing sensing seat system for human authentication and the inadequacy of the existing sensor technology in order to address the human subject recognition as well as the integration of the sensors in the seat. Thanks to the development of a redundant sensor network, we adopted a hierarchical architecture. Three cooperating classifiers (a distance-based classifier, a KSOM and a MLP) shares the input data and supplying three different classification results. A final classifier (a weighted averager) performs the fusion of the results and supplies the final response},
PAGES = {481-485},
URL = {https://iris.cnr.it/handle/20.500.14243/234919},
DOI = {10.1049/cp:20070412},
ISSN = {0537-9989},
ISBN = {978-0-86341-853-2},
CONFERENCE_NAME = {Intelligent Environments, 2007. IE 07. 3rd IET International Conference on},
BOOKTITLE = {IEE CONFERENCE PUBLICATION},
}
@INPROCEEDINGS{PIOGGIA_2007_INPROCEEDINGS_PSFIMAD_234889,
AUTHOR = {Pioggia, G. and Sica, M. and Ferro, M. and Igliozzi, R. and Muratori, F. and Ahluwalia, A. and De Rossi, D.},
TITLE = {Human-Robot Interaction in Autism: FACE, an Android-based Social Therapy},
YEAR = {2007},
ABSTRACT = {In human-machine social interaction, the intersection between biology and engineering needs a context which allows for the development of adapting dynamics. The android FACE is able to interact with the external environment, interpreting and conveying emotions through non verbal communication. FACE captures expressive and psychophysical correlates from its interlocutor and actuates behaviours following two communicative modalities of semeiology. FACE interacts with kinesics, non verbal communication conveyed by body part movements, or facial expressions, and so on, taking into account the proxemic space. FACE'S goal is define and test a therapeutic protocol for autism in order to enhance social and emotive abilities in people with autism. Data regarding our latest clinical study are reported. The clinical study was aimed at verifying FACE'S capabilities in enhancing imitative skills and shared attention in subjects with autism. In particular, we monitored their attention towards FACE and then we checked if the android remains a restricted and repetitive interest or an object to share with the therapist. The study involved an experimental group, composed of 4 children with autism. The participants were diagnosed using ADI-R and ADOS-G, two specific diagnostic instruments. The experimental set up consisted of a specially equipped room provided with two remotely orientable cameras in which the subject, under the supervision of a therapist, can interact with FACE. During twenty minutes sessions, we observed both spontaneous behavior of the participants and their reactions to therapists presses in correlation with the time course of the physiological and behavioural data. The participants showed a spontaneous ability of imitation of the head and facial movements of the android. Moreover we observed that the children with autism focused their attention towards FACE'S eye movements following verbal suggestions from the therapist},
PAGES = {605-612},
URL = {https://iris.cnr.it/handle/20.500.14243/234889},
DOI = {10.1109/ROMAN.2007.4415156},
ISBN = {978-1-4244-1634-9},
CONFERENCE_NAME = {Robot and Human interactive Communication, 2007. RO-MAN 2007. The 16th IEEE International Symposium on},
}
@INPROCEEDINGS{PIRRELLI_2007_INPROCEEDINGS_P_65066,
AUTHOR = {Pirrelli, V.},
TITLE = {On the cognitive autonomy of morphological processing},
YEAR = {2007},
ABSTRACT = {La connaissance morphologique définit-elle un domaine linguistique autonome dans la grammaire ou est-ce plutôt le sous-produit de principes et représentations basés sur la syntaxe ? Nous traitons la question en prenant en considération un grand ensemble de preuves linguistiques et cognitives, en nous fondant sur la manière dont les locuteurs apprennent, structurent, ont accès et utilisent leur lexique mental pour analyser et produire des mots. Conformément à l'idée que l'observation empirique de productions linguistiques concrètes peut donner des indications sur des domaines spécifiques à l'intérieur de la grammaire, nous concluons qu'il est difficile de concilier les preuves linguistiques fondées sur l'usage avec une approche qui consisterait à voir la morphologie comme la syntaxe des morphèmes. Cependant, il serait également erroné et inutile du point de vue logique de caractériser l'autonomie fonctionnelle de la morphologie par rapport à la syntaxe en termes de modularité de procès},
KEYWORDS = {Theoretical Morphology, Mental Lexicon, Language Learning, Self-Organizing Maps},
PAGES = {245-269},
URL = {https://iris.cnr.it/handle/20.500.14243/65066},
PUBLISHER = {LINCOM academic publishers (LINCOM GmbH) (München, DEU)},
ISBN = {9783895865046},
CONFERENCE_NAME = {Actes du colloque international de Morphologie 4èmes Décembrettes},
CONFERENCE_PLACE = {München},
BOOKTITLE = {Morphologie à Toulouse},
EDITOR = {Hathout, N. and Montermini, F.},
}
@INPROCEEDINGS{PIRRELLI_2007_INPROCEEDINGS_PH_65067,
AUTHOR = {Pirrelli, V. and Herreros, I.},
TITLE = {Learning Inflection by Itself},
YEAR = {2007},
ABSTRACT = {The paper reports on a few experimental results of a computer simulation of learning the verb morphology of Italian, English and Arabic with the same type of neural architecture based on Kohonen's self-organizing maps. Issues of the mental organization of the resulting morphological lexica are explored in some detail and discussed in the light of the differential distribution of regular and irregular inflections in the three languages. It is shown that typologically diverse, non trivial aspects of the underlying paradigmatic structure of the three verb systems effectively emerge through sheer exposure to realistic distributions of verb forms devoid of morpho-syntactic content. We argue that these results go a long way towards explaining how global organization effects in the mental morphological lexicon may eventually result from local word processing steps},
KEYWORDS = {Theoretical Morphology, Mental Lexicon, Language Learning, Self-Organizing Maps},
PAGES = {269-290},
URL = {http://mmm.lingue.unibo.it/},
ISSN = {1826-7491},
CONFERENCE_NAME = {V Mediterranean Morphology Meeting},
BOOKTITLE = {ONLINE PROCEEDINGS OF THE MEDITERRANEAN MORPHOLOGY MEETINGS},
EDITOR = {Booij, G. and Ducceschi, L. and Fradin, B. and Guevara, E. and Ralli, A. and Scalise, S.},
}
@INPROCEEDINGS{QUOCHI_2007_INPROCEEDINGS_QDSMC_65109,
AUTHOR = {Quochi, V. and Del Gratta, R. and Sassolini, E. and Monachini, M. and Calzolari, N.},
TITLE = {Toward a Standard Lexical Resource in the Bio Domain},
YEAR = {2007},
ABSTRACT = {The present paper describes a large-scale lexical resource for the biology domain designed both for human and for machine use. This lexicon aims at semantic interoperability and extendability, through the adoption of ISO-LMF standard for lexical representation and through a granular and distributed encoding of relevant information. The first part of this contribution focuses on three aspects of the model that are of particular interest to the biology community: the treatment of term variants, the representation on bio events and the alignment with a domain ontology. The second part of the paper describes the physical implementation of the model: a relational database equipped with a set of automatic uploading procedures. Peculiarity of the BioLexicon is that it combines features of both terminologies and lexicons. A set verbs relevant for the domain is also represented with full details on their syntactic and semantic argument structure},
KEYWORDS = {Lexical representation model, Lexical Database, Computational Lexicography, Special Domains, Standards},
PAGES = {295-299},
PUBLISHER = {Fundacja Uniwersytetu im A. Mickiewicza (Poznan, POL)},
ISBN = {978-83-7177-413-3},
CONFERENCE_NAME = {LTC07-3rd Language and Technology Conference: Human Language Technology. Challenges of the Information Society},
CONFERENCE_PLACE = {Poznan},
}
@INPROCEEDINGS{ROVENTINI_2007_INPROCEEDINGS_RRMUM_65058,
AUTHOR = {Roventini, A. and Ruimy, N. and Marinelli, R. and Ulivieri, M. and Mammini, M.},
TITLE = {Mapping Concrete Entities from PAROLE-SIMPLE-CLIPS to ItalWordNet: Methodology and Results},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/65058},
CONFERENCE_NAME = {45th Annual Meeting of the Association for Computational Linguistics},
}
@INPROCEEDINGS{RUIMY_2007_INPROCEEDINGS_R_65059,
AUTHOR = {Ruimy, N.},
TITLE = {Enhancing SIMPLE Semantic Relations: A Proposal},
YEAR = {2007},
ABSTRACT = {Semantic relations play a prominent role and have considerable expressive power in the SIMPLE model. Yet, some conceptual links are still too vaguely expressed or not even captured through lack of appropriate representational vocabulary. In this paper, the relations that were added to the Extended Qualia Structure in the framework of the CLIPS project are first illustrated. Then, a proposal is made to further enrich the relation network by borrowing from the EuroWordNet model some conceptual links holding between events and their participants and among co-participants in events, with a view to enhancing the understanding of the relationships among word senses in a sentence},
URL = {https://iris.cnr.it/handle/20.500.14243/65059},
PUBLISHER = {Wydawnictwo Poznanskie Sp. z o. o (Poznan, POL)},
ISBN = {978-83-7177-413-3},
CONFERENCE_NAME = {3rd Language \& Technology Conference},
CONFERENCE_PLACE = {Poznan},
BOOKTITLE = {Proceedings of 3rd Language \& Technology Conference},
EDITOR = {Vetulani},
}
@INPROCEEDINGS{SGAMBELLURI_2007_INPROCEEDINGS_SVFPSDB_234906,
AUTHOR = {Sgambelluri, N. and Valenza, G. and Ferro, M. and Pioggia, G. and Scilingo, E. and De Rossi, D. and Bicchi, A.},
TITLE = {An Artificial Neural Network approach for Haptic Discrimination in Minimally Invasive Surgery},
YEAR = {2007},
ABSTRACT = {In this paper we investigate the possibility of processing the tactile perception by using a novel biomimetic approach for the pattern recognition module. The goal is to enhance the perception in complex virtual environments deriving from haptic displays mimicking human tactile discrimination. To do this we explored a Minimally Invasive Surgery application where the tactile information are strictly limited. In fact, this promising technique suffers from some evident limitations due to the surgeon loss of tactile perception during palpation of internal organs. This is basically due to the mechanical transmission of the elongated tools used during operation. We propose to integrate an Artificial Neural Network in an electronic board capable of processing data provided by a sensorized laparoscopic tool. The capabilities of several pattern recognition techniques present in literature, the Principal Component Analysis (PCA), a Multilayer Perception (MLP) and a Kohonen Self-Organising Map (KSOM) are investigated. The results are compared with that obtained psychophysically on five viscoelastic materials},
URL = {https://iris.cnr.it/handle/20.500.14243/234906},
DOI = {10.1109/ROMAN.2007.4415048},
ISBN = {978-1-4244-1634-9},
}
@INPROCEEDINGS{SORIA_2007_INPROCEEDINGS_SBLMP_65060,
AUTHOR = {Soria, C. and Bartolini, R. and Lenci, A. and Montemagni, S. and Pirrelli, V.},
TITLE = {Automatic Extraction of Semantics in Law Documents},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/65060},
CONFERENCE_NAME = {V Legislative XML Workshop},
}
@INPROCEEDINGS{TORAL_2007_INPROCEEDINGS_TM_65062,
AUTHOR = {Toral, A. and Monachini, M.},
TITLE = {Formalising and bottom-up enriching the ontology of a Generative Lexicon},
YEAR = {2007},
ABSTRACT = {This paper presents on-going research to formalise the ontology of a computational lexicon in OWL (W3C standard) as well as to enrich it by applying a bottom-up approach that extracts semantic information from the lexicon. The resource used follows the Generative Lexicon (GL) theory and therefore (1) puts a challenge to ontology design as its semantic types are multidimensional and (2) enables the acquisition of further knowledge on concepts from semantic units. The formalisation allows the ontology to be processed by Description Logics reasoners as well as to be employed in Semantic Web applications. Moreover, the lexicon-driven enrichment increases the semantic information present in the ontology making it appropriate for ontology-driven Natural Language Processing. Finally, the paper studies the application of these procedures to a subsequent GL-based biological resource},
KEYWORDS = {Ontologies, Generative Lexicon, Qualia Structure, Semantic Web},
PAGES = {599-603},
URL = {https://iris.cnr.it/handle/20.500.14243/65062},
PUBLISHER = {INCOMA Ltd (Shoumen, BGR)},
ISBN = {978-954-91743-7-3},
CONFERENCE_NAME = {RANLP-2007-International Conference on Recent Advances in Natural Language Processing},
CONFERENCE_PLACE = {Shoumen},
EDITOR = {Angelova, G. and Bontcheva, K. and Mitkov, R. and Nicolov, N.},
}
@INPROCEEDINGS{TORAL_2007_INPROCEEDINGS_TM_65063,
AUTHOR = {Toral, A. and Monachini, M.},
TITLE = {SIMPLE-OWL: a Generative Lexicon Ontology for NLP and the Semantic Web},
YEAR = {2007},
ABSTRACT = {This research deals with the modelling of a Generative Lexicon based ontology to be used in the Semantic Web and Natural Language Processing semantic tasks. This ontology is imported from a existing computational Lexical Resource and is converted to the W3C standard Web Ontology Language. This presents some challenges, as for example the multidimensionality of the original ontology, which are covered in the current paper. The result of this research is an OWL compliant semantically rich and linguistically-based ontology, thus useful to the automatic processing of text within the Semantic Web paradigm},
KEYWORDS = {Owl, Ontologies, Generative Lexicon, Semantic Web},
URL = {https://iris.cnr.it/handle/20.500.14243/65063},
ISBN = {3-540-74781-8},
CONFERENCE_NAME = {10th Congress of Italian Association for Artificial Intelligence-Senso Comune Workshop},
}
@INPROCEEDINGS{TORAL_2007_INPROCEEDINGS_TMM_65064,
AUTHOR = {Toral, A. and Monachini, M. and Muñoz, R.},
TITLE = {Automatically converting and enriching a computational lexicon Ontology for NLP semantic tasks},
YEAR = {2007},
ABSTRACT = {This paper describes the automatic transformation of a Generative Lexicon (GL) based Ontology into OWL, the Semantic Web ontology language. Furthermore, the OWL ontology is automatically enriched by means of a bottom-up procedure that extracts additional semantic information (relationships, features, predicates and quantifier restrictions) from the lexicon. The contribution of this research is two-fold. On one hand, we introduce a methodology for the formalisation of GL ontologies. On the other, we have developed automatic procedures that bring out a formalised, reasoning-capable, and semantically rich ontology, thus suitable for Natural Language Processing semantic tasks},
PAGES = {216-220},
URL = {https://iris.cnr.it/handle/20.500.14243/65064},
PUBLISHER = {Fundacja Uniwersytetu im A. Mickiewicza (Poznan, POL)},
ISBN = {978-83-7177-413-3},
CONFERENCE_NAME = {LTC07-3rd Language \& Technology Conference: Human Language Technologies as a Challenge for Computer Science and Linguistics},
CONFERENCE_PLACE = {Poznan},
}
@INPROCEEDINGS{CALDERONE_2007_INPROCEEDINGS_CQ_225689,
AUTHOR = {Calderone, B. and Quochi, V.},
TITLE = {Emergent Cognitive Functions of the Noun Phrase},
YEAR = {2007},
KEYWORDS = {noun phrase, emergence of language},
URL = {https://iris.cnr.it/handle/20.500.14243/225689},
CONFERENCE_NAME = {SLE 2007 Annual Meeting},
BOOKTITLE = {SLE 2007 Annual Meeting Book of Abstracts},
}
@TECHREPORT{AITMOKHTAR_2007_TECHREPORT_ABBDGGMSS_195934,
AUTHOR = {Aitmokhtar, S. and Barker, E. and Brunelli, R. and Demetriou, G. and Gaizauskas, R. and Giovannetti, E. and Montemagni, S. and Sándor, A. and Sun, H.},
TITLE = {Semantic Annotation Services for Virtual Information and Knowledge Environments},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/195934},
}
@TECHREPORT{BOUQUET_2007_TECHREPORT_BSMGSNSBCJ_195935,
AUTHOR = {Bouquet, P. and Stoermer, H. and Montemagni, S. and Giovannetti, E. and Semeraro, G. and Niederee, C. and Stecher, R. and Brunelli, R. and Chanod, J. P. and Jacquin, T.},
TITLE = {Semantic Representation and Management Report},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/195935},
}
@TECHREPORT{CALZOLARI_2007_TECHREPORT_CMQSGB_195954,
AUTHOR = {Calzolari, N. and Monachini, M. and Quochi, V. and Soria, C. and Goggi, S. and Baroni, P.},
TITLE = {FLaReNet: Fostering Language Resources Network. Grant Agreement n° 617001, eContentPlus},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/195954},
}
@TECHREPORT{CININI_2007_TECHREPORT_CS_457841,
AUTHOR = {Cinini, A. and Sassi, M.},
TITLE = {Archivio del Digesto Latino-Italiano},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/457841},
}
@TECHREPORT{CININI_2007_TECHREPORT_CS_195944,
AUTHOR = {Cinini, A. and Sassi, M.},
TITLE = {L'Informazione sanitaria. Analisi di tre quotidiani a tiratura nazionale},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/195944},
}
@TECHREPORT{DELGRATTA_2007_TECHREPORT_DBCEMQS_195953,
AUTHOR = {Del Gratta, R. and Bartolini, R. and Caselli, T. and Enea, A. and Monachini, M. and Quochi, V. and Sassolini, V.},
TITLE = {TimeML: An Ontological Mapping onto the UIMA Type Systems},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/195953},
}
@TECHREPORT{DELGRATTA_2007_TECHREPORT_DMQSC_195940,
AUTHOR = {Del Gratta, R. and Monachini, M. and Quochi, V. and Sassolini, E. and Calzolari, N.},
TITLE = {Bio-Lexicon DataBase: Architecture, Concepts and Loading Software},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/195940},
}
@TECHREPORT{DELGRATTA_2007_TECHREPORT_DTQM_195952,
AUTHOR = {Del Gratta, R. and Toral, A. and Quochi, V. and Monachini, M.},
TITLE = {LocalBioLex: A database framework for biolinguistic research on integrated databases},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/195952},
}
@TECHREPORT{DELLORLETTA_2007_TECHREPORT_DFGLMTP_195933,
AUTHOR = {Dell'Orletta, F. and Federico, M. and Giovannetti, E. and Lenci, A. and Marchi, S. and Trabucco, A. and Pirrelli, V.},
TITLE = {Specifiche di Named Entity Recognition per l'Italiano},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/195933},
}
@TECHREPORT{DELLORLETTA_2007_TECHREPORT_DFGLMTP_457838,
AUTHOR = {Dell'Orletta, F. and Federico, M. and Giovannetti, E. and Lenci, A. and Marchi, S. and Trabucco, A. and Pirrelli, V.},
TITLE = {Segmentazione di un Testo Inglese in Token},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/457838},
}
@TECHREPORT{DELLORLETTA_2007_TECHREPORT_DFGLMTP_195932,
AUTHOR = {Dell'Orletta, F. and Federico, M. and Giovannetti, E. and Lenci, A. and Marchi, S. and Trabucco, A. and Pirrelli, V.},
TITLE = {Specifiche di Chunking per l'Italiano},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/195932},
}
@TECHREPORT{DELLORLETTA_2007_TECHREPORT_DFGLMTP_195931,
AUTHOR = {Dell'Orletta, F. and Federico, M. and Giovannetti, E. and Lenci, A. and Marchi, S. and Trabucco, A. and Pirrelli, V.},
TITLE = {Analisi Morfosintattica per l'Italiano},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/195931},
}
@TECHREPORT{DELLORLETTA_2007_TECHREPORT_DFGLMTP_457837,
AUTHOR = {Dell'Orletta, F. and Federico, M. and Giovannetti, E. and Lenci, A. and Marchi, S. and Trabucco, A. and Pirrelli, V.},
TITLE = {Language Recognition Tool, Specifiche di Implementazione},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/457837},
}
@TECHREPORT{DELLORLETTA_2007_TECHREPORT_DFGLMTP_195930,
AUTHOR = {Dell'Orletta, F. and Federico, M. and Giovannetti, E. and Lenci, A. and Marchi, S. and Trabucco, A. and Pirrelli, V.},
TITLE = {Segmentazione di un Testo Italiano in Token},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/195930},
}
@TECHREPORT{ENEA_2007_TECHREPORT_E_195929,
AUTHOR = {Enea, A.},
TITLE = {Servizi di rete per il congresso LREC 2006},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/195929},
}
@TECHREPORT{FRANCOPOULO_2007_TECHREPORT_FMC_195947,
AUTHOR = {Francopoulo, G. and Monachini, M. and Calzolari, N.},
TITLE = {Lexical Standards for ISO ballot},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/195947},
}
@TECHREPORT{FRANCOPOULO_2007_TECHREPORT_FMC_195946,
AUTHOR = {Francopoulo, G. and Monachini, M. and Calzolari, N.},
TITLE = {Lexical Markup Framework: an ISO Standard for Semantic Information in NLP Lexicons},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/195946},
}
@TECHREPORT{MONACHINI_2007_TECHREPORT_M_457842,
AUTHOR = {Monachini, M.},
TITLE = {Test-suites of ISO conformant lexical entries},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/457842},
}
@TECHREPORT{MONTEMAGNI_2007_TECHREPORT_MMVBBRPT_195951,
AUTHOR = {Montemagni, S. and Marchi, S. and Venturi, G. and Bartolini, R. and Bertagna, F. and Ruffolo, P. and Peters, W. and Tiscornia, D.},
TITLE = {Report on Ontology learning tool and testing},
YEAR = {2007},
ABSTRACT = {This deliverable documents the work done within the DALOS EU project for what concerns the definition and implementation of methodologies and techniques to bootstrap terminological and ontological knowledge from domain corpora. Starting from a corpus of legacy legislative texts in different languages, linguistic technologies combined with statistical techniques have been used to extract significant terms as well as to structure them in conceptual structures for the different languages dealt with within the project, namely Italian, English, Spanish and Dutch},
KEYWORDS = {Ontology Learning, Term Extraction, Natural Language Processing, Conceptual Indexing},
URL = {https://iris.cnr.it/handle/20.500.14243/195951},
}
@TECHREPORT{MONTEMAGNI_2007_TECHREPORT_MS_195936,
AUTHOR = {Montemagni, S. and Simi, M.},
TITLE = {The Italian dependency annotated corpus developed for the CoNLL-2007 Shared Task},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/195936},
}
@TECHREPORT{MONTEMAGNI_2007_TECHREPORT_MTV_195937,
AUTHOR = {Montemagni, S. and Trabucco, A. and Venturi, G.},
TITLE = {Bio-Event Linguistic Annotation Tool. User Manual},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/195937},
}
@TECHREPORT{MONTEMAGNI_2007_TECHREPORT_MTVTCAMKRP_457839,
AUTHOR = {Montemagni, S. and Trabucco, A. and Venturi, G. and Thompson, P. and Cotter, P. and Ananiadou, S. and McNaught, J. and Kim, J. and Rebholz, D. and Pezik, P.},
TITLE = {Event annotation of domain corpora},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/457839},
}
@TECHREPORT{PICCHI_2007_TECHREPORT_P_195939,
AUTHOR = {Picchi, E.},
TITLE = {Analisi di corpora di documenti: strumenti e risorse linguistiche verso un'integrazione con ontologie},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/195939},
}
@TECHREPORT{PICCHI_2007_TECHREPORT_PSC_195941,
AUTHOR = {Picchi, E. and Sassolini, E. and Cucurullo, S.},
TITLE = {Implementazione di procedure di Clustering},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/195941},
}
@TECHREPORT{PICCHI_2007_TECHREPORT_PSC_457840,
AUTHOR = {Picchi, E. and Sassolini, E. and Cucurullo, S.},
TITLE = {Implementazione di procedure per la Named Entity Recognition},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/457840},
}
@TECHREPORT{PICCHI_2007_TECHREPORT_PSC_195942,
AUTHOR = {Picchi, E. and Sassolini, E. and Cucurullo, S.},
TITLE = {Implementazione di procedure di Spidering per sistemi di Alerting},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/195942},
}
@TECHREPORT{ROMARY_2007_TECHREPORT_RFMDBWFG_195950,
AUTHOR = {Romary, L. and Francopoulo, G. and Monachini, M. and Declerck, T. and Bunt, H. and Wittenburg, P. and Funk, A. and Gillam, L.},
TITLE = {LIRICS-Final Public Report},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/195950},
}
@TECHREPORT{SABA_2007_TECHREPORT_S_457843,
AUTHOR = {Saba, A.},
TITLE = {Arte della verdadera Navegación de Pedro de Siria},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/457843},
}
@TECHREPORT{SASAKI_2007_TECHREPORT_SMAPMMP_195938,
AUTHOR = {Sasaki, Y. and McNaught, J. and Ananiadou, S. and Pezik, P. and McGillivray, B. and Montemagni, S. and Pirrelli, V.},
TITLE = {Augmented Version of Bio-Lexicon},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/195938},
}
@TECHREPORT{SASSI_2007_TECHREPORT_SC_195945,
AUTHOR = {Sassi, M. and Cinini, A.},
TITLE = {Content analysis dei provvedimenti della sezione disciplinare del C. S. M},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/195945},
}
@TECHREPORT{SORIA_2007_TECHREPORT_ST_195949,
AUTHOR = {Soria, C. and Thorleifsdottir, A. E.},
TITLE = {eParticipation: the potential of new and emerging technologies},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/195949},
}
@THESIS{QUOCHI_2007_THESIS_Q_479321,
AUTHOR = {Quochi, V.},
TITLE = {A Usage-Based Approach to Light Verb Constructions in Italian: Development and Use},
YEAR = {2007},
ABSTRACT = {Oggetto di studio della ricerca è la costruzione a verbo supporto con verbo fare in ottica cognitiva e di apprendimento della prima lingua. L’ambito teorico di lavoro prescelto è la Linguistica Cognitiva e in particolar modo la Construction Grammar. La tesi che ha guidato questa ricerca è la convinzione che la Costruzione a Verbo Supporto (o leggero) costituisca un modello sintattico-semantico con funzione etichettante e che tale modello sia sfruttato dai bambini per nominare eventi per i quali non possiedono ancora un’etichetta. La costruzione a verbo supporto inoltre viene considerata come una struttura prototipica, una categoria radiale i cui confini non sono delineabili in maniera netta. Il primo capitolo presenta gli studi più importanti sul fenomeno delle costruzioni a verbo supporto e il background teorico sul quale si fonda la ricerca. Nel secondo capitolo si descrivono tre studi empirici volti a verificare per l’Italiano l’ipotesi di realtà psicologica delle Costruzioni (quali oggetti simbolici, coppie di forma e significato). Il terzo e quarto capitolo costituiscono il cuore della ricerca e sono dedicati allo studio empirico dei costrutti con verbo fare in un corpus di Italiano parlato L1 derivato dal database CHILDES. Da una parte si è analizzata la lingua di degli adulti per determinare le tipologie di costrutti rilevanti per il bambino e il ruolo della lingua di input nello sviluppo di questi costrutti nel bambino. Dall’altra si è studiato lo sviluppo dei costrutti fare Nome nella lingua del bambino per studiarne lo sviluppo e l’uso. I dati hanno confermato la tesi iniziale. Il bambino sfrutta lo schema della costruzione a verbo supporto per riferirsi ad azioni o eventi. Si sono individuate almeno due costruzioni per le quai il bambino mostra produttività. Il quinto, infine, è il capitolo conclusivo nel quale si dà una rappresentazione delle costruzioni identificate nel corpus nei termini di una famiglia di costruzioni al fine di mostrare come tale rappresentazione renda conto della vicinanza tra Costruzioni a Verbo Supporto e Costruzione Transitiva, e fornisca un buon modello esplicativo dei dati acquisizionali. Il capitolo si conclude con un riepilogo dei risultati ottenuti e un’indicazione degli sviluppi futuri},
URL = {https://iris.cnr.it/handle/20.500.14243/479321},
}
@MISC{_2007_MISC_S_17708,
AUTHOR = {, S. M. P. G.},
TITLE = {Digital Bibliography of Professor Antonio Zampolli},
YEAR = {2007},
ABSTRACT = {Antonio Zampolli: Director of Research and Assistant to the Director of CAAL (Centre for the Automatic Linguistic Annotations), Gallarate and Pisa (1960-1966). Research (Senior Engineer) at the Pisa Scientific Centre of IBM, Responsible for Computational Linguistics (1967-1975). Full Professor of Computational Linguistics at the University of Pisa, and founder (1968) and Director of the Linguistic Division of CNUCE, transformed in 1978 into the Institute of Computational Linguistics [Istituto di Linguistica Computazionale-ILC] of the National Research Council [Consiglio Nazionale delle Ricerche-CNR], Pisa. His main research interests were computational lexicology and lexicography, computer-assisted language teaching, formal grammars and parsers, literary and linguistic text analysis, machine translation, multimodality, multilinguality, quantitative linguistics, reusability of lexical resources, standards for literary and linguistic data processing, text processing},
URL = {https://iris.cnr.it/handle/20.500.14243/17708},
}
@MISC{AIELLO_2007_MISC_APC_450,
AUTHOR = {Aiello, M. and Papaleo, G. and Chiarella, D.},
TITLE = {LMA-Log Mail Analyzer},
YEAR = {2007},
ABSTRACT = {Network and system administrator should monitor log files for maintaining control over services he/she offers to users. This is a difficult task since it is necessary to completely understand log file format; moreover information on a single transaction is often spread on different lines. Another problem commonly found is represented by data mining operation which should be performed to extract important data from the whole (noise). All above problems are found when dealing with mail servers: we analyzed postfix and sendmail log file and created a tool, log mail analyzer aka LMA, for comprehensive analysis. LMA parses mail-log files, extracts information on each transaction and dumps records using BerkeleyDB or a different DataBase Management System like Mysql. Various type of query, both on BekeleyDB and sql language are supported: through these queries it is possible to adopt an anomaly based approach for intrusion detection purposes. In fact it is well known that viruses and worms propagate also using e-mails. Having a tool for clear understanding and monitoring smtp transaction may help in manager security tasks. LMA is written in Perl for portability reason and is available at http: //sourceforge. net/projects/lma/},
URL = {https://iris.cnr.it/handle/20.500.14243/450},
}
@MISC{FRANCOPOULO_2007_MISC_FM_129317,
AUTHOR = {Francopoulo, G. and Monachini, M.},
TITLE = {Lexical Markup Framework},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/129317},
}
@MISC{GIOVANNETTI_2007_MISC_G_244998,
AUTHOR = {Giovannetti, E.},
TITLE = {Creating and exploiting ontologies for semantic annotation of text},
YEAR = {2007},
ABSTRACT = {An ontology is a description of conceptual knowledge organized in a com-puter based representation. Semantic annotation of text is the process of making semantic information (e. g. about entities and relations) formally explicit. Semantic annotation and ontologies are involved in two main and related tasks: an ontology can be used for semantic annotation, this latter requiring a formal representation of the domain of interest during the process of natural language understanding. On the contrary, texts can be useful sources of knowledge for populating and enhancing ontologies. These two tasks can be combined in a cyclic process: ontologies are used as the "world knowledge" for interpreting the text and assigning the correct meanings to linguistic structures, while semantic annotation provides new knowledge to be exploited for the enrichment and refinement of the ontology itself. This (apparent) vicious circle (between the need of having the domain represented in the ontology for the semantic annotation process and the enrichment of the ontology based on the results obtained from the annotation) can be turned to a virtuous circle if the necessary conditions are set to let the evolving ontology and the annotation process interact in a synergetic way. The construction and maintenance of an ontology can be a very costly engineering process: in order to alleviate the costs several proposals for automatically learning ontologies from data have emerged. In particular "ontology learning from text" has recently become quite popular since textual resources are still the main means for knowledge encoding and transfer used by people. Semantic annotation of text requires the application of natural language processing techniques to reconstruct the syntactic structure of sentences, going through tokenization, morphological analysis and part-of-speech tagging. Once syntax has been made explicit, the ontology can be used to drive the attribution of meaning to the syntactical analysed text. In this work we present the state of the art of ontology learning from text and semantic annotation and the techniques necessary to make optimum use of their symbiosis},
URL = {https://iris.cnr.it/handle/20.500.14243/244998},
}
@MISC{MAIELLO_2007_MISC_MGC_446,
AUTHOR = {Maiello and Gpapaleo and Chiarella, D.},
TITLE = {Worm Poacher},
YEAR = {2007},
ABSTRACT = {We propose a new technique to detect internet worm. We base our research on the fact that an indirect worm (a worm spreading by e-mail) needs to spread quickly and so it sends a lot of e-mail in a short while, producing an anomalous behaviour. Moreover we found stealthy worms through detecting traffic anomalies. We worked on a mail-server log of a real network and the results obtained drove us to detect indirect worm with different approaches based on various parameters (global e-mail flow, single host e-mail flow, reject, sender field analysis)},
URL = {https://iris.cnr.it/handle/20.500.14243/446},
}
@MISC{PICCHI_2007_MISC_PMCSP_195948,
AUTHOR = {Picchi, E. and Montemagni, S. and Cucurullo, S. and Sassolini, E. and Paoli, M.},
TITLE = {ALT-Web. Sito dell Atlante Lessicale Toscano (ALT) in rete},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/195948},
}
@MISC{PICCHI_2007_MISC_PSC_195943,
AUTHOR = {Picchi, E. and Sassolini, E. and Cucurullo S, C. D.},
TITLE = {Legislazione Toscana raccolta e illustrata da Lorenzo Cantini},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/195943},
}
@MISC{QUOCHI_2007_MISC_QDMC_129309,
AUTHOR = {Quochi, V. and Del Gratta, R. and Monachini, M. and Calzolari, N.},
TITLE = {BioLexicon Model and Implementation},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/129309},
}
@MISC{SABA_2007_MISC_S_195928,
AUTHOR = {Saba, A.},
TITLE = {La Instrución de Mercaderes di Saravia de la Calle e la Institutione de mercanti di Alfonso de Ulloa. Trattamento dati},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/195928},
}
@MISC{SASSI_2007_MISC_SC_106742,
AUTHOR = {Sassi, M. and Cinini, A.},
TITLE = {Il monitoraggio dell'amministrazione della giustizia},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/106742},
CONFERENCE_NAME = {Tecnologia dell'informazione e della comunicazione per la giustizia},
}
@MISC{TESCONI_2007_MISC_TMBMSC_457836,
AUTHOR = {Tesconi, M. and Marchetti, A. and Bertagna, F. and Monachini, M. and Soria, C. and Calzolari, N.},
TITLE = {LeXFlow: a Prototype Supporting Collaborative Lexicon Development and Cross-fertilization},
YEAR = {2007},
URL = {https://iris.cnr.it/handle/20.500.14243/457836},
}
@ARTICLE{BOZZI_2006_ARTICLE_B_37698,
AUTHOR = {Bozzi, A.},
TITLE = {Electronic Publishing and Computational Philology},
YEAR = {2006},
ABSTRACT = {Abstract-This paper is concerned with the relationship between electronic publishing and digital scholarly textual criticism. Hypertextual techniques and computational tools are compared. These two different methodologies applied to modern and contemporary texts with respect to ancient manuscript tradition are highlighted. Particular attention is focussed on the general criteria employed in the development of a computer-assisted workstation for digital editions of Greek papyri and medieval manuscripts. Keywords-electronic publishing, computational philology, digital},
KEYWORDS = {Electronic publishing, Computational philology, Digital libraries, Textual criticism},
PAGES = {3-24},
URL = {https://iris.cnr.it/handle/20.500.14243/37698},
VOLUME = {24-25},
ISSN = {0392-6907},
JOURNAL = {LINGUISTICA COMPUTAZIONALE},
}
@ARTICLE{BURGASSI_2006_ARTICLE_B_269604,
AUTHOR = {Burgassi, C.},
TITLE = {Tessere jacoponiche},
YEAR = {2006},
ABSTRACT = {Il contributo esamina alcuni aspetti della lingua di Jacopone da Todi. Attenzione particolare è dedicata ai contatti con la tradizione letteraria dei Padri della Chiesa e dell'esegesi biblica medievale},
KEYWORDS = {Filologia Italiana, Jacopone da Todi},
PAGES = {5-19},
URL = {https://iris.cnr.it/handle/20.500.14243/269604},
VOLUME = {64},
ISSN = {0392-5110},
JOURNAL = {STUDI DI FILOLOGIA ITALIANA},
}
@ARTICLE{DELRIO_2006_ARTICLE_DDT_37700,
AUTHOR = {Del Rio, N. and Durán, J. I. and Turrini, G.},
TITLE = {Addizionario: a Tool for the Emergence of Indigenous Language as a House of Being},
YEAR = {2006},
ABSTRACT = {This paper reports the preliminary findings of a study about the use of an itneractive multimedia and multilingual software application (Addizionario) in an intercultural setting and the role of language in education. The study involved nine primary schools of very small P'urhepecha indigenous communities in the state of Michoacan, Mexico. In an attempt to evaluate the impact of th4e software as a tool for opening up a space for written language production in the maternal tongue, emphasis will be placed not only on products and results, but also on the process and difficulties of using the software in contexts characterized by strong digital divide, significant educational lag, and gradual loss of the indigenous languages},
PAGES = {263-282},
URL = {https://iris.cnr.it/handle/20.500.14243/37700},
VOLUME = {XXVI},
}
@ARTICLE{GUADAGNINI_2006_ARTICLE_G_75403,
AUTHOR = {Guadagnini, E.},
TITLE = {Scelta di voci del Tesoro della Lingua Italiana delle Origini (decima serie)},
YEAR = {2006},
ABSTRACT = {Voce diritto agg. /avv. /prep. /s. m},
KEYWORDS = {Lessicografia italiana, Italiano antico},
PAGES = {11-248},
URL = {https://iris.cnr.it/handle/20.500.14243/75403},
VOLUME = {11},
ISSN = {1591-8254},
JOURNAL = {BOLLETTINO-OPERA DEL VOCABOLARIO ITALIANO},
}
@ARTICLE{MAC_2006_ARTICLE_MBBC_433724,
AUTHOR = {Macé, C. and Baret, P. and Bozzi, A. and Cignoni Eds, L.},
TITLE = {Preface},
YEAR = {2006},
ABSTRACT = {Many scientific ventures start from haphazard meetings and this is also true for the history of this volume. During an informal meeting, Philippe Baret, Caroline Macé, Barbara Bordalejo and Peter Robinson put forward the idea of organizing a workshop together; only a few months later what had first appeared to be a simple hypothesis became a real event, also made possible thanks to the collaboration of many people and to the financial support of the Unit of Genetics of the University of Louvain (Louvain-la-Neuve, Faculty of Bioengineering, Agricultural and Environmental Sciences). We need to thank people who morally supported our initiative from the very beginning: besides Peter Robinson and Barbara Bordalejo, we would like to thank Peter Van Deun and Bram Roosen (Instituut voor Vroegchristelijke en Byzantijnse studies, K. U. Leuven), Carlos Steel (De Wulf-Mansioncentrum, K. U. Leuven), Dirk Van Hulle (Antwerp James Joyce Centre, Universiteit Antwerpen) and Andrea Schmidt (Centre for the Study of Gregory of Nazianzus, U. C. L.). Above all, we wish to thank the people who helped us make this workshop not only a scientific achievement but also a pleasant moment of friendship and conviviality: Anne-Catherine Lantin, Steve Ferrière and Isabelle Caignet. We would not have been able to present the results of this international conference to the public without the support of the Institute for Computational Linguistics in Pisa. Although the conference was held in English, we did not want the publication to be exclusively in this language. Therefore, we are grateful to Richard Goulet, who could not participate in the workshop, but accepted to contribute to this volume. Richard Goulet, like Peter Robinson and Andrea Bozzi, is a pioneer in the use of the computer in philology. Finally, Laura Cignoni should be thanked for her precious contribution in all those cases in which it was necessary to perform translations from Italian into English and for the general editing of the text to be handed to the publisher in camera-ready format},
PAGES = {xi-xv},
URL = {https://iris.cnr.it/handle/20.500.14243/433724},
VOLUME = {24-25},
}
@ARTICLE{MIAZZA_2006_ARTICLE_MZTCTM_37701,
AUTHOR = {Miazza, D. and Zanetti, M. and Turrini, G. and Cerri, R. and Torti, R. and Muriana, M.},
TITLE = {Creating Worlds with Addizionario: an Integrated Teaching Approach},
YEAR = {2006},
ABSTRACT = {This paper presents an experience with 10-year-old children in the use of conceptual maps to build and comprehend descriptive texts. This was part of a multidisciplinary project aimed at increasing the pupils' knowledge of their own town. The aim of the project was twofold: to develop the general knowledge of the children and to promote the creation of linkages among different areas of knowledge by using Addizionario. The children built personal knowledge paths. This proved to be a motivating task, as each child enriched the given materials with self-made ones (pictures, drawings, photos, texts). This teaching method helped the children achieve significant learning goals, and promoted self-efficacy and empowerment. Moreover, it supported and favored an atmosphere of 'knowledge sharing' in the calssroom, which considerably improved individual productions. Throughout the school year, the topic of the research project-Pavia as a world-was developed in relation to four school subjects: history, geography, science, and visual arts},
PAGES = {217-232},
URL = {https://iris.cnr.it/handle/20.500.14243/37701},
VOLUME = {XXVI},
}
@ARTICLE{PASSAROTTI_2006_ARTICLE_PB_37699,
AUTHOR = {Passarotti, M. and Bozzi, A.},
TITLE = {Towards Textual Drift Modelling in Computational Philology},
YEAR = {2006},
ABSTRACT = {Abstract-The article highlights the need to fix the methodological basis of computational philology. Formalization and modelling of the textual drift phenomenon, intended as a set of modifications to which each text is submitted in the course of its production and/or transmission, are the necessary grounds for a formal and shared definition of the research methods of computational philology. A methodological interdisciplinary solution to these problems is proposed, which consists in merging the individual experiences achieved in the field of philology with the results obtained by evolutionary biology. Two important strands have been identified concerning philology (not only computational), independent of whether they are dealing with authorial, or non-authorial variants. Textual drift modelling should be conducted so that it can be applied to the greatest extent to both strands. Keywords-philology, philogenetics, computational textual criticism},
PAGES = {63-86},
URL = {https://iris.cnr.it/handle/20.500.14243/37699},
VOLUME = {24-25},
}
@ARTICLE{PIOGGIA_2006_ARTICLE_PFDD_999,
AUTHOR = {Pioggia, G. and Ferro, M. and Di Francesco, F. and De Rossi, D.},
TITLE = {A processing architecture for associative short-term memory in electronic noses},
YEAR = {2006},
ABSTRACT = {Electronic nose (e-nose) architectures usually consist of several modules that process various tasks such as control, data acquisition, data filtering, feature selection and pattern analysis. Heterogeneous techniques derived from chemometrics, neural networks, and fuzzy rules used to implement such tasks may lead to issues concerning module interconnection and cooperation. Moreover, a new learning phase is mandatory once new measurements have been added to the dataset, thus causing changes in the previously derived model. Consequently, if a loss in the previous learning occurs (catastrophic interference), real-time applications of e-noses are limited. To overcome these problems this paper presents an architecture for dynamic and efficient management of multi-transducer data processing techniques and for saving an associative short-term memory of the previously learned model. The architecture implements an artificial model of a hippocampus-based working memory, enabling the system to be ready for real-time applications. Starting from the base models available in the architecture core, dedicated models for neurons, maps and connections were tailored to an artificial olfactory system devoted to analysing olive oil. In order to verify the ability of the processing architecture in associative and short-term memory, a paired-associate learning test was applied. The avoidance of catastrophic interference was observed},
KEYWORDS = {Associative short-term memory, Catastrophic interference, Electronic noses, Multi-transducer data processing},
PAGES = {3066-3072},
URL = {https://iris.cnr.it/handle/20.500.14243/999},
VOLUME = {17 (11)},
DOI = {10.1088/0957-0233/17/11/027},
ISSN = {0957-0233},
JOURNAL = {MEASUREMENT SCIENCE \& TECHNOLOGY (PRINT)},
}
@ARTICLE{TURRINI_2006_ARTICLE_TBBP_37702,
AUTHOR = {Turrini, G. and Baroni, P. and Bianchi, F. and Paccosi, A.},
TITLE = {Addizionario-Plus},
YEAR = {2006},
ABSTRACT = {The present paper describes Addizionario-Plus, the updated and extended version of Addizionario. The main changes that have been introduced into the software (some of which were requested or suggested by users) concern: a) the system architecture; b) the graphics of the user interface; c) the programming language; d) the number and types of activities that it is possible to carry out; e) the creation of the Teacher Module; f) the development of a wide, detailed range of online helps; and g) while performing the activities, the possibility of accessing a large quantity of ready-to-use material, arranged into a number of teaching paths already traced out},
KEYWORDS = {multimedia tools, language teaching/learning, intercultural education},
PAGES = {283-293},
URL = {http://www.libraweb.net/articoli.php?chiave=200601502\&rivista=15},
VOLUME = {XXVI},
ISSN = {0392-6907},
JOURNAL = {LINGUISTICA COMPUTAZIONALE},
}
@ARTICLE{TURRINI_2006_ARTICLE_TBP_37705,
AUTHOR = {Turrini, G. and Baroni, P. and Paccosi, A.},
TITLE = {AddizionarioPLUS: a Creative Approach to Linguistic and Intercultural Education},
YEAR = {2006},
ABSTRACT = {This paper describes AddizionarioPLUS, the updated and extended version of Addizionario. Addizionario-a hypermedia linguistic laboratory in which children being from 5 to 12 years old can study Italian as their native or second language at various levels of difficulty and from different points of view-was developed by the Institute for Computational Linguistics of the National Research Council (ILC-CNR), in collaboration with the Department of Computer Science of the University of Turin, and was successfully tested in Italy and abroad. The main changes that have been introduced into the software concern: a) the graphic interface with the user, b) the programming language, c) the system architecture, d) the possible activities, e) the organization of the working environments, f) a module for the teacher, g) the available ready-to-use material and learning paths, h) the possible helps for both pupils and the teacher},
KEYWORDS = {multimedia, dictionary, language, culture, education},
PAGES = {407-412},
URL = {http://www.informatica.si/vols/vol30.html#No4},
VOLUME = {30 (4)},
ISSN = {0350-5596},
JOURNAL = {INFORMATICA},
}
@ARTICLE{TURRINI_2006_ARTICLE_TB_433725,
AUTHOR = {Turrini, G. and Bianchi, F.},
TITLE = {Preface},
YEAR = {2006},
PAGES = {xi-xviii},
URL = {https://iris.cnr.it/handle/20.500.14243/433725},
VOLUME = {XXVI},
}
@ARTICLE{TURRINI_2006_ARTICLE_TB_37703,
AUTHOR = {Turrini, G. and Bianchi, F.},
TITLE = {Addizionario: A Child-Centered Approach to Linguistic Education},
YEAR = {2006},
ABSTRACT = {Addizionario is an innovative learning tool which supports the child's cognitive and linguistic development. In the form of a hypermedia laboratory, it encourages children to study language at various levels of difficulty and from different points of view, with particular emphasis on lexical competence and language reflection. This paper describes Addizionario and its two strictly interrelated, but at the same time independent, components: (i) the Core Dictionary, a dictionary for children written and illustrated by children; and (ii) the Activity Book, a multimedia creative environment which allows the children to construct their own personal dictionaries and to play with language. Furthermore, some teaching ideas are offered to help teachers take advantage of the features of the software},
PAGES = {3-22},
URL = {https://iris.cnr.it/handle/20.500.14243/37703},
VOLUME = {XXVI},
}
@ARTICLE{ZANETTI_2006_ARTICLE_ZMT_433726,
AUTHOR = {Zanetti, M. A. and Miazza, D. and Turrini, G.},
TITLE = {Between Metacognition and Creativity},
YEAR = {2006},
PAGES = {399-405},
URL = {https://iris.cnr.it/handle/20.500.14243/433726},
VOLUME = {30/4},
}
@ARTICLE{ZANETTI_2006_ARTICLE_ZMT_37704,
AUTHOR = {Zanetti, M. and Miazza, D. and Turrini, G.},
TITLE = {Addizionario: in between Cognition and Metacognition},
YEAR = {2006},
ABSTRACT = {Metacognitive theory considers learning as the result of the activation of several conscious processes. Our project aimed to support reading comprehension and meaningful learning by the use of conceptual maps and to investigate the processes involved in motivated learning when the pupil's attention is turned to learning objectives and suitable strategies are made explicit and shared. The project saw a group of children attending year four in an Italian primary school tackle a scientific subject matter from a multidisciplinary perspective. Each pupil created an initial conceptual map in pen-and-paper format and then a final one with Addizionario. Qualitative and quantitative comparison between the two outputs showed development in the learning processes, awareness of the logical reasoning used in creating the map, and ability to self-monitor the progressive mastering of knowledge. Active re-elaboration of the material helped the children understand the learning objectives, and find suitable strategies},
PAGES = {233-252},
URL = {https://iris.cnr.it/handle/20.500.14243/37704},
VOLUME = {XXVI},
}
@BOOK{CININI_2006_BOOK_CS_138512,
AUTHOR = {Cinini, A. and Sassi, M.},
TITLE = {Content analysis dei provvedimenti della sezione disciplinare del C. S. M},
YEAR = {2006},
ABSTRACT = {Nell'ambito del progetto di ricerca denominato "Tecnologie dell'informazione e della comunicazione per la giustizia" coordinato dall'Istituto di Ricerca sui Sistemi Giudiziari (IRSIGCNR di Bologna) e co-finanziato dai Fondi Integrativi Ricerca di Base (FIRB) del Ministero dell'Università e della Ricerca, l'Istituto di Linguistica Computazionale (ILC-CNR di Pisa) ha collaborato con l'IRSIG e con il Centro Studi e Ricerche sull'Ordinamento Giudiziario dell'Università di Bologna per la realizzazione di una base dati elettronica per l'analisi dei provvedimenti della sezione disciplinare del Consiglio Superiore della Magistratura},
KEYWORDS = {Informatica giuridica documentale, Knowledge extraction from texts, DBT},
PAGES = {1-68},
URL = {https://iris.cnr.it/handle/20.500.14243/138512},
PUBLISHER = {S. T. A. R. Servizio Tecnografico Area Ricerca CNR (Pisa, ITA)},
CONFERENCE_PLACE = {Pisa},
}
@BOOK{MAC_2006_BOOK_MBBC_134798,
AUTHOR = {Macé, C. and Baret, P. and Bozzi, A. and Cignoni, L. E.},
TITLE = {The Evolution of Texts: Confronting Stemmatological and Genetical Methods},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/134798},
}
@BOOK{TURRINI_2006_BOOK_TB_134800,
AUTHOR = {Turrini, G. and Bianchi, F. E.},
TITLE = {Hypermedia for Education and Research},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/134800},
}
@INCOLLECTION{BOZZI_2006_INCOLLECTION_B_134801,
AUTHOR = {Bozzi, A.},
TITLE = {Edizione elettronica dei testi e filologia computazionale},
YEAR = {2006},
PAGES = {207-232},
URL = {https://iris.cnr.it/handle/20.500.14243/134801},
PUBLISHER = {II mulino (Bologna, ITA)},
ISBN = {8815107193},
CONFERENCE_PLACE = {Bologna},
BOOKTITLE = {Fondamenti di critica testuale},
EDITOR = {Stussi, A.},
}
@INCOLLECTION{CALZOLARI_2006_INCOLLECTION_C_134803,
AUTHOR = {Calzolari, N.},
TITLE = {Language Resources and Content Interoperability: technical, strategic and political issues for a new generation of Language Resources},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/134803},
}
@INCOLLECTION{MARINELLI_2006_INCOLLECTION_MBR_134806,
AUTHOR = {Marinelli, R. and Bindi, R. and Roventini, A.},
TITLE = {Metonymic and Metaphorical Uses of Proper Names},
YEAR = {2006},
ABSTRACT = {In this paper we describe a research we are carrying out in the framework of ItalWordNet, a large lexical-semantic database containing semantic information for about 50, 000 synsets of nouns, verbs, adjectives, adverbs, and a subset of proper names, which is continuously enriched and updated at the Institute for Computational Linguistics in Pisa. The research concerns the proper names considered from a twofold aspect: their coding in the lexical semantic database and their concrete use, as it is evidenced within a large corpus of the contemporary written Italian language. In particular the semantic relations involving the proper names and their senses (literal, derived and extended) are taken into consideration. Many proper names turn out to be the basis for many extensions of meaning, so in the paper we analyse in the corpus a set of them showing many types of derivates and sense extensions generated by means of lexical rules that operate as "generative factors" (Pustejovsky, 2001). The many contexts of use, analyzed in the corpus, confirm a rich regular polysemy regarding this category of nouns, so, for a set of cases, we propose to represent this phenomenon by introducing specific semantic relations in the database},
KEYWORDS = {Lexical semantic databases, Proper Names, Corpora},
PAGES = {69-78},
URL = {http://www.c-s-p.org/Flyers/Linguistics-in-the-Twenty-First-Century.htm},
PUBLISHER = {Centro de linguística aplicada, Ministerio de ciencia, tecnología y medio ambiente (Newcastle, GBR)},
ISBN = {1904303862},
CONFERENCE_PLACE = {Santiago de Cuba},
BOOKTITLE = {Linguistics in the Twenty First Century},
EDITOR = {Bermúdez, E. M. and Miyares, L. R.},
}
@INCOLLECTION{MARINELLI_2006_INCOLLECTION_MR_134807,
AUTHOR = {Marinelli, R. and Roventini, A.},
TITLE = {The Italian Marittime Lexicon and the ItalWordNet Semantic Database},
YEAR = {2006},
ABSTRACT = {The paper reports on the creation of a terminological subset belonging to the maritime lexical domain; this set of terms is structured according to the design principles of the generic Italian lexical semantic database ItalWordNet, i. e. applying the same semantic relations model and using the possibility of linking the specialised terms to the corresponding closest concepts in WordNet. The main characteristics of the lexical semantic database are also described and, in particular: i) the construction of the terminological wordnet; ii) the approach adopted to connect the terminological database to the generic one; iii) some issues about the mapping between the Italian terms and the Princeton WordNet; iv) a first outline of a specific maritime domain ontology},
KEYWORDS = {Lexical databases, Terminology, Ontology},
PAGES = {173-182},
URL = {http://www.c-s-p.org/Flyers/Linguistics-in-the-Twenty-First-Century.htm},
PUBLISHER = {Centro de linguística aplicada, Ministerio de ciencia, tecnología y medio ambiente (Newcastle, GBR)},
ISBN = {1904303862},
CONFERENCE_PLACE = {Santiago de Cuba},
BOOKTITLE = {Linguistics in the Twenty First Century},
EDITOR = {Bermúdez, E. M. and Miyares, L. R.},
}
@INCOLLECTION{TURRINI_2006_INCOLLECTION_TCP_134799,
AUTHOR = {Turrini, G. and Cignoni, L. and Paccosi, A.},
TITLE = {Addizionario: il dizionario visto dalla parte dei bambini},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/134799},
}
Warning: Undefined array key 0 in /mnt/resources/apps/pipol_v5/lib_pipol.php on line 7034
Deprecated: strtoupper(): Passing null to parameter #1 ($string) of type string is deprecated in /mnt/resources/apps/pipol_v5/lib_pipol.php on line 7034
@EDITORIAL{_2006_EDITORIAL__453614,
AUTHOR = {},
TITLE = {Proceedings of LREC 2006: 5th International Conference on Language Resources and Evaluation},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/453614},
}
Warning: Undefined array key 0 in /mnt/resources/apps/pipol_v5/lib_pipol.php on line 7034
Deprecated: strtoupper(): Passing null to parameter #1 ($string) of type string is deprecated in /mnt/resources/apps/pipol_v5/lib_pipol.php on line 7034
@EDITORIAL{_2006_EDITORIAL__181025,
AUTHOR = {},
TITLE = {The Evolution of Texts: Confronting Stemmatological and Genetical Methods},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/181025},
}
Warning: Undefined array key 0 in /mnt/resources/apps/pipol_v5/lib_pipol.php on line 7034
Deprecated: strtoupper(): Passing null to parameter #1 ($string) of type string is deprecated in /mnt/resources/apps/pipol_v5/lib_pipol.php on line 7034
@EDITORIAL{_2006_EDITORIAL__181027,
AUTHOR = {},
TITLE = {Language Resources and Evaluation},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/181027},
}
@INPROCEEDINGS{AIELLO_2006_INPROCEEDINGS_AACP_104535,
AUTHOR = {Aiello, M. and A Avanzini, D. and Chiarella, D. and Papaleo, G.},
TITLE = {Worm detection using e-mail data mining},
YEAR = {2006},
ABSTRACT = {We propose a new technique to detect internet worm. We base our research on the fact that an indirect worm (a worm spreading by e-mail) needs to spread quickly and so it sends a lot of e-mail in a short while, producing an anomalous behaviour. Moreover we found stealthy worms through detecting traffic anomalies. We worked on a mail-server log of a real network and the results obtained drove us to detect indirect worm with different approaches based on various parameters (global email flow, single host e-mail flow, reject, sender field analysis)},
KEYWORDS = {Data Mining, E-mail, Early Detection, Worm},
URL = {https://iris.cnr.it/handle/20.500.14243/104535},
CONFERENCE_NAME = {PRISE},
}
@INPROCEEDINGS{AIELLO_2006_INPROCEEDINGS_AACP_67262,
AUTHOR = {Aiello, M. and A Avanzini, D. and Chiarella, D. and Papaleo, G.},
TITLE = {Worm detection using e-mail data mining},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/67262},
CONFERENCE_NAME = {Primo Workshop italiano su Privacy e Security},
}
@INPROCEEDINGS{AIELLO_2006_INPROCEEDINGS_AACP_434409,
AUTHOR = {Aiello, M. and Avanzini, D. A. and Chiarella, D. and Papaleo, G.},
TITLE = {A tool for complete log mail analysis: LMA},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/434409},
CONFERENCE_NAME = {Trans European Research and Education Networking Association},
}
@INPROCEEDINGS{BARBERA_2006_INPROCEEDINGS_BD_384176,
AUTHOR = {Barbera, M. and Di Donato, F.},
TITLE = {Weaving the Web of Science. HyperJournal and the impact of the Semantic Web on scientific publishing},
YEAR = {2006},
ABSTRACT = {In this paper we present HyperJournal, an Open Source web application for publishing on-line Open Access scholarly journals. In the first part (sections 1, 2 and 3) we briefly describe the project and the software. In sections 4 and 5, we discuss the weaknesses of the current publishing model and the benefits deriving from the adoption of Semantic Web technologies, outlining how the Semantic Web vision can help to overcome the inefficiencies of the current model. In the last two sections (6 and 7), we present two experimental applications, developed on top of HyperJournal, with the purpose of demonstrating how the technologies can affect the daily work of scholars. The first application is a tool for graphically visualizing the network of citations existing between articles and their authors, and for performing bibliometric measurements alternative to the ISI Impact Factor. The second is a tool for automatically extracting references from non-structured textual documents, which is part of a tool-chain for the extraction of hidden semantics},
URL = {https://iris.cnr.it/handle/20.500.14243/384176},
}
@INPROCEEDINGS{BARTOLINI_2006_INPROCEEDINGS_BCGLMPRS_61476,
AUTHOR = {Bartolini, R. and Caracciolo, C. and Giovannetti, E. and Lenci, A. and Marchi, S. and Pirrelli, V. and Renso, C. and Spinsanti, L.},
TITLE = {Creation and use of lexicons and ontologies for natural language interface to databases},
YEAR = {2006},
ABSTRACT = {In this paper we present an original approach to natural language query interpretation which has been implemented within the FuLL (Fuzzy Logic and Language) Italian project of BC S. r. l. In particular, we discuss here the creation of linguistic and ontological resources, together with the exploitation of existing ones, for natural language-driven database access and retrieval. Both the database and the queries we experiment with are Italian, but the methodology we broach naturally extends to other languages},
KEYWORDS = {Natual language processing, ontologies, gis, databases},
PAGES = {6},
URL = {https://iris.cnr.it/handle/20.500.14243/61476},
CONFERENCE_NAME = {LREC Conference},
BOOKTITLE = {LREC 2006},
}
@INPROCEEDINGS{BARTOLINI_2006_INPROCEEDINGS_BGMMABSB_65047,
AUTHOR = {Bartolini, R. and Giovannetti, E. and Marchi, S. and Montemagni, S. and Andreatta, C. and Brunelli, R. and Stecher, R. and Bouquet, P.},
TITLE = {Multimedia Information Extraction in Ontology-based Semantic Annotation of Product Catalogues},
YEAR = {2006},
ABSTRACT = {The demand for efficient methods for extracting knowledge from multimedia content has led to a growing research community investigating the convergence of multimedia and knowledge technologies. In this paper we describe a methodology for extracting multimedia information from product catalogues empowered by the synergetic use and extension of a domain ontology. The methodology was implemented in the Trade Fair Advanced Semantic Annotation Pipeline of the VIKE-framework},
KEYWORDS = {Semantic Web Technologies, ontology creation, ontology extraction, ontology evolution, semantic annotation of multimedia content},
URL = {https://iris.cnr.it/handle/20.500.14243/65047},
CONFERENCE_NAME = {SWAP 2006},
}
@INPROCEEDINGS{BOMBARA_2006_INPROCEEDINGS_BCCGMRST_62247,
AUTHOR = {Bombara, M. and Calì, D. and Calì, I. and Giovannetti, E. and Masserotti, M. V. and Renso, C. and Spinsanti, L. and Tropea, G.},
TITLE = {Interrogazioni in linguaggio naturale a basi dati eterogenee: l'ontologia nel sistema "FuLL" nei GIS},
YEAR = {2006},
ABSTRACT = {The interaction between users and GIS software is a known and critical issue. The importance of giving those users a natural language interface to the system is thus strategic. Moving such a NL interface between heterogeneous DBs is an even more challenging task. We accomplish this by using a domain ontology as a knowledge repository and interface between raw data and language semantics. Successful tests of FuLL's (Fuzzy Logic and Language) technology are reported, where we have used the same ontology structure and connected it to Bologna's and Catania's district geo-databases},
KEYWORDS = {Natural Language Processing, Query in linguaggio naturale},
PAGES = {6},
URL = {https://iris.cnr.it/handle/20.500.14243/62247},
CONFERENCE_NAME = {AMFM 2006-Informazione Geografica: data harmonisation, interoperabilità e standard, reti e facilities management, ubiquitous GIS},
BOOKTITLE = {Informazione Geografica: data harmonisation, interoperabilità e standard, reti e facilities management, ubiquitous GIS. Atti},
}
@INPROCEEDINGS{CALZOLARI_2006_INPROCEEDINGS_CSSCPBEMSC_64246,
AUTHOR = {Calzolari, F. and Sassolini, E. and Sassi, M. and Cucurullo, S. and Picchi, E. and Bertagna, F. and Enea, A. and Monachini, M. and Soria, C. and Calzolari, N.},
TITLE = {Next Generation Language Resources using Grid},
YEAR = {2006},
ABSTRACT = {This paper presents a case study concerning the challenges and requirements posed by next generation language resources, realized as an overall model of open, distributed and collaborative language infrastructure. If a sort of "new paradigm" for language resource sharing is required, we think that the emerging and still evolving technology connected to Grid computing is a very interesting and suitable one for a concrete realization of this vision. Given the current limitations of Grid computing, it is very important to test the new environment on basic language analysis tools, in order to get the feeling of what are the potentialities and possible limitations connected to its use in NLP. For this reason, we have done some experiments on a module of the Linguistic Miner, i. e. the extraction of linguistic patterns from restricted domain corpora. The Grid environment has produced the expected results (reduction of the processing time, huge storage capacity, data redundancy) without any additional cost for the final user},
KEYWORDS = {grid, acquisition, topic classification},
PAGES = {1858-1861},
URL = {https://iris.cnr.it/handle/20.500.14243/64246},
ISBN = {2-9517408-2-4},
CONFERENCE_NAME = {LREC 2006: 5th International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{CALZOLARI_2006_INPROCEEDINGS_C_65032,
AUTHOR = {Calzolari, N.},
TITLE = {International Standards for Computational Lexicons: their relation to terminology},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/65032},
}
@INPROCEEDINGS{CASELLI_2006_INPROCEEDINGS_CP_65013,
AUTHOR = {Caselli, T. and Prodanof, I.},
TITLE = {Annotating Bridging Anaphors in Italian: in Search of Reliability},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/65013},
CONFERENCE_NAME = {LREC 2006: 5th International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{CUCURULLO_2006_INPROCEEDINGS_CMPPS_65044,
AUTHOR = {Cucurullo, S. and Montemagni, S. and Paoli, M. and Picchi, E. and Sassolini, E.},
TITLE = {Atlante Dialettale in rete: ALT-Web},
YEAR = {2006},
ABSTRACT = {The paper presents an on-line dialectal resource, ALT-Web, which gives access to the linguistic data of the Lexical Atlas of Tuscany or Atlante Lessicale Toscano, a specially designed linguistic atlas in which lexical data have both a diatopic and diastratic characterisation. The paper illustrates ALT-Web with particular emphasis on: 1) the dialectal data representation model; 2) the access modalities to the ALT dialectal corpus designed to produce an output tailored to the specific needs of the different classes of users (both professionals and common citizens); 3) ontology-based search. These represent three main features which differentiate ALT-Web both from the previous digitalised ALT version and, most interestingly, from other on-line dialectal resources. At the time of writing, this is the first resource of this type in Italy, and one of the few at the international level},
KEYWORDS = {dialectal resources, information retrieval},
PAGES = {661-672},
URL = {http://www.euralex.org/publications/},
PUBLISHER = {Edizioni dell'ORSO (Alessandria, ITA)},
ISBN = {8876949186},
CONFERENCE_NAME = {12° EURALEX International Congress},
CONFERENCE_PLACE = {Alessandria},
BOOKTITLE = {Proceedings in 12° EURALEX International Congress, Congresso internazionale di lessicografia},
EDITOR = {Corino, E. and Marello, C. and Onesti, C.},
}
@INPROCEEDINGS{CUCURULLO_2006_INPROCEEDINGS_CMPPS_65014,
AUTHOR = {Cucurullo, S. and Montemagni, S. and Paoli, M. and Picchi, E. and Sassolini, E.},
TITLE = {Dialectal resources on-line: the ALT-Web experience},
YEAR = {2006},
ABSTRACT = {The paper presents an on-line dialectal resource, ALT-Web, which gives access to the linguistic data of the Atlante Lessicale Toscano, a specially designed linguistic atlas in which lexical data have both a diatopic and diastratic characterisation. The paper focuses on: the dialectal data representation model; the access modalities to the ALT dialectal corpus; ontology-based search},
KEYWORDS = {Computational dialectology, Dialectal databases, Construction of lexical resources},
PAGES = {1846-1851},
URL = {http://www.lrec-conf.org/lrec2006/},
ISBN = {2-9517408-2-4},
CONFERENCE_NAME = {LREC 2006: 5th International Conference on Language Resources and Evaluation},
BOOKTITLE = {Dialectal resources on-line: the ALT-Web experience},
}
@INPROCEEDINGS{DELLORLETTA_2006_INPROCEEDINGS_DLMP_65043,
AUTHOR = {Dell'Orletta, F. and Lenci, A. and Montemagni, S. and Pirrelli, V.},
TITLE = {Probing the space of grammatical variation: induction of cross-lingual grammatical constraints from treebanks},
YEAR = {2006},
ABSTRACT = {The paper reports on a detailed quantitative analysis of distributional language data of both Italian and Czech, highlighting the relative contribution of a number of distributed grammatical factors to sentence-based identification of subjects and direct objects. The work uses a Maximum Entropy model of stochastic resolution of conflicting grammatical constraints and is demonstrably capable of putting explanatory theoretical accounts to the test of usage-based empirical verification},
PAGES = {21-28},
URL = {https://iris.cnr.it/handle/20.500.14243/65043},
PUBLISHER = {Association for Computational Linguistics (Stroudsburg, USA)},
ISBN = {1-932432-78-7},
CONFERENCE_NAME = {Coling/ACL 2006},
CONFERENCE_PLACE = {Stroudsburg},
BOOKTITLE = {Proceedings of the Workshop on Frontiers in Linguistically Annotated Corpora 2006 (LAC 06)},
}
@INPROCEEDINGS{DELLORLETTA_2006_INPROCEEDINGS_DLMP_65015,
AUTHOR = {Dellorletta, F. and Lenci, A. and Montemagni, S. and Pirrelli, V.},
TITLE = {Searching treebanks for functional constraints: cross-lingual experiments in grammatical relation assignment},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/65015},
CONFERENCE_NAME = {LREC 2006: 5th International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{FRANCOPOULO_2006_INPROCEEDINGS_FBGCMPS_65033,
AUTHOR = {Francopoulo, G. and Bel, N. and George, M. and Calzolari, N. and Monachini, M. and Pet, M. and Soria, C.},
TITLE = {Lexical markup framework (LMF) for NLP multilingual resources},
YEAR = {2006},
ABSTRACT = {Optimizing the production, maintenance and extension of lexical resources is one of the crucial aspects impacting Natural Language Processing (NLP). A second aspect involves optimizing the process leading to their integration into applications. In this respect, we believe that the production of a consensual specification on multilingual lexicons can be a useful aid for the various NLP actors. Within ISO, one purpose of LMF (ISO-24613) is to define a standard for lexicons that covers multilingual data},
PAGES = {1-8},
URL = {https://iris.cnr.it/handle/20.500.14243/65033},
ISBN = {1-932432-69-8},
CONFERENCE_NAME = {COLING-ACL Workshop on Multilingual Lexical Resources and Interoperability},
BOOKTITLE = {Proceedings of the Workshop on Multilingual Language Resources and Interoperability},
}
@INPROCEEDINGS{FRANCOPOULO_2006_INPROCEEDINGS_FDMR_65016,
AUTHOR = {Francopoulo, G. and Declerck, T. and Monachini, M. and Romary, L.},
TITLE = {The relevance of standards for research infrastructures},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/65016},
CONFERENCE_NAME = {LREC 2006: 5th International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{FRANCOPOULO_2006_INPROCEEDINGS_FGCMBPS_65018,
AUTHOR = {Francopoulo, G. and George, M. and Calzolari, N. and Monachini, M. and Bel, N. and Pet, M. and Soria, C.},
TITLE = {Lexical Markup Framework (LMF)},
YEAR = {2006},
ABSTRACT = {Optimizing the production, maintenance and extension of lexical resources is one the crucial aspects impacting Natural Language Processing (NLP). A second aspect involves optimizing the process leading to their integration in applications. With this respect, we believe that the production of a consensual specification on lexicons can be a useful aid for the various NLP actors. Within ISO, the purpose of LMF is to define a standard for lexicons. LMF is a model that provides a common standardized framework for the construction of NLP lexicons. The goals of LMF are to provide a common model for the creation and use of lexical resources, to manage the exchange of data between and among these resources, and to enable the merging of large number of individual electronic resources to form extensive global electronic resources. In this paper, we describe the work in progress within the sub-group ISO-TC37/SC4/WG4. Various experts from a lot of countries have been consulted in order to take into account best practices in a lot of languages for (we hope) all kinds of NLP lexicons},
PAGES = {233-236},
URL = {https://iris.cnr.it/handle/20.500.14243/65018},
PUBLISHER = {European Language Resources Association (ELRA)-Evaluations and Language resources Distribution Agency (ELDA) (Paris, FRA)},
ISBN = {2-9517408-2-4},
CONFERENCE_NAME = {LREC 2006: 5th International Conference on Language Resources and Evaluation},
CONFERENCE_PLACE = {Paris},
}
@INPROCEEDINGS{FRANCOPOULO_2006_INPROCEEDINGS_FGCMBPS_65017,
AUTHOR = {Francopoulo, G. and George, M. and Calzolari, N. and Monachini, M. and Bel, N. and Pet, M. and Soria, C.},
TITLE = {LMF for multilingual, specialized lexicons},
YEAR = {2006},
PAGES = {27-32},
URL = {https://iris.cnr.it/handle/20.500.14243/65017},
ISBN = {2-9517408-2-4},
CONFERENCE_NAME = {LREC 2006: 5th International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{FRANCOPOULO_2006_INPROCEEDINGS_FMRS_65034,
AUTHOR = {Francopoulo, G. and Monachini, M. and Romary, L. and Salmontalt, S.},
TITLE = {Lexical Markup Framework: Working to Reach a Consensual ISO Standard on Lexicons},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/65034},
CONFERENCE_NAME = {LREC 2006: 5th International Conference on Language Resources and Evaluation},
BOOKTITLE = {Lexical Markup Framework: Working to Reach a Consensual ISO Standard on Lexicons-Tutorial},
}
@INPROCEEDINGS{GIOULI_2006_INPROCEEDINGS_GLGPMSCC_65019,
AUTHOR = {Giouli, V. and Labropoulou, P. and Gavrilidou, M. and Piperidis, S. and Monachini, M. and Soria, C. and Calzolari, N. and Choukri, K.},
TITLE = {Language Resources Production Models: the Case of the INTERA Multilingual Corpus and Terminology},
YEAR = {2006},
ABSTRACT = {This paper reports on the multilingual Language Resources (MLRs), i. e. parallel corpora and terminological lexicons for less widely digitally available languages, that have been developed in the INTERA project and the methodology adopted for their production. Special emphasis is given to the reality factors that have influenced the MLRs development approach and their final constitution. Building on the experience gained in the project, a production model has been elaborated, suggesting ways and techniques that can be exploited in order to improve LRs production taking into account realistic issues},
KEYWORDS = {multilingual parallel corpora, language resources production models, less widely digitally available languages},
PAGES = {609-614},
URL = {https://iris.cnr.it/handle/20.500.14243/65019},
ISBN = {2-9517408-2-4},
CONFERENCE_NAME = {LREC 2006: 5th International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{GOLA_2006_INPROCEEDINGS_GR_65035,
AUTHOR = {Gola, E. and Ruimy, N.},
TITLE = {Traduzione automatica e processi di comprensione: il lessico},
YEAR = {2006},
PAGES = {291-306},
URL = {https://iris.cnr.it/handle/20.500.14243/65035},
VOLUME = {03},
PUBLISHER = {Aracne (Roma, ITA)},
ISBN = {88-548-0733-8},
CONFERENCE_NAME = {Tradurre e comprendere. Pluralità dei linguaggi e delle culture},
CONFERENCE_PLACE = {Roma},
BOOKTITLE = {Tradurre e comprendere-pluralità dei linguaggi e delle culture},
EDITOR = {Pititto, R. and Venezia, S.},
}
@INPROCEEDINGS{MARCHETTI_2006_INPROCEEDINGS_MTRRBMSCHH_65036,
AUTHOR = {Marchetti, A. and Tesconi, M. and Ronzano, F. and Rosella, M. and Bertagna, F. and Monachini, M. and Soria, C. and Calzolari, N. and Huang, C. R. and Hsieh, S. K.},
TITLE = {Towards an Architecture for the GlobalWordNet Initiative},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/65036},
CONFERENCE_NAME = {SWAP-06, the 3rd Italian Semantic Web Workshop},
}
@INPROCEEDINGS{MARCHETTI_2006_INPROCEEDINGS_MTRRBMSCHH_221102,
AUTHOR = {Marchetti, A. and Tesconi, M. and Ronzano, F. and Rosella, M. and Bertagna, F. and Monachini, M. and Soria, C. and Calzolari, N. and Huang, C. and Hsieh, S.},
TITLE = {Toward an Architecture for the Global Wordnet Initiative},
YEAR = {2006},
ABSTRACT = {Enhancing the development of multilingual lexicons is of foremost importance for intercultural collaboration to take place, as multilingual lexicons are the cornerstone of several multilingual applications. However, the development and maintenance of large-scale, robust multilingual dictionaries is a tantalizing task. Moreover, Semantic Web's growing interest towards the availability of high-quality lexical resources and their multilingual interoperability, is focusing more and more attention on this topic. In this paper we present a tool, based on a web service architecture, enabling semi-automatic generation of bilingual lexicons through linking of distributed monolingual lexical resources. In addition to lexicon development, the architecture also allows enrichment of monolingual source lexicons through exploitation of the semantic information encoded in corresponding entries. In the paper we describe our case study applied to the Italian and Chinese wordnets, and we illustrate how the architecture can be extended to access distributed multilingual WordNets over the Internet, paving the way to exploitation in a cross-lingual framework of the wealth of information built over the last decade},
KEYWORDS = {Lexical resource, wordnet, multilingual interoperability, semantic web},
PAGES = {7-35},
URL = {http://ceur-ws.org/Vol-201/35.pdf},
CONFERENCE_NAME = {SWAP 2006-Semantic Web Applications and Perspectives},
}
@INPROCEEDINGS{MARCONI_2006_INPROCEEDINGS_M_65020,
AUTHOR = {Marconi, L.},
TITLE = {Message of the Chair of the Local Organising Committee},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/65020},
CONFERENCE_NAME = {LREC 2006: Book of Abstracts 5th International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{MARINELLI_2006_INPROCEEDINGS_M_65038,
AUTHOR = {Marinelli, R.},
TITLE = {Computational Resources and Electronic Corpora in Metaphors Evaluation},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/65038},
CONFERENCE_NAME = {Second International Conference of the German Cognitive Linguistics Association},
}
@INPROCEEDINGS{MARINELLI_2006_INPROCEEDINGS_MB_65021,
AUTHOR = {Marinelli, R. and Bindi, R.},
TITLE = {Proper Names and Linguistic Dynamics},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/65021},
CONFERENCE_NAME = {LREC 2006: 5th International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{MARINELLI_2006_INPROCEEDINGS_MRS_65022,
AUTHOR = {Marinelli, R. and Roventini, A. and Spadoni, G.},
TITLE = {Using Core Ontology for Domain Lexicon Structuring},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/65022},
CONFERENCE_NAME = {LREC 2006: 5th International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{MARINELLI_2006_INPROCEEDINGS_MS_64242,
AUTHOR = {Marinelli, R. and Spadoni, G.},
TITLE = {Some Considerations in Structuring a Terminological Knowledge Base},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/64242},
CONFERENCE_NAME = {Third International WordNet Conference},
}
@INPROCEEDINGS{MARINELLI_2006_INPROCEEDINGS_MS_65037,
AUTHOR = {Marinelli, R. and Spadoni, G.},
TITLE = {From Dictionary to Knowledge Base System},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/65037},
CONFERENCE_NAME = {MACL (Multilingualism \& Applied Comparative Linguistics)},
}
@INPROCEEDINGS{MONACHINI_2006_INPROCEEDINGS_M_65023,
AUTHOR = {Monachini, M.},
TITLE = {LMF semantic package and mapping of existing semantic lexicons},
YEAR = {2006},
ABSTRACT = {The definition of a standard for the representation of lexical data has progressively become mandatory in the linguistic and computational linguistic community to cope with the ever encreasing number of digital lexical data that are gathered and disseminated worldwide. LMF should be seen by the community as a tool for modelling one's own lexical data, with the possibile result tat people will provide useful feedback on the usability and needed evolution of the standard project},
PAGES = {29},
URL = {https://iris.cnr.it/handle/20.500.14243/65023},
ISBN = {2-9517408-2-4},
CONFERENCE_NAME = {LREC 2006: 5th International Conference on Language Resources and Evaluation},
BOOKTITLE = {Lexical Markup Framework: Working to Reach a Consensual ISO Standard on Lexicons-Tutorial},
EDITOR = {Francopoulo, G. and Monachini, M. and Romary, L. and Salmon Alt, S.},
}
@INPROCEEDINGS{MONACHINI_2006_INPROCEEDINGS_MCCFMMOU_65024,
AUTHOR = {Monachini, M. and Calzolari, N. and Choukri, K. and Friedrich, J. and Maltese, G. and Mammini, M. and Odijk, J. and Ulivieri, M.},
TITLE = {Unified Lexicon and Unified Morphosyntactic Specifications for Written and Spoken Italian},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/65024},
CONFERENCE_NAME = {LREC 2006: 5th International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{MONTEMAGNI_2006_INPROCEEDINGS_MPP_65042,
AUTHOR = {Montemagni, S. and Paoli, M. and Picchi, E.},
TITLE = {ALT-WEB: l 'Atlante Lessicale Toscano in rete},
YEAR = {2006},
ABSTRACT = {Scopo dell'articolo è la presentazione di ALT-Web, ovvero l'Atlante Lessicale Toscano in rete. ALT-Web è stato ideato per rendere il patrimonio linguistico-culturale testimoniato dall'Atlante Lessicale Toscano una risorsa educativa realmente disponibile in modo che possa fornire un contributo alla conservazione della memoria dell'identità culturale toscana e al contempo costituisca un prezioso punto di riferimento per lo studio di dinamiche linguistiche sia a livello areale sia a livello socio-culturale. La sua collocazione in rete porta inevitabilmente ALT-Web a rivolgersi a una vasta gamma di utenti non più circoscritta agli addetti ai lavori (ovvero dialettologi, linguisti, etno-linguisti), ma che include anche insegnanti, operatori culturali (ad esempio, personale di musei e di istituzioni culturali pubbliche e private) fino al cittadino navigatore di Internet che voglia capire di più della propria identità linguistica e culturale. Il vasto e variegato bacino di utenza a cui intende rivolgersi ALT-Web ha portato alla trasformazione della versione informatizzata dell'Atlante Lessicale Toscano (conosciuta come DBT-ALT) in una rete ipertestuale con modalità e funzionalità di accesso differenziate in relazione alle diverse classi di utenza; a questo aspetto, è legata l'altra interpretazione dell'acronimo ALT-Web, ovvero quella di "ALT come rete". L'articolo illustra aspetti del processo di progettazione e realizzazione dell'opera che rivestono un qualche interesse per il linguista e il dialettologo. In particolare, dopo un breve excursus che riepiloga le caratteristiche principali della risorsa di partenza, l'articolo illustra la progettazione e realizzazione di ALT-Web, partendo dall'analisi dei requisiti e la definizione delle caratteristiche generali per arrivare ad aspetti più specifici che riguardano le modalità di accesso ai materiali e la normalizzazione dei materiali dialettali in trascrizione fonetica},
KEYWORDS = {Dialettologia Computazionale - Risorse dialettali in rete - Atlante lessicale},
PAGES = {209-241},
URL = {https://iris.cnr.it/handle/20.500.14243/65042},
PUBLISHER = {Antenore (Roma, ITA)},
ISBN = {88-8455-606-6},
CONFERENCE_NAME = {Lessicografia Dialettale. Ricordando Paolo Zolli. Atti del Convegno di Studi},
CONFERENCE_PLACE = {Roma},
BOOKTITLE = {Lessicografia dialettale: ricordando Paolo Zolli-Atti del convegno di studi, Venezia, 9-11 dicembre 2004},
EDITOR = {Bruni, F. and Marcato, C.},
}
@INPROCEEDINGS{PARDELLI_2006_INPROCEEDINGS_PSGO_65025,
AUTHOR = {Pardelli, G. and Sassi, M. and Goggi, S. and Orsolini, P.},
TITLE = {Natural Language Processing: A Terminological and Statistical Approach},
YEAR = {2006},
ABSTRACT = {The aim of this article is to provide a statistical representation of significant terms used in the field of Natural Language Processing from the 1960s till nowadays, in order to draft a survey on the most significant research trends in that period. By retrieving these keywords it should be possible to highlight the ebb and flow of some thematic topics. The NLP terminological sample derives from a database created for this purpose using the DBT software (Textual Data Base, ILC patent)},
KEYWORDS = {Natural Language Processing, Terminology},
PAGES = {2395-2398},
URL = {https://iris.cnr.it/handle/20.500.14243/65025},
PUBLISHER = {European Language Resources Association (ELRA)-Evaluations and Language resources Distribution Agency (ELDA) (Paris, FRA)},
ISBN = {2-9517408-2-4},
CONFERENCE_NAME = {LREC 2006: 5th International Conference on Language Resources and Evaluation},
CONFERENCE_PLACE = {Paris},
}
@INPROCEEDINGS{ROVENTINI_2006_INPROCEEDINGS_R_65026,
AUTHOR = {Roventini, A.},
TITLE = {Linking Verbal Entries of Different Lexical Resources},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/65026},
CONFERENCE_NAME = {LREC 2006: 5th International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{ROVENTINI_2006_INPROCEEDINGS_RR_65041,
AUTHOR = {Roventini, A. and Ruimy, N.},
TITLE = {Linking and harmonizing different lexical resources: a comparison of verbal entries},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/65041},
CONFERENCE_NAME = {GWC 2006},
}
@INPROCEEDINGS{RUIMY_2006_INPROCEEDINGS_R_65028,
AUTHOR = {Ruimy, N.},
TITLE = {Structuring a Domain Vocabulary in a General Knowledge Environment},
YEAR = {2006},
ABSTRACT = {The study which is reported here aims at investigating the extent to which the conceptual and representational tools provided by a lexical model designed for the semantic representation of general language may suit the requirements of knowledge modelling in a domain-specific perspective. A general linguistic ontology and a set of semantic links, which allow classifying, describing and interconnecting word senses, play a central role in structuring and representing such knowledge. The health and medicine vocabulary has been taken as a case study for this investigation},
KEYWORDS = {Lexical resource, ontology, semantic relations, semantic network, domain specific knowledge},
PAGES = {2407-2411},
URL = {https://iris.cnr.it/handle/20.500.14243/65028},
PUBLISHER = {European Language Resources Association (ELRA)-Evaluations and Language resources Distribution Agency (ELDA) (Paris, FRA)},
ISBN = {2-9517408-2-4},
CONFERENCE_NAME = {LREC 2006: 5th International Conference on Language Resources and Evaluation},
CONFERENCE_PLACE = {Paris},
}
@INPROCEEDINGS{RUIMY_2006_INPROCEEDINGS_R_65027,
AUTHOR = {Ruimy, N.},
TITLE = {Merging two Ontology-based Lexical Resources},
YEAR = {2006},
ABSTRACT = {ItalWordNet (IWN) and PAROLE/SIMPLE/CLIPS (PSC), the two largest electronic, general-purpose lexical resources of Italian language present many compatible aspects although they are based on two different lexical models having their own underlying principles and peculiarities. Such compatibility prompted us to study the feasibility of semi-automatically linking and eventually merging the two lexicons. To this purpose, the mapping of the ontologies on which basis both lexicons are structured was performed and the sets of semantic relations enabling to relate lexical units were compared. An overview of this preliminary phase is provided in this paper. The linking methodology and related problematic issues are described. Beyond the advantage for the end user to dispose of a more exhaustive and in-depth lexical information combining the potentialities and most outstanding features offered by the two lexical models, resulting benefits and enhancements for the two resources are illustrated that definitely legitimize the soundness of this linking and merging initiative},
KEYWORDS = {Lexical resource, semantic information, ontology mapping, linking},
PAGES = {1716-1721},
URL = {https://iris.cnr.it/handle/20.500.14243/65027},
PUBLISHER = {European Language Resources Association (ELRA)-Evaluations and Language resources Distribution Agency (ELDA) (Paris, FRA)},
ISBN = {2-9517408-2-4},
CONFERENCE_NAME = {LREC 2006: 5th International Conference on Language Resources and Evaluation},
CONFERENCE_PLACE = {Paris},
}
@INPROCEEDINGS{SASSI_2006_INPROCEEDINGS_S_65045,
AUTHOR = {Sassi, M.},
TITLE = {Martí y Carpentier, voces de la América},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/65045},
CONFERENCE_NAME = {XXVIII Convegno Internazionale di Americanistica},
}
@INPROCEEDINGS{SORIA_2006_INPROCEEDINGS_STBCMM_144244,
AUTHOR = {Soria, C. and Tesconi, M. and Bertagna, F. and Calzolari, N. and Marchetti, A. and Monachini, M.},
TITLE = {Moving to dynamic computational lexicons with LeXFlow},
YEAR = {2006},
ABSTRACT = {LeXFlow is a framework for semi-automatic integration of lexicons, already expressed in standardized format. LeXFlow is intended as a tool for, on the one hand, paving the way to the development of dynamic multi-source lexicons; and on the other, for fostering the adoption of standards. Borrowing from techniques used in the domain of document workflows, we model the activity of lexicon management as a particular case of workflow instance, where lexical entries move across agents and become dynamically updated. To this end, we have designed a lexical flow (LF) corresponding to the scenario where an entry of a lexicon A becomes enriched via basically two steps. First, by virtue of being mapped onto a corresponding entry belonging to a lexicon B, the entry(LA) inherits the semantic relations available in B. Second, by resorting to an automatic application that acquires information about semantic relations from corpora, the relations acquired are integrated into the entry and proposed to the human encoder. As a result of the lexical flow, in addition, for each starting lexical entry(LA) mapped onto a corresponding entry(LB) the flow produces a new entry representing the merging of the original two entries},
KEYWORDS = {computational lexicons, collaborative authoring},
PAGES = {12},
URL = {https://iris.cnr.it/handle/20.500.14243/144244},
ISBN = {2-9517408-2-4},
CONFERENCE_NAME = {LREC 2006: 5th International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{TESCONI_2006_INPROCEEDINGS_TMBMHCS_151954,
AUTHOR = {Tesconi, M. and Marchetti, A. and Bertagna, F. and Monachini, M. and Huang, C. and Calzolari, N. and Soria, C.},
TITLE = {Towards agent-based cross-lingual interoperability of distributed lexical resources},
YEAR = {2006},
ABSTRACT = {In this paper we present an application fostering the integration and interoperability of computational lexicons, focusing on the particular case of mutual linking and cross-lingual enrichment of two wordnets, ItalWordNet and Sinica-BOW lexicons. This is intended as a case-study investingating the needs and requirements of semi-automatic integration and interoperability of lexical resources},
KEYWORDS = {wordnet, multilingual computational lexicons, collaborative authoring},
PAGES = {17-24},
URL = {https://iris.cnr.it/handle/20.500.14243/151954},
ISBN = {1-932432-69-8},
CONFERENCE_NAME = {ACL Workshop on Multilingual Lexical Resources and Interoperability},
BOOKTITLE = {Proceedings of the Workshop on Multilingual Language Resources and Interoperability},
}
@INPROCEEDINGS{TESCONI_2006_INPROCEEDINGS_TMBMSC_75853,
AUTHOR = {Tesconi, M. and Marchetti, A. and Bertagna, F. and Monachini, M. and Soria, C. and Calzolari, N.},
TITLE = {LeXFlow: a system for cross-fertilization of computational lexicons},
YEAR = {2006},
ABSTRACT = {This demo presents LeXFlow, a workflow management system for crossfertilization of computational lexicons. Borrowing from techniques used in the domain of document workflows, we model the activity of lexicon management as a set of workflow types, where lexical entries move across agents in the process of being dynamically updated. A prototype of LeXFlow has been implemented with extensive use of XML technologies (XSLT, XPath, XForms, SVG) and open-source tools (Cocoon, Tomcat, MySQL). LeXFlow is a web-based application that enables the cooperative and distributed management of computational lexicons},
KEYWORDS = {computational lexicons, collaborative authoring},
URL = {https://iris.cnr.it/handle/20.500.14243/75853},
DOI = {10.3115/1225403.1225406},
CONFERENCE_NAME = {COLING-ACL '06 Proceedings of the COLING/ACL on Interactive presentation sessions},
}
@INPROCEEDINGS{TESCONI_2006_INPROCEEDINGS_TMBMSC_65039,
AUTHOR = {Tesconi, M. and Marchetti, A. and Bertagna, F. and Monachini, M. and Soria, C. and Calzolari, N.},
TITLE = {LeXFlow: a framework for cross-fertilization of computational lexicons},
YEAR = {2006},
ABSTRACT = {This demo presents LeXFlow, a workflow management system for cross-fertilization of computational lexicons. Borrowing from techniques used in the domain of document workflows, we model the activity of lexicon management as a set of workflow types, where lexical entries move across agents in the process of being dynamically updated. A prototype of LeXFlow has been implemented with extensive use of XML technologies (XSLT, XPath, XForms, SVG)and open-source tools (Cocoon, Tomcat, MySQL). LeXFlow is a web-based application that enables the cooperative and distributed management of computational lexicons},
PAGES = {9-12},
URL = {https://iris.cnr.it/handle/20.500.14243/65039},
ISBN = {1-932432-69-8},
CONFERENCE_NAME = {COLING/ACL 2006},
BOOKTITLE = {Proceedings of the COLING/ACL 2006 Interactive Presentation Sessions},
}
@INPROCEEDINGS{TOKUNAGA_2006_INPROCEEDINGS_TSCCMSHPXYK_65040,
AUTHOR = {Tokunaga, T. and Sornlertlamvanich, V. and Charoenporn, T. and Calzolari, N. and Monachini, M. and Soria, C. and Huang, C. and Prevot, L. and Xia, Y. and Yu, H. and Kiyoaki, S.},
TITLE = {Infrastructure for standardization of Asian language resources},
YEAR = {2006},
ABSTRACT = {As an area of great linguistic and cultural diversity, Asian language resources have received much less attention than their western counterparts. Creating a common standard for Asian language resources that is compatible with an international standard has at least three strong advantages: to increase the competitive edge of Asian countries, to bring Asian countries to closer to their western counterparts, and to bring more cohesion among Asian countries. To achieve this goal, we have launched a two year project to create a common standard for Asian language resources. The project is comprised of four research items, (1) building a description framework of lexical entries, (2) building sample lexicons, (3) building an upper-layer ontology and (4) evaluating the proposed framework through an application. This paper outlines the project in terms of its aim and approach},
PAGES = {827-834},
URL = {https://iris.cnr.it/handle/20.500.14243/65040},
ISBN = {1-932432-69-8},
CONFERENCE_NAME = {COLING/ACL 2006},
BOOKTITLE = {Proceedings of the COLING/ACL 2006 Main Conference Poster Sessions},
}
@INPROCEEDINGS{TURRINI_2006_INPROCEEDINGS_TBP_65029,
AUTHOR = {Turrini, G. and Baroni, P. and Paccosi, A.},
TITLE = {AddizionarioPLUS: uno strumento interattivo per l'educazione interculturale},
YEAR = {2006},
ABSTRACT = {Il lavoro descrive AddizionarioPLUS, versione rinnovata e ampliata di Addizionario, software per lo sviluppo linguistico e cognitivo dei bambini della scuola primaria. I principali cambiamenti introdotti nella nuova versione riguardano a) l'interfaccia grafica, b) il linguaggio di programmazione utilizzato, c) una nuova architettura che renderà possibili attività collaborative, d) un modulo destinato al maestro, e) l'ampliamento del numero e della tipologia degli esercizi, f) la realizzazione di un ricco apparato di aiuti in linea. L'implementazione del prototipo di AddizionarioPLUS, ormai in fase avanzata, procede, come già fu per Addizionario, in stretto contatto con bambini e insegnanti},
KEYWORDS = {strumenti multimediali interattivi, sviluppo linguistico e cognitivo, educazione interculturale},
PAGES = {483-488},
URL = {https://iris.cnr.it/handle/20.500.14243/65029},
CONFERENCE_NAME = {Didamatica 2006},
}
@INPROCEEDINGS{BARTOLINI_2006_INPROCEEDINGS_BGMMABSNBB_65046,
AUTHOR = {Bartolini, R. and Giovannetti, E. and Marchi, S. and Montemagni, S. and Andreatta, C. and Brunelli, R. and Stecher, R. and Niederée, C. and Bouquet, P. and Bortoli, S.},
TITLE = {Ontology Learning in Multimedia Information Extraction from Product Catalogues},
YEAR = {2006},
ABSTRACT = {We propose a methodology for extracting multimedia information from product catalogues empowered by the synergetic use and extension of a domain ontology. The use of domain ontologies in this context additionally opens up innovative ways of catalogue use. The method is characterized by incrementally feeding and exploiting the ontology during an information extraction process, implemented by the semantic annotation of the analysed document, and by providing support for detecting existing similar ontologies to enable reuse of (parts of) them},
KEYWORDS = {knowledge-drive multimedia analysis, ontology learning, semi-automatic content annotation tools},
URL = {https://iris.cnr.it/handle/20.500.14243/65046},
CONFERENCE_NAME = {BOEMIE 2006},
}
@TECHREPORT{CALZOLARI_2006_TECHREPORT_C_195918,
AUTHOR = {Calzolari, N.},
TITLE = {Language Technologies (LT)},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/195918},
}
@TECHREPORT{CIGNONI_2006_TECHREPORT_C_195920,
AUTHOR = {Cignoni, L.},
TITLE = {Regole Editoriali},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/195920},
}
@TECHREPORT{CIGNONI_2006_TECHREPORT_C_195919,
AUTHOR = {Cignoni, L.},
TITLE = {Filastrocche in inglese per la scuola materna ed elementare},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/195919},
}
@TECHREPORT{MARINELLI_2006_TECHREPORT_M_195921,
AUTHOR = {Marinelli, R.},
TITLE = {La terminologia Marittima-un database semantico-lessicale},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/195921},
}
@TECHREPORT{MONACHINI_2006_TECHREPORT_MSCFB_195922,
AUTHOR = {Monachini, M. and Soria, C. and Calzolari, N. and Francopoulo, G. and Bel, N.},
TITLE = {WD of Lexica standard for CD ballot},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/195922},
}
@TECHREPORT{QUOCHI_2006_TECHREPORT_QMCDS_195923,
AUTHOR = {Quochi, V. and Monachini, M. and Calzolari, N. and Del Gratta, R. and Sassolini, E.},
TITLE = {Bio-Lexicon Model and Preliminary ISO Conformant Data Categories},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/195923},
}
@TECHREPORT{RUIMY_2006_TECHREPORT_RMC_195924,
AUTHOR = {Ruimy, N. and Monachini, M. and Calzolari, N.},
TITLE = {Lessico Computazionale Multilivello dell'Italiano PAROLE-SIMPLE-CLIPS},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/195924},
}
@TECHREPORT{SABA_2006_TECHREPORT_S_195926,
AUTHOR = {Saba, A.},
TITLE = {Il lessico del Tractado de la Sphera de Iohannes de Sacrobusto},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/195926},
}
@TECHREPORT{SABA_2006_TECHREPORT_S_195927,
AUTHOR = {Saba, A.},
TITLE = {Il lessico del Arte de marear de Juan de Moya. Ed. 1564},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/195927},
}
@TECHREPORT{SASSI_2006_TECHREPORT_SC_195925,
AUTHOR = {Sassi, M. and Cinini, A.},
TITLE = {Content-analysis dei provvedimenti della sezione disciplinare del C. S. M},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/195925},
}
@MISC{AIELLO_2006_MISC_AC_4973,
AUTHOR = {Aiello, M. and Chiarella, D.},
TITLE = {Worm Poacher},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/4973},
}
@MISC{BARBERA_2006_MISC_BD_384181,
AUTHOR = {Barbera, M. and Di Donato, F.},
TITLE = {HyperJournal HowTo (versione italiana). HyperJournal 0. 4: guida per principianti},
YEAR = {2006},
ABSTRACT = {Manuale del software HyperJournal (in italiano)},
URL = {https://iris.cnr.it/handle/20.500.14243/384181},
}
@MISC{BARBERA_2006_MISC_BDDPT_384183,
AUTHOR = {Barbera, M. and Di Donato, F. and D'Ercole, N. and Pirro, P. and Tolu, A.},
TITLE = {HyperJournal},
YEAR = {2006},
ABSTRACT = {HyperJournal (2005-2006) è un software per creare e gestire riviste digitali e ad accesso aperto},
URL = {https://iris.cnr.it/handle/20.500.14243/384183},
}
@MISC{BARTOLINI_2006_MISC_BDLMMP_192748,
AUTHOR = {Bartolini, R. and Dell'Orletta, F. and Lenci, A. and Marchi, S. and Montemagni, S. and Pirrelli, V.},
TITLE = {Text-to-Knowledge (T2K) Versione 2},
YEAR = {2006},
ABSTRACT = {Versione 2. Text-to-Knowledge (T2K) è una piattaforma software di supporto avanzato alla gestione documentale per la creazione dinamica di repertori terminologici e ontologie di dominio a partire da testi e per l'indicizzazione concettuale di documenti. Il sistema T2K si propone di offrire una batteria integrata di strumenti avanzati di analisi linguistica del testo, analisi statistica e apprendimento automatico del linguaggio, destinati a offrire una rappresentazione accurata del contenuto di una base documentale non strutturata, per scopi di indicizzazione avanzata e navigazione intelligente. I risultati di questo processo di acquisizione sono annotati in forma di metadati XML, offrendo in tal modo la prospettiva di una sempre crescente e diretta interoperabilità con sistemi automatici per la produzione di contenuti digitali selezionati e strutturati dinamicamente su misura, per diversi profili di utenza. Versioni prototipali di T2K sono già operative su alcuni portali della pubblica amministrazione e sono state applicate per l'indicizzazione di contenuti didattici multimediali. E' in corso l'integrazione della tecnologia T2K nel sistema di gestione informatica di documentazione scientifica del CNR},
KEYWORDS = {text to knowledge, nlp, estrazione terminologica, ontology learning, indicizzazione terminologica},
URL = {https://iris.cnr.it/handle/20.500.14243/192748},
}
@MISC{BINDI_2006_MISC_B_192743,
AUTHOR = {Bindi, R.},
TITLE = {CLIC},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/192743},
}
@MISC{BINDI_2006_MISC_BMBGPR_457835,
AUTHOR = {Bindi, R. and Marinelli, R. and Biagini, L. and Goggi, S. and Picchi, E. and Rossi, S.},
TITLE = {LE-PAROLE, Italian Corpus Description, Part Available for Distribution},
YEAR = {2006},
}
@MISC{CAPPELLI_2006_MISC_CBRPNAPF_192742,
AUTHOR = {Cappelli, G. and Bozzi, A. and Ruffolo, P. and Passarotti, M. and Nascimento, A. and Alberto, P. and Pena, A. and Frade, S.},
TITLE = {LECTIO (Latim em Exercìcio Contìnuo através de Tecnologia Informàtica Orientada)},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/192742},
}
@MISC{CECCOTTI_2006_MISC_CS_192745,
AUTHOR = {Ceccotti, M. and Sassi, M.},
TITLE = {Dall'Archivio Elettronico delle Opere di Carlo Emilio Gadda. Studi e ricerche con strumenti computazionali dell'opera dell'ingegnere-scrittore},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/192745},
}
@MISC{DIDONATO_2006_MISC_D_406240,
AUTHOR = {Di Donato, F.},
TITLE = {Una scienza ad accesso libero: storia, filosofia e prospettive del movimento open access},
YEAR = {2006},
ABSTRACT = {Introduzione all'open access},
URL = {https://iris.cnr.it/handle/20.500.14243/406240},
}
@MISC{DIDONATO_2006_MISC_D_406239,
AUTHOR = {Di Donato, F.},
TITLE = {HyperJournal. Un software open source per l'Open Publishing},
YEAR = {2006},
ABSTRACT = {Presentazione di Hyperjournal},
URL = {https://iris.cnr.it/handle/20.500.14243/406239},
}
@MISC{DIDONATO_2006_MISC_D_406241,
AUTHOR = {Di Donato, F.},
TITLE = {Dalla parte dei ricercatori: strumenti Open Access per la ricerca scientifica},
YEAR = {2006},
ABSTRACT = {Aim of this presentation is to show the benefits deriving from the use of open archives and open access journals for researchers' everyday work. A practical illustration will be given about using those tools (in particular the disciplinary archive E-LIS) showing their usefulness for the entire research process, considering both the point of view of the scholar as a reader and the perspective of the scholar as an author},
URL = {https://iris.cnr.it/handle/20.500.14243/406241},
}
@MISC{DIDONATO_2006_MISC_D_384179,
AUTHOR = {Di Donato, F.},
TITLE = {Kant I., Risposta alla domanda: che cos'è l'illuminismo?},
YEAR = {2006},
ABSTRACT = {Traduzione dall'originale tedesco},
URL = {https://iris.cnr.it/handle/20.500.14243/384179},
ISSN = {1591-4305},
}
@MISC{DIDONATO_2006_MISC_D_406242,
AUTHOR = {Di Donato, F.},
TITLE = {L'esperienza degli umanisti. HyperJournal e il modello Open Access},
YEAR = {2006},
ABSTRACT = {A presentation on HyperJournal (an open source software for open access publishing) and on the Bollettino Telematico di Filosofia Politica, an on-line journal on Political Philosophy},
URL = {https://iris.cnr.it/handle/20.500.14243/406242},
}
@MISC{FABRI_2006_MISC_FCC_97505,
AUTHOR = {Fabri, M. and Cavallini, D. and Cinini, A.},
TITLE = {Il progetto di banca dati informatizzata delle sentenze della sezione disciplinare del CSM},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/97505},
CONFERENCE_NAME = {Presentazione del programma di informatizzazione realizzato in ambito IRSIG-CNR, ILC-CNR, CESROG-Università di Bologna},
}
@MISC{GUADAGNINI_2006_MISC_G_265600,
AUTHOR = {Guadagnini, E.},
TITLE = {Sordello, Per re noom puesc d'amor cuydar (BdT 437. 23)},
YEAR = {2006},
URL = {http://www.rialto.unina.it/Sordel/437.23(Boni).htm},
ISSN = {1973-381X},
}
@MISC{GUADAGNINI_2006_MISC_G_265611,
AUTHOR = {Guadagnini, E.},
TITLE = {Sordello, Si cool malaus qe no se sap gardar (BdT 437. 31)},
YEAR = {2006},
URL = {http://www.rialto.unina.it/Sordel/437.31(Boni).htm},
ISSN = {1973-381X},
}
@MISC{GUADAGNINI_2006_MISC_G_265599,
AUTHOR = {Guadagnini, E.},
TITLE = {Sordello, Non pueis mudar, qan luecs es (BdT 437. 21)},
YEAR = {2006},
URL = {http://www.rialto.unina.it/Sordel/437.21(Asperti).htm},
ISSN = {1973-381X},
}
@MISC{GUADAGNINI_2006_MISC_G_265612,
AUTHOR = {Guadagnini, E.},
TITLE = {Sordello, Tant m'abellis lo terminis novels (BdT 437. 35)},
YEAR = {2006},
URL = {http://www.rialto.unina.it/Sordel/437.35(Boni).htm},
ISSN = {1973-381X},
}
@MISC{GUADAGNINI_2006_MISC_G_265613,
AUTHOR = {Guadagnini, E.},
TITLE = {Sordello, Tos temps serai ves amor (BdT 437. 36)},
YEAR = {2006},
URL = {http://www.rialto.unina.it/Sordel/437.36(Boni).htm},
ISSN = {1973-381X},
}
@MISC{GUADAGNINI_2006_MISC_G_265603,
AUTHOR = {Guadagnini, E.},
TITLE = {Sordello, Puois noom tenc per pajat d'amor (BdT 437. 25)},
YEAR = {2006},
URL = {http://www.rialto.unina.it/Sordel/437.25(Boni).htm},
ISSN = {1973-381X},
}
@MISC{GUADAGNINI_2006_MISC_G_265605,
AUTHOR = {Guadagnini, E.},
TITLE = {Sordello, Puois trobat ai qi conois et enten (BdT 437. 26)},
YEAR = {2006},
URL = {http://www.rialto.unina.it/Sordel/437.26(Boni).htm},
ISSN = {1973-381X},
}
@MISC{GUADAGNINI_2006_MISC_G_265624,
AUTHOR = {Guadagnini, E.},
TITLE = {Peire Cardenal, Ar mi puesc yeu lauzar d'amor (BdT 335. 7)},
YEAR = {2006},
URL = {http://www.rialto.unina.it/PCard/335.7(Vatteroni).htm},
ISSN = {1973-381X},
}
@MISC{GUADAGNINI_2006_MISC_G_265601,
AUTHOR = {Guadagnini, E.},
TITLE = {Sordello, Planher vuelh en Blacatz en aquest leugier so (BdT 437. 24)},
YEAR = {2006},
URL = {http://www.rialto.unina.it/Sordel/437.24(Boni).htm},
ISSN = {1973-381X},
}
@MISC{GUADAGNINI_2006_MISC_G_265607,
AUTHOR = {Guadagnini, E.},
TITLE = {Sordello, Qan plus creis, dompna,. l desiriers (BdT 437. 27)},
YEAR = {2006},
URL = {http://www.rialto.unina.it/Sordel/437.27(Boni).htm},
ISSN = {1973-381X},
}
@MISC{GUADAGNINI_2006_MISC_G_265608,
AUTHOR = {Guadagnini, E.},
TITLE = {Sordello, Qui beois membra del segle qu'es passatz (BdT 437. 29)},
YEAR = {2006},
URL = {http://www.rialto.unina.it/Sordel/437.29(Boni).htm},
ISSN = {1973-381X},
}
@MISC{MARCHI_2006_MISC_ME_458598,
AUTHOR = {Marchi, S. and Emiliano, G.},
TITLE = {The Product catalogues Terminology Processor (PTP) and the Product catalogue Italian Semantic Annotator (PISA) for the VIKE-framework},
YEAR = {2006},
ABSTRACT = {Moduli software sviluppati in seno al progetto VIKEF},
URL = {https://iris.cnr.it/handle/20.500.14243/458598},
}
@MISC{MARINELLI_2006_MISC_M_106741,
AUTHOR = {Marinelli, R.},
TITLE = {Proposta di contributo da parte dellILC alla REI (Rete di eccellenza dell'italiano istituzionale) con un database di terminologia marittima},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/106741},
CONFERENCE_NAME = {Secondo incontro della Rete di eccellenza dell'italiano istituzionale},
}
@MISC{MARINELLI_2006_MISC_MS_464693,
AUTHOR = {Marinelli, R. and Spadoni, G.},
TITLE = {MARITERM Database di terminologia marittima},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/464693},
}
@MISC{MONTEMAGNI_2006_MISC_M_464692,
AUTHOR = {Montemagni, S.},
TITLE = {La Treebank Sintattico Semantica dell'Italiano del progetto SI-TAL},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/464692},
}
@MISC{PICCHI_2006_MISC_PMSCP_192744,
AUTHOR = {Picchi, E. and Montemagni, S. and Sassolini, E. and Cucurullo, S. and Paoli, M.},
TITLE = {ALTWEB},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/192744},
}
@MISC{PICCHI_2006_MISC_PSCSC_192747,
AUTHOR = {Picchi, E. and Sassi, M. and Ceccotti, M. L. and Sassolini, E. and Cucurullo, S.},
TITLE = {Linguistic Miner},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/192747},
}
@MISC{PIRRELLI_2006_MISC_P_106730,
AUTHOR = {Pirrelli, V.},
TITLE = {Parlare per sapere: la lingua come accesso alla conoscenza},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/106730},
CONFERENCE_NAME = {Conferenza TAL 2006: Uomini e macchine, un colloquio possibile},
}
@MISC{PIRRELLI_2006_MISC_PLM_435674,
AUTHOR = {Pirrelli, V. and Lenci, A. and Montemagni, S.},
TITLE = {Probing the space of grammatical variation: induction of cross-lingual grammatical constraints from treebanks},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/435674},
CONFERENCE_NAME = {Language resources and language research: typology, second language acquisition, English Linguistics},
}
@MISC{ROVENTINI_2006_MISC_RABCM_192746,
AUTHOR = {Roventini, A. and Alonge, A. and Bertagna, F. and Calzolari, N. and Marinelli, R.},
TITLE = {ItalWordNet database semantico-lessicale dell italiano},
YEAR = {2006},
URL = {https://iris.cnr.it/handle/20.500.14243/192746},
}
@MISC{RUIMY_2006_MISC_R_435669,
AUTHOR = {Ruimy, N.},
TITLE = {Il modello lessicale SIMPLE: dal monolingue al bilingue},
YEAR = {2006},
ABSTRACT = {Il modello lessicale PAROLE-SIMPLE ha permesso la realizzazione di lessici elettronici multilivelli armonizzati per le 12 lingue della CE. Successivamente, nell'ambito del progetto nazionale italiano 'Corpora e Lessici dell'Italiano Parlato e Scritto', è stato sviluppato il lessico CLIPS utilizzando sia il modello che i dati del lessico italiano PAROLESIMPLE. CLIPS, la cui costruzione si è appena conclusa, rappresenta attualmente la più vasta risorsa lessicale elettronica dell'italiano. E' adesso allo studio un progetto di utilizzo di questo lessico come input per la creazione di una risorsa lessicale elettronica bilingue italiano-francese. Due scenari alternativi sono al momento in corso di valutazione: 1) il collegamento semi-automatizzato di due lessici elettronici monolingui basati sullo stesso modello, i. e. CLIPS ed il lessico francese PAROLE-SIMPLE; 2) la derivazione di un database lessicale bilingue a partire dal lessico CLIPS e da coppie di sensi corrispondenti IT-FR estratti da un dizionario bilingue. Questa seconda ipotesi si basa sulla ricerca di correlazioni tra l'informazione fornita dagli indicatori di senso nelle entrate bilingui e i vari elementi descrittivi contenuti nel lessico CLIPS},
PAGES = {279-290},
URL = {https://iris.cnr.it/handle/20.500.14243/435669},
ISBN = {84-935340-4-8},
CONFERENCE_NAME = {Tercero Seminario de la Escuela Interlatina de Altos Estudios en Lingüística Aplicada},
}
@ARTICLE{CALZOLARI_2005_ARTICLE_CE_150883,
AUTHOR = {Calzolari, N. and Eds, I. N.},
TITLE = {Language Resources and Evaluation},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/150883},
ISSN = {0010-4817},
JOURNAL = {COMPUTERS AND THE HUMANITIES},
}
@ARTICLE{DIDONATO_2005_ARTICLE_D_384168,
AUTHOR = {Di Donato, F.},
TITLE = {I media telematici come strumento per la comunicazione scientifica},
YEAR = {2005},
ABSTRACT = {Che cosa sono i media telematici? In che misura sono e possono diventare strumenti per lo studio universitario e la ricerca scientifica? Costruire una risposta a tali questioni necessita di alcune definizioni preliminari. Il termine telematica oggi ha assunto un significato particolare e suona un po' desueto, se usato per intendere ciò a cui ci riferiremo nelle pagine che seguono. Oggetto di questa analisi è infatti la produzione di informazione in formati digitali (tramite computer) e la condivisione del sapere attraverso la rete Internet e il World Wide Web. Il problema della comunicazione del sapere sarà dunque affrontato da un punto di vista filosofico e politico, considerando in che modo le tecnologie della parola agiscono sulla struttura del discorso scientifico a partire da un'introduzione teorica (dunque astratta, ma il meno possibile tecnica) e storica al computer, a Internet e al Web; ricostruiremo poi, brevemente, cosa si intende con "scienza", come vi si accede e come si produce all'interno dei limiti imposti dalle nuove tecnologie, esplorandone le possibilità-esplicite e solo accennate; per indicare, infine, alcuni strumenti utili alla pratica della ricerca scientifica in rete},
URL = {https://iris.cnr.it/handle/20.500.14243/384168},
ISSN = {1591-4305},
JOURNAL = {BOLLETTINO TELEMATICO DI FILOSOFIA POLITICA},
}
@ARTICLE{DIDONATO_2005_ARTICLE_D_384170,
AUTHOR = {Di Donato, F.},
TITLE = {I Greci tra oralità e scrittura},
YEAR = {2005},
ABSTRACT = {Un'introduzione al tema del passaggio dalle culture a oralità primaria a quelle basate sulla scritta nella Grecia antica},
URL = {https://iris.cnr.it/handle/20.500.14243/384170},
ISSN = {1591-4305},
JOURNAL = {BOLLETTINO TELEMATICO DI FILOSOFIA POLITICA},
}
@ARTICLE{DIDONATO_2005_ARTICLE_D_384163,
AUTHOR = {Di Donato, F.},
TITLE = {Conoscenza e pubblicità del sapere. Le condizioni della repubblica scientifica a partire dall'Architettonica della ragion pura di Kant},
YEAR = {2005},
ABSTRACT = {La prima Critica di Kant, pubblicata nel 1781 e rivista nel 1787, ha al centro il problema dell'esame delle possibilita? e dei limiti della ragion pura, cioe? della facolta? di conoscere a priori; per rispondere alla domanda "che cosa posso sapere?", essa indaga sui fondamenti, le condizioni e i limiti della conoscenza. Kant affronta, nell'ultimo quarto del Settecento, un tema fondamentale nella storia del pensiero filosofico, di cui si occupa, tra gli altri, gia? Platone nel Menone. Nel discorso del filosofo tedesco, tuttavia, i termini di confronto privilegiati sono i dogmatici (Leibniz e Wolff) e gli scettici (Hume), da cui la filosofia critica intende esplicitamente prendere le distanze. La metafisica tradizionale, divisa tra empirismo e razionalismo, e? caduta in un abisso senza fondo: da una parte infatti, secondo Kant, il conoscere a posteriori, a partire cioe? da fatti, non e? mai universale e necessario ed e? incapace di offrire un criterio discriminativo tra conoscenza e opinioni; dall'altra parte, pero?, non si puo? dedurre la realta? da meri princi?pi e pertanto la ragione dogmatica e?, inevitabilmente, dispotica. Per questo e? necessario attuare una rivoluzione copernicana; per questo, inoltre, la repubblica della scienza dev'essere presupposta e, assieme, fondata sui princi?pi della ragione. Le pagine che seguono sono un commento al terzo capitolo della Dottrina trascendentale del metodo, L'architettonica della ragion pura, e in particolare affrontano la lettura dell' Architettonica indagando sulle condizioni di possibilita? del logos scientifico},
URL = {https://iris.cnr.it/handle/20.500.14243/384163},
ISSN = {1591-4305},
JOURNAL = {BOLLETTINO TELEMATICO DI FILOSOFIA POLITICA},
}
@ARTICLE{DIDONATO_2005_ARTICLE_D_384169,
AUTHOR = {Di Donato, F.},
TITLE = {Usare la rete per fare ricerca: esperienze open access alla facoltà di Scienze politiche di Pisa},
YEAR = {2005},
ABSTRACT = {Text of the presentation-about the journal 'Bollettino telematico di filosofia politica', HyperJournal software and disciplinary open archive "Giuliano Marini"-held at the workshop "Conoscenza e proprietà: problematiche ed esperienze a confronto sull'open access", Pisa University, 20/09/2005},
URL = {https://iris.cnr.it/handle/20.500.14243/384169},
ISSN = {1591-4305},
JOURNAL = {BOLLETTINO TELEMATICO DI FILOSOFIA POLITICA},
}
@ARTICLE{GUADAGNINI_2005_ARTICLE_G_272360,
AUTHOR = {Guadagnini, E.},
TITLE = {La crociata di Federico II e la «cerchia di Blacatz»},
YEAR = {2005},
ABSTRACT = {La crociata di Federico II e la «cerchia di Blacatz»},
KEYWORDS = {Provenzalistica, Storia medievale, Federico II},
PAGES = {309-331},
URL = {https://iris.cnr.it/handle/20.500.14243/272360},
VOLUME = {46},
ISSN = {0391-8467},
JOURNAL = {STUDI MEDIEVALI},
}
@ARTICLE{GUADAGNINI_2005_ARTICLE_G_75405,
AUTHOR = {Guadagnini, E.},
TITLE = {Scelta di voci del Tesoro della Lingua Italiana delle Origini (nona serie)},
YEAR = {2005},
ABSTRACT = {Voci disonestà s. f., disonestamente avv., disonestanza s. f., disonestare v., disonestezza s. f., disonestità s. f., disonesto agg. /avv. /s. m. del Tesoro della Lingua Italiana delle Origini (pp. 117-130)},
KEYWORDS = {Lessicografia italiana, Italiano antico},
PAGES = {13-176},
URL = {https://iris.cnr.it/handle/20.500.14243/75405},
VOLUME = {10},
ISSN = {1591-8254},
JOURNAL = {BOLLETTINO-OPERA DEL VOCABOLARIO ITALIANO},
}
@ARTICLE{LENCI_2005_ARTICLE_LMP_433719,
AUTHOR = {Lenci, A. and Montemagni, S. and Pirrelli, V.},
TITLE = {Acquiring and Representing Meaning: Theoretical and Computational Perspectives},
YEAR = {2005},
PAGES = {19-66},
URL = {https://iris.cnr.it/handle/20.500.14243/433719},
VOLUME = {22-23},
}
@ARTICLE{MONACHINI_2005_ARTICLE_MS_37694,
AUTHOR = {Monachini, M. and Soria, C.},
TITLE = {Building Multilingual Terminological Lexicons for Less Widely Available Languages},
YEAR = {2005},
ABSTRACT = {Availability of Linguistic Resources for the development of Human Language Technology applications is nowadays recognized as a critical issue with both political and economic impact and implications on the sphere of cultural identity. This paper reports about the experience gained during the INTERA European project for the production of multilingual terminological lexicons for less widely available languages, i. e. those languages that suffer from poor representation over the net and from scarce computational resources, but yet are requested by the market. It discusses the procedure followed within the project, focuses on the problems faced which had an impact on the initial goals, presents the necessary modifications that resulted from these problems, evaluates the market needs as attested by various surveys, and describes the methodology that is proposed for the efficient production of Multilingual Terminological Lexicons},
PAGES = {251-261},
URL = {https://iris.cnr.it/handle/20.500.14243/37694},
VOLUME = {15},
ISSN = {1230-2384},
JOURNAL = {ARCHIVES OF CONTROL SCIENCES},
}
@ARTICLE{PAOLA_2005_ARTICLE_P_194933,
AUTHOR = {Paola, P. G.},
TITLE = {Bibliography of Antonio Zampolli (from 1962 to 2004)},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/194933},
ISSN = {1230-2384},
JOURNAL = {ARCHIVES OF CONTROL SCIENCES},
}
@BOOK{LENCI_2005_BOOK_LMP_134788,
AUTHOR = {Lenci, A. and Montemagni, S. and Pirrelli, V.},
TITLE = {Testo e computer-Elementi di linguistica computazionale},
YEAR = {2005},
ABSTRACT = {In che modo il computer può aiutarci a comprendere come funziona la nostra lingua? Cosa significa analizzare un testo con l'aiuto di un calcolatore? In che misura possiamo estendere le potenzialità del computer rendendolo capace di interagire con gli utenti umani nella loro lingua' Queste e altre domande sono l'oggetto di indagine della linguistica computazionale, una disciplina che ha al suo centro proprio il rapporto tra lingua e computer. Il libro fornisce gli elementi di base della linguistica computazionale partendo da un interesse primario per il testo, la sua struttura e il suo contenuto. Il volume propone una sintesi equilibrata e accessibile tra sapere e fare, nozioni di base e loro applicazione, ed è destinato in primo luogo agli studenti delle facoltà umanistiche e scientifiche interessati all'interazione tra scienze umane e informatica, ma anche agli studiosi che vogliano imparare a usare il computer come strumento di ricerca sul linguaggio},
KEYWORDS = {Linguistica Computazionale},
PAGES = {255},
URL = {https://iris.cnr.it/handle/20.500.14243/134788},
PUBLISHER = {Carocci (Roma, ITA)},
ISBN = {8843034251},
CONFERENCE_PLACE = {Roma},
}
@BOOK{LENCI_2005_BOOK_LMP_134787,
AUTHOR = {Lenci, A. and Montemagni, S. and Pirrelli, V.},
TITLE = {Acquiring and Representing Word Meaning: Computational perspectives},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/134787},
PUBLISHER = {Istituti Editoriali e Poligrafici Internazionali (Pisa-Roma, ITA)},
ISBN = {88-8147-413-1},
CONFERENCE_PLACE = {Pisa-Roma},
}
@INCOLLECTION{BERNDT_2005_INCOLLECTION_BBCT_134790,
AUTHOR = {Berndt, A. and Bianchi, F. and Cignoni, L. and Turrini, G.},
TITLE = {COME IN: Children On-line in Multimedia Environments and Intercultural Networks},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/134790},
PUBLISHER = {Wit Press (Southampton, GBR)},
CONFERENCE_PLACE = {Southampton},
}
@INCOLLECTION{QUOCHI_2005_INCOLLECTION_Q_134794,
AUTHOR = {Quochi, V.},
TITLE = {Issues on the acquisition of Italian complex nominals from text corpora: a computational approach combining syntactic and semantic information},
YEAR = {2005},
ABSTRACT = {The paper addressed the issue of Italian Complex Nominals from an (automatic) acquisition and representational perspective. Just like English noun compounds, ICNs blur the distinction between the syntactic and the lexical component because they are (at least) partially non-transparent but, nevertheless, show regularities both at the syntactic and at the semantic level. This contribution reports on an experiment conducted to identify the highest possible number of productive syntactic-semantic patterns of ICN formation, and to make explicit the particular semantic relation that exists between the head of the phrase and its modifier(s). I rely on a non-traditional generative theory of the lexicon, namely the Generative Lexicon, as a model for the representation/ interpretation of ICNs which provides us with a structured representation of the internal semantics of lexical items. The experiment explored the representational power of the qualia structure with respect to ICNs},
KEYWORDS = {complex nominals, multiword expressions, lexicon, lexical representation, generative lexicon},
PAGES = {153-174},
URL = {https://iris.cnr.it/handle/20.500.14243/134794},
PUBLISHER = {Edizioni Plus srl (Pisa, ITA)},
ISBN = {9788884922366},
CONFERENCE_PLACE = {Pisa},
BOOKTITLE = {Studies in the Semantics of Lexical Combinatory Patterns},
EDITOR = {Bertuccelli, M.},
}
@INCOLLECTION{ROVENTINI_2005_INCOLLECTION_RR_233145,
AUTHOR = {Roventini, A. and Ruimy, N.},
TITLE = {Linking and Harmonizing Different Lexical Resources: a Comparison of Verbal Entries in ItalWordNet and PAROLE-SIMPLE-CLIPS},
YEAR = {2005},
ABSTRACT = {During the last years, in the framework of Computational Linguistics, many lexical resources have been developed which aim at coding complex lexical semantic information according to different linguistic models (WordNet, Frame Semantics, Generative Lexicon, etc.). However, these resources are often not easily accessible nor available in their entirety. Yet, from the point of view of the continuous growth of the technology (Semantic Web), their visibility, availability, integration and harmonization are becoming of utmost importance. ItalWordNet and PAROLE/SIMPLE/CLIPS are two resources which, tackling lexical semantics from different perspectives and being at least partially complementary could profit from linking each other. In this paper we address the issue of linking these resources focusing on the most problematic part of the lexicon: the second order entities. In particular, after a brief description of the two resources, their different approaches to the verb semantics are described; an accurate comparison of a set of verbal entries is carried out, with a view to evaluating the possibilities and the advantages of a semiautomatic link; finally, the results and the future work are illustrated},
URL = {https://iris.cnr.it/handle/20.500.14243/233145},
ISBN = {978-80-210-3915-5},
}
Warning: Undefined array key 0 in /mnt/resources/apps/pipol_v5/lib_pipol.php on line 7034
Deprecated: strtoupper(): Passing null to parameter #1 ($string) of type string is deprecated in /mnt/resources/apps/pipol_v5/lib_pipol.php on line 7034
@EDITORIAL{_2005_EDITORIAL__181022,
AUTHOR = {},
TITLE = {Acquisition and Representation of Word Meaning: Theoretical and computational perspectives},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/181022},
ISSN = {0392-6907},
ISBN = {88-8147-413-1},
}
@INPROCEEDINGS{BARBERA_2005_INPROCEEDINGS_BDTM_384165,
AUTHOR = {Barbera, M. and Di Donato, F. and Tummarello, G. and Morbidoni, C.},
TITLE = {HyperJournal, PHP scripting and Semantic Web technologies for Open Access},
YEAR = {2005},
ABSTRACT = {n this article we present an high level overview of the HyperJournal project, an effort to provide novel possibilities both in Scientific Publishing and in access to Scientific Contributions, according to the Open Access movement guidelines. All the work has been implemented using the PHP Web Script language and interfacing with Java modules such as Sesame and RDFGrowth. Such interfaces, here illustrated, are of general use for project with similar needs. While the HyperJournal project itself is in its infancy stage, a first release is already available for download and public use, thus representing one of the certainly not many real and deployable examples of Semantic Web applications},
URL = {https://iris.cnr.it/handle/20.500.14243/384165},
}
@INPROCEEDINGS{BARTOLINI_2005_INPROCEEDINGS_BGLMP_431279,
AUTHOR = {Bartolini, R. and Giorgetti, D. and Lenci, A. and Montemagni, S. and Pirrelli, V.},
TITLE = {Automatic Incremental Term Acquisition from Domain Corpora},
YEAR = {2005},
ABSTRACT = {We describe a technique for the acquisition of terms from Italian domain text corpora, which relies both on sophisticated linguistic analysis and on statistical measures applied to linguistically processed text rather than to raw text as it is usually the case. The main advantage of this technique is that minimal a priori knowledge of term structure is required, thus allowing to explore and discover terms in a given domain without imposing a strict pattern matching structure on them, and also to easily extend it to different domains. The approach we present in this paper is incremental as it may be iterated to discover terms of increasing complexity built on top of terms discovered in the previous iteration. The reason why it is convenient to adopt such an incremental approach is that it allows to "clean" data from noise in the first step, elicitating the constituent terms, and then to refine term acquisition on "skimmed" term data},
PAGES = {293-300},
URL = {https://iris.cnr.it/handle/20.500.14243/431279},
CONFERENCE_NAME = {7th International conference on Terminology and Knowledge Engineering (TKE2005)},
BOOKTITLE = {Proceedings of TKE 2005-7th International Conference on Terminology and Knowledge Engineering},
}
@INPROCEEDINGS{BIAGIOLI_2005_INPROCEEDINGS_BFPMSS_155324,
AUTHOR = {Biagioli, C. and Francesconi, E. and Passerini, A. and Montemagni, S. and Soria, C. B. C. and Soria, C.},
TITLE = {Automatic semantics extraction in law documents},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/155324},
CONFERENCE_NAME = {Tenth International Conference on Artificial Intelligence and Law (ICAIL 2005)},
}
@INPROCEEDINGS{BIANCHI_2005_INPROCEEDINGS_BT_64215,
AUTHOR = {Bianchi, F. and Turrini, G.},
TITLE = {COME IN: un sito per l'insegnamento/apprendimento delle lingue straniere nella scuola primaria},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/64215},
CONFERENCE_NAME = {Didamatica 2005},
}
@INPROCEEDINGS{CALZOLARI_2005_INPROCEEDINGS_C_64216,
AUTHOR = {Calzolari, N.},
TITLE = {Antonio Zampolli-A life Computational Linguistics},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/64216},
}
@INPROCEEDINGS{CALZOLARI_2005_INPROCEEDINGS_C_77224,
AUTHOR = {Calzolari, N.},
TITLE = {Language Resources and Content Interoperability. Technical, strategic and political issues for a new generation of Language Resources},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/77224},
}
@INPROCEEDINGS{CALZOLARI_2005_INPROCEEDINGS_CS_64217,
AUTHOR = {Calzolari, N. and Soria, C.},
TITLE = {A new paradigm for an Open Distributed Language Resource Infrastructure: the case of Computational Lexicons},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/64217},
CONFERENCE_NAME = {Knowledge Collection from Volunteer Contributors. Papers from the 2005 AAAI Spring Symposium},
}
@INPROCEEDINGS{CAPPELLI_2005_INPROCEEDINGS_CGF_244999,
AUTHOR = {Cappelli, A. and Giovannetti, E. and Federico, M.},
TITLE = {The Role of Communication in Human-Robot Interaction},
YEAR = {2005},
ABSTRACT = {This article focuses on the problem of Human-Robot Interaction (HRI) with particular emphasis on the problem of communication between humans and robots. In this perspective, we can talk about Human-Robot Communication (HRC) as a part of HRI. To allow a human and a so called "social robot" to work as partners, it is necessary to develop suitable spoken dialogue systems. In this work, after an overview about social robots, we will face the problem of Human-Robot Communication and the different possible dialogue management techniques},
URL = {https://iris.cnr.it/handle/20.500.14243/244999},
}
@INPROCEEDINGS{CASELLI_2005_INPROCEEDINGS_CP_64218,
AUTHOR = {Caselli, T. and Prodanof, I.},
TITLE = {A corpus-based model for bridging anaphora resolution in Italian},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/64218},
CONFERENCE_NAME = {Conference RANLP 2005},
}
@INPROCEEDINGS{CUTUGNO_2005_INPROCEEDINGS_CMRR_144315,
AUTHOR = {Cutugno, P. and Marconi, L. and Ratti, D. and Rolando, C.},
TITLE = {Informaciones estadísticas en CALIS: Corpus y Archivo Léxical del Italiano Escrito},
YEAR = {2005},
ABSTRACT = {Informaciones estadísticas en CALIS: Corpus y Archivo Léxical del Italiano Escrito. CALIS es una base de datos de la lengua italiana escrita de 3. 798. 275 palabras y esta formada de textos escritos de varios generes pesados oportunamente y selecionados en tres distintos sectores: diaros, periodicos y libros. Este producto representa el italiano efectivamente leido mas bien que toda la lengua italiana escrita. Esta eleccion se justifica en cuanto se deseaba construir un corpus, y en consecuencia un lexico de frecuencia, que se acercara los mas posible al lexico mental de un hablante de media cultura y no a un diccionario de la lengua italiana. Los diarios con 1. 836. 119 palabras estan extraido de tres diarios que son los mas importantes y leidos en Italia: Il Corriere Della Sera, Repubblica, La Stampa. En cada diario se han elegidos textos de 9 diferentes subsectores: economia, cronica local, cronica mundana, cronica negra, politica exterior, politica interior, ciencia, espectaculo y deporte. El sector de los periodicos esta constituido por 1. 306. 653 palabras elejdas entre 12 differentes subsectores: arte-ciencia-tecnica, auto-nautica, ninos-muchachos, casa-hobby, feminil, fotonovelas, informacion general, cronica mundana, radio-television, deporte, viajes-ecologia y otro. El sector de los libros esta constituido por 655. 503 palabras elejdas entre 13 generos literarios: arte, ninos, fantascienza, gialli espionaje, hobby y viajes, narrativa clasica, narrativa moderna, rosa, ensaystica, ciencias naturales y exactas, ciencias sociales y humanas, teatro y poesia. En este trabajo se analizan las informaciones extraidas del lexico de frecuencia del corpus lematizado de CALIS (Corpus e Archivio Lessicale Italiano Scritto) relativamente a las diferentes categorias gramaticales, a los datos de frecuencia y de dispercion de cada lemma y de cada forma en los distintos sectores y subsectores. Se efectuan por algunos sectores analisis sobre el acrecentamiento de las formas/lemas con el fin de efectuar una evaluacion sobre las posibles y corectas dimensiones de un corpus para ser representativo de la lengua analizada},
KEYWORDS = {Italiano, Analisi Statistica, Lessico di Frequenza},
PAGES = {361-365},
URL = {http://www.santiago.cu/hosting/linguistica/descargar.php?d=194},
PUBLISHER = {Centro de linguística aplicada, Ministerio de ciencia, tecnología y medio ambiente (Santiago de Cuba, CUB)},
ISBN = {959-7174-04-9},
CONFERENCE_NAME = {IX Simposio Internacional Comunicación Social},
CONFERENCE_PLACE = {Santiago de Cuba},
BOOKTITLE = {Actas-I IX Simposio Internacional Comunicación Social},
EDITOR = {Moreno, C. A. and Bolaños, J. P. and Rojas, L. H. and Miyares, L. R.},
}
@INPROCEEDINGS{DELLORLETTA_2005_INPROCEEDINGS_DLMP_77226,
AUTHOR = {Dell'Orletta, F. and Lenci, A. and Montemagni, S. and Pirrelli, V.},
TITLE = {Climbing the path to grammar: a maximum entropy model of subject/object learning},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/77226},
CONFERENCE_NAME = {Psychocomputational Models of Human Language Acquisition (PsychoCompLA-2005)},
}
@INPROCEEDINGS{DIDONATO_2005_INPROCEEDINGS_D_383736,
AUTHOR = {Di Donato, F.},
TITLE = {Designing a Semantic Web path to e-science},
YEAR = {2005},
ABSTRACT = {This paper aims at designing a possible path of convergence between the Open Access and the Semantic Web communities. In section 2, it focuses on the problems that the current Web has to face to become a fully effective research means, with particular regard to the question of selection according to subjective quality criteria. Section 3 exposes the main principles and standards which lie behind the Open Access movement, and tries to demonstrate that the Open Access community is a fertile ground where to experiment Semantic Web technologies. Finally, section 4 sketches a number of practical strategies and suggests the combination of existing tools for e-Science, in order to create a real Semantic Web of scientific knowledge},
URL = {https://iris.cnr.it/handle/20.500.14243/383736},
}
@INPROCEEDINGS{GAVRILIDOU_2005_INPROCEEDINGS_GLMPS_431280,
AUTHOR = {Gavrilidou, M. and Labropoulou, P. and Monachini, M. and Piperidis, S. and Soria, C.},
TITLE = {Building Multilingual Language Resources},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/431280},
ISBN = {954-91743-2-8},
CONFERENCE_NAME = {Language and Speech Infrastructure for Information Access in the Balkan Countries},
}
@INPROCEEDINGS{MARCONI_2005_INPROCEEDINGS_MRRC_77227,
AUTHOR = {Marconi, L. and Ratti, D. and Rolando, C. and Cutugno, P.},
TITLE = {Hemeroteca telemática: instrumento para la organizacion y la circulación de la información},
YEAR = {2005},
ABSTRACT = {En estos últimos anos los progresos tecnológicos han aumentado, de forma exponencial, la capacidad de transmitir la información y han facilitado también la posibilidad de archivar los datos y recuperarlos. La hemeroteca telemática es una propuesta para el desarrollo y la realización de un archivo digital exhaustivo de todos los diarios italianos por medio de tecnologías adelantadas que faciliten el acceso, el recupero y la utilización de la información. La exhaustividad del archivo y la metodología de acceso a la informacion son las características principales del proyecto. La característica de la hemeroteca actual es de estar formada por un material muy deteriorable cual el papel, especialmente el papel usado para los diarios, muy sutil y sometido a usura en la sustancia y en el color. Las películas han resuelto el problema de la conservación de los datos pero solo parcialmente sea por los costes muy altos sea porque no representan un real auxilio a la búsqueda de la información. La realización de una hemeroteca digital podría ser además un ejemplo de prueba para el desarrollo de metodologías y instrumentos lingüísticos en sectores especializados de la información. De hecho los diarios representan un sector de la información bastante bien estructurado ya que están divididos en planas según el contenido, crónica, política del interior y del exterior, deporte, cultura, entretenimiento, etc.; además llevan informaciones de tipo no textual como fotos y viñitas satíricas que constituyen parte integrante de la información. De otro lado la mayor facilidad de acceso a enormes cantidades de información no significa que la información sea realmente utilizable por los expertos del sector o por el público. La explosión de la información en la red ha bien puesto en evidencia el problema de la saturación del canal por falta de instrumentos y estrategias aptos a la búsqueda y selección de la información pertinente. Una base de datos de la información periodística podría en fin constituir un archivo viviente, una testificación de la sociedad, un recurso esencial y altamente eficiente para nuestro país también desde un punto de vista económico, una empresa capaz de producir nuevos posibilidades trabajo y nuevas competencias, un instrumento en condiciones de contestar adecuadamente al desafió de la globalización. En nuestro estudio se analiza la metodología para la construcción de una hemeroteca italiana, se evidencian los problemas, se hace algunas hipótesis hacia las soluciones y se traza el camino para dar empuje a esta obra},
KEYWORDS = {Italiano, Quotidiani, Emeroteca},
PAGES = {601-604},
URL = {http://www.santiago.cu/hosting/linguistica/descargar.php?d=211},
PUBLISHER = {Centro de linguística aplicada, Ministerio de ciencia, tecnología y medio ambiente (Santiago de Cuba, CUB)},
ISBN = {959-7174-05-7},
CONFERENCE_NAME = {IX Simposio Internacional de Comunicación Social},
CONFERENCE_PLACE = {Santiago de Cuba},
BOOKTITLE = {Actas-II IX Simposio Internacional Comunicación Social},
EDITOR = {Moreno, C. A. and Bolaños, J. P. and Rojas, L. H. and Miyares, L. R. and Gutiérrez, Y. C.},
}
@INPROCEEDINGS{MARINELLI_2005_INPROCEEDINGS_MBR_64205,
AUTHOR = {Marinelli, R. and Bindi, R. and Roventini, A.},
TITLE = {Metonymic and Metaphorical Uses of Proper Names},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/64205},
CONFERENCE_NAME = {IX Simposio Internacional de Comunicación Social},
}
@INPROCEEDINGS{MARINELLI_2005_INPROCEEDINGS_MR_64206,
AUTHOR = {Marinelli, R. and Roventini, A.},
TITLE = {Some Considerations about the Italian Maritime Lexicon Structuring},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/64206},
CONFERENCE_NAME = {IX Simposio Internacional de Comunicación Social},
}
@INPROCEEDINGS{MONACHINI_2005_INPROCEEDINGS_MC_64208,
AUTHOR = {Monachini, M. and Calzolari, N.},
TITLE = {Initiatives towards the integration of Lexicons: MILE is taking steps forward},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/64208},
CONFERENCE_NAME = {Machine Translation},
}
@INPROCEEDINGS{MONACHINI_2005_INPROCEEDINGS_MS_64219,
AUTHOR = {Monachini, M. and Soria, C.},
TITLE = {Building Multilingual Terminological Lexicons for Less Widely Available Languages},
YEAR = {2005},
ABSTRACT = {Availability of Linguistic Resources for the development of Human Language Technology applications is nowadays recognized as a critical issue with both political and economic impact and implications on the sphere of cultural identity. This paper reports about the experience gained during the INTERA European project for the production of multilingual terminological lexicons for less widely available languages, i. e. those languages that suffer from poor representation over the net and from scarce computational resources, but yet are requested by the market. It discusses the procedure followed within the project, focuses on the problems faced which had an impact on the initial goals, presents the necessary modifications that resulted from these problems, evaluates the market needs as attested by various surveys, and describes the methodology that is proposed for the efficient production of Multilingual Terminological Lexicons},
PAGES = {129-133},
URL = {https://iris.cnr.it/handle/20.500.14243/64219},
PUBLISHER = {IMPRESJA Wydawnictwa Elektroniczne S. A (Poznan, POL)},
ISBN = {83-7111-341-2},
CONFERENCE_NAME = {2nd Language \& Technology Conference Human Language Technologies as a Challenge for Computer Science and Linguistics},
CONFERENCE_PLACE = {Poznan},
BOOKTITLE = {2nd Language \& Technology Conference Human Language Technologies as a Challenge for Computer Science and Linguistics Poznan},
EDITOR = {Vetulani, Z.},
}
@INPROCEEDINGS{PARDELLI_2005_INPROCEEDINGS_PO_64220,
AUTHOR = {Pardelli, G. and Orsolini, P.},
TITLE = {"Special Session in Memory of Antonio Zampolli"},
YEAR = {2005},
ABSTRACT = {It is certain that this bibliography needs to be further updates but it is with pleasure that we present it during this Special Session dedicated to Antonio Zampolli, along with a a short Curriculum vitae. A special thanks goes to Nicoletta Calzolari, Director of the Institute of Computational Linguistics, who always encouraged and supported our work with precious advices},
PAGES = {1-50},
URL = {https://iris.cnr.it/handle/20.500.14243/64220},
CONFERENCE_NAME = {L\&T'05-2nd Language Technologies as a Challenge for Computer Science and Linguistics in Memory of Antonio Zampolli},
}
@INPROCEEDINGS{RUIMY_2005_INPROCEEDINGS_RBC_64221,
AUTHOR = {Ruimy, N. and Bouillon, P. and Cartoni, B.},
TITLE = {Inferring a Semantically Annotated Generative French Lexicon from an Italian Lexical Resource},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/64221},
CONFERENCE_NAME = {GL 2005, Third International Workshop on Generative Approaches to the Lexicon},
}
@INPROCEEDINGS{RUIMY_2005_INPROCEEDINGS_RR_64222,
AUTHOR = {Ruimy, N. and Roventini, A.},
TITLE = {Towards the Linking of two Electronic Lexical Databases of Italian},
YEAR = {2005},
ABSTRACT = {In this paper we address the issue of the semiautomatic link of ItalWordNet and PAROLE/SIMPLE/CLIPS, two electronic lexical databases of Italian language, based on different lexical semantic models with their own underlying principles and peculiarities. Nevertheless, the two resources present many compatible aspects that led us to take their analysis further, convinced that a considerable gain could be achieved by their link. In this paper, an outline of the mapping of both their ontological frameworks and semantic relations is provided, the linking methodology and related problems are then described, finally the reciprocal benefits and enhancements the two lexicons would gain from their linking are illustrated},
URL = {https://iris.cnr.it/handle/20.500.14243/64222},
CONFERENCE_NAME = {L\&T'05-2nd Language Technologies as a Challenge for Computer Science and Linguistics},
}
@INPROCEEDINGS{SORIA_2005_INPROCEEDINGS_S_64207,
AUTHOR = {Soria, C.},
TITLE = {Constraints on the use of connectives in discourse},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/64207},
CONFERENCE_NAME = {First International Symposium on the Exploration and Modelling of Meaning},
}
@INPROCEEDINGS{SORIA_2005_INPROCEEDINGS_SM_64223,
AUTHOR = {Soria, C. and Monachini, M.},
TITLE = {Methods, Models and Standardization Issues for the Creation of Linguistic Resources: the Case of Under-Represented Languages},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/64223},
CONFERENCE_NAME = {TALN \& RECITAL 2005: 12ème conférence annuelle sur le Traitement Automatique des Langues Naturelles},
}
@INPROCEEDINGS{BARBERA_2005_INPROCEEDINGS_BD_383738,
AUTHOR = {Barbera, M. and Di Donato, F.},
TITLE = {HyperJournal: Open Publishing Made Easy},
YEAR = {2005},
ABSTRACT = {Poster of HyperJournal, an open source software for open access publishing of e-journals},
URL = {https://iris.cnr.it/handle/20.500.14243/383738},
}
@TECHREPORT{BALDI_2005_TECHREPORT_BBCP_195894,
AUTHOR = {Baldi, M. and Bozzi, A. and Canziani, G. E. and Passarotti, M.},
TITLE = {I Contradicentium Medicorum Libri},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/195894},
}
@TECHREPORT{BARTOLINI_2005_TECHREPORT_BCLMP_457826,
AUTHOR = {Bartolini, R. and Caracciolo, C. and Lenci, A. and Marchi, S. and Pirrelli, V.},
TITLE = {Motore semantico. Documento di progettazione e sviluppo},
YEAR = {2005},
ABSTRACT = {Il presente documento descrive architettura, funzionalità e algoritmo di un componente software dedicato, designato come "Motore Semantico", che ha lo scopo di produrre rappresentazioni logico-concettuali, ontologicamente interpretate, di interrogazioni in linguaggio naturale su una base di dati di tipo anche GIS},
KEYWORDS = {NLP},
PAGES = {1-42},
URL = {https://iris.cnr.it/handle/20.500.14243/457826},
}
@TECHREPORT{BARTOLINI_2005_TECHREPORT_BGMM_195895,
AUTHOR = {Bartolini, R. and Giorgetti, D. and Marchi, S. and Montemagni, S.},
TITLE = {ILC-CNR Contribution to Deliverable 4. 1},
YEAR = {2005},
ABSTRACT = {The goal of the semantic annotation is the annotation of entities and relations starting from input documents conformant with the harmonisation output schema as defined within WP3. This harmonisation schema will focus on the structural and logical organisation of the documents, while WP4 will concentrate on the annotation of textual entities and image elements. The results of semantic annotation are intended to populate the domain ontology},
KEYWORDS = {NLP},
URL = {https://iris.cnr.it/handle/20.500.14243/195895},
}
@TECHREPORT{BARTOLINI_2005_TECHREPORT_BLMMP_195896,
AUTHOR = {Bartolini, R. and Lenci, A. and Marchi, S. and Montemagni, S. and Pirrelli, V.},
TITLE = {Personalizzazione degli Italian NLP tools},
YEAR = {2005},
ABSTRACT = {Il presente documento intende offrire criteri e risultati della fase di personalizzazione dei moduli per l'analisi automatica del testo (Italian NLP tools o "AnITA") all'interno dell'architettura prevista nell'ambito del progetto FuLL},
KEYWORDS = {NLP},
PAGES = {13},
URL = {https://iris.cnr.it/handle/20.500.14243/195896},
}
@TECHREPORT{BARTOLINI_2005_TECHREPORT_BLMP_195898,
AUTHOR = {Bartolini, R. and Lenci, A. and Montemagni, S. and Pirrelli, V.},
TITLE = {Modellazione del motore sintattico e delle strutture dati di supporto},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/195898},
}
@TECHREPORT{BARTOLINI_2005_TECHREPORT_BLMMP_457827,
AUTHOR = {Bartolini, R. and Lenci, L. and Marchi, S. and Montemagni, S. and Pirrelli, V.},
TITLE = {Text-2-Knowledge: Acquisizione semi-automatica di ontologie per l'indicizzazione semantica di documenti},
YEAR = {2005},
ABSTRACT = {Text-2-Knowledge, Acquisizione semi-automatica di ontologie per l'indicizzazione semantica di documenti},
KEYWORDS = {nlp, terminology extraction},
URL = {https://iris.cnr.it/handle/20.500.14243/457827},
}
@TECHREPORT{BOZZI_2005_TECHREPORT_B_195900,
AUTHOR = {Bozzi, A.},
TITLE = {COMTOOCI project},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/195900},
}
@TECHREPORT{CININI_2005_TECHREPORT_C_157109,
AUTHOR = {Cinini, A.},
TITLE = {Relazione sull'attività di Content-Analysis},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/157109},
}
@TECHREPORT{CUCURULLO_2005_TECHREPORT_CMPPS_195901,
AUTHOR = {Cucurullo, S. and Montemagni, S. and Paoli, M. and Picchi, E. and Sassolini, E.},
TITLE = {Atlante Lessicale Toscano in rete (ALT-Web). Relazione finale},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/195901},
}
@TECHREPORT{DECLERCK_2005_TECHREPORT_DKBM_457828,
AUTHOR = {Declerck, T. and Kessler, M. and Bel, N. and Monachini, M.},
TITLE = {Evaluation of initiatives for morpho-syntactic and syntactic annotation},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/457828},
}
@TECHREPORT{FRANCOPOULO_2005_TECHREPORT_FBBDMBSG_195904,
AUTHOR = {Francopoulo, G. and Bontcheva, K. and Bunt, H. and Declerck, T. and Monachini, M. and Budin, G. and Schiffrin, A. and Gillam, L.},
TITLE = {Periodic Progress Report},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/195904},
}
@TECHREPORT{FRANCOPOULO_2005_TECHREPORT_FBBDMBSG_457829,
AUTHOR = {Francopoulo, G. and Bontcheva, K. and Bunt, H. and Declerck, T. and Monachini, M. and Budin, G. and Schiffrin, A. and Gillam, L.},
TITLE = {Annual Progress Report},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/457829},
}
@TECHREPORT{FRANCOPOULO_2005_TECHREPORT_FBMN_195903,
AUTHOR = {Francopoulo, G. and Bunt, H. and Monachini, M. and Nioche, J.},
TITLE = {Risk Management Plan},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/195903},
}
@TECHREPORT{FRANCOPOULO_2005_TECHREPORT_FGCMBPS_195905,
AUTHOR = {Francopoulo, G. and George, M. and Calzolari, N. and Monachini, M. and Bel, N. and Pet, M. and Soria, C.},
TITLE = {Language Resource Management Lexical Markup Framework},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/195905},
}
@TECHREPORT{GIORGETTI_2005_TECHREPORT_GMM_195906,
AUTHOR = {Giorgetti, D. and Marchi, S. and Montemagni, S.},
TITLE = {ILC-CNR Contribution to Deliverable 5. 1},
YEAR = {2005},
ABSTRACT = {This document describes the high level infrastructure designed as part of the project VIKEF for creating a Virtual Information and Knowledge Environment (VIKE), namely an environment made up of explicit representation of the information and knowledge implicitly contained in one or more collections of Information-Content-Knowledge (ICK) resources, and of a collection of services operating on this explicit representation of information and knowledge; it is a virtual environment, as the representation and the services for accessing information and knowledge is almost completely independent from the physical properties of the original data},
KEYWORDS = {NLP},
URL = {https://iris.cnr.it/handle/20.500.14243/195906},
}
@TECHREPORT{LENCI_2005_TECHREPORT_LMP_195907,
AUTHOR = {Lenci, A. and Marchi, S. and Pirrelli, V.},
TITLE = {Motore del dialogo. Documento di progettazione e sviluppo},
YEAR = {2005},
ABSTRACT = {Il presente documento intende offrire i criteri generali e le funzionalità di base relativi alla progettazione del motore di dialogo nell'ambito del progetto FuLL},
KEYWORDS = {NLP},
URL = {https://iris.cnr.it/handle/20.500.14243/195907},
}
@TECHREPORT{LENCI_2005_TECHREPORT_LPS_457830,
AUTHOR = {Lenci, A. and Pirrelli, V. and Soria, C.},
TITLE = {Modellazione del motore di dialogo e delle strutture dati di supporto},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/457830},
}
@TECHREPORT{MAMMINI_2005_TECHREPORT_MUM_195908,
AUTHOR = {Mammini, M. and Ulivieri, M. and Monachini, M.},
TITLE = {Unified Lexica: Common sample lexicon and harmonized morpho-syntactic specifications between PAROLE and LCStar},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/195908},
}
@TECHREPORT{MARCHI_2005_TECHREPORT_MM_195909,
AUTHOR = {Marchi, S. and Montemagni, S.},
TITLE = {ILC-CNR Contribution to Deliverable 3. 1},
YEAR = {2005},
ABSTRACT = {This document presents the first set of knowledge and content acquisition components. Starting from the Annotation Schema definition, it will then describe the Harmonization support and the Annotation components, as well as the various resources needed all along the current chain},
KEYWORDS = {NLP},
URL = {https://iris.cnr.it/handle/20.500.14243/195909},
}
@TECHREPORT{MONACHINI_2005_TECHREPORT_MSCDW_195910,
AUTHOR = {Monachini, M. and Soria, C. and Choukri, K. and Declerck, T. and Wittenburg, P.},
TITLE = {Final Evaluation Report},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/195910},
}
@TECHREPORT{MONACHINI_2005_TECHREPORT_MSUCDM_195911,
AUTHOR = {Monachini, M. and Soria, C. and Ulivieri, M. and Calzolari, N. and Declerck, T. and Mammini, M.},
TITLE = {Evaluation of existing standards for NLP Lexica: Proposal for Candidate Data Categories},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/195911},
}
@TECHREPORT{SASSI_2005_TECHREPORT_SC_147585,
AUTHOR = {Sassi, M. and Cinini, A.},
TITLE = {L'archivio della Disciplinare come deposito per la content-analysis},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/147585},
}
@TECHREPORT{SASSOLINI_2005_TECHREPORT_SE_334028,
AUTHOR = {Sassolini, E. and Evangelista, A.},
TITLE = {P8/L488-01: report tecnico di progetto},
YEAR = {2005},
ABSTRACT = {Diffusione della cultura e valorizzazione del patrimonio letterario della lingua italiana e della lingua araba attraverso una diffusione telematica di banche dati letterarie},
KEYWORDS = {trattamento della lingua araba, applicazione web},
PAGES = {12},
URL = {https://iris.cnr.it/handle/20.500.14243/334028},
}
@MISC{BARTOLINI_2005_MISC_BDGMLMP_192739,
AUTHOR = {Bartolini, R. and Dell'Orletta, F. and Giorgetti, D. and Marchi, S. and Lenci, A. and Montemagni, S. and Pirrelli, V.},
TITLE = {Text-to-Knowledge (T2K)},
YEAR = {2005},
ABSTRACT = {Piattaforma di estrazione e indicizzazione terminologica},
URL = {https://iris.cnr.it/handle/20.500.14243/192739},
}
@MISC{BARTOLINI_2005_MISC_BMLMP_192740,
AUTHOR = {Bartolini, R. and Marchi, S. and Lenci, A. and Montemagni, S. and Pirrelli, V.},
TITLE = {NLPtools},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/192740},
}
@MISC{BOZZI_2005_MISC_B_106740,
AUTHOR = {Bozzi, A.},
TITLE = {Digital libraries and scholarly editing: the SPWC System},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/106740},
CONFERENCE_NAME = {Alte Archive Noue Technologien},
}
@MISC{BOZZI_2005_MISC_B_464686,
AUTHOR = {Bozzi, A.},
TITLE = {SPWC-COMTOOCI},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/464686},
}
@MISC{BOZZI_2005_MISC_B_106739,
AUTHOR = {Bozzi, A.},
TITLE = {Electronic edition and digital textual criticism: methodological aspects},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/106739},
CONFERENCE_NAME = {Edition critique/èdition électronique: bases de données textuelles. Pratique et théorie},
}
@MISC{CALZOLARI_2005_MISC_C_435671,
AUTHOR = {Calzolari, N.},
TITLE = {Building Blocks for Semantic Annotation: towards Content Interoperability},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/435671},
}
@MISC{CALZOLARI_2005_MISC_C_106727,
AUTHOR = {Calzolari, N.},
TITLE = {An Infrastructure for Language Technology and more},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/106727},
}
@MISC{CALZOLARI_2005_MISC_C_106719,
AUTHOR = {Calzolari, N.},
TITLE = {Language Resources and Content Interoperability Technical, strategic and political issues for a new generation of Language Resources},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/106719},
}
@MISC{CALZOLARI_2005_MISC_C_106728,
AUTHOR = {Calzolari, N.},
TITLE = {Technical and Strategic Issues on Language Resources for a Research Infrastructure},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/106728},
}
@MISC{CALZOLARI_2005_MISC_C_106723,
AUTHOR = {Calzolari, N.},
TITLE = {Language Technology and the Semantic Web},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/106723},
}
@MISC{CALZOLARI_2005_MISC_C_106725,
AUTHOR = {Calzolari, N.},
TITLE = {Language resources: priorities and challenges},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/106725},
}
@MISC{CALZOLARI_2005_MISC_C_106721,
AUTHOR = {Calzolari, N.},
TITLE = {Language Resources, Language Technology, Linguistics: isn t this too narrow?},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/106721},
}
@MISC{CALZOLARI_2005_MISC_C_106726,
AUTHOR = {Calzolari, N.},
TITLE = {Linguistica Computazionale: che cosa ci dice della lingua?},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/106726},
}
@MISC{CALZOLARI_2005_MISC_CBLM_457831,
AUTHOR = {Calzolari, N. and Bertagna, F. and Lenci, A. and Monachini, M.},
TITLE = {Boosting Lexical Resources for the Semantic Web. Generative Lexicon and Lexicon Interoperability},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/457831},
CONFERENCE_NAME = {GL2005-3rd International Workshop on Generative Approaches to the Lexicon},
}
@MISC{CECCOTTI_2005_MISC_CS_192725,
AUTHOR = {Ceccotti, M. L. and Sassi, M.},
TITLE = {Dall'Archivio Elettronico delle Opere di Carlo Emilio Gadda. Studi e ricerche con strumenti computazionali dell'opera dell'ingegnere-scrittore},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/192725},
}
@MISC{DIDONATO_2005_MISC_D_406237,
AUTHOR = {Di Donato, F.},
TITLE = {Hyperjournal},
YEAR = {2005},
ABSTRACT = {Presentazione di Hyperjournal},
URL = {https://iris.cnr.it/handle/20.500.14243/406237},
}
@MISC{DIDONATO_2005_MISC_D_384164,
AUTHOR = {Di Donato, F.},
TITLE = {Suber P., Promuovere l'"Open Access" nelle scienze umane},
YEAR = {2005},
ABSTRACT = {Traduzione dall'originale inglese},
URL = {https://iris.cnr.it/handle/20.500.14243/384164},
ISSN = {1591-4305},
}
@MISC{DIFEDERICO_2005_MISC_DCSCF_188393,
AUTHOR = {Di Federico, G. and Cinini, A. and Sassi, M. and Cavallini, D. and Fabri, M.},
TITLE = {Sviluppo della banca dati testuale delle sentenze della sezione disciplinare del CSM},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/188393},
}
@MISC{FRANCOPOULO_2005_MISC_FGCBPS_464689,
AUTHOR = {Francopoulo, G. and George, M. and Calzolari, N. M. M. and Bel, N. and Pet, M. and Soria, C.},
TITLE = {Lexical Markup Framework},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/464689},
}
@MISC{GAVRILIDOU_2005_MISC_GLMPS_192735,
AUTHOR = {Gavrilidou, M. and Labropoulou, P. and Monachini, M. and Piperidis, S. and Soria, C.},
TITLE = {INTERA Business model},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/192735},
}
@MISC{GIORGOLO_2005_MISC_GHP_464691,
AUTHOR = {Giorgolo, G. and Herreros, I. and Pirrelli, V.},
TITLE = {SOM-ware},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/464691},
}
@MISC{GUADAGNINI_2005_MISC_G_265592,
AUTHOR = {Guadagnini, E.},
TITLE = {Sordello, Er encontraol temps de mai (BdT 437. 4a)},
YEAR = {2005},
URL = {http://www.rialto.unina.it/Sordel/437.4a(Boni).htm},
ISSN = {1973-381X},
}
@MISC{GUADAGNINI_2005_MISC_G_265615,
AUTHOR = {Guadagnini, E.},
TITLE = {Peire Cardenal, Ab votz d'angel, lengu'esperta, non blesza (BdT 335. 1)},
YEAR = {2005},
URL = {http://www.rialto.unina.it/PCard/335.1(Vatteroni).htm},
ISSN = {1973-381X},
}
@MISC{GUADAGNINI_2005_MISC_G_265621,
AUTHOR = {Guadagnini, E.},
TITLE = {Peire Cardenal, Anc non vi breton ni baivier (BdT 335. 5)},
YEAR = {2005},
URL = {http://www.rialto.unina.it/PCard/335.5(Vatteroni).htm},
ISSN = {1973-381X},
}
@MISC{GUADAGNINI_2005_MISC_G_265588,
AUTHOR = {Guadagnini, E.},
TITLE = {Sordello, Ailas, e queom fau miey huelh (BdT 437. 1)},
YEAR = {2005},
URL = {http://www.rialto.unina.it/Sordel/437.1%28Boni%29.htm},
ISSN = {1973-381X},
}
@MISC{GUADAGNINI_2005_MISC_G_265619,
AUTHOR = {Guadagnini, E.},
TITLE = {Peire Cardenal, Anc mais tan gen no vi venir pascor (BdT 335. 4)},
YEAR = {2005},
URL = {http://www.rialto.unina.it/PCard/335.4(Vatteroni).htm},
ISSN = {1973-381X},
}
@MISC{GUADAGNINI_2005_MISC_G_265625,
AUTHOR = {Guadagnini, E.},
TITLE = {Peire Cardenal, Lo sabers d'est segle es foledatz (BdT 335. 34)},
YEAR = {2005},
URL = {http://www.rialto.unina.it/PCard/335.34(Vatteroni).htm},
ISSN = {1973-381X},
}
@MISC{GUADAGNINI_2005_MISC_G_265591,
AUTHOR = {Guadagnini, E.},
TITLE = {Sordello, Aitant ses plus viu hom quan viu jauzens (BdT 437. 2)},
YEAR = {2005},
URL = {http://www.rialto.unina.it/Sordel/437.2%28Boni%29.htm},
ISSN = {1973-381X},
}
@MISC{GUADAGNINI_2005_MISC_G_265595,
AUTHOR = {Guadagnini, E.},
TITLE = {Sordello, Bel m'es ab motz leugiers a far (BdT 437. 7)},
YEAR = {2005},
URL = {http://www.rialto.unina.it/Sordel/437.7(Boni).htm},
ISSN = {1973-381X},
}
@MISC{GUADAGNINI_2005_MISC_G_265598,
AUTHOR = {Guadagnini, E.},
TITLE = {Sordello, Lai al comte mon segnor voill pregar (BdT 437. 18)},
YEAR = {2005},
URL = {http://www.rialto.unina.it/Sordel/437.18(Boni).htm},
ISSN = {1973-381X},
}
@MISC{GUADAGNINI_2005_MISC_G_265623,
AUTHOR = {Guadagnini, E.},
TITLE = {Peire Cardenal, Aquesta gens, quant son en lur guayeza (BdT 335. 6)},
YEAR = {2005},
URL = {http://www.rialto.unina.it/PCard/335.6(Vatteroni).htm},
ISSN = {1973-381X},
}
@MISC{GUADAGNINI_2005_MISC_G_265616,
AUTHOR = {Guadagnini, E.},
TITLE = {Peire Cardenal, Aissi com hom planh son filh o son paire (BdT 335. 2)},
YEAR = {2005},
URL = {http://www.rialto.unina.it/PCard/335.2(Vatteroni).htm},
ISSN = {1973-381X},
}
@MISC{GUADAGNINI_2005_MISC_G_265618,
AUTHOR = {Guadagnini, E.},
TITLE = {Peire Cardenal, Al nom del seingnor dreiturier (BdT 335. 3)},
YEAR = {2005},
URL = {http://www.rialto.unina.it/PCard/335.3(Vatteroni).htm},
ISSN = {1973-381X},
}
@MISC{GUADAGNINI_2005_MISC_G_265594,
AUTHOR = {Guadagnini, E.},
TITLE = {Sordello, Atretan dei ben chantar finamen (BdT 437. 5)},
YEAR = {2005},
URL = {http://www.rialto.unina.it/Sordel/437.5(Boni).htm},
ISSN = {1973-381X},
}
@MISC{MAMMINI_2005_MISC_MUM_192736,
AUTHOR = {Mammini, M. and Ulivieri, M. and Monachini, M.},
TITLE = {Lessici Unificati su richiesta},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/192736},
}
@MISC{MAMMINI_2005_MISC_MUM_192737,
AUTHOR = {Mammini, M. and Ulivieri, M. and Monachini, M.},
TITLE = {Lessico Unificato},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/192737},
}
@MISC{MAMMINI_2005_MISC_MUM_464690,
AUTHOR = {Mammini, M. and Ulivieri, M. and Monachini, M.},
TITLE = {Specifiche Lessicali Morfo-sintattiche Unificate},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/464690},
}
@MISC{MARCOBERTINETTO_2005_MISC_MBLMRRM_192733,
AUTHOR = {Marco Bertinetto, P. and Burani, C. and Laudanna, A. and Marconi, L. and Ratti, D. and Rolando, C. and Maria Thornton, A.},
TITLE = {CoLFIS: Corpus e Archivio Lessicale dell Italiano Scritto contemporaneo},
YEAR = {2005},
ABSTRACT = {Dal progetto speciale, "Banca Dati Lessicali dell'Italiano Scritto Contemporaneo" del CNR, sviluppato in collaborazione con la Scuola Normale Superiore di Pisa e l'Istituto di Scienze e Tecnologie della Cognizione del CNR di Roma, è stato realizzato il "Corpus e Archivio Lessicale dell'Italiano Scritto contemporaneo" (CoLFIS), suddiviso in tre settori contenente, in maniera opportunamente bilanciata, testi appartenenti a vari generi di scrittura. I sottoinsiemi, o settori, individuati in CoLFIS sono: la "stampa quotidiana" suddivisa in tre testate giornalistiche: "Il Corriere Della Sera", "La Repubblica", "La Stampa", a loro volta in ogni testata le occorrenze sono poi suddivise in sette sottoinsiemi; le "Pubblicazioni Periodiche" sono ulteriormente suddivise in 12 sottosettori; i "libri" sono suddivisi in 13 generi letterari. Il corpus rappresenta soprattutto l'italiano effettivamente letto piuttosto che tutto l'italiano scritto dal momento che, nel definire gli insiemi di testi da includere, non si sono tenuti presenti tutti i possibili usi scritti dell'italiano, tutti i tipi di testi teoricamente producibili ed effettivamente prodotti, ma piuttosto i tipi di testi che, da una indagine sociologica e statistica, sono risultati essere i più letti. Tale scelta si giustifica in quanto si è voluto costruire un corpus e un lessico di frequenza che si avvicinassero il più possibile al lessico mentale di un parlante di media cultura e non un a dizionario esaustivo della lingua italiana. Il corpus di CoLFIS è stato totalmente lemmatizzato e sono stati sviluppati algoritmi software di analisi statistica per estrarre i lessici di frequenza nel corpus totale e nei diversi settori costituenti il corpus lemmatizzato, per ogni lemma e per le relative forme. CoLFIS ha dato luogo a diversi prodotti disponibili in formato digitale tra cui un formario, i lessici di frequenza per i diversi settori e un lessico di frequenza totale dotati di appropriati indici di frequenza. Il corpus esiste in versione testuale e in versione lemmatizzata. Si tratta dell'unico corpus di riferimento creato su base statistica e interamente lemmatizzato della lingua italiana},
URL = {http://www.ge.ilc.cnr.it/lessico.php},
}
@MISC{MARCOBERTINETTO_2005_MISC_MBLMRRM_145632,
AUTHOR = {Marco Bertinetto, P. and Burani, C. and Laudanna, A. and Marconi, L. and Ratti, D. and Rolando, C. and Maria Thornton, A.},
TITLE = {Corpus e lessico di frequenza dell'Italiano scritto (CoLFIS). [Corpus and Frequency Lexicon of Written Italian]},
YEAR = {2005},
ABSTRACT = {CoLFIS: sistemas de interrogación online. CoLFIS: sistemas de interrogación online CoLFIS es una base de datos de la lengua italiana escrita de 3. 798. 275 palabras, formada de textos escritos de varios generes pesados oportunamente y selecionados en tres distintos sectores: diarios, periodicos y libros. El producto realizado representa el italiano leido mas bien que toda la lengua italiana escrita. Esta eleccion se justifica en cuanto se deseaba construir un corpus, y en consecuencia un lexico de frecuencia, que se acercara los mas posible al lexico mental de un hablante de media cultura y no a un diccionario de la lengua italiana. Los diarios con 1. 836. 119 palabras se han extraido de los tres diarios mas importantes y leidos en Italia: Il Corriere Della Sera, Repubblica, La Stampa. En cada diario se han elegidos textos de 9 diferentes subsectores: economia, cronica local, cronica mundana, cronica negra, politica exterior, politica interior, ciencia, espectaculo y deporte. El sector de los periodicos es constituido por 1. 306. 653 palabras elejdas entre 12 differentes subsectores: arte-ciencia-tecnica, auto-nautica, ninos-muchachos, casa-hobby, femenino, fotonovelas, informacion general, cronica mundana, radio-television, deporte, viajes-ecologia y otro. El sector de los libros es constituido por 655. 503 palabras elejdas entre 13 generos literarios: arte, ninos, ficcion, gialli espionaje, hobby y viajes, narrativa clasica, narrativa moderna, rosa, ensaystica, ciencias naturales y exactas, ciencias sociales y humanas, teatro y poesia. El corpus CoLFIS ha sido sometido a una lematizacion completa y se han desarrollado paquetes software de analisis estadistico para producir los lexicos de frecuencia relativos al corpus total y a los distintos sectores para cada lema y formas relativas. En este trabajo seran explicados los metodos de interogacion realizados para ayudar el usuario que quiere acercarse al corpus, puesto a disposicion en internet, y obtener informaciones del corpus, del corpus con lematizacion, de los lexicos de frecuencia. Ademas se ensenarà un estudio sobre los adverbios derivados, es decir los adverbios que terminan en-mente, como ejemplo de posibles investigaciones permitidas del material linguistico y del sistema de interogacion a disposicion. Se presenteran los porcentajes de las distintas tipologias adverbiales y se analizara la posicion del adverbio en la oracion buscando evaluar sus posibilidades combinatorias},
KEYWORDS = {Corpora, Lessico, Italiano, DataBase},
URL = {http://www.ge.ilc.cnr.it/strumenti.php},
}
@MISC{MARINELLI_2005_MISC_MS_192728,
AUTHOR = {Marinelli, R. and Spadoni, G.},
TITLE = {MARITERM Database di terminologia marittima},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/192728},
}
@MISC{MONACHINI_2005_MISC_MS_192724,
AUTHOR = {Monachini, M. and Soria, C.},
TITLE = {Terminologia Multilingue (inglese-greco-serbo-sloveno-bulgaro)},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/192724},
}
@MISC{MONACHINI_2005_MISC_MSPSR_192738,
AUTHOR = {Monachini, M. and Soria, C. and Picchi, E. and Sassolini, E. and Ruffolo, P.},
TITLE = {Procedure e tecniche di acquisizione semi-automatica di terminologie da testi paralleli},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/192738},
}
@MISC{MONACHINI_2005_MISC_MSUCDM_192734,
AUTHOR = {Monachini, M. and Soria, C. and Ulivieri, M. and Calzolari, N. and Declerck, T. and Mammini, M.},
TITLE = {Data Category Registry},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/192734},
}
@MISC{PARDELLI_2005_MISC_PSGO_192741,
AUTHOR = {Pardelli, G. and Sassi, M. and Goggi, S. and Orsolini, P.},
TITLE = {NLPterminology},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/192741},
}
@MISC{PECCHIA_2005_MISC_PCCS_192726,
AUTHOR = {Pecchia, L. and Caligaris, C. and Cappelli, G. and Saba, A.},
TITLE = {Corpus di Linguaggio Infantile},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/192726},
}
@MISC{PICCHI_2005_MISC_PMSCP_192727,
AUTHOR = {Picchi, E. and Montemagni, S. and Sassolini, E. and Cucurullo, S. and Paoli, M.},
TITLE = {ALTWEB},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/192727},
}
@MISC{PICCHI_2005_MISC_PSCSC_464687,
AUTHOR = {Picchi, E. and Sassi, M. and Ceccotti, M. L. and Sassolini, E. and Cucurullo, S.},
TITLE = {Linguistic Miner},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/464687},
}
@MISC{PIRRELLI_2005_MISC_P_106731,
AUTHOR = {Pirrelli, V.},
TITLE = {On the cognitive autonomy of morphological processing},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/106731},
CONFERENCE_NAME = {4èmes Décembrettes},
}
@MISC{PIRRELLI_2005_MISC_PH_106733,
AUTHOR = {Pirrelli, V. and Herreros, I.},
TITLE = {Learning Morphology by Itsel},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/106733},
CONFERENCE_NAME = {5th Mediterranean Morphology Meeting},
}
@MISC{PIRRELLI_2005_MISC_PL_106734,
AUTHOR = {Pirrelli, V. and Lenci, A.},
TITLE = {Dalla raccolta dati alla diagnostica: prospettive per una},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/106734},
CONFERENCE_NAME = {XIII Congresso della Società Italiana di Psicofisiologia},
}
@MISC{ROVENTINI_2005_MISC_RABCM_192730,
AUTHOR = {Roventini, A. and Alonge, A. and Bertagna, F. and Calzolari, N. and Marinelli, R.},
TITLE = {ItalWordNet database semantico-lessicale dell italiano},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/192730},
}
@MISC{RUIMY_2005_MISC_RMC_192729,
AUTHOR = {Ruimy, N. and Monachini, M. and Calzolari, N.},
TITLE = {Lessico elettronico multi-livello dell'italiano: PAROLE-SIMPLE-CLIPS},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/192729},
}
@MISC{SABA_2005_MISC_S_195913,
AUTHOR = {Saba, A.},
TITLE = {Lessico del testo Tractado de la Sphera de Iohannes de Sacrobusto},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/195913},
}
@MISC{SABA_2005_MISC_S_195912,
AUTHOR = {Saba, A.},
TITLE = {Lessico del testo Arte de marear de Juan de Moya},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/195912},
}
@MISC{SABA_2005_MISC_SSCPCG_464688,
AUTHOR = {Saba, A. and Sassi, M. and Carpi, E. and Periñán, B. and Calí, S. and Garciamacho, M. L.},
TITLE = {Corpus del LéNESO (Léxico Náutico del Español del Siglo de Oro)},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/464688},
}
@MISC{SORIA_2005_MISC_SM_192731,
AUTHOR = {Soria, C. and Monachini, M.},
TITLE = {MILE-OWL},
YEAR = {2005},
URL = {https://iris.cnr.it/handle/20.500.14243/192731},
}
@ARTICLE{ALLEGRINI_2004_ARTICLE_AGGW_50338,
AUTHOR = {Allegrini, P. and Giuntoli, M. and Grigolini, P. and West, B. J.},
TITLE = {From knowledge, knowability and the search for objective randomness to a new vision of complexity},
YEAR = {2004},
ABSTRACT = {Herein we consider various concepts of entropy as measures of the complexity of phenomena and in so doing encounter a fundamental problem in physics that affects how we understand the nature of reality. In essence the difficulty has to do with our understanding of randomness, irreversibility and unpredictability using physical theory, and these in turn undermine our certainty regarding what we can and what we cannot know about complex phenomena in general. The sources of complexity examined herein appear to be channels for the amplification of naturally occurring randomness in the physical world. Our analysis suggests that when the conditions for the renormalization group apply, this spontaneous randomness, which is not a reflection of our limited knowledge, but a genuine property of nature, does not realize the conventional thermodynamic state, and a new condition, intermediate between the dynamic and the thermodynamic state, emerges. We argue that with this vision of complexity, life, which with ordinary statistical mechanics seems to be foreign to physics, becomes a natural consequence of dynamical processes},
PAGES = {11-32},
URL = {https://iris.cnr.it/handle/20.500.14243/50338},
VOLUME = {20},
ISSN = {1054-1500},
JOURNAL = {CHAOS},
}
@ARTICLE{ALLEGRINI_2004_ARTICLE_AGP_50337,
AUTHOR = {Allegrini, P. and Grigolini, P. and Palatella, L.},
TITLE = {Intermittency and scale-free networks: a dynamical model for human language complexity},
YEAR = {2004},
ABSTRACT = {In this paper we try to model certain features of human language complexity by means of advanced concepts borrowed from statistical mechanics. We use a time series approach, the diffusion entropy (DE) method, to compute the complexity of an italian corpus of newspapers and magazines. We find that the anomalous scaling index is compatible with a simple dynamical model, a random walk on a complex scale-free network, which is linguistically related to Saussurres paradigms. The network complexity is independently measured on the same corpus, looking at the co-occurrence of nouns and verbs. This connection of cognitive complexity with long-range time correlations also provides an explanation for the famous Zipfs law in terms of the generalized central limit theorem},
PAGES = {95-105},
URL = {https://iris.cnr.it/handle/20.500.14243/50337},
VOLUME = {20},
}
@ARTICLE{BOZZI_2004_ARTICLE_B_37690,
AUTHOR = {Bozzi, A.},
TITLE = {Postfazione a Zampolli Antonio, Filologia e informatica: le origini della filologia computazionale},
YEAR = {2004},
PAGES = {21-24},
URL = {https://iris.cnr.it/handle/20.500.14243/37690},
VOLUME = {32},
}
@ARTICLE{BOZZI_2004_ARTICLE_B_37689,
AUTHOR = {Bozzi, A.},
TITLE = {Verso una filologia computazionale: la prima Euroconferenza della European Science Foundation},
YEAR = {2004},
ABSTRACT = {Digital technology offers to the philological disciplines many new tools and techniques for the editorial work. These have been the topics discussed at the first Euroconference sponsored by the European Science Foundation, which was held in September 2003 near Pisa. More than 70 scholars and young researchers from many attended the conference. The following paper gives a brief description of the themes discussed and the future developments envisaged for the different sectors in which philological disciplines are subdivided},
KEYWORDS = {Filologia computazionale, digitalizzazione dei documenti, edizioni elettroniche},
PAGES = {128-138},
URL = {https://iris.cnr.it/handle/20.500.14243/37689},
VOLUME = {32},
ISSN = {0870-0133},
JOURNAL = {EUPHROSYNE},
}
@ARTICLE{BOZZI_2004_ARTICLE_B_37688,
AUTHOR = {Bozzi, A.},
TITLE = {Tecnologie e beni librari: il digitale in biblioteca e in archivio},
YEAR = {2004},
PAGES = {439-445},
URL = {https://iris.cnr.it/handle/20.500.14243/37688},
VOLUME = {2},
}
@ARTICLE{BOZZI_2004_ARTICLE_BCL_37687,
AUTHOR = {Bozzi, A. and Cignoni, L. and Lebrave, J.},
TITLE = {Introduction},
YEAR = {2004},
ABSTRACT = {This volume contains a number of contributions resulting from the scientific discussions held during the Euroconference "Philological Disciplines and Digital Technology" (Il Ciocco, Castelvecchio Pascoli, Italy, 7-11 September, 2003), sponsored by the European Science Foundation (ESF), the Conseil National de la Recherche Scientifique (CNRS) and the Regione Toscana (Tuscan Region). Therefore, the articles published here are not the Proceedings of that Conference but, more interestingly, they reflect the themes that were dealt with on that occasion. Owing to the different scientific experiences, the papers cover a wide range of issues but their authors share the same scope, which is to provide an accurate and precise state-of-the-art description of Digital Philology. In the light of the digital revolution, what is the position of philological disciplines? How are critical editors reacting to this? How do they perceive the functions of this technology? Is it seen only as a tool for teaching and for research, or does it assume a more innovative role from a methodological point-of-view? It is said, at least in Italy, that the critical-editor's profession is at a crisis: the publication or re-publication of texts, especially ancient ones, is carried out by an increasingly smaller number of specialists as well as students. The term 'philology', in reality, is more and more often used to define 'stylistics', 'literary critics', 'anthropology of literature', etc. If these considerations are true, how then can technological development and the creation of digital libraries have a positive influence on the editorial profession in order to help reverse the negative trend of a diminished interest by young researchers in the production of critical editions? At the end of the 1960's similar reflections were made already when the development of information technology (IT) for the literary and philological disciplines was still at its pioneering stage: for example on the occasion of the important seminar "La pratique des ordinateurs dans la critique des textes", organised by CNRS in Paris in 1968},
PAGES = {xi-xiii},
URL = {https://iris.cnr.it/handle/20.500.14243/37687},
VOLUME = {20-21},
ISSN = {0392-6907},
JOURNAL = {LINGUISTICA COMPUTAZIONALE},
}
@ARTICLE{BOZZI_2004_ARTICLE_BC_433720,
AUTHOR = {Bozzi, A. and Corradini, M.},
TITLE = {Aspects and methods of computer-aided textual criticism},
YEAR = {2004},
ABSTRACT = {The development of digital technology in libraries and archives fosters the development of computational tools for the study of sources in view of publication, in Internet or CD, of critical editions. This paper presents a system for computational philology developed at the Institute for Computational Linguistics (ILC) of the National Research Council (CNR), Pisa, for the management of images and texts, experimented on Greek papyri, medieval manuscripts and ancient printed books. The aspects concerning critical apparatus and stemmatics was carried out in collaboration with the Department of Romance Languages and Literatures of Pisa University},
KEYWORDS = {Philological workstation, Textual criticism, Stemmatology},
PAGES = {49-66},
URL = {https://iris.cnr.it/handle/20.500.14243/433720},
VOLUME = {20-21},
ISSN = {0392-6907},
JOURNAL = {LINGUISTICA COMPUTAZIONALE},
}
@ARTICLE{BRESCIANI_2004_ARTICLE_BMBF_433721,
AUTHOR = {Bresciani, E. and Menchetti, A. and Bozzi, A. and Fedeli, G.},
TITLE = {DiPhiloS: un sistema di filologia computazionale applicato a referti medici greci su papiro},
YEAR = {2004},
PAGES = {267-286},
URL = {https://iris.cnr.it/handle/20.500.14243/433721},
VOLUME = {15},
}
@ARTICLE{CALZOLARI_2004_ARTICLE_C_37691,
AUTHOR = {Calzolari, N.},
TITLE = {The Strategic Role of LRs: ENABLER and the Committee for Written LRs and Evaluation},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/37691},
}
@ARTICLE{CALZOLARI_2004_ARTICLE_CL_37692,
AUTHOR = {Calzolari, N. and Lenci, A.},
TITLE = {Linguistica Computazionale-Strumenti e risorse per il Trattamento Automatico della Lingua},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/37692},
}
@ARTICLE{CAPPELLI_2004_ARTICLE_CG_79605,
AUTHOR = {Cappelli, A. and Giovannetti, E.},
TITLE = {L'Interazione uomo-robot},
YEAR = {2004},
ABSTRACT = {L'Interazione Uomo-Robot (HRI, Human-Robot Interaction) è un'area di ricerca multidisciplinare in costante sviluppo ricca di spunti per ricerche avanzate e trasferimenti di tecnologia. Essa gioca un ruolo fondamentale nella realizzazione di robot che operano in ambienti aperti e cooperano con gli esseri umani. Compiti di questo tipo richiedono lo sviluppo di tecniche che permettano ad utenti inesperti di usare i loro robot in modo semplice e sicuro utilizzando interfacce intuitive e naturali. In questo lavoro, dopo un'introduzione riguardante le questioni fondamentali dell'HRI, saranno indagate le diverse classificazioni di robot e una particolare tassonomia dell'interazione uomo-robot, dopodiché saranno presentate le diverse modalità di interazione possibili tra un robot e un essere umano corredate da una serie di applicazioni di interfacce uomo-robot avanzate},
KEYWORDS = {Human-robot interaction},
PAGES = {18-36},
URL = {https://iris.cnr.it/handle/20.500.14243/79605},
VOLUME = {1 (2)},
ISSN = {1724-8035},
JOURNAL = {INTELLIGENZA ARTIFICIALE},
}
@ARTICLE{DIDONATO_2004_ARTICLE_D_383730,
AUTHOR = {Di Donato, F.},
TITLE = {Verso uno "European Citation Index for the Humanities". Che cosa possono fare i ricercatori per la comunicazione scientifica},
YEAR = {2004},
ABSTRACT = {As a matter of principle, to open publish is a tautology, because making a text public means to maximize the access to texts and documents; but in practice, the equivalence doesn't work. Why? The answer depends on a twofold tension: the first tension is the one between Science and Technology, that is, between on the one hand the research process and the needs of scientists, and on the other, technological possibilities and limits, depending on publishing media (printed paper, computers, the Internet and the Web). The second is the tension between cataloguing (classification) and selection, that means the tension between the need to archive the results of human research, and to make them accessible; and, when quantity grows and several restrictions come out, the need of selection. This article is a discussion of a recent initiative of the ESF, the "European Citation Index of the Humanities"; it aims at providing some elements for the authors to consider, seeking an answer to the first question},
URL = {https://iris.cnr.it/handle/20.500.14243/383730},
ISSN = {1591-4305},
JOURNAL = {BOLLETTINO TELEMATICO DI FILOSOFIA POLITICA},
}
@ARTICLE{FURFARI_2004_ARTICLE_FSPSB_170613,
AUTHOR = {Furfari, F. and Soria, C. and Pirrelli, V. and Signore, O. and Bianchi Bandinelli, R.},
TITLE = {NICHE: Natural Interaction in Computerised Home Environments},
YEAR = {2004},
ABSTRACT = {Future technologies will provide users with increasing control over surrounding devices embedded in a common home environment. Somewhat paradoxically, this could result in an increase rather than a reduction in complexity if support for high-level interfacing is not introduced. This concern prompted the launching of a medium-term project aimed at promoting natural user-home interaction along the lines of the Ambient Intelligence vision},
KEYWORDS = {HCI, Home Autoamtion, Smart Home},
PAGES = {55-56},
URL = {http://www.ercim.org/publication/Ercim_News/enw58/furfari.html},
VOLUME = {58},
ISSN = {0926-4981},
JOURNAL = {ERCIM NEWS},
}
@ARTICLE{GUADAGNINI_2004_ARTICLE_G_265586,
AUTHOR = {Guadagnini, E.},
TITLE = {Scelta di voci del Tesoro della Lingua Italiana delle Origini (ottava serie)},
YEAR = {2004},
ABSTRACT = {Voci dialèttica s. f., dialèttico agg. /s. m., diàvola s. f., diavolerìa s. f., diavolettino s. m., diavoletto s. m., diàvolo agg., diàvolo s. m. del Tesoro della Lingua Italiana delle Origini (pp. 262-273)},
PAGES = {53-348},
URL = {https://iris.cnr.it/handle/20.500.14243/265586},
VOLUME = {9},
ISSN = {1591-8254},
JOURNAL = {BOLLETTINO-OPERA DEL VOCABOLARIO ITALIANO},
}
@ARTICLE{MAGNINI_2004_ARTICLE_MC_37685,
AUTHOR = {Magnini, B. and Calzolari, N.},
TITLE = {Temi e prospettive di ricerca per l elaborazione del linguaggio naturale in Italia-Topics and Research Perspectives for Natural Language Processing in Italy},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/37685},
}
@ARTICLE{MELE_2004_ARTICLE_MARDMSCO_13240,
AUTHOR = {Mele, A. and Avena, M. and Roullet, P. and De Leonibus, E. and Mandillo, S. and Sargolini, F. and Coccurello, R. and Oliverio, A.},
TITLE = {Nucleus accumbens dopamine receptors in the consolidation of spatial memory},
YEAR = {2004},
ABSTRACT = {Nucleus accumbens dopamine is known to play an important role in motor activity and in behaviours governed by drugs and natural reinforcers, as well as in nonassociative forms of learning. At the same time, activation of D1 and D2 dopamine receptors has been suggested to promote intracellular events related to neural plasticity. Therefore, in this study we wished to investigate the role of the two classes of dopamine receptors within the nucleus accumbens on the consolidation of spatial information. On day 1, CD1 male mice were placed in an open field containing five different objects and, immediately after three sessions of habituation, the animals were focally injected within the nucleus accumbens with either the D1 antagonist SCH 23390 (12. 5, 25 or 50 ng/side), or the D2 antagonist sulpiride (25, 50, 75 or 100 ng/side). Twenty-four hours later the ability of mice to discriminate an object displacement was assessed. Both the D1 and the D2 antagonists impaired the ability of mice to detect the spatial change. If the highest doses of the two antagonists were injected 2 h after the end of the last of the habituation sessions, no effect was observed in the reactivity to spatial change examined 24 h later. These data demonstrate that activation of both D1 and D2 receptors within the accumbens is necessary in the early stages of the consolidation of spatial information. The data are discussed in terms of involvement of nucleus accumbens dopamine in information processing in the absence of explicit reinforcers},
KEYWORDS = {dopamine, SCH 23390, sulpiride, plasticity, spatial learning},
PAGES = {423-431},
URL = {http://journals.lww.com/behaviouralpharm/pages/articleviewer.aspx?year=2004\&issue=09000\&article=00017\&type=abstract},
VOLUME = {15 (5-6)},
DOI = {10.1097/00008877-200409000-00017},
ISSN = {0955-8810},
JOURNAL = {BEHAVIOURAL PHARMACOLOGY},
}
@ARTICLE{NASCIMENTO_2004_ARTICLE_NAC_37686,
AUTHOR = {Nascimento, A. and Alberto, P. and Cappelli, G.},
TITLE = {OLISSIPO-entre filologia e informática: recursos para gerir o estudo do texto latino},
YEAR = {2004},
PAGES = {111-125},
URL = {https://iris.cnr.it/handle/20.500.14243/37686},
VOLUME = {32},
}
@BOOK{ALLEGRINI_2004_BOOK_AGP_134797,
AUTHOR = {Allegrini, P. and Grigolini, P. and Palatella, L.},
TITLE = {Cognitive scale-free networks as a model for intermittency in human language},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/134797},
PUBLISHER = {World Scientific Publ. Co (Singapore, SGP)},
CONFERENCE_PLACE = {Singapore},
}
@BOOK{BALDI_2004_BOOK_BBC_137727,
AUTHOR = {Baldi, M. and Bozzi, A. and Canziani, G.},
TITLE = {I Contradicentium medicorum libri di G. Cardano in DVD},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/137727},
}
@BOOK{BOZZI_2004_BOOK_BCL_134786,
AUTHOR = {Bozzi, A. and Cignoni, L. and Lebrave Jl, E.},
TITLE = {Digital Technology and Philological Disciplines},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/134786},
}
@BOOK{DIDONATO_2004_BOOK_D_383735,
AUTHOR = {Di Donato, F.},
TITLE = {Nei limiti della ragione. Il problema della famiglia in Kant},
YEAR = {2004},
ABSTRACT = {L'atto sessuale può essere visto come la strumentalizzazione di un altro per il piacere di uno solo; e i bambini vengono a far parte di una famiglia senza il loro consenso. Per questo, secondo Kant, i rapporti familiari non possono essere intesi come contrattuali. D'altra parte, dal momento che le persone non sono cose, non possono neppure essere compresi come una collezione di diritti reali o diritti sulle cose. Kant sentì la necessità di aggiungere un nuovo titolo ai diritti personali e ai diritti reali, allo scopo di rispondere a una domanda fondamentale, connessa ad alcuni momenti essenziali dell'esistenza umana (il rapporto sessuale e la nascita): a quali condizioni è possibile istituire una famiglia giusta? Il nuovo titolo fu molto criticato, e la teoria di Kant fu dimenticata. La Rechtslehre, tuttavia, riconosce il bambino come primo cittadino del mondo, tratta il diritto alla genitorialità come indistinto e congiunto e postula l'uguaglianza delle donne. Tale modello supera così la dicotomia tra pubblico e privato, e anticipa le teorie femministe che riconoscono la necessità di fondare la prima comunità umana su basi razionali. Nei limiti della ragione si propone di mostrare la forza innovativa del progetto di famiglia razionale kantiana grazie al confronto con Fichte e Mary Wollstonecraft, e attraverso il dialogo con il dibattito femminista di oggi. È infatti possibile progettare una famiglia giusta, che tuteli i soggetti più deboli, a partire da Kant},
URL = {https://iris.cnr.it/handle/20.500.14243/383735},
}
@BOOK{SABA_2004_BOOK_S_134796,
AUTHOR = {Saba, A.},
TITLE = {El léxico del Compendio de la arte de navegar de Rodrigo Zamorano},
YEAR = {2004},
ABSTRACT = {A dos años de distancia de la publicación del Léxico del Breve compendio de la Esfera y de la arte de navegar de Martín Cortés, aparece el Compendio de la arte de navegar de Rodrigo Zamorano, ambos a cargo de Antonina Saba*. Esta obra constituye una provechosa contribución al incremento de un corpus de textos españoles del siglo XVI, nacido con el intento de crear un Léxico náutico del Español del Siglo de Oro (LÉNESO**). Este proyecto se está llevando a cabo con la contribución del Istituto di Linguistica Computazionale del CNR e del Dipartimento di Lingue romanze dell'Università di Pisa, del Departamento de Lengua Española y Lingüística General y de la Sección de Medios Impresos de la UNED de Madrid. El objetivo final es contribuir a la realización del "Diccionario de la Navegación del Siglo de Oro", dirigido por María Lourdes Garcia-Macho, subvencionado por la Dirección General de Enseñanza Superior e Investigación Científica del Ministerio de la Educación y Cultura. El enorme desarrollo económico y cultural que tuvo España después del descubrimiento de América, debido principalmente al comercio y a los intercambios con el Nuevo Mundo, favoreció la expansión de disciplinas relacionadas con la cosmografía, la astronomía, la cartografía, la meteorología, dando un impulso notable a la técnica de la navegación. El mérito de Zamorano y de sus compañeros Cortés, Chaves, Guevara, Medina, Palacio, Poza, Siria y otros, fue el aliento que dieron al cultivo de estas disciplinas nuevas e innovadoras. Los libros náuticos y los manuales de navegación de la época son una fuente inestimable de neologismos y tecnicismos en varios campos científicos y sobre todo el relacionado con la navegación, sin olvidar el aporte de topónimos que surgieron de los derroteros y de las cartas náuticas. El volumen que presentamos contiene la concordancia lematizada, los índices de frecuencia de los lemas y de los nombres propios, el diccionario inverso del Compendio de la arte de navegar, y un sistema de consulta del texto contenido en un CD-ROM, que constituyen una novedad y un estímulo para toda investigación sobre la lengua de la navegación},
KEYWORDS = {analisi linguistica, lessicografia, lessico specializzato},
PAGES = {IX-XXIX},
URL = {https://iris.cnr.it/handle/20.500.14243/134796},
ISBN = {8436206894},
EDITOR = {Saba, A.},
}
@INCOLLECTION{AGOSTINIANI_2004_INCOLLECTION_AMPP_134789,
AUTHOR = {Agostiniani, L. and Montemagni, S. and Paoli, M. and Picchi, E.},
TITLE = {Lessicografia dialettale e computer: questioni di rappresentazione e recupero dei dati},
YEAR = {2004},
KEYWORDS = {Lessicografia computazionale, Lessicografia Dialettale},
URL = {https://iris.cnr.it/handle/20.500.14243/134789},
PUBLISHER = {Centro Interuniversitario di Studi Veneti (Venezia, ITA)},
CONFERENCE_PLACE = {Venezia},
}
@INCOLLECTION{BARTOLINI_2004_INCOLLECTION_BLMPS_436876,
AUTHOR = {Bartolini, R. and Lenci, A. and Montemagni, S. and Pirrelli, V. and Soria, C.},
TITLE = {Automatic Classification and Analysis of Provisions in Italian Legal Texts: A Case Study},
YEAR = {2004},
ABSTRACT = {In this paper we address the problem of automatically enriching legal texts with semantic annotation, an essential prerequisite to effective indexing and retrieval of legal documents. This is done through illustration of SALEM (Semantic Annotation for LEgal Management), a computational system developed for automated semantic annotation of (Italian) law texts. SALEM is an incremental system using Natural Language Processing techniques to perform two tasks: i) classify law paragraphs according to their regulatory content, and ii) extract relevant text fragments corresponding to specific semantic roles that are relevant for the different types of regulatory content. The paper sketches the overall architecture of SALEM and reports results of a preliminary case study on a sample of Italian law texts},
KEYWORDS = {Annotazione semantica, Classificazione automatica},
PAGES = {593-604},
URL = {https://rdcu.be/dftjm},
DOI = {10.1007/978-3-540-30470-8_72},
PUBLISHER = {Springer (Berlin, DEU)},
ISBN = {978-3-540-23664-1},
CONFERENCE_PLACE = {Berlin},
BOOKTITLE = {On the Move to Meaningful Internet Systems 2004: OTM 2004 Workshops. OTM 2004},
EDITOR = {Meersman, R. and Tari, Z. and Corsaro, A.},
}
@INCOLLECTION{CALZOLARI_2004_INCOLLECTION_CP_134791,
AUTHOR = {Calzolari, N. and Paoloni, A.},
TITLE = {Il Trattamento Automatico della Lingua: definizione e aree tecnologiche},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/134791},
}
@INCOLLECTION{PAOLI_2004_INCOLLECTION_PMP_134795,
AUTHOR = {Paoli, M. and Montemagni, S. and Picchi, E.},
TITLE = {ALT Web: l'Atlante Lessicale Toscano in rete},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/134795},
PUBLISHER = {Centro Interuniversitario di Studi Veneti (Venezia, ITA)},
CONFERENCE_PLACE = {Venezia},
}
Warning: Undefined array key 0 in /mnt/resources/apps/pipol_v5/lib_pipol.php on line 7034
Deprecated: strtoupper(): Passing null to parameter #1 ($string) of type string is deprecated in /mnt/resources/apps/pipol_v5/lib_pipol.php on line 7034
@EDITORIAL{_2004_EDITORIAL__181024,
AUTHOR = {},
TITLE = {Digital Technology and Philological Disciplines},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/181024},
}
@INPROCEEDINGS{ALBERTO_2004_INPROCEEDINGS_ACPP_64210,
AUTHOR = {Alberto, P. and Cappelli, G. and Passarotti, M. and Pena, A.},
TITLE = {Strumenti informatici per l analisi dei testi latini},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/64210},
CONFERENCE_NAME = {Antiguidade Clássica: Que fazer com este património? Colóquio à memória de Victor Jabouille},
}
@INPROCEEDINGS{BAGLIONI_2004_INPROCEEDINGS_BNG_57545,
AUTHOR = {Baglioni, M. and Nanni, M. and Giovannetti, E.},
TITLE = {Mining literary texts using domain ontologies},
YEAR = {2004},
ABSTRACT = {This paper describes a query system on texts and literary material with advanced information retrieval tools. As a test bed we chose the electronic version of Dante's Inferno, manually tagged using XML, enriched with a domain ontology describing the historical, social and cultural context represented as a separate XML document},
KEYWORDS = {Ontology Engineering, Text Mining},
PAGES = {79-84},
URL = {https://iris.cnr.it/handle/20.500.14243/57545},
CONFERENCE_NAME = {Knowledge Discovery and Ontologies Worskshop 2004},
BOOKTITLE = {Proceedings of the Knowledge Discovery and Ontologies Worskshop 2004},
EDITOR = {Svátek, V.},
}
@INPROCEEDINGS{BARBERA_2004_INPROCEEDINGS_BD_383729,
AUTHOR = {Barbera, M. and Di Donato, F.},
TITLE = {Open Access and Semantic Web. SW Applications for Open Publishing},
YEAR = {2004},
ABSTRACT = {The Open Access movement, grown since the first Nineties and quickly developed in the last years, aims at enlarging the dissemination of scientific knowledge; based on the assumption that the Internet and the World Wide Web are able to offer "the chance to constitute a global and interactive representation of human knowledge, including cultural heritage and the guarantee of worldwide access", the signatories of the Berlin Declaration on Open Access (2003) pledged themselves to make the future Web sustainable, interactive, and transparent through the use of openly accessible compatible content and software tools. It is a well-known fact that one of the major applications of Semantic Web, the Dublin Core metadata set, is devoted to the connection of the scientific knowledge in a unique global network. Thanks to the metadata harvesting protocol of the Open Archives Initiative (OAI-PMH), this goal has yet become possible. Nevertheless, despite these developments are able to significantly modify the nature of scientific publishing as well as the existing system of quality assurance, nowadays the application of Web Semantic technology is limited to archiving and cataloguing; and the main issue of Semantic Web, selection by quality criteria, is lacking in application. This paper describes a set of applications conceived in order to fill the gap; HyperJournal, in particular, is a web application that facilitates the administration of academic journals on the Web; it is based on four major features that will be further described, and on the idea of a shared linkbase through a P2P technology, developed at the Università Politecnica delle Marche},
URL = {https://iris.cnr.it/handle/20.500.14243/383729},
}
@INPROCEEDINGS{BARTOLINI_2004_INPROCEEDINGS_BLMP_77220,
AUTHOR = {Bartolini, R. and Lenci, A. and Montemagni, S. and Pirrelli, V.},
TITLE = {Hybrid Constraints for Robust Parsing: First Experiments and Evaluation},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/77220},
CONFERENCE_NAME = {LREC 2004: Fourth International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{BARTOLINI_2004_INPROCEEDINGS_BLMPS_431278,
AUTHOR = {Bartolini, R. and Lenci, A. and Montemagni, S. and Pirrelli, V. and Soria, C.},
TITLE = {Semantic Mark-up of Italian Legal Texts Through NLP-based Techniques},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/431278},
ISBN = {2-9517408-1-6},
CONFERENCE_NAME = {LREC 2004: Fourth International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{BERTAGNA_2004_INPROCEEDINGS_BCMSU_77221,
AUTHOR = {Bertagna, F. and Calzolari, N. and Monachini, M. and Soria, C. and Ulivieri, M.},
TITLE = {Report on the interlingual annotation experience at ILC-CNR},
YEAR = {2004},
URL = {http://www.google.com/url?sa=t\&rct=j\&q=\&esrc=s\&source=web\&cd=1\&ved=0CDQQFjAA\&url=http%3A%2F%2Fciteseerx.ist.psu.edu%2Fviewdoc%2Fdownload%3Fdoi%3D10.1.1.92.5078%26rep%3Drep1%26type%3Dpdf\&ei=ksa5UZOcJ8mjhgeziIGQBw\&usg=AFQjCNE1nXfd9hHiIstx1Lq_4VaiGDvkkA\&sig2=fIUJ3FE3BnBgDALu5T832w\&bvm=bv.47883778,d.ZG4},
CONFERENCE_NAME = {Seventh Interlingua Workshop on Determining Interlingua Utility for Machine Translation},
BOOKTITLE = {Biennal Conference of the AMTA-Determining Interlingua Utility for Machine Translation},
EDITOR = {Habash, N. and Dorr, B. and Hovy, E. and Reeder, F.},
}
@INPROCEEDINGS{BERTAGNA_2004_INPROCEEDINGS_BLMC_77223,
AUTHOR = {Bertagna, F. and Lenci, A. and Monachini, M. and Calzolari, N.},
TITLE = {Content Interoperability of Lexical Resources: Open Issues and MILE Perspectives},
YEAR = {2004},
ABSTRACT = {The paper tackles the issue of content interoperability among lexical resources, by presenting an experiment of mapping differently conceived lexicons, FrameNet and NOMLEX, onto MILE (Multilingual ISLE Lexical Entry), a meta-entry for the encoding of multilingual lexical information, acting as a general schema of shared and common lexical objects. The aim is to (i) raise problems and (ii) test the expressive potentialities of MILE as a standard environment for Computational Lexicons},
PAGES = {131-134},
URL = {https://iris.cnr.it/handle/20.500.14243/77223},
ISBN = {2-9517408-1-6},
CONFERENCE_NAME = {LREC 2004: Fourth International Conference on Language Resources and Evaluation, held in Memory of Antonio Zampolli. Lisbon, Portugal, Proceedings, Volume I, Paris, The European Language Resources Association (ELRA)},
}
@INPROCEEDINGS{BERTAGNA_2004_INPROCEEDINGS_BLMC_77222,
AUTHOR = {Bertagna, F. and Lenci, A. and Monachini, M. and Calzolari, N.},
TITLE = {The MILE Lexical Classes: Data Categories for Content Interoperability among Lexicons},
YEAR = {2004},
PAGES = {8},
URL = {https://iris.cnr.it/handle/20.500.14243/77222},
ISBN = {2-9517408-1-6},
CONFERENCE_NAME = {LREC 2004: Fourth International Conference on Language Resources and Evaluation-Workshop: A Registry of Linguistic Data Categories within an Integrated Language Resources Repository Area (INTERA)},
}
@INPROCEEDINGS{BOZZI_2004_INPROCEEDINGS_B_64243,
AUTHOR = {Bozzi, A.},
TITLE = {Electronic Publishing and Computational Philology},
YEAR = {2004},
ABSTRACT = {This paper is concerned with the relationship between electronic publishing and digital scholarly textual criticism. Hypertextual techniques and computational tools are compared. These two different methodologies applied to modern and contemporary texts with respect to ancien manuscript tradition are highlighted. Particular attention is focussed on the general criteria employed in the development of a computer-assisted workstation for digital editions of Greek papyri and medieval manuscripts},
KEYWORDS = {Electronic publishing, Computational philology, Digital Libraries, Textual criticism},
PAGES = {3-24},
URL = {https://iris.cnr.it/handle/20.500.14243/64243},
VOLUME = {XXIV-XXV},
PUBLISHER = {Istituti Editoriali e Poligrafici Internazionali (Pisa-Roma, ITA)},
ISSN = {0392-6907},
ISBN = {978-88-8147-435-6},
CONFERENCE_NAME = {The Evolution of Texts: Confronting Stemmatological and Genetical Methods},
CONFERENCE_PLACE = {Pisa-Roma},
BOOKTITLE = {LINGUISTICA COMPUTAZIONALE},
EDITOR = {Macé, C. and Baret, P. and Bozzi, A. and Cignoni, L.},
}
@INPROCEEDINGS{BOZZI_2004_INPROCEEDINGS_BR_77218,
AUTHOR = {Bozzi, A. and Raggioli, A.},
TITLE = {DiPhiloS: un sistema di filologia computazionale applicato a referti medici greci su papiro},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/77218},
CONFERENCE_NAME = {Seminario di Studi: Testi medici su papiro},
}
@INPROCEEDINGS{BUSEMANN_2004_INPROCEEDINGS_BCCKE_77219,
AUTHOR = {Busemann, S. and Calzolari, N. and Choukri, K. and Krauwer and Eds, S.},
TITLE = {Building the LR&E Roadmap: Joint COCOSDA and ICCWLRE Meeting},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/77219},
}
@INPROCEEDINGS{CALZOLARI_2004_INPROCEEDINGS_C_64226,
AUTHOR = {Calzolari, N.},
TITLE = {European Initiatives to Promote Cooperation between Speech and Text Communities},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/64226},
}
@INPROCEEDINGS{CALZOLARI_2004_INPROCEEDINGS_C_64212,
AUTHOR = {Calzolari, N.},
TITLE = {Computational Lexicons-Open and Distributed Lexical Infrastructure},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/64212},
}
@INPROCEEDINGS{CALZOLARI_2004_INPROCEEDINGS_CCGMBFLMMP_64214,
AUTHOR = {Calzolari, N. and Choukri, K. and Gavrilidou, M. and Maegaard, B. and Baroni, P. and Fersøe, H. and Lenci, A. and Mapelli, V. and Monachini, M. and Piperidis, S.},
TITLE = {ENABLER Thematic Network of National Projects: Technical, Strategic and Political Issues of LRs},
YEAR = {2004},
ABSTRACT = {In this paper we present general strategies concerning Language Resources (LRs)-Written, Spoken and, recently, Multimodal-as developed within the ENABLER Thematic Network. LRs are a central component of the so-called "linguistic infrastructure" (the other key element being Evaluation), necessary for the development of any Human Language Technology (HLT) application. They play a critical role, as horizontal technology, in different emerging areas of FP6, and have been recognized as a priority within a number of national projects around Europe and world-wide. The availability of LRs is also a "sensitive" issue, touching directly the sphere of linguistic and cultural identity, but also with economical, societal and political implications. This is going to be even more true in the new Europe with 25 languages on a par},
KEYWORDS = {Language Resources, Strategic and Political Issues, Written and Spoken, Linguistic Infrastructure, Supranational Coordination},
PAGES = {937-940},
URL = {http://www.lrec-conf.org/proceedings/lrec2004/},
VOLUME = {III},
PUBLISHER = {European Language Resources Association (ELRA)-Evaluations and Language resources Distribution Agency (ELDA) (Paris, FRA)},
ISBN = {2-9517408-1-6},
CONFERENCE_NAME = {LREC 2004-Fourth International Conference on Language Resources and Evaluation},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings of the Fourth International Conference on Language Resources and Evaluation},
EDITOR = {Lino, M. T. and Xavier, M. F. and Ferreira, F. and Costa, R. and Silva, R.},
}
@INPROCEEDINGS{CAPPELLI_2004_INPROCEEDINGS_CGM_57553,
AUTHOR = {Cappelli, A. and Giovannetti, E. and Michelassi, P.},
TITLE = {Ontological knowledge and language in modelling classical architectonic structures},
YEAR = {2004},
ABSTRACT = {This article will concern the specification of the conceptual and linguistic constraints for the construction of a knowledge base in classical architecture, an operation that involves the structuring of the concepts of the domain to which appropriate linguistic terms must be associated. Our approach will take into account models of conceptual dictionaries proposed in computational linguistics as well as knowledge representation and ontological formalisms proposed in artificial intelligence and ontological engineering},
KEYWORDS = {Ontological engineering, Knowledge Representation Formalisms and Methods},
PAGES = {85-89},
URL = {https://iris.cnr.it/handle/20.500.14243/57553},
CONFERENCE_NAME = {Ontologies and Lexical Resources in Distributed Environment Ontolex 2004},
BOOKTITLE = {Proceedings of OntoLex 2004-Ontologies and Lexical Resources in Distributed Environment},
}
@INPROCEEDINGS{CAPPELLI_2004_INPROCEEDINGS_CA_64227,
AUTHOR = {Cappelli, G. and Alberto, P.},
TITLE = {The OLISSIPO and LECTIO Projects},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/64227},
CONFERENCE_NAME = {LREC 2004: Fourth International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{DECLERCK_2004_INPROCEEDINGS_DBCL_64228,
AUTHOR = {Declerck, T. and Buitelaar, P. and Calzolari, N. and Lenci, A.},
TITLE = {Towards a Language Infrastructure for the Semantic Web},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/64228},
}
@INPROCEEDINGS{FERDEGHINI_2004_INPROCEEDINGS_FMBPB_1865,
AUTHOR = {Ferdeghini, E. M. and Marcheschi, P. and Bozzi, A. and Prediletto, R. and Benassi, A.},
TITLE = {Radiologic image library for pathology related searches},
YEAR = {2004},
ABSTRACT = {The present study aims to apply to a medical information system, tools and methods, derived from computational linguistics, to allow the navigation, annotation and creative analysis of the stored data (in particular radiologic images of cardiological and pneumological patients) for longitudinal and transversal studies},
KEYWORDS = {information systems},
PAGES = {689-692},
URL = {https://iris.cnr.it/handle/20.500.14243/1865},
VOLUME = {31},
PUBLISHER = {IEEE Computer Society (Long Beach (Calif.), USA)},
ISBN = {0-7803-8927-1},
CONFERENCE_NAME = {Computers in Cardiology},
CONFERENCE_PLACE = {Long Beach (Calif.)},
BOOKTITLE = {Computers in Cardiology 2004},
EDITOR = {Murray, A.},
}
@INPROCEEDINGS{FERDEGHINI_2004_INPROCEEDINGS_FMBPB_64244,
AUTHOR = {Ferdeghini, E. and Marcheschi, P. and Bozzi, A. and Prediletto, R. and Benassi, A.},
TITLE = {Radiologic Image Library for Pathology Related Searches},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/64244},
CONFERENCE_NAME = {Computers in Cardiology},
}
@INPROCEEDINGS{FERSE_2004_INPROCEEDINGS_FM_64229,
AUTHOR = {Fersøe, H. and Monachini, M.},
TITLE = {ELRA Validation Methodology and Standard Promotion for Linguistic Resources},
YEAR = {2004},
ABSTRACT = {This paper describes the results of work made for ELRA during 2003-2004. It describes the methodology for validation of written language resources (WLRs), specifically lexica, which has been developed for ELRA and tested on a few resources in the ELRA catalogue. It discusses the importance of key issues in lexicon creation and validation such as the adoption of standards for the coding of linguistic content and the importance of documentation. It reports on the experience gained from applying the methodology to lexical resources in the ELRA catalogue arguing that the checks must be reasonable, informative, on a suitable level of detail, and generic. It proposes a set of basic elements to be included in future discussions on establishing standards for lexicon resources. In conclusion it sketches the work to be undertaken in 2004 to promote validation and the adoption of standards},
PAGES = {941-944},
URL = {https://iris.cnr.it/handle/20.500.14243/64229},
ISBN = {2-9517408-1-6},
CONFERENCE_NAME = {LREC 2004: Fourth International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{HEPPLE_2004_INPROCEEDINGS_HNAMMG_64230,
AUTHOR = {Hepple, M. and N, I. and Allegrini, P. and Marchi, S. and Montemagni, S. and Gómez Hidalgo, J.},
TITLE = {NLP-enhanced Content filtering within the POESIA Project},
YEAR = {2004},
ABSTRACT = {This paper introduces the POESIA internet filtering system, which is open-source, and which combines standard filtering methods, such as positive/negative URL lists, with more advanced techniques, such as image processing and NLP-enhanced text filtering. The description here focusses on components providing textual content filtering for three European languages (English, Italian and Spanish), employing NLP methods to enhance performance. We address also the acquisition of language data needed to develop these filters, and the evaluation of the system and its components},
KEYWORDS = {Image processing, Natural language processing systems, Open systems},
PAGES = {1967-1970},
URL = {https://www.aclweb.org/anthology/L04-1507/},
ISBN = {2-9517408-1-6},
CONFERENCE_NAME = {LREC 2004: Fourth International Conference on Language Resources and Evaluation},
BOOKTITLE = {Proceedings of the Fourth International Conference on Language Resources and Evaluation (LREC 2004)},
EDITOR = {Lino, M. T. and Xavier, M. F. and Ferreira, F. and Costa, R. and Silva, R.},
}
@INPROCEEDINGS{MARINELLI_2004_INPROCEEDINGS_M_64231,
AUTHOR = {Marinelli, R.},
TITLE = {Proper Names and Polysemy: From a Lexicographic Experience},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/64231},
CONFERENCE_NAME = {LREC 2004: Fourth International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{MARINELLI_2004_INPROCEEDINGS_MRE_64232,
AUTHOR = {Marinelli, R. and Roventini, A. and Enea, A.},
TITLE = {Building a Maritime Domain Lexicon: a Few Considerations on the Database Structure and the Semantic Coding},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/64232},
CONFERENCE_NAME = {LREC 2004: Fourth International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{MONACHINI_2004_INPROCEEDINGS_MCMRU_64233,
AUTHOR = {Monachini, M. and Calzolari, F. and Mammini, M. and Rossi, S. and Ulivieri, M.},
TITLE = {Unifying Lexicons in view of a Phonological and Morphological Lexical DB},
YEAR = {2004},
ABSTRACT = {The present work falls in the line of activities promoted by the European Languguage Resource Association (ELRA) Production Committee (PCom) and raises issues in methods, procedures and tools for the reusability, creation, and management of Language Resources. A two-fold purpose lies behind this experiment. The first aim is to investigate the feasibility, define methods and procedures for combining two Italian lexical resources that have incompatible formats and complementary information into a Unified Lexicon (UL). The adopted strategy and the procedures appointed are described together with the driving criterion of the merging task, where a balance between human and computational efforts is pursued. The coverage of the UL has been maximized, by making use of simple and fast matching procedures. The second aim is to exploit this newly obtained resource for implementing the phonological and morphological layers of the CLIPS lexical database. Implementing these new layers and linking them with the already exisitng syntactic and semantic layers is not a trivial task. The constraints imposed by the model, the impact at the architectural level and the solution adopted in order to make the whole database 'speak' efficiently are presented. Advantages vs. disadvantages are discussed},
PAGES = {1107-1110},
ISBN = {2-9517408-1-6},
CONFERENCE_NAME = {LREC 2004: Fourth International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{PANUZZI_2004_INPROCEEDINGS_PPM_64234,
AUTHOR = {Panuzzi, A. and Picchi, E. and Moneglia, M.},
TITLE = {Using PiTagger for Lemmatization and PoS Tagging of a Spontaneous Speech Corpus: C-Oral-Rom Italian},
YEAR = {2004},
ABSTRACT = {The automatic lemmatization and morpho-syntactic annotation of spoken language is a quite recent and complex task for Natural Language Processing. The state of the art on written corpora don't provide us with a satisfactory level of analysis regarding spontaneous spoken language (Uchimoto et al., 2002; Moreno \& Guirao, 2003). The spontaneous speech corpus Italian C-ORALROM has been tagged with Part of Speech (Pos) and morpho-syntactic information, using and adapting an already existing tool trained on Italian written resources (PiTagger, developed by Eugenio Picchi, ILC-CNR Pisa). The incidence of spoken domain on the performance is within a 10% of errors detected in the manual evaluation procedure. Some issues concerning spoken language emerged. The definition of significant contexts for PoS statistics is to be provided by utterance boundaries; moreover, the relevance of a series of phenomena related to the prosodic parsing has been highlighted: fragmentation phenomena, a relative lack of information for all word adjacent to utterance boundaries; under-specification of PoS for words in connection to secondary prosodic breaks and one word utterances},
KEYWORDS = {Lemmatization, Pos Tagging},
PAGES = {563-566},
URL = {http://www.lrec-conf.org/lrec2004/},
PUBLISHER = {European Language Resources Association (ELRA)-Evaluations and Language resources Distribution Agency (ELDA) (Paris, FRA)},
ISBN = {2-9517408-1-6},
CONFERENCE_NAME = {LREC 2004: Fourth International Conference on Language Resources and Evaluation},
CONFERENCE_PLACE = {Paris},
BOOKTITLE = {Proceedings: in LREC 2004: Fourth International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{PARDELLI_2004_INPROCEEDINGS_PSG_64235,
AUTHOR = {Pardelli, G. and Sassi, M. and Goggi, S.},
TITLE = {From Weaver to the ALPAC Report},
YEAR = {2004},
ABSTRACT = {This paper presents a sample pertaining to the creation and the use of words in the field of Natural Language Processing (NLP) in the years 1949-1966. These words have been statistically sorted and the results could be taken as a proof that electronic processing of linguistic data leads to the diffusion of clear and concise words for describing a complex concept which would need a circumlocution to be described instead. The aim of this article is to provide an evolutionary overview of these new lexical forms in the various languages for the period taken into account and, whereas possible, a data register and a tabular representation have been prepared as well},
KEYWORDS = {Terminology, Natural Language Processing},
PAGES = {2005-2008},
URL = {https://iris.cnr.it/handle/20.500.14243/64235},
PUBLISHER = {European Language Resources Association (ELRA)-Evaluations and Language resources Distribution Agency (ELDA) (Paris, FRA)},
ISBN = {2-9517408-1-6},
CONFERENCE_NAME = {LREC 2004: Fourth International Conference on Language Resources and Evaluation},
CONFERENCE_PLACE = {Paris},
EDITOR = {Lino, T. and Xavier, M. F. and Ferreira, F. and Costa, R. and Silvia, R.},
}
@INPROCEEDINGS{PICCHI_2004_INPROCEEDINGS_PCCSS_64236,
AUTHOR = {Picchi, E. and Ceccotti, M. L. and Cucurullo, S. and Sassi, M. and Sassolini, E.},
TITLE = {Linguistic Miner. An Italian Linguistic Knowledge System},
YEAR = {2004},
ABSTRACT = {Linguistic Miner is a project carried out at ILC whose objective is the development of an integrated system to build, organise and manage a corpus of Italian texts (of various origins and formats), and to design and constantly add new tools for the automatic extraction of tiered linguistic knowledge to be made available for many teaching, publishing, and other cultural purposes. The project is based on a notion that is preliminary to all the systems for corpus-based linguistic analysis: a language represented by the largest possible collection of heterogeneous texts is the best source of linguistic information at any level of analysis considered. The first goals of such a system are the semi-automated construction of an Italian data mine for the extraction of linguistic information, the validation of linguistic patterns, the installation of useful tools and resources for a range of different categories of Italian language users. The main feature of the project is its purpose of building large language reference corpora allowing for the creation and use of effective tools for the handling and processing, as well as the automatic linguistic synthesis, of such corpora},
KEYWORDS = {linguistic analysis, information extraction},
PAGES = {1811-1814},
URL = {http://www.lrec-conf.org/lrec2004/},
VOLUME = {V},
ISBN = {2-9517408-1-6},
CONFERENCE_NAME = {LREC 2004: Fourth International Conference on Language Resources and Evaluation},
BOOKTITLE = {Proceedings of the 4th International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{PIRRELLI_2004_INPROCEEDINGS_PCHV_13247,
AUTHOR = {Pirrelli, V. and Calderone, B. and Herreros, I. and Virgilio, M.},
TITLE = {Non-locality all the way through: Emergent Global Constraints in the Italian Morphological Lexicon},
YEAR = {2004},
ABSTRACT = {The paper reports on the behaviour of a Kohonen map of the mental lexicon, monitored through different phases of acquisition of the Italian verb system. Reported experiments appear to consistently reproduce emergent global ordering constraints on memory traces of inflected verb forms, developed through principles of local interactions between parallel processing neurons},
URL = {https://iris.cnr.it/handle/20.500.14243/13247},
}
@INPROCEEDINGS{QUOCHI_2004_INPROCEEDINGS_Q_64237,
AUTHOR = {Quochi, V.},
TITLE = {Representing Italian Complex Nominals: A Pilot Study},
YEAR = {2004},
ABSTRACT = {A corpus-based investigation of Italian Complex Nominals (CNs), of the form N PP, which aims at clarifying their syntactic and semantic constitution, is presented. The main goal is to find out useful parameters for their representation in a computational lexicon. As a reference model we have taken an implementation of Pustejovsky's Generative Lexicon Theory (1995), the SIMPLE Italian Lexicon, and in particular the Extended Qualia Structure. Italian CN formation mainly exploits post-modification; of particular interest here are CNs of the kind N PP since this syntactic pattern is highly productive in Italian and such CNs very often translate compound nouns of other languages. One of the major problems posed by CNs for interpretation is the retrieval or identification of the semantic relation linking their components, which is (at least partially) implicit on the surface. Studying a small sample, we observed some interesting facts that could be useful when setting up a larger experiment to identify semantic relations and/or automatically learn the syntactic peculiarities of given semantic paradigms. Finally, a set of representational features exploiting the results from our corpus is proposed},
KEYWORDS = {Multiword expression, Complex Nominals, Italian language},
PAGES = {1863-1866},
URL = {https://iris.cnr.it/handle/20.500.14243/64237},
ISBN = {2-9517408-1-6},
CONFERENCE_NAME = {LREC 2004: Fourth International Conference on Language Resources and Evaluation},
BOOKTITLE = {Proceedings of the Fourth International Conference on Language Resources and Evaluation, LREC'04},
}
@INPROCEEDINGS{ROVENTINI_2004_INPROCEEDINGS_RM_64238,
AUTHOR = {Roventini, A. and Marinelli, R.},
TITLE = {Extending the Italian WordNet with the Specialized language of the Maritime Domain},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/64238},
CONFERENCE_NAME = {Second International WordNet Conference, GWC 2004},
}
@INPROCEEDINGS{RUIMY_2004_INPROCEEDINGS_RBC_64239,
AUTHOR = {Ruimy, N. and Bouillon, P. and Cartoni, B.},
TITLE = {Semi-Automatic Derivation of a French Lexicon from CLIPS},
YEAR = {2004},
ABSTRACT = {In this paper we describe the methodology developed in the framework of a feasibility study for the derivation of a semantically annotated French lexicon from a monolingual Italian lexical resource. Firstly, an outline of the source lexicon is provided. Then, the two different and complementary strategies that have been experimented for pairing off the relevant monolingual Italian entries and their translational equivalents are described. Finally, the results achieved through each of the illustrated methodologies are presented, their viability is evaluated and a general assessment of the experiment performed is provided},
KEYWORDS = {cognate, sense indicator, semantic lexicon, matching rules, multilingual morphology},
PAGES = {1099-1102},
URL = {https://iris.cnr.it/handle/20.500.14243/64239},
CONFERENCE_NAME = {LREC 2004: Fourth International Conference on Language Resources and Evaluation},
}
@TECHREPORT{BARONI_2004_TECHREPORT_BCLQU_195897,
AUTHOR = {Baroni, P. and Calzolari, N. and Lenci, A. and Quochi, V. and Ulivieri, M.},
TITLE = {Final Resources Landscape},
YEAR = {2004},
ABSTRACT = {ELSNET-4 Deliverable D6. 4},
KEYWORDS = {Language Resources, Landscapes},
PAGES = {11},
URL = {https://iris.cnr.it/handle/20.500.14243/195897},
}
@TECHREPORT{BARONI_2004_TECHREPORT_BCM_195899,
AUTHOR = {Baroni, P. and Calzolari, N. and Mammini, M.},
TITLE = {Final Resources Roadmap},
YEAR = {2004},
ABSTRACT = {ELSNET-4 Deliverable D6. 3},
KEYWORDS = {Language Resources, Roadmaps},
URL = {https://iris.cnr.it/handle/20.500.14243/195899},
}
@TECHREPORT{BARTOLINI_2004_TECHREPORT_BGLMP_195902,
AUTHOR = {Bartolini, E. and Giorgetti, D. and Lenci, A. and Montemagni, S. and Pirrelli, V.},
TITLE = {Text-2-Knowledge: Acquisizione automatica di ontologie per l'indicizzazione semantica di documenti},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/195902},
}
@TECHREPORT{CECCOTTI_2004_TECHREPORT_CS_195914,
AUTHOR = {Ceccotti, M. and Sassi, M.},
TITLE = {Gadda in Abruzzo. Concordanze per lemma},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/195914},
}
@TECHREPORT{GAVRILIDOU_2004_TECHREPORT_GGDLMSPRS_457832,
AUTHOR = {Gavrilidou, M. and Giouli, V. and Desipri, E. and Labropoulou, P. and Monachini, M. and Soria, C. and Picchi, E. and Ruffolo, P. and Sassolini, E.},
TITLE = {Report on the multilingual resources production},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/457832},
}
@TECHREPORT{GAVRILIDOU_2004_TECHREPORT_GGDMS_195915,
AUTHOR = {Gavrilidou, M. and Giouli, V. and Desipri, E. and Monachini, M. and Soria, C.},
TITLE = {Report on the model of LRs production. INTERA},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/195915},
}
@TECHREPORT{SABA_2004_TECHREPORT_S_195892,
AUTHOR = {Saba, A.},
TITLE = {Lessico del testo "Ytinerario de navegación de los mares y tierras occidentales"},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/195892},
}
@TECHREPORT{SABA_2004_TECHREPORT_S_195891,
AUTHOR = {Saba, A.},
TITLE = {Lessico del testo Libro de las longitudes y manera que hasta agora se ha tenido en el arte de navegar, con sus demonstraciones y exemplos},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/195891},
}
@MISC{ALLEGRINI_2004_MISC_AMM_458592,
AUTHOR = {Allegrini, P. and Marchi, S. and Montemagni, S.},
TITLE = {The Italian NLP Filter},
YEAR = {2004},
ABSTRACT = {Resoconto delle attività del gruppo di ricerca ILC-CNR nel contesto del progetto POESIA. Workshop Finale "Present and Future of Open-source Content-based Web Filtering"},
URL = {https://iris.cnr.it/handle/20.500.14243/458592},
}
@MISC{BARBERA_2004_MISC_BD_384180,
AUTHOR = {Barbera, M. and Di Donato, F.},
TITLE = {HyperJournal Howto: a beginner's guide to HyperJournal 0. 4},
YEAR = {2004},
ABSTRACT = {A beginner's guide to HyperJournal 0. 4},
URL = {https://iris.cnr.it/handle/20.500.14243/384180},
}
@MISC{BOZZI_2004_MISC_B_435677,
AUTHOR = {Bozzi, A.},
TITLE = {Analisi linguistica e documenti digitali: un servizio innovativo per la fruizione dei beni librari},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/435677},
CONFERENCE_NAME = {TAL in biblioteca. Conferenza a cura del Forum per il Trattamento Automatico della Lingua},
}
@MISC{BOZZI_2004_MISC_B_106738,
AUTHOR = {Bozzi, A.},
TITLE = {The DIPHILOS workstation for critical apparatus management: some experiments on medieval provençal texts},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/106738},
CONFERENCE_NAME = {Textual Criticism and Genetics Confronting Methods},
}
@MISC{BOZZI_2004_MISC_B_192723,
AUTHOR = {Bozzi, A.},
TITLE = {CHLT-LEMLAT},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/192723},
}
@MISC{BOZZI_2004_MISC_BC_106737,
AUTHOR = {Bozzi, A. and Corradini, M. S.},
TITLE = {Aspetti di critica testuale assistita da calcolatore},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/106737},
CONFERENCE_NAME = {XXIV Congrès International de Linguistique et de Philologie Romanes (CILPR 2004)},
}
@MISC{CASALINI_2004_MISC_CDP_383734,
AUTHOR = {Casalini, B. and Di Donato, F. and Pievatolo Maria, C.},
TITLE = {Guédon J.-C., La lunga ombra di Oldenburg: i bibliotecari, i ricercatori, gli editori e il controllo della pubblicazione scientifica},
YEAR = {2004},
ABSTRACT = {In the last 50 years, publishers have managed to transform scholarly journals-traditionally, a secondary, unpromising publishing venture at best-into big business. How they have managed to create extremely high profit rates is a story that has not yet been clearly told. What is the real basis behind this astounding capability? What is the source of their power? How can it be subverted? This presentation will address these questions, but more research is clearly needed, and it is of such scope as to require a concerted, sustained effort. Recently, because of the advent of digitization and the Internet, the technical system of scientific communication has undergone a profound change that is still unfolding. The imposition of site licenses and the corresponding development of library consortia signal changes so deep that the very status of the "document" and the ways in which individuals may interact with it appear quite incommensurable with the past. The role of libraries is also deeply subverted, as we shall see. The consequences stemming from these developments are difficult to ascertain, but we can be sure that scientific communication is morphing. This presentation will endeavor to sketch out two scenarios that are presently unfolding on courses that, although relatively separate for the moment, will eventually collide. Each one of these scenarios corresponds to a different take on the paradigmatic shift. Which one will win is unclear; it may even be that these two scenarios will compete for quite some time. In any case, we need to acquire an image of the territory we are entering, however grained, and of the forces that are shaping its contours, if mapping out strategies is of the essence. In effect, this presentation asks whether the results of fundamental research in science, technology, and medicine-results that clearly stand at a pre-competitive stage if viewed in commercial terms, results that may even, in some cases, save lives-will remain part of humanity's knowledge commons, or whether they will be gradually confiscated for the benefit of smaller and smaller scientific and business elites},
URL = {https://iris.cnr.it/handle/20.500.14243/383734},
}
@MISC{DIDONATO_2004_MISC_D_406235,
AUTHOR = {Di Donato, F.},
TITLE = {Open Publishing in the Humanities},
YEAR = {2004},
ABSTRACT = {What does Open Publishing in the Humanities means?},
URL = {https://iris.cnr.it/handle/20.500.14243/406235},
}
@MISC{DIDONATO_2004_MISC_D_383727,
AUTHOR = {Di Donato, F.},
TITLE = {H. Hohenegger, Kant filosofo dell'architettonica. Saggio sulla Critica della facoltà di giudizio, Quodlibet (coll. Estetica e critica), Macerata 2004},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/383727},
ISSN = {1126-4780},
}
@MISC{ENEA_2004_MISC_E_123698,
AUTHOR = {Enea, A.},
TITLE = {Gli ARCHIVI FOTOGRAFICI degli Istituti per la storia della Resistenza e della società contemporanea in Italia},
YEAR = {2004},
ABSTRACT = {Sono consultabili le descrizioni di archivi fotografici dell'Istituto nazionale e degli Istituti di Novara, Pavia, Sesto San Giovanni, Torino, e Udine, dell'archivio Albe e Lica Steiner (Politecnico di Milano), del Centro Studi e ricerca Silvio Trentin di Jesolo e del Comune di Corbetta. Le descrizioni dei fondi sono a livello di serie, eccezion fatta per l'Istituto di Torino dove sono descritti i singoli documenti con la riproduzione delle immagini},
KEYWORDS = {archivistica, beni culturali},
URL = {http://www.reteparri.it/risorse-on-line/servizi-archivistici},
}
@MISC{ENEA_2004_MISC_E_106736,
AUTHOR = {Enea, A.},
TITLE = {Prove di integrazione fra due applicativi: Isis e Guarini},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/106736},
CONFERENCE_NAME = {Accesso agli archivi informatici dell?Istituto: risultati e prospettive},
}
@MISC{ENEA_2004_MISC_E_435676,
AUTHOR = {Enea, A.},
TITLE = {La banca dati Guida in rete: wwwisis e strategie di ricerca},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/435676},
CONFERENCE_NAME = {La Guida agli archivi della Resistenza},
}
@MISC{MARCHI_2004_MISC_MA_458599,
AUTHOR = {Marchi, S. and Allegrini, P.},
TITLE = {POESIA: the Italian Content Filter},
YEAR = {2004},
ABSTRACT = {Modulo per il content filtering di pagine web in italiano},
URL = {https://iris.cnr.it/handle/20.500.14243/458599},
}
@MISC{PIRRELLI_2004_MISC_PAM_435675,
AUTHOR = {Pirrelli, V. and Allegrini, P. and Montemagni, S.},
TITLE = {Classifying text through time: a complexity science approach to dynamic web page filtering},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/435675},
CONFERENCE_NAME = {International Conference on Text Mining (CIFT)},
}
@MISC{PIRRELLI_2004_MISC_PLM_106735,
AUTHOR = {Pirrelli, V. and Lenci, A. and Montemagni, S.},
TITLE = {The lexicon in context: distributional evidence and representational issues},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/106735},
CONFERENCE_NAME = {International Colloquium: Word Structure and Lexical Systems: models and applications},
}
@MISC{SABA_2004_MISC_S_195893,
AUTHOR = {Saba, A.},
TITLE = {Ytinerario de navegación de los mares y tierras occidentales},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/195893},
}
@MISC{SABA_2004_MISC_SC_195917,
AUTHOR = {Saba, A. and Carpi, E.},
TITLE = {Suma de Geographía que trata de todas las partidas y provincias del mundo, en especial de las Indias},
YEAR = {2004},
URL = {https://iris.cnr.it/handle/20.500.14243/195917},
}
@MISC{SASSI_2004_MISC_SC_97599,
AUTHOR = {Sassi, M. and Cinini, A.},
TITLE = {Prototipo di analisi testuale delle sentenze della Cassazione. Estrazione automatica di descrittori},
YEAR = {2004},
ABSTRACT = {En el ámbito del proyecto "Tecnologías para la justicia", coordinado por el Istituto di Ricerca sui Sistemi Giudiziari del CNR di Bologna (IRSIG), el Istituto di Linguistica Computazionale del CNR (ILC), ha brindado instrumentos, ya experimentados en la investigación lingüística, para la extracción de informaciones lingüístico-conceptuales desde grandes cantidades de datos textuales},
KEYWORDS = {classificazione del testo},
URL = {https://iris.cnr.it/handle/20.500.14243/97599},
CONFERENCE_NAME = {IV Congreso Mundial de Derecho Informatico Alfa-Redi},
}
@ARTICLE{ALLEGRINI_2003_ARTICLE_AAGPR_144503,
AUTHOR = {Allegrini, P. and Aquino, G. and Grigolini, P. and Palatella, L. and Rosa, A.},
TITLE = {Generalized master equation via aging continuous-time random walks},
YEAR = {2003},
ABSTRACT = {We discuss the problem of the equivalence between continuous-time random walk (CTRW) and generalized master equation (GME). The walker, making instantaneous jumps from one site of the lattice to another, resides in each site for extended times. The sojourn times have a distribution density (t) that is assumed to be an inverse power law with the power index µ. We assume that the Onsager principle is fulfilled, and we use this assumption to establish a complete equivalence between GME and the Montroll-Weiss CTRW. We prove that this equivalence is confined to the case where (t) is an exponential. We argue that is so because the Montroll-Weiss CTRW, as recently proved by Barkai [E. Barkai, Phys. Rev. Lett. 90, 104101 (2003)], is nonstationary, thereby implying aging, while the Onsager principle is valid only in the case of fully aged systems. The case of a Poisson distribution of sojourn times is the only one with no aging associated to it, and consequently with no need to establish special initial conditions to fulfill the Onsager principle. We consider the case of a dichotomous fluctuation, and we prove that the Onsager principle is fulfilled for any form of regression to equilibrium provided that the stationary condition holds true. We set the stationary condition on both the CTRW and the GME, thereby creating a condition of total equivalence, regardless of the nature of the waiting-time distribution. As a consequence of this procedure we create a GME that is a bona fide master equation, in spite of being non-Markov. We note that the memory kernel of the GME affords information on the interaction between system of interest and its bath. The Poisson case yields a bath with infinitely fast fluctuations. We argue that departing from the Poisson form has the effect of creating a condition of infinite memory and that these results might be useful to shed light on the problem of how to unravel non-Markov quantum master equations. ©2003 The American Physical Society},
PAGES = {056123-056134},
URL = {https://iris.cnr.it/handle/20.500.14243/144503},
VOLUME = {68},
}
@ARTICLE{ALLEGRINI_2003_ARTICLE_ABGHIMPRSVY_152319,
AUTHOR = {Allegrini, P. and Benci, V. and Grigolini, P. and Hamilton, P. and Ignaccolo, M. and Menconi, G. and Palatella, L. and Raffaelli, G. and Scafetta, N. and Virgilio, M. and Yang, J.},
TITLE = {Compression and diffusion: a joint approach to detect complexity},
YEAR = {2003},
ABSTRACT = {The adoption of the KolmogorovSinai entropy is becoming a popular research tool among physicists, especially when applied to a dynamical system fitting the conditions of validity of the Pesin theorem. The study of time series that are a manifestation of system dynamics whose rules are either unknown or too complex for a mathematical treatment, is still a challenge since the KS entropy is not computable, in general, in that case. Here we present a plan of action based on the joint action of two procedures, both related to the KS entropy, but compatible with computer implementation through fast and efficient programs. The former procedure, called compression algorithm sensitive to regularity (CASToRE), establishes the amount of order by the numerical evaluation of algorithmic compressibility. The latter, called complex analysis of sequences via scaling and randomness assessment (CASSANDRA), establishes the complexity degree through the numerical evaluation of the strength of an anomalous effect. This is the departure, of the diffusion process generated by the observed fluctuations, from ordinary Brownian motion. The CASSANDRA algorithm shares with CASToRE a connection with the Kolmogorov complexity. This makes both algorithms especially suitable to study the transition from dynamics to thermodynamics, and the case of non-stationary time series as well. The benefit of the joint action of these two methods is proven by the analysis of artificial sequences with the same main properties as the real time series to which the joint use of these two methods will be applied in future research work},
PAGES = {517-535},
URL = {https://iris.cnr.it/handle/20.500.14243/152319},
VOLUME = {15},
}
@ARTICLE{ALLEGRINI_2003_ARTICLE_AMP_37654,
AUTHOR = {Allegrini, P. and Montemagni, S. and Pirrelli, V.},
TITLE = {Example-based automatic induction of semantic classes through entropic scores},
YEAR = {2003},
ABSTRACT = {Abstract-The paper deals in some detail with the application of examplebased machine learning techniques to the task of automatically acquiring semantic information from functionally annotated texts. Special emphasis is placed on the use of analogical proportions as a means of structuring the knowledge embodied in attested examples, and weighing up their contribution to a variety of lexico-semantic classification tasks. Careful quantitative analysis of automatically acquired information proves to shed considerable light on the semantic inter-connectivity of input data, their structure and organising principles},
PAGES = {1-45},
URL = {https://iris.cnr.it/handle/20.500.14243/37654},
VOLUME = {16-17},
}
@ARTICLE{BOZZI_2003_ARTICLE_B_37653,
AUTHOR = {Bozzi, A.},
TITLE = {Aspetti e problemi di spoglio elettronico di un archivio testuale: il caso dei Grammatici Latini antichi},
YEAR = {2003},
KEYWORDS = {Latino, Linguistica, Base di Dati, Filologia, Grammatica},
PAGES = {533-550},
URL = {https://iris.cnr.it/handle/20.500.14243/37653},
VOLUME = {31},
}
@ARTICLE{BOZZI_2003_ARTICLE_BC_37659,
AUTHOR = {Bozzi, A. and Corradini, M. S.},
TITLE = {The Diphilos workstation: a computational system for digital philology},
YEAR = {2003},
ABSTRACT = {Abstract-Digital technology development and the conversion of ancient source documents in digital format allows to design software tools for philological disciplines. The Philological Workstation is able to: 1) manage images and texts; 2) perform an automatic link between each word of the manually transcribed manuscripts and the image-zones where the words are located; 3) associate annotations and variants to the text or to the image; 4) prepare indexes and concordances. A special module is also available to record the critical apparatus information allowing the user to evaluate the different typology each variant is dealing with. A multidimensional scaling algorithm shows the dependence between the collated sources in a 3D space. With regard to the ancient printed books, the workstation is able to train a specific neural system for automatic interpretation and transcription of the text, which, for the Latin language, is verified and corrected by a linguistic spelling checker},
PAGES = {47-77},
URL = {https://iris.cnr.it/handle/20.500.14243/37659},
VOLUME = {16-17},
}
@ARTICLE{CALZOLARI_2003_ARTICLE_CB_37647,
AUTHOR = {Calzolari, N. and Bindi, R.},
TITLE = {Acquisition of lexical information from a large textual Italian corpus},
YEAR = {2003},
ABSTRACT = {information others than those usually found in machine readable dictionaries or manually encoded by lexicographers are urgently needed. Different sources must be exploited if we want to overcome the lexical bottleneck of Natural Language Processing. Very interesting data can be found by processing large textual corpora, where the actual usage of the language can be truly investigated. These data refer, typically, to various kinds of syntagmatic relations, which are particularly problematic in many NLP applications. The paper describes how this data can be at least partially extracted by processing and analysing large text corpora, with quantitative/statistic methods. We describe two types of quantitative analyses whose aim is to extract information on the strength of association between two words, and on fixed phrases and idioms. We observe how the measure of the association ratio provides quantitative evidence to a number of lexical, syntactic and semantic relationships between word-pairs. One of the claims is that the linguistic information embodied in all these quite different types of lexical collocations can be helpful for lexical disambiguation in analysis and crucial for lexical selection in generation. This is a step towards a more objective lexicography and a more data-based linguistics},
PAGES = {117-131},
URL = {https://iris.cnr.it/handle/20.500.14243/37647},
VOLUME = {16-17},
}
@ARTICLE{CAMUGLIA_2003_ARTICLE_CCR_37645,
AUTHOR = {Camuglia, G. and Camuglia Ribarov, M. and Ribarov, K.},
TITLE = {Computer processing of a Clopen language system: old-church Slavonic},
YEAR = {2003},
ABSTRACT = {Abstract-The aim of this work is to explain and reveal the mutual benefits of computational processing of a dead language and a contemporary language. The dead language considered is Old-Church Slavonic. We shall try to point out that processing of a dead language is important not only for a diachronic study of the language material, and that annotation is not the straightforward process that it may seem to be. We also describe briefly two frameworks for the processing of Old-Church Slavonic: DBT and STIN-O-SANCT},
PAGES = {133-150},
URL = {http://www.torrossa.it/pages/ipplatform/itemDetails.faces},
VOLUME = {16-17},
DOI = {10.1400/18156},
ISSN = {0392-6907},
JOURNAL = {LINGUISTICA COMPUTAZIONALE},
}
@ARTICLE{CAPPELLI_2003_ARTICLE_CMCC_37668,
AUTHOR = {Cappelli, A. and Moretti, L. and Catarsi, M. N. and Caligaris, C.},
TITLE = {Strumenti per l'accesso multilingue al contenuto dell'informazione},
YEAR = {2003},
PAGES = {151-182},
URL = {https://iris.cnr.it/handle/20.500.14243/37668},
VOLUME = {16-17},
}
@ARTICLE{CAPPELLI_2003_ARTICLE_C_37655,
AUTHOR = {Cappelli, G.},
TITLE = {OLISSIPO: strumento per l'estrazione automatica del vocabolario di base},
YEAR = {2003},
PAGES = {183-200},
URL = {https://iris.cnr.it/handle/20.500.14243/37655},
VOLUME = {16-17},
}
@ARTICLE{CAPPELLI_2003_ARTICLE_CP_37679,
AUTHOR = {Cappelli, G. and Passarotti, M.},
TITLE = {LemLat: uno strumento computazionale per l?analisi linguistica del latino. Sviluppo e prospettive},
YEAR = {2003},
PAGES = {519-531},
URL = {https://iris.cnr.it/handle/20.500.14243/37679},
VOLUME = {31},
}
@ARTICLE{CAROTA_2003_ARTICLE_CP_37662,
AUTHOR = {Carota, F. and Prodanof, I.},
TITLE = {A corpus-based account of suffix productivity in Italian},
YEAR = {2003},
PAGES = {201-220},
URL = {https://iris.cnr.it/handle/20.500.14243/37662},
VOLUME = {16-17},
}
@ARTICLE{CECCOTTI_2003_ARTICLE_CS_37680,
AUTHOR = {Ceccotti, M. L. and Sassi, M.},
TITLE = {L?Archivio elettronico delle Opere di Carlo Emilio Gadda in DBT 2000: risultati e prospettive" (The Electronic Archive of Carlo Emilio Gadda?s Works: results and prospects)},
YEAR = {2003},
KEYWORDS = {Strumenti lessicali, Database gaddiano, Letteratura italiana, Informatica uman, Carlo Emilio Gadda},
URL = {https://iris.cnr.it/handle/20.500.14243/37680},
VOLUME = {SUPII},
}
@ARTICLE{CECCOTTI_2003_ARTICLE_CS_37648,
AUTHOR = {Ceccotti, M. and Sassi, M.},
TITLE = {L'archivio elettronico delle opere di Carlo Emilio Gadda. Da redattori a fruitori di un data base testuale},
YEAR = {2003},
PAGES = {221-250},
URL = {https://iris.cnr.it/handle/20.500.14243/37648},
VOLUME = {16-17},
}
@ARTICLE{CIGNONI_2003_ARTICLE_CC_37646,
AUTHOR = {Cignoni, L. and Coffey, S.},
TITLE = {At the interface of onomastics and phraseology. Multiword units as proper names, proper names as 'common' phrasal units},
YEAR = {2003},
PAGES = {251-262},
URL = {https://iris.cnr.it/handle/20.500.14243/37646},
VOLUME = {16-17},
}
@ARTICLE{CIGNONI_2003_ARTICLE_CC_37671,
AUTHOR = {Cignoni, L. and Coffey, S.},
TITLE = {Considerations emerging from a frequency study of multiword units in a corpus of contemporary written Italian},
YEAR = {2003},
PAGES = {263-283},
URL = {https://iris.cnr.it/handle/20.500.14243/37671},
VOLUME = {16-17},
}
@ARTICLE{FERRARI_2003_ARTICLE_FP_433716,
AUTHOR = {Ferrari, G. and Prodanof, I.},
TITLE = {Computational modelling of tutorial dialogue},
YEAR = {2003},
PAGES = {285-322},
URL = {https://iris.cnr.it/handle/20.500.14243/433716},
VOLUME = {16-17},
}
@ARTICLE{GIORGETTI_2003_ARTICLE_GS_154345,
AUTHOR = {Giorgetti, D. and Sebastiani, F.},
TITLE = {Automating survey coding by multiclass text categorization techniques},
YEAR = {2003},
ABSTRACT = {Survey coding is the task of assigning a symbolic code from a predefined set of such codes to the answer given in response to an open-ended question in a questionnaire (aka survey). This task is usually carried out to group respondents according to a predefined scheme based on their answers. Survey coding has several applications, especially in the social sciences, ranging from the simple classification of respondents to the extraction of statistics on political opinions, health and lifestyle habits, customer satisfaction, brand fidelity, and patient satisfaction. Survey coding is a difficult task, because the code that should be attributed to a respondent based on the answer she has given is a matter of subjective judgment, and thus requires expertise. It is thus unsurprising that this task has traditionally been performed manually, by trained coders. Some attempts have been made at automating this task, most of them based on detecting the similarity between the answer and textual descriptions of the meanings of the candidate codes. We take a radically new stand, and formulate the problem of automated survey coding as a text categorization problem, that is, as the problem of learning, by means of supervised machine learning techniques, a model of the association between answers and codes from a training set of precoded answers, and applying the resulting model to the classification of new answers. In this article we experiment with two different learning techniques: one based on naive Bayesian classification, and the other one based on multiclass support vector machines, and test the resulting framework on a corpus of social surveys. The results we have obtained significantly outperform the results achieved by previous automated survey coding approaches},
KEYWORDS = {survey coding, text classification, machine learning, information retrieva},
PAGES = {1269-1277},
URL = {https://iris.cnr.it/handle/20.500.14243/154345},
VOLUME = {54},
ISSN = {1532-2882},
JOURNAL = {JOURNAL OF THE AMERICAN SOCIETY FOR INFORMATION SCIENCE AND TECHNOLOGY},
}
@ARTICLE{GUADAGNINI_2003_ARTICLE_G_275946,
AUTHOR = {Guadagnini, E.},
TITLE = {Scelta di voci del Tesoro della Lingua Italiana delle Origini (settima serie)},
YEAR = {2003},
ABSTRACT = {Voce città s. f. del Tesoro della Lingua Italiana delle Origini (pp. 117-128)},
PAGES = {43-239},
URL = {https://iris.cnr.it/handle/20.500.14243/275946},
VOLUME = {8},
ISSN = {1591-8254},
JOURNAL = {BOLLETTINO-OPERA DEL VOCABOLARIO ITALIANO},
}
@ARTICLE{LENCI_2003_ARTICLE_LMP_37664,
AUTHOR = {Lenci, A. and Montemagni, S. and Pirrelli, V.},
TITLE = {Chunk-it. An Italian shallow parser for robust syntactic annotation},
YEAR = {2003},
PAGES = {353-386},
URL = {https://iris.cnr.it/handle/20.500.14243/37664},
VOLUME = {16-17},
}
@ARTICLE{MARINELLI_2003_ARTICLE_M_37649,
AUTHOR = {Marinelli, R.},
TITLE = {Per una storia dell'archivio testuale dell'Istituto di Linguistica Computazionale: dati e gestione del catalogo informatizzato},
YEAR = {2003},
ABSTRACT = {Over the last few years there has been much discussion about the relation between types of data, storage devices and system requirements for the preservation of data. This work carried out for the reorganization of the magnetic Archive of the Institute of Computational Linguistics (ILC), is an example of interaction between data management and recovery methods, as well as between data recording system development and evolution of storage devices. Data structure has also been affected by the technological evolution. It has been necessary to rely on an efficient, well-structured and tested data-base management system. Thus a computerized system was implemented for the joint management of normalized cataloguing files and bibliographic data, using the Information Retrieval System CDS/ISIS. A suitable description corresponding to standard criteria is necessary for a reliable tracing of the documents. The correct use of international standards like ISO to process traditional bibliographic information assures the accessibility, readability and consistency of the data},
KEYWORDS = {databases, information retrieval systems, textual archives},
PAGES = {387-399},
URL = {https://iris.cnr.it/handle/20.500.14243/37649},
VOLUME = {16-17 (1)},
ISSN = {0392-6907},
JOURNAL = {LINGUISTICA COMPUTAZIONALE},
}
@ARTICLE{MARINELLI_2003_ARTICLE_MBBGMOPRCZ_37656,
AUTHOR = {Marinelli, R. and Biagini, L. and Bindi, R. and Goggi, S. and Monachini, M. and Orsolini, P. and Picchi, E. and Rossi, S. and Calzolari, N. and Zampolli, A.},
TITLE = {The Italian PAROLE corpus: an overview},
YEAR = {2003},
PAGES = {401-421},
URL = {https://iris.cnr.it/handle/20.500.14243/37656},
VOLUME = {16-17},
ISSN = {0392-6907},
JOURNAL = {LINGUISTICA COMPUTAZIONALE},
}
@ARTICLE{MEGA_2003_ARTICLE_MAGLPRV_146772,
AUTHOR = {Mega, M. S. and Allegrini, P. and Grigolini, P. and Latora, V. and Palatella, L. and Rapisarda, A. and Vinciguerra, S.},
TITLE = {Power-Law Time Distribution of Large Earthquakes},
YEAR = {2003},
ABSTRACT = {We study the statistical properties of time distribution of seismicity in California by means of a new method of analysis, the diffusion entropy. We find that the distribution of time intervals between a large earthquake (the main shock of a given seismic sequence) and the next one does not obey Poisson statistics, as assumed by the current models. We prove that this distribution is an inverse power law with an exponent µ = 2. 06±0. 01. We propose the long-range model, reproducing the main properties of the diffusion entropy and describing the seismic triggering mechanisms induced by large earthquakes},
KEYWORDS = {Scaling detection, main-shocks, diffusion entropy},
URL = {https://iris.cnr.it/handle/20.500.14243/146772},
VOLUME = {90},
ISSN = {0031-9007},
JOURNAL = {PHYSICAL REVIEW LETTERS (PRINT)},
}
@ARTICLE{MONACHINI_2003_ARTICLE_MC_37676,
AUTHOR = {Monachini, M. and Calzolari, N.},
TITLE = {Methods for standardization: the case of morphosyntax within the EAGLES project},
YEAR = {2003},
PAGES = {423-460},
URL = {https://iris.cnr.it/handle/20.500.14243/37676},
VOLUME = {16-17 (1)},
ISSN = {0392-6907},
JOURNAL = {LINGUISTICA COMPUTAZIONALE},
}
@ARTICLE{MONTEMAGNI_2003_ARTICLE_MBBCCLPZFMRBPSZMPD_37665,
AUTHOR = {Montemagni, S. and Barsotti, F. and Battista, M. and Calzolari, N. and Corazzari, O. and Lenci, A. and Pirrelli, V. and Zampolli, A. and Fanciulli, F. and Massetani, M. and Raffaelli, R. and Basili, R. and Pazienza, M. T. and Saracino, D. and Zanzotto, F. and Mana, N. and Pianesi, F. and Delmonte, R.},
TITLE = {The syntactic-semantic Treebank of Italian. An Overview},
YEAR = {2003},
PAGES = {461-492},
URL = {https://iris.cnr.it/handle/20.500.14243/37665},
VOLUME = {16-17},
}
@ARTICLE{MONTEMAGNI_2003_ARTICLE_MPB_37666,
AUTHOR = {Montemagni, S. and Picchi, E. and Biagini, L.},
TITLE = {DBT-ALT: a system for storing and querying the data of the 'Atlante Linguistico Toscano'},
YEAR = {2003},
ABSTRACT = {Abstract-Computers can help dialectologists to make full use of the information they have so laboriously and painstakingly acquired: the basic dimensions of dialectal research can be enlarged and its possible outcomes can become more sophisticated. In this paper, we describe a lexical database for dialectal data, DBT-ALT, which has been designed and constructed to contain linguistic data collected for the Atlante Lessicale Toscano (ALT), a lexical atlas of Tuscany. DBT-ALT is illustrated in detail, with particular emphasis on its search functions which allow for complex queries taking into account a wide range of parameters interactively defined by the user on the basis of his/her research interests},
PAGES = {493-517},
URL = {https://iris.cnr.it/handle/20.500.14243/37666},
VOLUME = {18-19},
}
@ARTICLE{PARDELLI_2003_ARTICLE_P_37677,
AUTHOR = {Pardelli, G.},
TITLE = {BIBLOS: historical, philosophical and philological digital library of the Italian National Research Council},
YEAR = {2003},
ABSTRACT = {The BIBLOS project was established in 1996 for the purpose of creating an Internet site which would combine and organise all the information gathered by the various branches of the National Research Council (CNR) relating to the Humanities. The browsing system is based on a subject catalogue which represents the main access to the file, and which includes information on three different research topics: linguistics, philosophy and antiquities. The Istitutes have already made available the information collected from their research activity and the databases which have been developed, usually in the form of bibliographic catalogues and specialised bibliographies},
KEYWORDS = {IT for Library, Biblioteche virtuali, Documentazione, Catalogazione, CNR},
PAGES = {519-549},
URL = {https://iris.cnr.it/handle/20.500.14243/37677},
VOLUME = {ANNO XVIII-XIX, 1998-1999},
DOI = {10.1400/18171},
ISSN = {0392-6907},
JOURNAL = {LINGUISTICA COMPUTAZIONALE},
}
@ARTICLE{PECCHIA_2003_ARTICLE_PG_37661,
AUTHOR = {Pecchia, L. and Guazzini, E.},
TITLE = {An Italian children's corpus of spoken language},
YEAR = {2003},
ABSTRACT = {Abstract-In this paper we describe the criteria adopted for the creation of a corpus of spoken language produced by six-to-eleven-year-old children in different communicative situations, the methodology used for the collection of the data, the transcription, coding and lemmatization phases. This work is to be included among the activities carried out within the framework of the Corpus di Linguaggio Infantile (CLI), a special project of the Italian National Research Council (CNR)},
PAGES = {547-572},
URL = {https://iris.cnr.it/handle/20.500.14243/37661},
VOLUME = {18-19},
}
@ARTICLE{PETERS_2003_ARTICLE_PP_150092,
AUTHOR = {Peters, C. and Picchi, E.},
TITLE = {Bilingual lexicons, parallel and comparable corpora: creating the basis for cross language information retrieval},
YEAR = {2003},
ABSTRACT = {Abstract-We summarise our work over the last decade aimed at the design and development of a series of tools studied for use in applications such as language learning, translation studies and bilingual lexicography. The different components of an integrated system for bilingual lexical and textual database management are outlined. Our final goal has been the implementation of a web-based system for crosslanguage information retrieval},
KEYWORDS = {Cross-language information retrieval, Multilingual corpora, Bilingual lexicography, Translation studies, Second language learning},
PAGES = {573-596},
URL = {https://iris.cnr.it/handle/20.500.14243/150092},
VOLUME = {18-19},
ISSN = {0392-6907},
JOURNAL = {LINGUISTICA COMPUTAZIONALE},
}
@ARTICLE{PICCHI_2003_ARTICLE_P_37678,
AUTHOR = {Picchi, E.},
TITLE = {PiSystem: sistemi integrati per l'analisi testuale},
YEAR = {2003},
ABSTRACT = {Abstract-This paper provides an overview of the textual and lexical analysis tools implemented at the Institute of Computational Linguistics, which reflect the development of the studies and applications of the Institute from the pioneer stage of lexicography to its current state of progress. The analysis procedures coordinated and integrated in a system called PiSystem are presented, starting from the base element, DBT (Database Testuale), an analysis query system of textual material, with its correlated base functions. The procedures include the following: a) analysis of entire textual corpora; b) new international coding; d) text classification/lemmatization; computer-assisted lemmatization; automatic lemmatization; analysis, navigation and retrieval of linguistic information for lemmatized texts. DBT-DIG, a system specifically designed to deal with Digital Libraries (textual material in character and/or image format), with particular regard to the collection of periodicals available in libraries, is also presented. Other components of the Pi-System are illustrated in detail in articles in this volume: handling of multilingual environments; treatment of bilingual (Italian-Arabic) material; processing, analysis and navigation within the dialectal ALT (Atlante Lessicale Toscano) archive},
PAGES = {597-627},
URL = {https://iris.cnr.it/handle/20.500.14243/37678},
VOLUME = {18-19},
}
@ARTICLE{PICCHI_2003_ARTICLE_PSNC_433717,
AUTHOR = {Picchi, E. and Sassolini, E. and Nahli, O. and Cucurullo, S.},
TITLE = {Risorse monolingui e multilingui. Corpus bilingue italiano-arabo},
YEAR = {2003},
ABSTRACT = {Abstract-The objective of the project is twofold: on the one hand, the creation and elaboration of software procedures for the Arabic language and, on the other hand, the creation of linguistic resources for the management of large Arabic corpora. The linguistic resources are substantially the following: a) Morphological engine for the Arabic language. The engine is constituted by a number of modules: the algorithms and modules for generation and analysis, an appropriate encoding system for the representation of lexical data and of morphological characteristics of Arabic, the so-called lemmario, i. e. the archive of lemmas; b) The automatic alignment of parallel texts in Italian and Arabic language; c) Automatic tagging of Arabic texts, performed by using the above morphological engine; d) Systems for accessing and querying (raw and/or tagged) Arabic texts and parallel Italian-Arabic corpora},
KEYWORDS = {Morfologia araba, Corpora bilingui, Analisi testuale, Aligner, Tagger},
PAGES = {629-678},
URL = {https://iris.cnr.it/handle/20.500.14243/433717},
VOLUME = {18-19},
}
@ARTICLE{PIRRELLI_2003_ARTICLE_PB_37650,
AUTHOR = {Pirrelli, V. and Battista, M.},
TITLE = {Syntagmatic and paradigmatic issues in computational morphology},
YEAR = {2003},
ABSTRACT = {Abstract-In this paper some germane theoretical issues in inflectional morphology will be addressed from a computational point of view. In particular we shall focus on the proper treatment of verb stem allomorphy in Italian conjugation and discuss several different formal solutions in some detail. To put our discussion on a more computational footing, all our examples are illustrated by using the DATR formalism as our metalanguage. This allows us to combine the advantages of the advanced expressive power and flexibility of DATR with the further bonus of offering a running piece of program code that actually works on the discussed examples. The upshot of the paper is that a computational treatment of Italian conjugation can considerably benefit from recent theoretical advances in word and paradigm morphology, as this level of description allows the rule writer to capture generalizations which would otherwise completely elude a purely syntagmatic approach to allomorphy},
PAGES = {679-701},
URL = {https://iris.cnr.it/handle/20.500.14243/37650},
VOLUME = {18-19},
}
@ARTICLE{PRODANOF_2003_ARTICLE_PCM_37672,
AUTHOR = {Prodanof, I. and Cappelli, A. and Moretti, L.},
TITLE = {Resources and tools: experiences in language engineering},
YEAR = {2003},
ABSTRACT = {Abstract-In this paper notions such as resources, tools and reusability related to the design and implementation of NLP applications at low costs will be discussed through examples from projects carried out within the frame of European programmes. The components embedded (dictionary and parser) and the ways in which these are reused will be presented},
PAGES = {703-744},
URL = {https://iris.cnr.it/handle/20.500.14243/37672},
VOLUME = {18-19},
}
@ARTICLE{ROVENTINI_2003_ARTICLE_RABCCGMMSZ_37667,
AUTHOR = {Roventini, A. and Alonge, A. and Bertagna, F. and Calzolari, N. and Cancila, J. and Girardi, C. and Magnini, B. and Marinelli, R. and Speranza, M. and Zampolli, A.},
TITLE = {ItalWordNet: building a large semantic database for the automatic treatment of Italian},
YEAR = {2003},
ABSTRACT = {Abstract-This paper describes the main characteristics of the ItalWordNet semantic database, built in the context of the SI-TAL Italian National Project, within which a set of integrated resources and tools for the automatic treatment of the Italian language was realized. The database was created by extending the Italian wordnet developed within the EuroWordNet project, by adding: i) adjectives, adverbs and proper nouns (not dealt with in EuroWordNet); ii) a terminological subset related to the economic-financial domain. The relevant changes involved by these extensions both in the linguistic model and in the data structure are also illustrated. In particular, we discuss: i) the overall architecture of the database; ii) the semantic relations used to encode information on synsets; iii) the changes made to the EuroWordNet Top Ontology structure; iv) the specific characteristics of the terminological subset and the solutions adopted to link it to the generic wordnet. Keywords-synset, semantic database, wordnet, semantic},
KEYWORDS = {Database lessicale, Rete semantica, Relazioni semantiche, Risorse linguistiche},
PAGES = {745-791},
URL = {https://iris.cnr.it/handle/20.500.14243/37667},
VOLUME = {18-19},
}
@ARTICLE{RUIMY_2003_ARTICLE_RCGSCZ_37657,
AUTHOR = {Ruimy, N. and Corazzari, O. and Gola, E. and Spanu, A. and Calzolari, N. and Zampolli, A.},
TITLE = {The PAROLE model and the Italian Syntactic lexicon},
YEAR = {2003},
ABSTRACT = {Abstract-This paper presents an overview of a large scale Syntactic Computational Lexicon of Italian. This lexicon was elaborated in the framework of the EC funded LE-PAROLE project, which developed core, generic and re-usable written language resources in 12 EU languages. All monolingual lexica were built according to the same design principles, same linguistic specifications and representation format. The PAROLE Italian lexicon is representative of modern Italian language use. The entries were selected on a frequency basis from the ILC Corpus and the syntactic structures encoded were partly inferred from their contexts of occurrence. Both the general structure of a PAROLE lexicon and the specificity of its Italian instantiation are presented. Some languagespecific linguistic and lexicographic options concerning crucial issues to a lexicon building process are illustrated. An overview of the syntactic structures encoded for verbs, nouns and adjectives allows lexicon syntactic coverage as well as description fine-grainedness to be estimated},
PAGES = {793-820},
URL = {https://iris.cnr.it/handle/20.500.14243/37657},
VOLUME = {18-19},
ISSN = {0392-6907},
JOURNAL = {LINGUISTICA COMPUTAZIONALE},
}
@ARTICLE{RUIMY_2003_ARTICLE_RMGCDUR_37673,
AUTHOR = {Ruimy, N. and Monachini, M. and Gola, E. and Calzolari, N. and Del Fiorentino, M. and Ulivieri, M. and Rossi, S.},
TITLE = {A computational semantic lexicon of Italian: SIMPLE},
YEAR = {2003},
ABSTRACT = {Abstract-This paper describes the Italian Semantic Computational Lexicon elaborated in the framework of the European LE-SIMPLE Project. SIMPLE was aimed at adding a layer of semantic information to a subset of PAROLE lexica. The SIMPLE framework is based principally on the Generative Lexicon theory which allows to express the multidimensionality of meaning by means of qualia structure. Word senses are described according to their position within the SIMPLE ontology, which is based on the principle of orthogonal inheritance and consists of semantic types for characterizing simple nouns, event and property denoting lexical units. The encoding process is guided by templates, that are schematic structures containing clusters of structured information specific to each semantic type. Besides a high degree of granularity of meaning representation, the SIMPLE lexicon presents innovative aspects such as link between the syntactic and semantic levels of information, description of predicative representation and enforcement of selectional restrictions/preferences on arguments},
PAGES = {821-864},
VOLUME = {18-19},
JOURNAL = {LINGUISTICA COMPUTAZIONALE},
}
@ARTICLE{SABA_2003_ARTICLE_SC_37651,
AUTHOR = {Saba, A. and Cappelli, G.},
TITLE = {Morfsin and AyDA: two systems for analyzing modern and old Spanish},
YEAR = {2003},
ABSTRACT = {Abstract-In this work we shall present two software systems for automatic text analysis developed at the Institute of Computational Linguistics (ILC) in Pisa. Although originally designed for modern Spanish texts, both can be applied, with appropriate modifications, to Old Spanish. The first one, a mainframe application called Morfsin©, was released in its final version in 1986. The second, developed for the IBMcompatible PC platform, stems from the earlier work on Morfsin and is known by the acronym AyDA (Analyzer and Automatic Disambiguator). AyDA represents a useful tool for linguistics specialists in that it reduces the need to manually tag words morphologically. Moreover, it can provide quite a high degree of automatic disambiguation of functional homographs in a text. The final outcome depends on the number of words recognized, which depends, in turn, on the lexis included in the lookup dictionaries and the type of text being analyzed-modern or old, literary prose or specialized language, etc. This paper provides a description of the basic structure of the two systems, with particular emphasis on AyDA, and reports the results obtained in applying AyDA to texts in Old Spanish},
PAGES = {865-900},
URL = {https://iris.cnr.it/handle/20.500.14243/37651},
VOLUME = {18-19},
}
@ARTICLE{SASSI_2003_ARTICLE_SA_37652,
AUTHOR = {Sassi, M. and Amoroso, Y.},
TITLE = {Letteratura, diritto e linguistica computazionale. Panorama delle collaborazioni Italia-Cuba},
YEAR = {2003},
ABSTRACT = {Abstract-These notes offer an outline of the collaborations started in 1995 by the Institute of Computational Linguistics (ILC) of Pisa, with some Cuban Scientific Institutions and expanded in several research sectors in the subsequent years. As regards Automatized Lexicography, we propose here a brief description of the results and prospects of work carried out with CEM (Centro de Estudios Martianos), FAC (Fundación Alejo Carpentier) and ILL (Instituto de Literatura y Lingüística). In 1996, as a result of the cooperation of ILC with CEM with regard to methodology and textual codification, we started the creation of an electronic archive of the complete works of Jose Martí (27 tomes). In 1997, in collaboration with FAC, ILC put to practical use the previous experiences for the creation of an electronic archive of the complete works of Alejo Carpentier. In 2002, the collaboration between ILL and SCDI (Sociedad Cubana de Derecho e Informática de la Unión di Juristas de Cuba), resulted in the creation of the Diccionario de Jurismática. As far as Legal Information Science is concerned, we propose a presentation of the objectives which have been reached as well as the projects for the future in the area, relating to the study of languages and legal documents as formulated by ILC and SCDI},
PAGES = {901-924},
URL = {https://iris.cnr.it/handle/20.500.14243/37652},
VOLUME = {18-19},
}
@ARTICLE{SORIA_2003_ARTICLE_SP_37658,
AUTHOR = {Soria, C. and Pirrelli, V.},
TITLE = {A multi-level annotation meta-scheme for dialogue acts},
YEAR = {2003},
ABSTRACT = {Abstract-This article describes a new principled framework for comparison, design and standardization of annotation schemes for dialogue acts. Previous attempts at comparing existing schemes in order to identify a common core of generally agreed-upon dialogue acts share the assumption that tags belonging to different schemes and describing the same general phenomena can always be related through hypo-or hyperonymy relationships. Consequently, general-purpose schemes have often been the result of a merger of different tag sets. In this article, we show the extent to which comparability of different annotation schemes is prevented by the very limited tag inter-translatability. We thus describe an alternative approach to the comparison of dialogue act taxonomies based on a compositional analysis of tags according to independent classificatory dimensions. The framework takes a recognition-based approach to dialogue tagging and defines four independent taxonomies of tags, one for each orthogonal dimension of linguistic and contextual analysis assumed to have a bearing on identification of dialogue acts. We also show how the same framework can be used to design a generalpurpose annotation scheme which combines the features of generality and expressivity by exploiting a modular structure. The advantages and limitations of this proposal over other previous attempts are discussed and concretely exemplified},
KEYWORDS = {dialogue acts, annotation scheme, pragmatics},
PAGES = {925-952},
URL = {https://iris.cnr.it/handle/20.500.14243/37658},
VOLUME = {18-19},
ISSN = {0392-6907},
JOURNAL = {LINGUISTICA COMPUTAZIONALE},
}
@ARTICLE{TURRINI_2003_ARTICLE_TCP_37669,
AUTHOR = {Turrini, G. and Cignoni, L. and Paccosi, A.},
TITLE = {From a children's dictionary to a hypermedia laboratory for language learning},
YEAR = {2003},
ABSTRACT = {Abstract-This paper describes Addizionario, a software tool patented by the National Research Council (CNR.) of Italy, addressed to pre-and primary school children for the study of Italian as native or second language. The different stages of development of the system are described which range from a preliminary phase of collection of childrens data to the implementation of a multimedia Dictionary, to the final stage of a language laboratory in which an Activity Book interacting with the Dictionary has been added to the system. The multilingual version of Addizionario recently developed is used in European Socrates-Comenius projects to foster the learning of a native and foreign language. Furthermore, the particular features of the tool, which is child-centred, open, flexible and easy-to-use, make it suitable not only for normal users, but also for those presenting learning difficulties linked to physical or cognitive impairment. Keywords-hypermedia, childrens dictionaries, creativity, language learning, impairment 1. INTRODUCTION This paper describes the most interesting features of Addizionario, an integrated set of tools designed to support pre-and primary school children in the study of Italian as native or as second language at various levels of difficulty and from various points of view. The software, implemented at the Institute of Computational Linguistics (ILC) in Pisa, in collaboration with the Department of Computer Sciences of Turin University, and patented by the Italian National Research Council (CNR) of Italy, reflects the ideas that the ILC group Language Teaching and Information Technologies involved in the study and implementation of information tools for language teaching, has expressed over the last decade},
PAGES = {953-969},
URL = {https://iris.cnr.it/handle/20.500.14243/37669},
VOLUME = {18-19},
}
@ARTICLE{ZAMPOLLI_2003_ARTICLE_ZCC_37681,
AUTHOR = {Zampolli, A. and Calzolari, N. and Cignoni, L.},
TITLE = {Foreword},
YEAR = {2003},
PAGES = {xiii-xv},
URL = {https://iris.cnr.it/handle/20.500.14243/37681},
VOLUME = {16-17},
}
@BOOK{AMOROSO_2003_BOOK_AFFIMMPS_89053,
AUTHOR = {Amoroso, Y. C. A. and Fameli, E. and Fameli, M. and Inghirami, B. and Mariani, P. and Marinai, E. and Parenti, L. and Sassi, M.},
TITLE = {Diritto alla vita e Diritto all'ambiente nel lessico costituzionale e nella dottrina giuridica. Strumenti e metodi per l'analisi linguistico-concettuale},
YEAR = {2003},
ABSTRACT = {La ricerca, all'interno di un progetto coordinato di Agenzia 2000, si è prefissata l'utilizzo di thesauri multilingue come strumenti per il reperimento di informazioni all'interno di banche dati consultabili in rete. Il contesto in cui la ricerca si è svolta, coincidendo con le problematiche relative ai diritti fondamentali (in specie: diritto alla vita e diritto all'ambiente), è stato fin dall'inizio concepito come fortemente interdisciplinare e a livello internazionale},
KEYWORDS = {Diritto alla vita, Diritto all'ambiente, Fonti costituzionali, Strumenti lessicali, Database settoriali},
PAGES = {160},
URL = {https://iris.cnr.it/handle/20.500.14243/89053},
PUBLISHER = {CNR, ITTIG (Firenze, ITA)},
CONFERENCE_PLACE = {Firenze},
}
@BOOK{CAMMELLI_2003_BOOK_CS_89037,
AUTHOR = {Cammelli, A. and Sassi, M.},
TITLE = {Strumenti e metodi per uno studio lessicale della Costituzione Bolivariana del Venezuela},
YEAR = {2003},
ABSTRACT = {Il testo della costituzione bolivariana della repubblica del Venezuela merita attenta considerazione perché nel suo lungo articolato racchiude un "sapere" costituzionale con valori e principi universali che è quasi impossibile recepire in un testo unico. Sicuramente la maturità e l'altezza dei principi enunciati si devono anche alla giovinezza del testo promulgato solennemente il 20 dicembre del 1999 dopoché il popolo venezuelano lo aveva approvato con un referendum il 15 dicembre dello stesso anno},
KEYWORDS = {Lessico Costituzionale, Bolivar, Repubblica bolivariana del Venezuela},
PAGES = {1-42},
URL = {http://www.ilc.cnr.it/CEG/LessicoBolivar.pdf},
}
@INCOLLECTION{ALLEGRINI_2003_INCOLLECTION_ALMP_134779,
AUTHOR = {Allegrini, P. and Lenci, A. and Montemagni, S. and Pirrelli, V.},
TITLE = {Le forme del significato. Acquisizione e rappresentazione dell'informazione semantica},
YEAR = {2003},
KEYWORDS = {Acquisizione, Semantica Lessicale, Ontologia, Machine Learning},
URL = {https://iris.cnr.it/handle/20.500.14243/134779},
}
@INCOLLECTION{BOZZI_2003_INCOLLECTION_B_134772,
AUTHOR = {Bozzi, A.},
TITLE = {Digital documents and computational philology: the Digital Philology System DiPhiloS},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/134772},
PUBLISHER = {Olschki (Firenze, ITA)},
CONFERENCE_PLACE = {Firenze},
}
@INCOLLECTION{BOZZI_2003_INCOLLECTION_BR_134771,
AUTHOR = {Bozzi, A. and Raggioli, A.},
TITLE = {Tecnologia digitale negli Istituti Culturali: un case study},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/134771},
}
@INCOLLECTION{CALZOLARI_2003_INCOLLECTION_CZ_134783,
AUTHOR = {Calzolari, N. and Zampolli, A.},
TITLE = {The EAGLES/ISLE Initiative for Setting Standards: the Computational Lexicon Working Group for Multilingual Lexicons},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/134783},
}
@INCOLLECTION{CALZOLARI_2003_INCOLLECTION_CZL_134773,
AUTHOR = {Calzolari, N. and Zampolli, A. and Lenci, A.},
TITLE = {Risorse linguistiche per un accesso al 'contenuto'},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/134773},
}
@INCOLLECTION{MONTEMAGNI_2003_INCOLLECTION_MBBCCLZRPMD_134774,
AUTHOR = {Montemagni, S. and Barsotti, F. and Battista, M. and Calzolari, N. and Corazzari, O. and Lenci, A. and Zampolli, A. and Raffaelli, R. and Pazienza, M. and Mana, N. and Delmonte, R.},
TITLE = {Building the Italian Syntactic-Semantic Treebank},
YEAR = {2003},
KEYWORDS = {Corpora testuali, Annot. sintattica, Annot. semantica, Treebank},
URL = {https://iris.cnr.it/handle/20.500.14243/134774},
}
@INCOLLECTION{PICCHI_2003_INCOLLECTION_P_134775,
AUTHOR = {Picchi, E.},
TITLE = {Esperienze nel settore dell'analisi di corpora testuali: software e strumenti linguistici},
YEAR = {2003},
KEYWORDS = {Analisi testuale, Digital Library, Disambiguazione, Corpora bilingui, Lemmatizzazione},
URL = {https://iris.cnr.it/handle/20.500.14243/134775},
PUBLISHER = {Olschki (Firenze, ITA)},
CONFERENCE_PLACE = {Firenze},
}
@INCOLLECTION{PIRRELLI_2003_INCOLLECTION_P_134776,
AUTHOR = {Pirrelli, V.},
TITLE = {Machine language learning meets information technology},
YEAR = {2003},
KEYWORDS = {Apprendimento, Sistemi integrati, Semantic web, Machine Learning},
URL = {https://iris.cnr.it/handle/20.500.14243/134776},
PUBLISHER = {Angeli (Milano, ITA)},
CONFERENCE_PLACE = {Milano},
}
@INCOLLECTION{SASSI_2003_INCOLLECTION_S_134784,
AUTHOR = {Sassi, M.},
TITLE = {La consultazione dei corpora costituzionali con il DBT},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/134784},
PUBLISHER = {CNR, ITTIG (Firenze, ITA)},
CONFERENCE_PLACE = {Firenze},
}
@EDITORIAL{AMOROSO_2003_EDITORIAL_ACFFIMMPS_197022,
AUTHOR = {Amoroso, Y. and Cammelli, A. and Fameli, E. and Fameli, M. and Inghirami, B. and Mariani, P. and Marinai, E. and Parenti, L. and Sassi, M.},
TITLE = {Diritto alla vita e Diritto all'ambiente nel lessico costituzionale e nella dottrina giuridica. Strumenti e metodi per l'analisi linguistico-concettuale},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/197022},
}
@EDITORIAL{CECCOTTI_2003_EDITORIAL_CS_195195,
AUTHOR = {Ceccotti, M. and Sassi, M.},
TITLE = {Sistema},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195195},
}
@INPROCEEDINGS{CALZOLARI_2003_INPROCEEDINGS_CBLM_77210,
AUTHOR = {Calzolari, N. and Bertagna, F. and Lenci, A. and Monachini, M.},
TITLE = {New Perspectives for Lexical Resources in the Semantic Web Scenario},
YEAR = {2003},
PAGES = {10-19},
URL = {https://iris.cnr.it/handle/20.500.14243/77210},
CONFERENCE_NAME = {GL 2003-Second International Workshop on Generative Approaches to the Lexicon},
EDITOR = {Bouillon, P. and Kanzaki, K.},
}
@INPROCEEDINGS{CALZOLARI_2003_INPROCEEDINGS_CLQ_77203,
AUTHOR = {Calzolari, N. and Lenci, A. and Quochi, V.},
TITLE = {Towards Multiword and Multilingual Lexicons: Between Theory and Practice},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/77203},
CONFERENCE_NAME = {Linguistics and Phonetics 2002 Conference},
}
@INPROCEEDINGS{CAPPELLI_2003_INPROCEEDINGS_CG_101362,
AUTHOR = {Cappelli, A. and Giovannetti, E.},
TITLE = {Human-Robot Interaction},
YEAR = {2003},
ABSTRACT = {Human-Robot Interaction (HRI) is a constantly growing multidisciplinary area rich of cues for advanced researches and technology transfers. It plays a fundamental role in the development of robots that operate in an open environment and cooperate with humans. This task requires the development of techniques that allow inexpert users to use their robots in an efficient and safe way, using an intuitive and natural interface. In this work, after an introduction to the fundamental issues concerning HRI, we will present the different possible interaction modalities between robot and man followed by a series of advanced interface applications for autonomous mobile robots},
KEYWORDS = {Human robot interaction, Natural language processing, Man-machine interaction, Robotics},
PAGES = {15-20},
URL = {https://iris.cnr.it/handle/20.500.14243/101362},
ISBN = {88-85059-15-5},
CONFERENCE_NAME = {1st RoboCare Workshop},
BOOKTITLE = {Proceedings of the First Robocare Workshop},
EDITOR = {Cesta, A.},
}
@INPROCEEDINGS{CUTUGNO_2003_INPROCEEDINGS_CMMRRR_77217,
AUTHOR = {Cutugno, P. and Marconi, L. and Miyares Bermúdez, E. and Ratti, D. and Rolando, C. and Ruiz Miyares, L.},
TITLE = {Thesaurus electrónico Italiano-Español: Instrumento hipertextual para la enseñanza y la traducción automatizada asistida en ambas lenguas},
YEAR = {2003},
PAGES = {585-587},
URL = {https://iris.cnr.it/handle/20.500.14243/77217},
CONFERENCE_NAME = {VIII Simposio Internacional de Comunicacion Social},
}
@INPROCEEDINGS{CUTUGNO_2003_INPROCEEDINGS_CMRR_431275,
AUTHOR = {Cutugno, P. and Marconi, L. and Ratti, D. and Rolando, C.},
TITLE = {VI e-book: gramática del verbo italiano},
YEAR = {2003},
CONFERENCE_NAME = {VIII Simposio Internacional de Comunicacion Social},
}
@INPROCEEDINGS{CUTUGNO_2003_INPROCEEDINGS_CMRR_77216,
AUTHOR = {Cutugno, P. and Marconi, L. and Ratti, D. and Rolando, C.},
TITLE = {The usability of e-book technology for the treatment of linguistic data},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/77216},
CONFERENCE_NAME = {Advances in Technology-Based Education: Toward a Knowledge-Based Society II International Conference on Multimedia ICT's in Education},
}
@INPROCEEDINGS{GIORGETTI_2003_INPROCEEDINGS_GPS_77212,
AUTHOR = {Giorgetti, D. and Prodanof, I. and Sebastiani, F.},
TITLE = {Open-ended survey coding using text categorization techniques},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/77212},
CONFERENCE_NAME = {Impact of Technology on the Survey Process},
}
@INPROCEEDINGS{GIORGETTI_2003_INPROCEEDINGS_GS_147456,
AUTHOR = {Giorgetti, D. and Sebastiani, F.},
TITLE = {Multiclass text categorization for automated survey coding},
YEAR = {2003},
ABSTRACT = {Survey coding is the task of assigning a symbolic code from a predefined set of such codes to the answer given in response to an open-ended question in a questionnaire (aka survey). We formulate the problem of automated survey coding as a text categorization problem, i. e. as the problem of learning, by means of supervised machine learning techniques, a model of the association between answers and codes from a training set of pre-coded answers, and applying the resulting model to the classi. cation of new answers. In this paper we experiment with two different learning techniques, one based on naÏve Bayesian classi. cation and the other one based on multiclass support vector machines, and test the resulting framework on a corpus of social surveys. The results we have obtained significantly outperform the results achieved by previous automated survey coding approaches},
KEYWORDS = {Text categorization, Classifier Design and Evaluation, Learning, Information Search and Retrieval, Sociology},
PAGES = {798-802},
URL = {https://iris.cnr.it/handle/20.500.14243/147456},
PUBLISHER = {ACM Press (New York, USA)},
CONFERENCE_NAME = {SAC-03-18th ACM Symposium on Applied Computing},
CONFERENCE_PLACE = {New York},
BOOKTITLE = {na},
}
@INPROCEEDINGS{GIORGETTI_2003_INPROCEEDINGS_GSP_57593,
AUTHOR = {Giorgetti, D. and Sebastiani, F. and Prodanof, I.},
TITLE = {Automatic coding of open-ended surveys using text categorization techniques},
YEAR = {2003},
ABSTRACT = {Open-ended questions do not limit respondents' answers in terms of linguistic form and semantic content, but bring about severe problems in terms of cost and speed, since their coding requires trained professionals to manually identify and tag meaningful text segments. To overcome these problems, a few automatic approaches have been proposed in the past, some based on matching the answer with textual descriptions of the codes, others based on manually building rules that check the answer for the presence or absence of code-revealing words. While the former approach is scarcely effective, the major drawback of the latter approach is that the rules need to be developed manually, and before the actual observation of text data. We propose a new approach, inspired by work in information retrieval (IR), that overcomes these drawbacks. In this approach survey coding is viewed as a task of multiclass text categorization (MTC), and is tackled through techniques originally developed in the. eld of supervised machine learning. In MTC each text belonging to a given corpus has to be classi. ed into exactly one from a set of prede. ned categories. In the supervised machine learning approach to MTC, a set of categorization rules is built automatically by learning the characteristics that a text should have in order to be classified under a given category. Such characteristics are automatically learnt from a set of training examples, i. e. a set of texts whose category is known. For survey coding, we equate the set of codes with categories, and all the collected answers to a given question with texts. Giorgetti and Sebastiani have carried out automatic coding experiments with two di. erent supervised learning techniques, one based on a naÏve Bayesian method and the other based on multiclass support vector machines. Experiments have been run on a corpus of social surveys carried out by the National Opinion Research Center, University of Chicago (NORC). These experiments show that our methods outperform, in terms of accuracy, previous automated methods tested on the same corpus},
KEYWORDS = {Automatic coding},
PAGES = {173-184},
URL = {https://iris.cnr.it/handle/20.500.14243/57593},
CONFERENCE_NAME = {The Impact of Technology on the Survey Process. Fourth International Conference on Survey and Statistical Computing},
}
@INPROCEEDINGS{GUADAGNINI_2003_INPROCEEDINGS_G_265241,
AUTHOR = {Guadagnini, E.},
TITLE = {«Sill, qu'es caps e guitz» (P.-C. 461, 67a): un "descort" provenzale del secondo quarto del Duecento},
YEAR = {2003},
PAGES = {395-405},
URL = {https://iris.cnr.it/handle/20.500.14243/265241},
PUBLISHER = {Viella (Roma, ITA)},
ISBN = {9788883341120},
CONFERENCE_NAME = {Septième Congrès International de l'Association Internationale d'Études Occitanes},
CONFERENCE_PLACE = {Roma},
BOOKTITLE = {Scène, évolution, sort de la langue et de la littérature d'oc. Actes du Septième Congrès International de l'Association Internationale d'Études Occitanes},
EDITOR = {Castano, R. and Guida, S. and Latella, F.},
}
@INPROCEEDINGS{MARINELLI_2003_INPROCEEDINGS_MRS_77214,
AUTHOR = {Marinelli, R. and Roventini, A. and Spadoni, G.},
TITLE = {Linking a subset of maritime terminology to the Italian Wordnet},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/77214},
CONFERENCE_NAME = {Third International Conference on Maritime Terminology},
}
@INPROCEEDINGS{PICCHI_2003_INPROCEEDINGS_PCCCFSST_77204,
AUTHOR = {Picchi, E. and Ceccotti, M. and Cignoni, L. and Cucurullo, N. and Fiorentini, G. and Sassi, M. and Sassolini, E. and Turrini, G.},
TITLE = {Linguistic Miner},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/77204},
CONFERENCE_NAME = {Congresso annuale AICA 2003: I costi dell'ignoranza e il valore della conoscenza nella società dell'informazione},
}
@INPROCEEDINGS{RUIMY_2003_INPROCEEDINGS_RMC_431276,
AUTHOR = {Ruimy, N. and Monachini, M. and Calzolari, N.},
TITLE = {Un lexique électronique multi-niveaux de l'italien},
YEAR = {2003},
ABSTRACT = {CLIPS est la plus vaste ressource lexicale électronique de l'italien. Elle comprend 55. 000 mots codés à 4 niveaux de description linguistique. La représentation lexicale est basée sur des standards internationaux: CLIPS utilise en effet le même modèle, le même langage de représentation et la même méthodologie que 11 autres lexiques développés au cours des projets européens PAROLE et SIMPLE. Les informations fournies, particulièrement utiles pour des applications de TLH, sont très structurées, granulaires et innovatrices, avec entre autres au niveau sémantique la Extended Qualia Structure, basée sur la théorie du Lexique Génératif, et la représentation prédicative. La description d'une unité lexicale est un continuum à travers les différents niveaux d'information. Les propriétés phonologiques, morphologiques et syntaxiques d'un lemme, ainsi que son/ses schéma(s) d'arguments sont décrits. Au niveau sémantique, chaque lexème/sens est associé à un vaste ensemble structuré d'informations, parmi lesquelles son type ontologique et l'expression-au moyen des relations qualia-des différentes facettes de sa sémantique. La représentation prédicative décrit, quant à elle, le scénario sémantique (dans lequel le mot s'insère) et ses participants auxquels sont attribués rôle thématique et contraintes sémantiques. La relation des niveaux syntaxique et sémantique est assurée par des liens permettant de projeter les structures argumentales sur leur(s) réalisation(s) syntaxique(s). Une telle richesse d'information, et en particulier celle fournie par la Extended Qualia, permet notamment 1) de constituer des réseaux sémantiques, en formulant une requête sur l'ensemble des relations qualia contenant un mot-clé; 2) d'extraire des noyaux de vocabulaire de domaines spécifiques, en alternant requêtes sur qualia et sens; 3) d'acquérir des collocations lexicales, en exploitant les liens syntagmatiques évènements/entités exprimés par les qualia; 4) de désambiguïser la contribution sémantique du modificateur dans certains groupes nominaux complexes, en analysant la structure qualia de la tête},
PAGES = {1-10},
URL = {https://iris.cnr.it/handle/20.500.14243/431276},
ISBN = {80-86732-21-5},
CONFERENCE_NAME = {CIL XVII International Congress of Linguists},
}
@INPROCEEDINGS{SORIA_2003_INPROCEEDINGS_SBC_77215,
AUTHOR = {Soria, C. and Bertagna, F. and Calzolari, N.},
TITLE = {ItalWordNet in an annotation task: a chance for discussion},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/77215},
}
@TECHREPORT{ALLEGRINI_2003_TECHREPORT_ACMMHICDP_195189,
AUTHOR = {Allegrini, P. and Calzolari, N. and Marchi, S. and Montemagni, S. and Hepple, M. and Ireson, N. G. H. J. M. and Carrero, G. F. and De Buenaga, R. M. and Puera, S. E.},
TITLE = {POESIA Lexical Resources and Tools for Each Language},
YEAR = {2003},
ABSTRACT = {The aim of this report is to review the various resources that the different language processing sites expect to use in the development of their language-specific text filtering components. Some of the required resources are ones that were developed before Poesia, possibly by one the Poesia partners, or possibly elsewhere but being now in the public domain. Such resources may require adaptation to the Poesia task. Other resources required for Poesia will be developed as part of the project. In some cases, this development has already been done or is in progress, whilst in others, it is yet to be undertaken. In what follows, the status of each of the resources described will be made clear in terms of these alternatives},
KEYWORDS = {Lexical Resources, nlp},
PAGES = {30},
URL = {https://iris.cnr.it/handle/20.500.14243/195189},
}
@TECHREPORT{AMOROSO_2003_TECHREPORT_ACFFIMMPS_195153,
AUTHOR = {Amoroso, Y. and Cammelli, A. and Fameli, E. and Fameli, M. and Inghirami, B. and Mariani, P. and Marinai, M. and Parenti, L. and Sassi, M.},
TITLE = {Diritto alla vita e Diritto all'ambiente nel lessico costituzionale e nella dottrina giuridica. Strumenti e metodi per l'analisi linguistico-concettuale},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195153},
}
@TECHREPORT{BARONI_2003_TECHREPORT_BCF_288269,
AUTHOR = {Baroni, P. and Calzolari, N. and Fiorentini, G.},
TITLE = {Resources Roadmap (First Release)},
YEAR = {2003},
ABSTRACT = {ELSNET-4 Deliverable D6. 1},
KEYWORDS = {Language Resources, Roadmaps},
URL = {https://iris.cnr.it/handle/20.500.14243/288269},
}
@TECHREPORT{BARONI_2003_TECHREPORT_BCFLM_288896,
AUTHOR = {Baroni, P. and Calzolari, N. and Fiorentini, G. and Lenci, A. and Monachini, M.},
TITLE = {Resources Landscape (First Release)},
YEAR = {2003},
ABSTRACT = {ELSNET-4 Deliverable D6. 2},
KEYWORDS = {Language Resources, Landscapes},
URL = {https://iris.cnr.it/handle/20.500.14243/288896},
}
@TECHREPORT{BARONI_2003_TECHREPORT_BCFLM_195188,
AUTHOR = {Baroni, P. and Calzolari, N. and Fiorentini, G. and Lenci, A. and Monachini, M.},
TITLE = {Resources Landscape Map (1st release)},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195188},
}
@TECHREPORT{BARONI_2003_TECHREPORT_BCL_195154,
AUTHOR = {Baroni, P. and Calzolari, N. and Lenci, A.},
TITLE = {Extended Configuration of the Network and Final Report},
YEAR = {2003},
ABSTRACT = {ENABLER Deliverable D1. 2},
KEYWORDS = {Language Resources, Networks},
PAGES = {21},
URL = {https://iris.cnr.it/handle/20.500.14243/195154},
}
@TECHREPORT{BERTAGNA_2003_TECHREPORT_BCLM_195155,
AUTHOR = {Bertagna, F. and Calzolari, N. and Lenci, A. and Monachini, M.},
TITLE = {Report on the Feasibility and the Organisational Requirements for the Construction of Multilingual LRs},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195155},
}
@TECHREPORT{CALZOLARI_2003_TECHREPORT_CBLM_195178,
AUTHOR = {Calzolari, N. and Bertagna, F. and Lenci, A. and Monachini, M.},
TITLE = {MILE Users? Evaluation and Feedback},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195178},
}
@TECHREPORT{CALZOLARI_2003_TECHREPORT_CBLM_195157,
AUTHOR = {Calzolari, N. and Bertagna, F. and Lenci, A. and Monachini, M.},
TITLE = {Standards and Best Practice for Multilingual Computational Lexicons-MILE (the Multilingual ISLE Lexical Entry)},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195157},
}
@TECHREPORT{CALZOLARI_2003_TECHREPORT_CGP_195180,
AUTHOR = {Calzolari, N. and Grishman, R. and Palmer, M.},
TITLE = {Introduction to the CLWG Guidelines},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195180},
}
@TECHREPORT{CALZOLARI_2003_TECHREPORT_CW_195158,
AUTHOR = {Calzolari, N. and Wittenburg, P.},
TITLE = {Report of the ISO Preparation Workhop on Lexicons},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195158},
}
@TECHREPORT{CAMMELLI_2003_TECHREPORT_CS_147784,
AUTHOR = {Cammelli, A. and Sassi, M.},
TITLE = {Strumenti e metodi per uno studio lessicale della Costituzione della Repubblica Bolivariana del Venezuela},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/147784},
}
@TECHREPORT{CECCOTTI_2003_TECHREPORT_CS_195886,
AUTHOR = {Ceccotti, M. L. and Sassi, M.},
TITLE = {Iterazioni gaddiane},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195886},
}
@TECHREPORT{CECCOTTI_2003_TECHREPORT_CS_195887,
AUTHOR = {Ceccotti, M. and Sassi, M.},
TITLE = {Annotazioni su composti in-cola. Da Dante a Gadda},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195887},
}
@TECHREPORT{CECCOTTI_2003_TECHREPORT_CS_195888,
AUTHOR = {Ceccotti, M. and Sassi, M.},
TITLE = {Concordanze del Pasticciaccio},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195888},
}
@TECHREPORT{ENEA_2003_TECHREPORT_E_195159,
AUTHOR = {Enea, A.},
TITLE = {Webmail: un'interfaccia Web per la posta elettronica},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195159},
}
@TECHREPORT{ENEA_2003_TECHREPORT_E_195160,
AUTHOR = {Enea, A.},
TITLE = {Una soluzione AntiVirus e AntiSpam},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195160},
}
@TECHREPORT{ENEA_2003_TECHREPORT_EF_195161,
AUTHOR = {Enea, A. and Fiorentini, G.},
TITLE = {Il nuovo sito Internet dell'Istituto di Linguistica Computazionale},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195161},
}
@TECHREPORT{ENEA_2003_TECHREPORT_EPOF_195181,
AUTHOR = {Enea, A. and Pardelli, G. and Orsolini, P. and Fiorentini, G.},
TITLE = {Pubblicazioni ILC sul WEB},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195181},
}
@TECHREPORT{GAVRILIDOU_2003_TECHREPORT_GDLCMS_195162,
AUTHOR = {Gavrilidou, M. and Desipri, E. and Labropoulo, P. and Calzolari, N. and Monachini, M. and Soria, C.},
TITLE = {Technical Specifications for the Selection and Encoding of Multilingual Resources},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195162},
}
@TECHREPORT{HEID_2003_TECHREPORT_HMPS_195182,
AUTHOR = {Heid, U. and Maci, E. and Pirrelli, V. and Soria, C.},
TITLE = {NITE Interim Evaluation Report},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195182},
}
@TECHREPORT{LENCI_2003_TECHREPORT_LCM_195186,
AUTHOR = {Lenci, A. and Calzolari, N. and Monachini, M.},
TITLE = {Report on LR Related Activities to Be Promoted},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195186},
}
@TECHREPORT{MARZI_2003_TECHREPORT_MPA_195183,
AUTHOR = {Marzi, C. and Petrongolo, C. and Aprile, N.},
TITLE = {GLARS: Contratti dei servizi comuni di Area},
YEAR = {2003},
ABSTRACT = {Revisione dei contratti di appalto dei servizi di Mensa, vigilanza, e pulizie, per una ottimizzazione dei servizi e risparmio dei costi},
KEYWORDS = {contratti servizi, Area della Ricerca Pisa},
URL = {https://iris.cnr.it/handle/20.500.14243/195183},
}
@TECHREPORT{MONACHINI_2003_TECHREPORT_MBCL_195163,
AUTHOR = {Monachini, M. and Bertagna, F. and Calzolari, N. and Lenci, A.},
TITLE = {Improving Harmonisation between Resources: Divergence/Convergence between Specifications and de-facto Standards},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195163},
}
@TECHREPORT{MONACHINI_2003_TECHREPORT_MBCUN_195164,
AUTHOR = {Monachini, M. and Bertagna, F. and Calzolari, N. and Underwood, N. and Navarretta, C.},
TITLE = {Towards a Standard for the Creation of Lexica},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195164},
}
@TECHREPORT{MONACHINI_2003_TECHREPORT_MS_195165,
AUTHOR = {Monachini, M. and Soria, C.},
TITLE = {Testing Scenario and Quality Assessment Strategy},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195165},
}
@TECHREPORT{QUOCHI_2003_TECHREPORT_QJ_195190,
AUTHOR = {Quochi, V. and Jan, O.},
TITLE = {"Appendix F: Representing noun compounds and support verbs in MILE (PISA & XMELLT)"},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195190},
}
@TECHREPORT{RUIMY_2003_TECHREPORT_RMC_195167,
AUTHOR = {Ruimy, N. and Monachini, M. and Calzolari, N.},
TITLE = {Progetto CLIPS: Specifiche Linguistiche e Manuale di Codifica, Livello semantico},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195167},
}
@TECHREPORT{RUIMY_2003_TECHREPORT_RMC_195166,
AUTHOR = {Ruimy, N. and Monachini, M. and Calzolari, N.},
TITLE = {Progetto CLIPS: Specifiche Linguistiche e Manuale di Codifica, Livello sintattico},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195166},
}
@TECHREPORT{SABA_2003_TECHREPORT_S_195171,
AUTHOR = {Saba, A.},
TITLE = {Lessico del testo "Arte de la verdadera navegación en que se trata de la máchina del mundo" di Pedro de Siria, (ed. 1602, pp. 167). Trascrizione digitale: A. Saba},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195171},
}
@TECHREPORT{SABA_2003_TECHREPORT_S_195169,
AUTHOR = {Saba, A.},
TITLE = {Lessico del testo ?Hidrografía: la más curiosa que hasta aquí ha salido a luz [. ]? di Andrés de Poza, (ed. 1585, pp. 363). Trascrizione digitale: A. Saba},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195169},
}
@TECHREPORT{SABA_2003_TECHREPORT_S_195168,
AUTHOR = {Saba, A.},
TITLE = {Arte de la verdadera navegación en que se trata de la máchina del mundo" di Pedro de Siria, (ed. 1602, pp. 167)},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195168},
}
@TECHREPORT{SABA_2003_TECHREPORT_S_195173,
AUTHOR = {Saba, A.},
TITLE = {"Arte de navegar en que se contienen las reglas, declaraciones, secretos y avisos que a la navegación son necessarios [. ]" di Pedro de Medina, (ed. 1545, pp. 211)},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195173},
}
@TECHREPORT{SABA_2003_TECHREPORT_S_195172,
AUTHOR = {Saba, A.},
TITLE = {?Hidrografía: la más curiosa que hasta aquí ha salido a luz [. ]? di Andrés de Poza, (ed. 1585, pp. 363)},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195172},
}
@TECHREPORT{SABA_2003_TECHREPORT_S_195170,
AUTHOR = {Saba, A.},
TITLE = {Lessico del testo ?Arte de navegar en que se contienen las reglas, declaraciones, secretos y avisos que a la navegación son necessarios [. ]? di Pedro de Medina, (ed. 1545, pp. 211). Trascrizione digitale: B. Periñán},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195170},
}
@TECHREPORT{SASSI_2003_TECHREPORT_S_195174,
AUTHOR = {Sassi, M.},
TITLE = {La consultazione dei corpora costituzionali con DBT},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195174},
}
@TECHREPORT{SASSI_2003_TECHREPORT_SA_195193,
AUTHOR = {Sassi, M. and Amoroso, Y.},
TITLE = {Il corpus elettronico delle costituzioni ibero-americane},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195193},
}
@TECHREPORT{SASSI_2003_TECHREPORT_SA_195175,
AUTHOR = {Sassi, M. and Amoroso, Y.},
TITLE = {Il corpus elettronico delle costituzioni iberoamericane},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195175},
}
@TECHREPORT{SASSI_2003_TECHREPORT_SC_195192,
AUTHOR = {Sassi, M. and Ceccotti, M. L.},
TITLE = {Documentazione dell'attività di consulenza svolta sul database Gadda per studiosi in Italia e all'estero (2002-2003)},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195192},
}
@TECHREPORT{SASSI_2003_TECHREPORT_SC_195889,
AUTHOR = {Sassi, M. and Ceccotti, M.},
TITLE = {Concordanze della Cognizione del dolore},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195889},
}
@MISC{CAPPELLI_2003_MISC_CG_142875,
AUTHOR = {Cappelli, A. and Giovannetti, E.},
TITLE = {L'interazione Uomo-Robot},
YEAR = {2003},
ABSTRACT = {L'Interazione Uomo-Robot (HRI, Human-Robot Interaction) è un'area di ricerca multidisciplinare in costante sviluppo ricca di spunti per ricerche avanzate e trasferimenti di tecnologia. Essa gioca un ruolo fondamentale nella realizzazione di robot che operano in ambienti aperti e cooperano con gli esseri umani. Compiti di questo tipo richiedono lo sviluppo di tecniche che permettano ad utenti inesperti di usare i loro robot in modo semplice e sicuro utilizzando interfacce intuitive e naturali. In questo lavoro, dopo un'introduzione riguardante le questioni fondamentali dell'HRI, saranno indagate le diverse classificazioni di robot e una particolare tassonomia dell'Interazione Uomo-Robot, dopodiché saranno presentate le diverse modalità di interazione possibili tra un robot e un essere umano corredate da una serie di applicazioni di interfacce uomo-robot avanzate con particolare riguardo per i robot di assistenza agli anziani e alle persone diversamente abili},
KEYWORDS = {Robotics, Human-robot interaction, Man-machine interfaces},
URL = {https://iris.cnr.it/handle/20.500.14243/142875},
}
@MISC{CAPPELLI_2003_MISC_C_192721,
AUTHOR = {Cappelli, G.},
TITLE = {Studio Morfosintattico del LSM (Linguaggio dei Segni Messicano)},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/192721},
}
@MISC{CAPPELLI_2003_MISC_C_192722,
AUTHOR = {Cappelli, G.},
TITLE = {"OLISIPPO: estrazione automatica di Vocabolario Basico del Latino"},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/192722},
}
@MISC{CUTUGNO_2003_MISC_CMRR_195890,
AUTHOR = {Cutugno, P. and Marconi, L. and Ratti, D. and Rolando, C.},
TITLE = {Il linguaggio burocratico e l'uso del computer},
YEAR = {2003},
KEYWORDS = {linguaggio, semplificazione, lessico},
URL = {https://iris.cnr.it/handle/20.500.14243/195890},
}
@MISC{DIDONATO_2003_MISC_D_383725,
AUTHOR = {Di Donato, F.},
TITLE = {G. Bocchi, M. Ceruti (a cura di), Origini della scrittura. Genealogie di un'invenzione, Milano, Mondadori, 2002},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/383725},
ISSN = {1826-4654},
}
@MISC{ENEA_2003_MISC_E_123075,
AUTHOR = {Enea, A.},
TITLE = {Gli ARCHIVI CARTACEI degli Istituti per la storia della Resistenza e della società contemporanea in Italia},
YEAR = {2003},
URL = {http://www.italia-resistenza.it/archivi-insmli-ricerca-semplice},
}
@MISC{ENEA_2003_MISC_EPOF_195177,
AUTHOR = {Enea, A. and Pardelli, G. and Orsolini, P. and Fiorentini, G.},
TITLE = {Banca dati delle Pubblicazioni ILC sul WEB},
YEAR = {2003},
ABSTRACT = {Il repertorio delle pubblicazioni scientifiche dell'Istituto di Linguistica Computazionale disponibile in Internet è strutturato per censire i prodotti dell'attività di ricerca: Libri e loro capitoli; Articoli su riviste scientifiche nazionali e internazionali; Articoli in atti di convegni nazionali e internazionali; Deliverable di progetti comunitari; Rapporti tecnici e CD-Rom. Da pochi anni si sono aggiunte anche le pubblicazioni fruibili da Internet, in particolare dalle riviste elettroniche. A questa nuova tipologia appartengono anche alcuni riferimenti bibliografici delle pubblicazioni ILC. I riferimenti bibliografici si riconducono al: 1) Trattamento Automatico della Lingua, comprendente: risorse linguistiche (corpora testuali, lessici, thesauri), reti concettuali, strumenti di analisi linguistica del testo, strumenti di estrazione e rappresentazione del contenuto testuale; 2) Analisi filologica, letteraria e linguistica del testo: sistemi di gestione di basi di dati testuali, lessicali e dialettali, strumenti multimediali per lo studio della tradizione del testo, strumenti per la documentazione, conservazione e fruizione del patrimonio linguistico-culturale; 3) Applicazioni di varia natura: Traduzione automatica; Strumenti multimediali per la didattica e la disabilità; Tecnologie per il filtraggio di contenuti internet a tutela dei minori; Strumenti multilingue; Generazione automatica; Ontologia; Web Semantico. La descrizione delle scelte tecnologiche e del software utilizzato è descritta nella pubblicazione allegata},
KEYWORDS = {Bibliografia, Linguistica Computazionale},
URL = {http://www.ilc.cnr.it/viewpage.php/sez=ricerca/id=58/vers=ita},
}
@MISC{GIOVANNETTI_2003_MISC_G_264613,
AUTHOR = {Giovannetti, E.},
TITLE = {8° Congresso della Associazione Italiana per l'Intelligenza Artificiale},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/264613},
}
@MISC{MARCONI_2003_MISC_M_464685,
AUTHOR = {Marconi, L.},
TITLE = {Thesaurus elettronico Italiano-Spagnolo: Strumento per l'insegnamento e la traduzione automatica assistita nelle due lingue},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/464685},
}
@MISC{MARZI_2003_MISC_M_195184,
AUTHOR = {Marzi, C.},
TITLE = {FONDI STRUTTURALI: linee direttrici},
YEAR = {2003},
ABSTRACT = {Scopo del presente documento è la diffusione delle indicazioni ed istruzione ricevute in occasione del corso di formazione sulla "Preparazione, gestione e rendicontazione dei progetti di ricerca e sviluppo nell'ambito dei finanziamenti nazionali alla ricerca industriale (D. lgs. 297/99)"1. L'idea del corso nasce dall'importanza crescente annessa al ruolo delle Istituzioni Scientifiche per la crescita della competitività delle imprese, il che investe il CNR di nuovi compiti per lo sviluppo economico dell'Italia. In seguito alla riforma del sistema di incentivi alla ricerca industriale attuata dal MURST (Ministero dell'Università e della Ricerca Scientifica e Tecnologica-oggi MIUR) con l'emanazione di due provvedimenti che hanno riunito la precedente normativa-il Decreto Legislativo n. 297 del 27 luglio 1999 "Riordino della disciplina e snellimento delle procedure per il sostegno della ricerca scientifica e tecnologica, per la diffusione delle tecnologie, per la mobilità dei ricercatori" ed il Decreto Ministeriale n. 593 dell'8 agosto 2000 "Modalità procedurali per la concessione delle agevolazioni previste dal decreto legislativo 297/99"-il CNR, così come le Università e gli altri Enti Pubblici di Ricerca, trovano l'opportunità di collaborazione con le imprese e la possibilità di fruire dei finanziamenti agevolati per la ricerca nelle seguenti forme: presentazione di progetti di ricerca co-intestati tra imprese ed istituti di ricerca; partecipazione a Società e Consorzi per lo sviluppo di attività imprenditoriali; partecipazione ad attività di formazione di ricercatori e tecnici delle imprese},
KEYWORDS = {gestione, rendicontazione, progetti ricerca e sviluppo},
URL = {https://iris.cnr.it/handle/20.500.14243/195184},
}
@MISC{PICCHI_2003_MISC_P_106716,
AUTHOR = {Picchi, E.},
TITLE = {Lessicografia multilingue e trattamento dei testi},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/106716},
CONFERENCE_NAME = {Actas del Tercero Seminario de la Escuela Interlatina de Altos Estudios en Lingüística Aplicada},
}
@MISC{PIRRELLI_2003_MISC_PL_106713,
AUTHOR = {Pirrelli, V. and Lenci, A.},
TITLE = {Modelli computazionali dell'apprendimento del linguaggio},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/106713},
CONFERENCE_NAME = {XI Congresso della Società Italiana di Psicofisiologia},
}
@MISC{SASSI_2003_MISC_S_195194,
AUTHOR = {Sassi, M.},
TITLE = {Costituzione della Repubblica Bolivariana del Venezuela},
YEAR = {2003},
URL = {https://iris.cnr.it/handle/20.500.14243/195194},
}
@ARTICLE{BIORCI_2002_ARTICLE_BMRR_65004,
AUTHOR = {Biorci, G. and Marconi, L. and Ratti, D. and Rolando, C.},
TITLE = {La "composante animale" dans les expressions figées italiennes},
YEAR = {2002},
ABSTRACT = {This work involved the collection of Italian clichés and idiomatic phrases portraying an animal as the fulcrum which characterizes the linguistic sequence. The data were updated by insertion of stereotypes, idiomatic phrases, proverbs and locutions frequently used in the Italian language. The methodologies and morphosyntactic rules for the classification were studied and verified in practice. The results obtained were compared with the linguistic data of the Italian reference corpus. The idiomatic expressions collected-about 600-were sub-divided according to their formal typology. Their morphology and syntax were examined in detail and, wherever possible, the etymology of these expressions was investigated. At the time of their appearance they could be considered to be an invisible nucleus-although not set: verbs can be conjugated, some of the elements of the linguistic stereotypes can be substituted while keeping intact the meaning and the significance of the idiomatic phrase in the particular context. Numerous animals were found in the Italian language, 117 different species have come into every day language through idiomatic expressions and locutions, each processing its own history deeply rooted in the popular tradition, expressing, through metaphor, the commonplace, the folk wisdom, daily life and universal feeling},
KEYWORDS = {fraseologia idiomatica},
PAGES = {141-186},
URL = {https://iris.cnr.it/handle/20.500.14243/65004},
VOLUME = {81 (2)},
ISSN = {0007-9871},
JOURNAL = {CAHIERS DE LEXICOLOGIE},
}
@ARTICLE{CALZOLARI_2002_ARTICLE_CSBB_37683,
AUTHOR = {Calzolari, N. and Soria, C. and Bertagna, F. and Barsotti, F.},
TITLE = {Evaluating Lexical Resources Using Senseval},
YEAR = {2002},
ABSTRACT = {The aim of our paper is twofold: to introduce some general reflections on the task of lexical semantic annotation and the adequacy of existing lexical-semantic reference resources, while giving an overall description of the Italian lexical sample task for the SENSEVAL-2 experiment. We suggest how the SENSEVAL exercise (and comparison between the two editions of the experiment) can be employed to evaluate the lexical reference resources used for annotation. We conclude with a few general remarks on the gap between the lexicon, a partially decontextualised object, and the corpus, where context plays a significant role},
KEYWORDS = {Risorse Lessicali, Disambiguazione, Semantica, Annotazione, Wordnet},
PAGES = {375-390},
URL = {https://iris.cnr.it/handle/20.500.14243/37683},
VOLUME = {8 (4)},
DOI = {10.1017/S1351324902003017},
ISSN = {1469-8110},
JOURNAL = {NATURAL LANGUAGE ENGINEERING (ONLINE)},
}
@ARTICLE{CIGNONI_2002_ARTICLE_CCM_37684,
AUTHOR = {Cignoni, L. and Coffey, S. and Moon, R.},
TITLE = {Idiom Variation in Italian and English: Two Corpus-based Studies},
YEAR = {2002},
KEYWORDS = {Idioms, Variability, Corpora},
PAGES = {279-300},
URL = {https://iris.cnr.it/handle/20.500.14243/37684},
VOLUME = {2},
}
@ARTICLE{GUADAGNINI_2002_ARTICLE_G_275949,
AUTHOR = {Guadagnini, E.},
TITLE = {Scelta di voci del Tesoro della Lingua Italiana delle Origini (sesta serie)},
YEAR = {2002},
ABSTRACT = {Voci bottaccino s. m., bottaccio s. m., bottacciolo s. m., bottaglia s. f., bottaio s. m., bottame s. m., botte s. f., botticella s. f. / botticello s. m., botticina (1) s. f. / botticino s. m., botticina (2) s. f., bottigliere / bottigliero s. m., bottiglierìa s. f. del Tesoro della Lingua Italiana delle Origini (pp. 96-103)},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana},
PAGES = {41-242},
URL = {https://iris.cnr.it/handle/20.500.14243/275949},
VOLUME = {7},
ISSN = {1591-8254},
JOURNAL = {BOLLETTINO-OPERA DEL VOCABOLARIO ITALIANO},
}
@ARTICLE{GUADAGNINI_2002_ARTICLE_G_312039,
AUTHOR = {Guadagnini, E.},
TITLE = {Riflessi di tradizioni autonome: Blacatz, Blacasset e Guilhem Figueira nei canzonieri IKa},
YEAR = {2002},
ABSTRACT = {Riflessi di tradizioni autonome: Blacatz, Blacasset e Guilhem Figueira nei canzonieri IKa},
URL = {https://iris.cnr.it/handle/20.500.14243/312039},
ISSN = {1593-7259},
JOURNAL = {RIVISTA DI STUDI TESTUALI},
}
@ARTICLE{TURRINI_2002_ARTICLE_TCP_436875,
AUTHOR = {Turrini, G. and Cignoni, L. and Paccosi, A.},
TITLE = {Addizionario: words in your pocket},
YEAR = {2002},
ABSTRACT = {This paper describes Addizionario, a multilingual hypermedia laboratory for native language learning, addressed to children of nursery and primary schools. The features of the tool, which is child-centred, flexible, easy-to-use and interactive, make it suitable not only for normally skilled users, but also for those presenting more or less severe learning difficulties linked to both physical and cognitive impairment. The software, patented by the Italian National Research Council (C. N. R.), is used in numerous schools in Italy and abroad},
KEYWORDS = {Bisogni speciali, Apprendimento, Lingua, Multimedialità, E-learning},
PAGES = {136-139},
URL = {https://iris.cnr.it/handle/20.500.14243/436875},
VOLUME = {2398},
}
@INPROCEEDINGS{GIORGETTI_2002_INPROCEEDINGS_GPS_114022,
AUTHOR = {Giorgetti, D. and Prodanof, I. and Sebastiani, F.},
TITLE = {Automated Coding of Open-ended Surveys: Technical and Ethical Issues},
YEAR = {2002},
ABSTRACT = {This paper presents some technical and ethical issues arising from the use of automated methods to solve a typical social science problem: the coding of surveys including answers to open-ended questions. Coding an open-ended survey, which may include thousands of interviews, means to assign symbolic predefined labels to its answers according to their meaning. The increasing amount of information available from surveys carried out also on the Web, makes it viable the use of (semi)automated systems both to reduce time and human resources cost to analyze and manage it, and to produce results independent from coders' subjective impressions, but on the other hand poses both technical and ethical challenges to be carefully evaluated before being adopted},
KEYWORDS = {Text categorization},
PAGES = {9},
URL = {https://iris.cnr.it/handle/20.500.14243/114022},
CONFERENCE_NAME = {International Conference on Universal Knowledge and Language. ICUKL-2002},
}
@INPROCEEDINGS{GIORGETTI_2002_INPROCEEDINGS_GPS_101823,
AUTHOR = {Giorgetti, D. and Prodanof, I. and Sebastiani, F.},
TITLE = {Mapping an automated survey coding task into a probabilistic text categorization framework},
YEAR = {2002},
ABSTRACT = {This paper describes how to applya probabilistic Text Categorization method to a different and new domain where documents areanswers to open end questionnaires and codes viewed as categories consist of a hierarchical model. A reduced size training set mayb e used taking advantage of the hierarchical organization of categories. The system developed in this framework aims at helping psychologists in the evaluation of open end surveys inquiring about job candidates' competencies},
KEYWORDS = {Text categorization},
PAGES = {115-124},
URL = {https://link.springer.com/chapter/10.1007/3-540-45433-0_18#citeas},
VOLUME = {2389},
DOI = {10.1007/3-540-45433-0_18},
PUBLISHER = {Springer},
ISBN = {978-3-540-43829-8},
CONFERENCE_NAME = {PorTAL 2002-Third International Conference on Advances in Natural Language Processing},
BOOKTITLE = {Advances in Natural Language Processing},
}
@INPROCEEDINGS{PICCHI_2002_INPROCEEDINGS_PSNCV_222362,
AUTHOR = {Picchi, E. and Sassolini, E. and Nahli, O. and Cucurullo, S. and Vargas Isabel, M.},
TITLE = {Italian Arabic Linguistic Tools},
YEAR = {2002},
URL = {https://iris.cnr.it/handle/20.500.14243/222362},
CONFERENCE_NAME = {LREC 2002},
BOOKTITLE = {Third International Conference on Language Resources and Evaluation},
}
@INPROCEEDINGS{RUIMY_2002_INPROCEEDINGS_RMDGMUCZN_128484,
AUTHOR = {Ruimy, N. and Monachini, M. and Distante, R. and Guazzini, E. and Molino, S. and Ulivieri, M. and Calzolari, N. and Zampolli and , N.},
TITLE = {CLIPS, A Multil-level Italian Computational Lexicon: a Glimpse to Data},
YEAR = {2002},
ABSTRACT = {CLIPS is a multi-layered Italian computational lexicon based on the PAROLE-SIMPLE model. In this paper we briefly recall the main characteristics of the model and devote our attention to issues emerging from the encoding of large quantities of data, especially in relation to those types of syntactic and semantic information specific to our lexicon and that reflect innovative features of the underlying model},
URL = {https://iris.cnr.it/handle/20.500.14243/128484},
ISBN = {2-9517408-0-8},
}
@TECHREPORT{SASSOLINI_2002_TECHREPORT_SN_222368,
AUTHOR = {Sassolini, E. and Nahli, O.},
TITLE = {Motore morfologico della lingua araba},
YEAR = {2002},
URL = {https://iris.cnr.it/handle/20.500.14243/222368},
}
@TECHREPORT{STARYNKEVITCH_2002_TECHREPORT_SDTZHIGACMMG_403212,
AUTHOR = {Starynkevitch, B. and Daoudi, M. and Tombelle, C. and Zheng, H. and Hepple, M. and Ireson, N. and Gomezhildago, J. and Allegrini, P. and Calzolari, N. and Marchi, S. and Montemagni, S. and Guerra, S.},
TITLE = {POESIA Software Architecture Definition Document},
YEAR = {2002},
ABSTRACT = {Software Architecture Definition Document},
KEYWORDS = {NLP, Software Engineering},
PAGES = {68-80},
URL = {https://iris.cnr.it/handle/20.500.14243/403212},
}
@MISC{CAMMELLI_2002_MISC_CS_140514,
AUTHOR = {Cammelli, A. and Sassi, M.},
TITLE = {Progetto},
YEAR = {2002},
URL = {https://iris.cnr.it/handle/20.500.14243/140514},
}
@MISC{CECCOTTI_2002_MISC_CPS_17393,
AUTHOR = {Ceccotti, M. and Pardelli, G. and Sassi, M.},
TITLE = {Per un'analisi del lessico linguistico-computazionale: da Weaver all'ALPAC Report},
YEAR = {2002},
ABSTRACT = {In questo report proponiamo una breve presentazione della 'preistoria' della linguistica computazionale, del periodo compreso tra la pubblicazione del memorandum di Warren Weaver del 1949 e del Report dell'Alpac del 1966. La preistoria della CL vuol dire essenzialmente traduzione automatica, dizionari di macchina, etc., attività di ricerca svolte da matematici, fisici. L'inglese è la lingua veicolo di tutto ciò e continuerà ad esserlo ancora per anni prima che anche in Europa-eccezione è l'Inghilterra-e nel resto del mondo siano tentate traduzioni, adattamenti, proposte, che guidano i primi passi della ricerca in questi ambiti},
KEYWORDS = {Lessico linguistico-computazionale},
URL = {https://iris.cnr.it/handle/20.500.14243/17393},
}
@MISC{DIDONATO_2002_MISC_D_383722,
AUTHOR = {Di Donato, F.},
TITLE = {O. de Gouges, Dichiarazione dei diritti della donna e della cittadina},
YEAR = {2002},
ABSTRACT = {Traduzione dall'originale francese di O. de Gouges, Dichiarazione dei diritti della donna e della cittadina},
URL = {https://iris.cnr.it/handle/20.500.14243/383722},
ISSN = {1591-4305},
}
@MISC{DIDONATO_2002_MISC_D_382045,
AUTHOR = {Di Donato, F.},
TITLE = {Gerardo Cunico, Il millennio del filosofo: chiliasmo e teleologia morale in Kant, ETS, Pisa 2001},
YEAR = {2002},
URL = {https://iris.cnr.it/handle/20.500.14243/382045},
ISSN = {1591-4305},
}
@MISC{DIDONATO_2002_MISC_D_406236,
AUTHOR = {Di Donato, F.},
TITLE = {L'approccio filosofico ad una nuova scienza: l'ecologia sociale},
YEAR = {2002},
ABSTRACT = {Workshop La dea ferita. Donne, sviluppo, cooperazione internazionale, Scuola Sant'Anna di Pisa, 14 febbraio 2002},
URL = {https://iris.cnr.it/handle/20.500.14243/406236},
}
@MISC{DIDONATO_2002_MISC_D_382043,
AUTHOR = {Di Donato, F.},
TITLE = {P. Bourdieu, La domination masculine, Edition du Seuil, Paris 1998},
YEAR = {2002},
URL = {https://iris.cnr.it/handle/20.500.14243/382043},
ISSN = {1591-4305},
}
@MISC{GUADAGNINI_2002_MISC_G_265630,
AUTHOR = {Guadagnini, E.},
TITLE = {"Sill, qu'es caps e guitz" (P.-C. 461, 67a): un descort provenzale del secondo quarto del Duecento},
YEAR = {2002},
URL = {https://iris.cnr.it/handle/20.500.14243/265630},
CONFERENCE_NAME = {VII Congresso Internazionale dell'AIEO [Association Internationale d'Études Occitanes]},
}
@MISC{PARDELLI_2002_MISC_POSEG_123610,
AUTHOR = {Pardelli, G. and Orsolini, P. and Sassi, M. and Enea, A. and Gazzetti, S.},
TITLE = {TAL Bibliography (1951-2002). Parte I},
YEAR = {2002},
ABSTRACT = {Il presente catalogo contiene molte delle bibliografie del Trattamento Automatico della Lingua TAL a partire dal secondo dopoguerra ad oggi e diverse bibliografie di opere di linguistica generale variamente collegate alla linguistica Computazionale CL, in varie formulazioni: glossematica, grammatica trasformazionale-generativa, fonetica, stilistica linguistica, psicolinguistica, sociolinguistica, didattica delle lingue, filosofia del linguaggio, storia della lingua, funzionalismo praghese, prosodismo inglese, ecc. Sono compresi, inoltre, alcuni riferimenti alla documentazione di alcuni linguaggi di programmazione evoluti adatti alla elaborazione di dati linguistici. La tipologia delle opere presenti nel seguente catalogo sinteticamente può ricondursi a:-Le prime testimonianze del trattamento automatico del linguaggio: Busa (1951);-Atti di Congressi e Conferenze di varie Associazioni Internazionali (ACL, ALLC, COLING, TAL, ACLA, AILA, ecc.), tra i principali possiamo citare quelli dei congressi di CL tenuti a Yorktown Heights (IBM-64), a Grenoble (CITAL-67), a Praga (1968) e a Bergen (COLING-78);-Opere generali o introduttive delle applicazioni del calcolatore alle ricerche umanistiche e letterarie. Un esempio è dato dalla pubblicazione di F. De Tollenaere: i lavori presentati in questo survey del 1962 si riferiscono a ricerche nel settore Humanities di vari paesi: Stati Uniti, Inghilterra, Francia, Italia, Belgio, Olanda, Unione Sovietica, Cecoslovacchia, ecc. In questo gruppo, per la lessicografia, ricordiamo i due colloqui di Praga (1967) e di Pisa (1970)0;-Opere sull'uso di modelli matematici nella linguistica (Garvin, Maegaard). Gli argomenti trattati in queste opere nella maggior parte dei casi fanno riferimento a: 1. Valutazione statistica: compilazione di liste, dizionari, indici e di ricerche statistiche in genere (livello distribuzionale); 2. Elaborazione algoritmica dei sistemi sintattici e di vari modelli di acquisizione del linguaggio (livello sintattico); 3. Elaborazione automatica del contenuto del linguaggio (livello semantico); 4. Traduzione automatica (per le varie lingue); 5. Lessicografia (classica, romanza, slava, germanica, biblica, concordanze, indici e studi dialettologici, ecc.). E' stato possibile individuare le tematiche principali e gli argomenti più ricorrenti della soggettazione attraverso l'analisi di circa 5000 documenti nel settore del TAL. Mantenere una terminologia comune (normalizzazione) della soggettazione non è stato sempre possibile. L'interdisciplinarietà, sempre più praticata dopo gli anni '50, dovuta all'incontro dei metodi della linguistica con altre discipline e la terminologia dei primi anni in questo settore di indagine, ci avrebbero condotto alla dispersione dei soggetti, che sono stati rivisti in funzione di una maggiore omogeinità. I testi che studiano il linguaggio e i sistemi di automazione nelle ricerche e nelle analisi linguistiche sono stati descritti nel database principalmente in inglese e occasionalmente in francese per casi particolari (v. nell'indice dei Soggetti: Traduction Mécanique /Traduction Automatique) per rispettarne le prime testimonianze. Abbiamo preferito mantenere descrittori simili per evidenziare l'evoluzione della terminologia usata nei testi nel corso degli anni (v.: Automatic. /Automated.). Abbiamo evitato, per quanto possibile, l'uso di termini di eccessivo tecnicismo: ciò per rendere più agevole la ricerca attraverso Internet da parte di un'utenza non sempre specialistica. Il lavoro di soggettazione, analisi e selezione dei documenti per la costruzione di questo archivio è stato svolto da Gabriella Pardelli. Il software CDS-ISIS dell'Unesco è stato utilizzato per gli standard catalografici e, allo scopo, è stato attivato un server per l'accesso simultaneo al database. Il supporto informatico, anche per ciò che concerne il rilevamento dei dati per le indagini statistiche come il recupero automatico dei tag di sottocampo dei record bibliografici (lingua, paese, argomento, ecc.) è stato fornito interamente da Alessandro Enea. Paola Orsolini e Silvia Gazzetti si sono occupate del lavoro di catalogazione. L'elaborazione del catalogo generato dal database ISIS è stata effettuata da Manuela Sassi},
KEYWORDS = {Bibliografia, Linguistica Computazionale},
PAGES = {1-187},
URL = {http://www.biblos.cnr.it/04_2_TALb.html},
PUBLISHER = {S. T. A. R. Servizio Tecnografico Area Ricerca CNR (Pisa, ITA)},
CONFERENCE_PLACE = {Pisa},
}
@MISC{SASSI_2002_MISC_S_265982,
AUTHOR = {Sassi, M.},
TITLE = {Tratado del Esphera y del arte del marear},
YEAR = {2002},
URL = {https://iris.cnr.it/handle/20.500.14243/265982},
}
@ARTICLE{BOTTINO_2001_ARTICLE_BC_211259,
AUTHOR = {Bottino, R. and Cutugno, P.},
TITLE = {Developing basic key skills through the use of ICT tools},
YEAR = {2001},
ABSTRACT = {In this paper, we seek to establish a link between some basic key skills and the way in which ICT could be used to foster those skills in schools. This is preceded by a brief introduction examining what the term key skill usually stands for. We investigate how ICT can be used to foster the development of skills that are not specifically related to a particular disciplinary field or technical ability but which are relevant and useful in primary and secondary school education and can affect access to future employment. A new element presented in this work concerns the possibility of reflecting about relationships which, thanks to an appropriate use of technology, are being established between processes of innovation in school, teaching practice and the changing abilities and methods required in the world of work},
KEYWORDS = {EDUCATION, KNOWLEDGE AND LEARNING, Education and Life-Long Learning, General Engineering, Learning and Human Resources Development, SCIENCE, ENGINEERING AND TECHNOLOGY},
PAGES = {179-188},
URL = {http://www.ingentaconnect.com/content/ind/ijceell/2001/00000011/00000003/art00001},
VOLUME = {11 (3)},
DOI = {10.1504/IJCEELL.2001.000392},
ISSN = {1560-4624},
JOURNAL = {INTERNATIONAL JOURNAL OF CONTINUING ENGINEERING EDUCATION \& LIFELONG LEARNING},
}
@ARTICLE{CALZOLARI_2001_ARTICLE_CCZ_50335,
AUTHOR = {Calzolari, N. and Corazzari, O. and Zampolli, A.},
TITLE = {Lexical-Semantic Tagging of an Italian Corpus},
YEAR = {2001},
ABSTRACT = {Semantically tagged corpora are becoming an urgent need for training and evaluation within many applications. They are also the natural accompaniment of semantic lexicons, for which they constitute both a useful testbed to evaluate their adequacy and a repository of corpus examples for the attested senses. It is essential that sound criteria are defined for their construction and a specific methodology is set up for the treatment of various semantic phenomena. We present some observations and results concerning the lexical-semantic tagging of an Italian corpus within the framework of two projects: the ELSNET feasibility study, part of a preparatory phase started with Senseval/Romanseval, and an Italian National Project (TAL), where one of the components is the lexical-semantic annotation of larger quantities of texts for an Italian syntactic-semantic Treebank. The results of the ELSNET experiment have been of utmost importance for the definition of the technical guidelines for the lexical-semantic level of annotation of the Treebank},
URL = {https://iris.cnr.it/handle/20.500.14243/50335},
}
@ARTICLE{DIDONATO_2001_ARTICLE_D_382021,
AUTHOR = {Di Donato, F.},
TITLE = {La filosofia è donna? Pensiero femminista e pensiero femminile},
YEAR = {2001},
ABSTRACT = {Le donne sono emarginate dalla sfera pubblica: la presenza e la visibilità di esse nel diritto e nella cultura restano limitate, nonostante le rivendicazioni femministe abbiano mostrato con chiarezza, a partire da almeno due secoli, in che misura il problema influisca tanto sulle condizioni di vita delle donne quanto sull'organizzazione e la struttura della sfera pubblica stessa. Il femminismo, per risolvere la questione delle disuguaglianze legate a questa esclusione e riequilibrare la presenza maschile e femminile nelle istituzioni, presenta due proposte assai diverse: il pensiero della differenza rivendica il riconoscimento della differenza sessuale come fatto che caratterizza essenzialmente le persone, e dunque richiede sul piano dei diritti, diritti sessuati, e, sul piano della cultura, la necessità per le donne di rafforzare gli strumenti propri della femminilitÃ; il femminismo dell'uguaglianza sostiene, di contro, che chiedere di essere riconosciute come soggetti del diritto e della cultura in quanto donne è controproducente, e che non si tratta tanto di rivendicare visibilità per problemi intesi come tipici delle donne, quanto di mostrare in che misura questi problemi riguardino tanto le donne quanto gli uomini. Così, pur partendo da un elemento comune e universalmente riconosciuto, l'emarginazione delle donne dalla sfera pubblica, sul piano politico il femminismo si trova diviso. Per comprendere le implicazioni delle diverse proposte, è necessario soffermarsi sulla lettura che la filosofia femminista dà delle storie della femminilità, vale a dire sul modo in cui questa esclusione viene motivata e argomentata nel pensiero filosofico e politico. Nel tentare di fare ciò, prende in esame le interpretazioni di due argomenti centrali delle storie della femminilità: il nesso tra l'essere donna e la capacità di procreare e quello, che da questo segue, tra femminilità e funzione materna},
URL = {https://iris.cnr.it/handle/20.500.14243/382021},
ISSN = {1591-4305},
JOURNAL = {BOLLETTINO TELEMATICO DI FILOSOFIA POLITICA},
}
@ARTICLE{GUADAGNINI_2001_ARTICLE_G_275952,
AUTHOR = {Guadagnini, E.},
TITLE = {Scelta di voci del Tesoro della Lingua Italiana delle Origini (quinta serie)},
YEAR = {2001},
ABSTRACT = {Voci borsa s. f., borsaio s. m., borsellina s. f., borsellino s. m., borsello s. m., borsetta s. f., borsetto s. m., borsingo agg. del Tesoro della Lingua Italiana delle Origini (pp. 215-220)},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana},
PAGES = {39-246},
URL = {https://iris.cnr.it/handle/20.500.14243/275952},
VOLUME = {6},
ISSN = {1591-8254},
JOURNAL = {BOLLETTINO-OPERA DEL VOCABOLARIO ITALIANO},
}
@ARTICLE{PICCHI_2001_ARTICLE_PMB_37675,
AUTHOR = {Picchi, E. and Montemagni, S. and Biagini, L.},
TITLE = {DBT-ALT: a System for Storying and Querying the Data of the Atlante Lessicale Toscano (ALT)},
YEAR = {2001},
KEYWORDS = {Atlanti linguistici, Dialettologia comput, Lessicografia dialet, Geolinguistica, Sociolinguistica},
PAGES = {85-103},
URL = {https://iris.cnr.it/handle/20.500.14243/37675},
VOLUME = {9},
}
@BOOK{PICCHI_2001_BOOK_PS_134781,
AUTHOR = {Picchi, E. and Stoppelli, P.},
TITLE = {LIZ 4. 0 Letteratura Italiana Zanichelli},
YEAR = {2001},
KEYWORDS = {Analisi testuale, Editoria Elettronica, Letteratura Italiana, Digital Library},
URL = {https://iris.cnr.it/handle/20.500.14243/134781},
PUBLISHER = {Zanichelli (Bologna, ITA)},
CONFERENCE_PLACE = {Bologna},
}
@BOOK{SABA_2001_BOOK_S_134780,
AUTHOR = {Saba, A.},
TITLE = {El léxico del Breve Compendio de la sphera y de la arte de navegar de Martín Cortés},
YEAR = {2001},
KEYWORDS = {Lessicografia, Morfosintassi, Lessico nautico, Text processing},
URL = {https://iris.cnr.it/handle/20.500.14243/134780},
}
@INCOLLECTION{RUIMY_2001_INCOLLECTION_RGM_134778,
AUTHOR = {Ruimy, N. and Gola, E. and Monachini, M.},
TITLE = {Lexicography Informs Lexical Semantics: the SIMPLE Experience},
YEAR = {2001},
ABSTRACT = {This volume is a collection of original contributions from outstanding scholars in linguistics, philosophy and computational linguistics exploring the relation between word meaning and human linguistic creativity},
KEYWORDS = {semantica lessicale, ontologia, templates, lessico elettronico, lessico generativo},
PAGES = {350-362},
URL = {https://iris.cnr.it/handle/20.500.14243/134778},
PUBLISHER = {Cambridge University Press (Cambridge, GBR)},
ISBN = {0521780489},
CONFERENCE_PLACE = {Cambridge},
BOOKTITLE = {The Language of Word Meaning},
EDITOR = {Bouillon, P. and Busa, F. and Bogouraev, B.},
}
@TECHREPORT{CIGNONI_2001_TECHREPORT_C_16626,
AUTHOR = {Cignoni, G. P.},
TITLE = {Entrate Lessicali per il trattamento automatico del linguaggio (TAL)},
YEAR = {2001},
ABSTRACT = {In questo articolo verranno brevemente descritti i contenuti che caratterizzano l'attività di ricerca dell'Istituto di Linguistica Computazionale ILC, e attraverso le entrate lessicali elaborate per le cosiddette digital libraries, cercheremo di rappresentare la produzione scientifica del personale afferente alla struttura di ricerca e i testi presenti in Biblioteca. La prima parte sarà dedicata allo studio dei tempi argomentali più significativi nel settore del trattamento automatico della lingua, la seconda presenterà gli archivi accessibili viarete telematica. Scopo di questo lavoro è quello di poter soddisfare l'utenza in questo settore disciplinare, che spesso può essere specialistica (insegnanti, dottorandi, masterandi, cultori della materia ecc.), ma che può anche appartenere ad altre categorie (studenti medi, studenti universitari ecc.)},
URL = {https://iris.cnr.it/handle/20.500.14243/16626},
}
@MISC{DIDONATO_2001_MISC_D_382047,
AUTHOR = {Di Donato, F.},
TITLE = {J. S. Mill, H. Taylor, Sull'eguaglianza ed emancipazione femminile, Einaudi 2001, trad. it. M. Reichlin, cura di N. Urbinati},
YEAR = {2001},
URL = {https://iris.cnr.it/handle/20.500.14243/382047},
ISSN = {1591-4305},
}
@MISC{DIDONATO_2001_MISC_D_383721,
AUTHOR = {Di Donato, F.},
TITLE = {R. Aramayo, F. Oncina (a cura di), Etica y antropologia. Un dilema kantiano, Editorial Comares, Granada 1999},
YEAR = {2001},
URL = {https://iris.cnr.it/handle/20.500.14243/383721},
ISSN = {0393-2516},
}
@ARTICLE{GUADAGNINI_2000_ARTICLE_G_275955,
AUTHOR = {Guadagnini, E.},
TITLE = {Scelta di voci del Tesoro della Lingua Italiana delle Origini (quarta serie)},
YEAR = {2000},
ABSTRACT = {Voci arenga (1) s. f., civanza s. f., civanzare v. del Tesoro della Lingua Italiana delle Origini},
URL = {https://iris.cnr.it/handle/20.500.14243/275955},
VOLUME = {5},
ISSN = {1591-8254},
JOURNAL = {BOLLETTINO-OPERA DEL VOCABOLARIO ITALIANO},
}
@ARTICLE{LENCI_2000_ARTICLE_LBBCGMOPPRVZ_124413,
AUTHOR = {Lenci, A. and Bel, N. and Busa, F. and Calzolari, N. and Gola, E. and Monachini, M. and Ogonowsky, A. and Peters, I. and Peters, W. and Ruimy, N. and Villegas, M. and Zampolli, A.},
TITLE = {SIMPLE: A General Framework for the Development of Multilingual Lexicons},
YEAR = {2000},
ABSTRACT = {The project LE-SIMPLE is an innovative attempt at building harmonized syntacticsemantic lexicons for twelve European languages, intended for use in different Human Language Technology applications. SIMPLE provides a general design model for the encoding of a large amount of semantic information, ranging from ontological typing, to argument structure and terminology. SIMPLE thus provides a general framework for resource development, where state-of-the-art results in lexical semantics are coupled with the needs of Language Engineering applications accessing semantic information},
URL = {https://iris.cnr.it/handle/20.500.14243/124413},
DOI = {10.1093/ijl/13.4.249},
ISSN = {0950-3846},
JOURNAL = {INTERNATIONAL JOURNAL OF LEXICOGRAPHY},
}
@ARTICLE{PIRRELLI_2000_ARTICLE_PB_264442,
AUTHOR = {Pirrelli, V. and Battista, M.},
TITLE = {The Paradigmatic Dimension of Stem Allomorphy in Italian Verb Inflection},
YEAR = {2000},
ABSTRACT = {This paper is concerned with a detailed analysis of stem allomorphy in Italian Conjugation, carried out from a phonological and paradigmatic perspective. In theory, one would expect these two complementary viewpoints to take care of neatly separable classes of phenomena. In fact, the two dimensions turn out to be interlocked in a complex way, to define a grammatical continuum ranging from minor phonological processes to full suppletion. A formal descriptive framework is proposed here, whereby several insights into the structure of inflectional paradigms (Matthews 1974, Carstairs 1987, Wurzel 1989, Stump 1991, Aronoff 1994) are dealt with from a unifying, purely morphological perspective. In this framework, the structure of a verb paradigm is characterised in terms of a distribution of slots into a number of equivalence classes, or set partition, where each equivalence class is associated with a morphologically distinct stem root. It is shown that, in Italian, a few set partitions account for the structure of all Italian verb paradigms, whether regular or less regular. Moreover, all these partitions are mutually related homomorphically. This well-behaved family of distributions tightly constrains stem allomorphy at an appropriate level of abstraction, independently of whether the origin of allomorphy is morpho-phonological or purely morphological, showing the superiority of the obtained generalisations over more traditional syntagmatic accounts},
KEYWORDS = {Morfologia, allomorfia, paradigmi flessionali},
PAGES = {307-379},
URL = {https://iris.cnr.it/handle/20.500.14243/264442},
VOLUME = {12},
ISSN = {1120-2726},
JOURNAL = {RIVISTA DI LINGUISTICA},
}
@BOOK{MARCONI_2000_BOOK_MBRRM_216329,
AUTHOR = {Marconi, L. and Bermudez, E. M. and Ratti, D. and Rolando, C. and Miyares, L. R.},
TITLE = {Diccionario Ortográfico del Español, basado en el lexico del escolar cubano},
YEAR = {2000},
ABSTRACT = {Edizione a cura dell'Ufficio del Presidente del Consiglio Nazionale delle Ricerche. Realizzato dalla base di un corpus di testi prodotti dai bambini, raccolto in Cuba da un'equipe di Linguisti, il "Diccionario Ortográfico del Español basado en el léxico del escolar cubano" contiene 8. 403 lemmi con la descrizione delle possibili forme, della categoria grammaticale per sostantivi, aggettivi e per le altre categorie grammaticali fatta eccezione per i verbi. Come per l'italiano i verbi sono dotati di un codice di rimando al modello di coniugazione. I modelli di riferimento per questo dizionario sono 77 e rappresentano un consistente insieme dei modelli del verbo spagnolo. Il Dizionario Ortografico dello Spagnolo (ed. CNR, Genova, 2000) basato sul lessico dello scolaro cubano è formato da tre parti distinte.-Una prima parte con le regole più comuni dell'ortografia e dell'accentuazione; alcune irregolarità grafiche dei verbi e delle altre categorie verbali; una breve descrizione della struttura del dizionario.-La seconda parte è formata dai modelli verbali, cioè da una serie di tavole dove ogni verbo coniugato serve di riferimento per tutti i verbi che si comportano nella coniugazione nello stesso modo.-Forma la terza parte la lista delle parole usate dallo scolaro cubano con le relative terminazioni nel caso dei nominali e con il numero che indica la tavola di riferimento nel caso dei verbi},
KEYWORDS = {Diccionario, Español},
PAGES = {I-334},
URL = {http://www.ge.ilc.cnr.it/page.php?ID=dic-cubano\&lingua=it},
ISBN = {8890031824},
}
@BOOK{MARCONI_2000_BOOK_MMRRR_216333,
AUTHOR = {Marconi, L. and Miyares Bermudez, E. and Ratti, D. and Rolando, C. and Ruiz Miyares, L.},
TITLE = {Vocabulario inverso y anagramas del Español, basado en el léxico del escolar cubano},
YEAR = {2000},
ABSTRACT = {A partire dal "Diccionario Ortográfico del Español basado en el léxico del escolar cubano" il "Vocabulario Inverso y Anagramas del Español basado en el léxico del escolar cubano" contiene tutte le forme ordinate in modalità inversa e i relativi anagrammi del lessico scolare cubano. Il "Vocabolario Inverso e Anagrammi dello Spagnolo" (ed. CNR, Genova, 2000) è un complemento del Diccionario Ortográfico del Español, dal momento che contiene le 80305 forme generate a partire dal Diccionario Ortográfico del Español, ordinate in ordine inverso e i 10182 anagrammi},
KEYWORDS = {Vocabulario Inverso, Anagramas, Español},
PAGES = {I-417},
URL = {http://www.ge.ilc.cnr.it/page.php?ID=inverso\&lingua=it},
ISBN = {8890031832},
EDITOR = {Marconi, L. and Bermúdez, E. M. and Ratti, D. and Rolando, C. and Miyares, L. R.},
}
@BOOK{PIRRELLI_2000_BOOK_P_263719,
AUTHOR = {Pirrelli, V.},
TITLE = {Paradigmi in morfologia. Un approccio interdisciplinare alla flessione verbale dell'italiano},
YEAR = {2000},
ABSTRACT = {Cosa vuol dire apprendere le forme flesse di un verbo in una lingua come l'italiano? Attraverso quali processi mentali e quali strutture cognitive un parlante è in grado di memorizzare, strutturare ed estendere a parole mai ascoltate prima i dati morfologici cui è esposto nel corso dell'apprendimento? Quali risposte sono disponibili allo stato attuale delle ricerche, e quanto sono soddisfacenti? E infine, che cosa ci insegnano queste ricerche riguardo al modo in cui la mente umana associa forma e contenuto nel linguaggio? Questo libro cerca di affrontare buona parte di questi problemi attraverso l'analisi di tre fonti primarie di dati. La prima riguarda l'evidenza del sistema verbale dell'italiano, la sua variabilità dal punto di vista formale, e l'apparentemente caotico pullulare di eccezioni e sacche di sotto-regolarità. Considereremo con attenzione come questi dati sono analizzati in morfologia teorica e con quali strumenti formali. In secondo luogo guarderemo ai dati psicolinguistici relativi all'apprendimento delle parole da parte del bambino, ai suoi errori, alle sue generalizzazioni e alle sue difficoltà, per poi confrontare questi dati sia con i modelli della linguistica teorica che con i modelli computazionali di elaborazione e di apprendimento del linguaggio ad oggi disponibili. Infine, daremo uno sguardo al cambiamento linguistico dal punto di vista diacronico, e in particolare alle direzioni che il sistema verbale dell'italiano ha preso nella sua progressiva deriva dal verbo latino attraverso il tempo},
URL = {https://iris.cnr.it/handle/20.500.14243/263719},
ISBN = {88-8147-237-6},
}
@INCOLLECTION{PETERS_2000_INCOLLECTION_PPB_386467,
AUTHOR = {Peters, C. and Picchi, E. and Biagini, L.},
TITLE = {Parallel and comparable bilingual corpora in language teaching and learning},
YEAR = {2000},
ABSTRACT = {An abstract is not available},
KEYWORDS = {Linguistics, Content analysis and indexing. Linguistic processes, Information search and retrieval},
PAGES = {73-85},
URL = {https://iris.cnr.it/handle/20.500.14243/386467},
BOOKTITLE = {Multilingual corpora in teaching and research},
EDITOR = {Botley, S. P. and McEnery, A. M. and Wilson, A.},
}
@INPROCEEDINGS{BEL_2000_INPROCEEDINGS_BBCGLMOPPRVZ_124394,
AUTHOR = {Bel, N. and Busa, F. and Calzolari, N. and Gola, E. and Lenci, A. and Monachini, M. and Ogonowsky, A. and Peters, I. and Peters, W. and Ruimy, N. and Villegas, M. and Zampolli, A.},
TITLE = {SIMPLE: A General Framework for the Development of Multilingual Lexicons},
YEAR = {2000},
ABSTRACT = {The project LE-SIMPLE is an innovative attempt of building harmonized syntactic-semantic lexicons for 12 European languages, aimed at use in different Human Language Technology applications. SIMPLE provides a general design model for the encoding of a large amount of semantic information, spanning from ontological typing, to argument structure and terminology. SIMPLE thus provides a general framework for resource development, where state-of-the-art results in lexical semantics are coupled with the needs of Language Engineering applications accessing semantic information},
URL = {https://iris.cnr.it/handle/20.500.14243/124394},
}
@INPROCEEDINGS{CECCOTTIMARIA_2000_INPROCEEDINGS_CSP_139030,
AUTHOR = {Ceccotti Maria, L. and Sassi, M. and Pardelli, G.},
TITLE = {Il soccorso informatico per lo studio di un autore difficile, C. E. Gadda},
YEAR = {2000},
ABSTRACT = {Nella prima parte di questo contributo si illustreranno le caratteristiche dell'Archivio Gadda in DBT, frutto di un lungo lavoro redazionale di transcodifica e di codifica. Nella seconda sarà brevemente descritta e motivata la realizzabilità di un sito web su Gadda, un modello di 'laboratorio culturale' che costituito inizialmente da alcuni brani gaddiani, da nostre recenti pubblicazioni, da dati bibliografici, potrebbe essere arricchito dall'apporto del lettore di Gadda, studioso,. studente, curioso},
KEYWORDS = {Gadda C.E.},
PAGES = {149-154},
URL = {https://iris.cnr.it/handle/20.500.14243/139030},
PUBLISHER = {Associazione Italiana per l'Informatica ed il Calcolo Automatico (AICA) (Cesena, ITA)},
CONFERENCE_NAME = {DIDAMATICA 2000, Informatica per la Didattica},
CONFERENCE_PLACE = {Milano},
BOOKTITLE = {Atti 1. Lavori Scientifici},
EDITOR = {Andronico, A. and Casadei, G. and Sacerdoti, G.},
}
@INPROCEEDINGS{CECCOTTI_2000_INPROCEEDINGS_CSP_128391,
AUTHOR = {Ceccotti, M. L. and Sassi, M. and Pardelli, G.},
TITLE = {Un laboratorio multimediale dedicato a Carlo Emilio Gadda: il modello e i primi dati implementati in formato XML},
YEAR = {2000},
ABSTRACT = {In this paper we present of the Italian National Council of Research titled "Gadda 's Electronic Archive: Lexicographical and bibliographical Tools in XML". The text is made of two sections: in the first, we present Gadda's Electronic Archive, implemented at the ILC, and in the second, we show the project's objectives and the results achieved in the first months of work},
KEYWORDS = {Gadda's Electronic Archive},
PAGES = {267-271},
URL = {https://iris.cnr.it/handle/20.500.14243/128391},
PUBLISHER = {Associazione Italiana per l'Informatica ed il Calcolo Automatico (AICA) (Milano, ITA)},
CONFERENCE_NAME = {XXXVIII Congresso Annuale AICA: Le tecnologie dell'Informazione e della Comunicazione come sviluppo del Paese},
CONFERENCE_PLACE = {Milano},
}
@INPROCEEDINGS{LANZA_2000_INPROCEEDINGS_LP_117889,
AUTHOR = {Lanza, C. and Pardelli, G.},
TITLE = {Una soggettazione automatica di letteratura grigia con algoritmi di rete neurale artificiale. Due esperimenti ICAS e ILC},
YEAR = {2000},
ABSTRACT = {The aim of this work is to create an automatic subject classification of grey literature documents using an artificial neural network. In particular, a software simulator of neural network with back-propagation learning scheme was used; training of the network was carried out on around 300 documents. The prototype developed follows the steps which were performed during the learning, the processing and the network querying phase. The analysis of the final tests provides targets to be referred to the percentage of document classification error for each subject. From this data it is possible to evince possible document-subject correlations and/or subject-subject correlations in order to construct a relational Database of the scientific documents available at the Institute of Computational Linguistics and at the Institute of Instrumental Analitical Chemistry},
KEYWORDS = {Artificial Neural Network, IT for Library, Data Mining},
PAGES = {52-56},
URL = {https://iris.cnr.it/handle/20.500.14243/117889},
PUBLISHER = {Istituto Superiore di Sanità (Roma, ITA)},
ISSN = {0393-5620},
CONFERENCE_NAME = {La letteratura grigia: politica e pratica. 3° Convegno Nazionale},
CONFERENCE_PLACE = {Roma},
BOOKTITLE = {ISTISAN CONGRESSI},
EDITOR = {Alberani, V. and De Castro, P.},
}
@TECHREPORT{BARTOLINI_2000_TECHREPORT_B_365832,
AUTHOR = {Bartolini, R.},
TITLE = {Partizionamento per HD con simmetrie},
YEAR = {2000},
ABSTRACT = {An abstract is not available},
KEYWORDS = {HD},
PAGES = {1-12},
URL = {https://iris.cnr.it/handle/20.500.14243/365832},
}
@TECHREPORT{LENCI_2000_TECHREPORT_LBRGMCPOMPPGV_208538,
AUTHOR = {Lenci, A. and Busa, F. and Ruimy, N. and Gola, E. and Monachini, M. and Calzolari, N. and Pustejovsky, A. Z. J. and Ogonowski, A. and McCawley, C. and Peters, I. and Peters, W. and Gaizauskas, R. and Villegas, M.},
TITLE = {SIMPLE Linguistic Specifications},
YEAR = {2000},
ABSTRACT = {The SIMPLE project represents-at our knowledge-the first attempt to tackle encoding of semantic (argument) frames on a large scale, i. e. for so many languages and with rather wide coverage. Even though it is a real lexicon building project, it must also be seen as having challenging research aspects and will provide a framework for testing and evaluating the maturity of the current state-of-the-art in the realm of lexical semantics grounded on, and connected to, a syntactic foundation. The availability of rather large, uniformly structured lexical resources in so many EU languages will offer the users the benefits of a standardized base. According to the subsidiarity concept, which is at the basis of many EU initiatives, the process started at the EU level will be continued at the national level. This is already happening for a number of languages. The fact that all these LRs will be based on the existing models and standards defined at the European level will create a really large infrastructure of harmonized LR throughout all Europe. This achievement is of major importance in a multilingual country like Europe, where all the difficulties connected with the task of LRs building are multiplied by the language factor. This would have been absolutely impossible without the fundamental role played by the EC LRs and standards projects},
URL = {https://iris.cnr.it/handle/20.500.14243/208538},
}
@MISC{DIDONATO_2000_MISC_D_382046,
AUTHOR = {Di Donato, F.},
TITLE = {A. Giddens, Runaway World. How Globalisation is Reshaping our Lives, Profile Books, 1999 (trad. it. di R. Falcioni, Il mondo che cambia. Come la globalizzazione ridisegna la nostra vita, Il Mulino, Bologna 2000)},
YEAR = {2000},
URL = {https://iris.cnr.it/handle/20.500.14243/382046},
ISSN = {1591-4305},
}
@MISC{DIDONATO_2000_MISC_D_382040,
AUTHOR = {Di Donato, F.},
TITLE = {Sylviane Agacinski, La politica dei sessi, Milano, Ponte alle Grazie, 1998},
YEAR = {2000},
URL = {https://iris.cnr.it/handle/20.500.14243/382040},
ISSN = {1591-4305},
}
@MISC{DIDONATO_2000_MISC_D_382044,
AUTHOR = {Di Donato, F.},
TITLE = {A. Cavarero, Tu che mi guardi, tu che mi racconti. Filosofia della narrazione},
YEAR = {2000},
URL = {https://iris.cnr.it/handle/20.500.14243/382044},
ISSN = {1591-4305},
}
@MISC{DIDONATO_2000_MISC_D_382041,
AUTHOR = {Di Donato, F.},
TITLE = {B. Beccalli (a cura di), Donne in quota. E' giusto riservare posti alle donne nel lavoro e nella politica?},
YEAR = {2000},
URL = {https://iris.cnr.it/handle/20.500.14243/382041},
ISSN = {1591-4305},
}
@MISC{DIDONATO_2000_MISC_D_382048,
AUTHOR = {Di Donato, F.},
TITLE = {T. Pitch, Un diritto per due, Il saggiatore, Milano 1998},
YEAR = {2000},
URL = {https://iris.cnr.it/handle/20.500.14243/382048},
ISSN = {1591-4305},
}
@ARTICLE{PIRRELLI_1999_ARTICLE_PY_264349,
AUTHOR = {Pirrelli, V. and Yvon, F.},
TITLE = {The hidden dimension: a paradigmatic view of data-driven NLP},
YEAR = {1999},
ABSTRACT = {Many tasks in language analysis are described as the maximally economic mapping of one level of linguistic representation onto another such level. Over the past decade, many different machine-learning strategies have been developed to automatically induce such mappings directly from data. In this paper, we contend that the way most learning algorithms have been applied to problems of language analysis reflects a strong bias towards a compositional (or biunique) model of interlevel mapping. Although this is justified in some cases, we contend that biunique inter-level mapping is not a jack of all trades. A model of analogical learning, based on a paradigmatic reanalysis of memorized data, is presented here. The methodological pros and cons of this approach are discussed in relation to a number of germane linguistic issues and illustrated in the context of three case studies: word pronunciation, word analysis, and word sense disambiguation. The evidence produced here seems to suggest that the brain is not designed to carry out the logically simplest and maximally economic way of relating form and function in language. Rather we propose a radical shift of emphasis in language learning from syntagmatic inter-level mapping to paradigmatically-constrained intra-level mapping},
KEYWORDS = {data-driven NLP, memory-based machine learning, analogical language learning},
PAGES = {391-408},
URL = {https://iris.cnr.it/handle/20.500.14243/264349},
VOLUME = {11},
ISSN = {1362-3079},
JOURNAL = {JOURNAL OF EXPERIMENTAL AND THEORETICAL ARTIFICIAL INTELLIGENCE ONLINE},
}
@INCOLLECTION{MONACHINI_1999_INCOLLECTION_MC_115924,
AUTHOR = {Monachini, M. and Calzolari, N.},
TITLE = {Standardization in the Lexicon},
YEAR = {1999},
ABSTRACT = {This book provides an in-depth discussion of the field of syntactic wordclass tagging, i. e. the annotation of the words in a text with tags indicating their syntactic properties. Represented are the viewpoints of the two main groups who take an interest in tagging: the users of tagged text and the developers of tagging software. The book starts out by examining the field foremost from the user's point of view. After a brief historical overview, the nature and uses of tagging are discussed and current practice is described. Here the user will find what tagging is and the software developer what it is the user wants. The book then switches to the other point of view and continues with a detailed explanation of the most common computational techniques for automatically tagging large amounts of text. Here the software developer finds information needed for the implementation of a tagger while the user gains insight into the possibilities and impossibilities of automatic tagging and how computer-provided tags should be interpreted},
URL = {https://iris.cnr.it/handle/20.500.14243/115924},
DOI = {10.1007/978-94-015-9273-4_11},
ISBN = {0-7923-5896-1},
}
@INPROCEEDINGS{BEDINI_1999_INPROCEEDINGS_BBT_393853,
AUTHOR = {Bedini, L. and Bozzi, A. and Tonazzini, A.},
TITLE = {Digital techniques for character recognition in old printed books and in modern damaged documents},
YEAR = {1999},
ABSTRACT = {An abstract is not available},
KEYWORDS = {Document analysis, Blind image restoration, Optical character recognition, Computational philology, Image processing and computer vision},
PAGES = {959-962},
URL = {https://iris.cnr.it/handle/20.500.14243/393853},
CONFERENCE_NAME = {Second International Congress on Science and Technology for the Safeguard of Cultural Heritage in the Mediterranean Basin},
}
@TECHREPORT{MARINAI_1999_TECHREPORT_MS_219271,
AUTHOR = {Marinai, E. and Sassi, M.},
TITLE = {Manuale d'uso},
YEAR = {1999},
ABSTRACT = {Breve manuale d'uso per dare un orientamento per il recupero delle informazioni contenenuto nell'archivio "Bibliografia delle edizioni giuridiche antiche in lingua italiana-Testi dottrinali e statutari dal 1470 al 1800" e suggerire dei percorsi di ricerca legati a particolari esigenze. Non si tratta di un manuale esaustivo delle possibilità offerte dal programma di interrogazione (PiSystem di E. Picchi, ILC-CNR) in quanto una loro puntuale descrizione si trova nella "Guida" all'interno del programma stesso},
KEYWORDS = {manuale uso, banca dati storico-giuridica},
PAGES = {47-67},
URL = {http://www.ittig.cnr.it/EditoriaServizi/AttivitaEditoriale/CollanaCD/cd-3.htm},
PUBLISHER = {ESI (Napoli, ITA)},
ISBN = {88-8114-914-1},
CONFERENCE_PLACE = {Napoli},
}
@MISC{DIDONATO_1999_MISC_D_384162,
AUTHOR = {Di Donato, F.},
TITLE = {La teoria femminista: una bibliografia},
YEAR = {1999},
ABSTRACT = {Bibliografia ragionata di teoria femminista (1999-2004)},
URL = {https://iris.cnr.it/handle/20.500.14243/384162},
}
@MISC{PARDELLI_1999_MISC_P_16739,
AUTHOR = {Pardelli, G.},
TITLE = {I risultati del Progetto BIBLOS},
YEAR = {1999},
ABSTRACT = {Il sito di BIBLOS e' entrato ufficialmente in servizio con questa Conferenza quando e' stato presentato presso la Sede Centrale del CNR (Aula Marconi). In tale occasione i responsabili delle Unità Operative degli Istituti del Comitato 08 hanno presentato i risultati raggiunti, in particolare il catalogo a soggetto. In tale occasione è stato presentato il soggettario e il prototipo bibliografico dell'unità operativa ILC},
KEYWORDS = {Biblos Project},
URL = {https://iris.cnr.it/handle/20.500.14243/16739},
CONFERENCE_NAME = {BIBLOS Biblioteca virtuale del settore Storico Filosofico e Filologico del Consiglio Nazionale delle Ricerche: I risultati del Progetto BIBLOS: la telematica al servizio della cultura umanistica},
}
@ARTICLE{GUADAGNINI_1998_ARTICLE_G_267269,
AUTHOR = {Guadagnini, E.},
TITLE = {Nuove voci del Tesoro della Lingua Italiana delle Origini},
YEAR = {1998},
ABSTRACT = {Voce laidezza s. f. del Tesoro della Lingua Italiana delle Origini},
KEYWORDS = {Lessico, Lessicografia, Lingua Italiana},
PAGES = {5-276},
URL = {https://iris.cnr.it/handle/20.500.14243/267269},
VOLUME = {3},
ISSN = {1591-8254},
JOURNAL = {BOLLETTINO-OPERA DEL VOCABOLARIO ITALIANO},
}
@INCOLLECTION{PETERS_1998_INCOLLECTION_PP_386209,
AUTHOR = {Peters, C. and Picchi, E.},
TITLE = {Bilingual reference corpora for translators and translation studies},
YEAR = {1998},
ABSTRACT = {Sommario non disponibile},
KEYWORDS = {Information retrieval systems, Conten},
PAGES = {91-100},
URL = {https://iris.cnr.it/handle/20.500.14243/386209},
BOOKTITLE = {Unity in Diversity. Current Trends in Translation Studies},
EDITOR = {Bowker, L.},
}
@INCOLLECTION{PICCHI_1998_INCOLLECTION_PP_386210,
AUTHOR = {Picchi, E. and Peters, C.},
TITLE = {Cross-language information retrieval: a system for comparable corpus querying},
YEAR = {1998},
ABSTRACT = {We describe a system that has been designed to process and query comparable text corpora. i. e. collections of texts from pairs or multiples of languages referring to the same domain. The first version of the system has been developed to retrieve natural language lexical equivalents from sets of sublanguage texts in English and Italian; given the necessary lexical and morphological components it could be extended to cover other langueges. The initial implementation was made with the needs of language scholars in mind; however, the system could have application in the fields of terminology and crosslingual document retrieval},
KEYWORDS = {Cross-language information retrieval},
PAGES = {81-92},
URL = {https://iris.cnr.it/handle/20.500.14243/386210},
PUBLISHER = {Kluwer (Dordrecht, NLD)},
CONFERENCE_PLACE = {Dordrecht},
BOOKTITLE = {Cross-Language Information Retrieval},
EDITOR = {Grefenstette, G.},
}
@INPROCEEDINGS{AGOSTINIANI_1998_INPROCEEDINGS_AMM_221050,
AUTHOR = {Agostiniani, L. and Montemagni, S. and Marinai, E.},
TITLE = {Una procedura informatica di accesso intelligente a materiali in trascrizione fonetica: l'esperienza dell'Atlante Lessicale Toscano},
YEAR = {1998},
ABSTRACT = {Una procedura informatica di accesso intelligente a materiali in trascrizione fonetica: l'esperienza dell'Atlante Lessicale Toscano},
KEYWORDS = {trascrizione fonetica},
PAGES = {18},
URL = {https://iris.cnr.it/handle/20.500.14243/221050},
CONFERENCE_NAME = {V° Congresso SILFI},
BOOKTITLE = {Atti del V° Congresso SILFI},
}
@INPROCEEDINGS{BOTTINO_1998_INPROCEEDINGS_BRCFF_370322,
AUTHOR = {Bottino, R. and R, M. and Cutugno, P. and Furinghetti and , F.},
TITLE = {Hypermedia as a means for learning and for thinking about learning},
YEAR = {1998},
ABSTRACT = {The paper refers to a project aimed at designing, implementing and evaluating a hypermedia system, IPER-3, facing the three 'classical' problems in the history of mathematics (trisection of the angle, quadrature of the circle, duplication of the cube). The aim of the project is to study the opportunities offered by this kind of technology to the presentation of mathematical topics both in teacher training courses and in classroom work},
KEYWORDS = {Hypermedia system, Education, History of Mathematics},
PAGES = {144-149},
URL = {https://iris.cnr.it/handle/20.500.14243/370322},
PUBLISHER = {AACE, Association for the advancement of computing in education (Norfolk, Va, USA)},
CONFERENCE_NAME = {ED-MEDIA/ED-TELECOM 98 '10th World Conferences on Educational Multimedia and Hypermedia and on Educational Telecommunications},
CONFERENCE_PLACE = {Norfolk, Va},
BOOKTITLE = {Proceedings of ED-MEDIA/ED-TELECOM 98 '10th World Conferences on Educational Multimedia and Hypermedia and on Educational Telecommunications},
EDITOR = {Ottmann, T. and Tomek, I.},
}
@INPROCEEDINGS{BRASCHLER_1998_INPROCEEDINGS_BPPS_363531,
AUTHOR = {Braschler, M. and Peters, C. and Picchi, E. and Schauble, P.},
TITLE = {Cross-language web querying: The EuroSearch approach},
YEAR = {1998},
ABSTRACT = {Each national site is responsible for maintaining and operating a search service for its own languages, so that the needs of distinct language communities can be catered for by native speakers of that language. The languages covered are currently French, German, Italian and Spanish, plus also English. Differences in the partners' document collections and indexing mechanisms have led to the implementation of different search strategies, depending on the collection to be queried. The cross-language search component of EuroSearch thus consists of an integration of lexicon-and corpus-based search mechanisms and two distinct types of searching will be activated: o query translation using a multilingual lexicon; enhanced by an experimental corpus-based mechanism o similarity thesaurus technology},
KEYWORDS = {Information search and retrieval, Digital libraries},
PAGES = {701-702},
URL = {http://www.scopus.com/inward/record.url?eid=2-s2.0-84945195637\&partnerID=q2rCbXpz},
VOLUME = {1513},
PUBLISHER = {Springer (New York, USA)},
CONFERENCE_NAME = {ECDL'98: Research and advanced technology for digital libraries. Second European Conference},
CONFERENCE_PLACE = {New York},
}
@INPROCEEDINGS{PICCHI_1998_INPROCEEDINGS_PP_389178,
AUTHOR = {Picchi, E. and Peters, C.},
TITLE = {Exploiting lexical resources and linguistic tools in cross-language information retrieval: the euro-search approach},
YEAR = {1998},
ABSTRACT = {Cross-language Information Retrieval (CLIR) is a very new research area in which methodologies and tools developed for Natural Language Processing (NLP) are being integrated with techniques and results coming from the Information Retrieval (IR) field. The EuroSearch project provides an excellent testbed for the application and testing of different kinds of cross-language retrieval methodologies. In EuroSearch, a federation of industrial search engines (Arianna for Italy, Ole for Spain and EuroSpider for Switzerland), using different kinds of search mechanisms, will provide their users with functionalities for cross-language querying. The paper describes and motivates the technology that will be adopted in the implementation of the multilingual interface of the federation, focusing on an approach that enhances the potential of a lexicon-based search through the integration of a corpus-based methodology},
KEYWORDS = {Cross-language Information Retrieval},
PAGES = {865-872},
URL = {https://iris.cnr.it/handle/20.500.14243/389178},
EDITOR = {Rubio, A.},
}
@INPROCEEDINGS{ROVENTINI_1998_INPROCEEDINGS_RBCP_363528,
AUTHOR = {Roventini, A. and Bertagna, F. and Calzolari, N. and Peters, C.},
TITLE = {Building the italian component of EuroWordNet: a language-specific perspective},
YEAR = {1998},
ABSTRACT = {An abstract is not available},
KEYWORDS = {Lexical semantics, EuroWord-Net, Italian semantic database},
PAGES = {10},
URL = {https://iris.cnr.it/handle/20.500.14243/363528},
CONFERENCE_NAME = {Actes Euralex'98. Communications soumises a Euralex'98. 8eme Congres International de Lexicographie},
}
@INPROCEEDINGS{ROVENTINI_1998_INPROCEEDINGS_RPCB_389176,
AUTHOR = {Roventini, A. and Peters, C. and Calzolari, N. and Bertagna, F.},
TITLE = {Building a semantic network for italian using existing lexical resources},
YEAR = {1998},
ABSTRACT = {An abstract is not available},
KEYWORDS = {Content analysis and indexing},
PAGES = {377-383},
URL = {https://iris.cnr.it/handle/20.500.14243/389176},
CONFERENCE_NAME = {First International Conference on Language Resource and Evaluation},
EDITOR = {Rubio, A.},
}
@INPROCEEDINGS{MARCONI_1998_INPROCEEDINGS_MRR_20001,
AUTHOR = {Marconi, L. and Ratti, D. and Rolando, C.},
TITLE = {Evaluacion cuantitava del lexico periodistico},
YEAR = {1998},
ABSTRACT = {Our corpus comprises all editions of the Repubblica newspaper published en 1994. These have been analysed automatically to establish the newspaper's language richness and variety. Since the data have not been lematized, our analisys is based on all forms encountered in the corpus. The word in the corpus have been classified according to the following types: news, business and finance, politics, culture entertainment and sport. The classification follows the scheme developed for the Italian corpora project. Various statistical analyses will be presented and discussed},
PAGES = {679-683},
URL = {https://iris.cnr.it/handle/20.500.14243/20001},
CONFERENCE_NAME = {JADT 1998},
BOOKTITLE = {JADT 1998},
EDITOR = {Mellet, S. and La Collaboration De Brunet, A. E. and Juillard, M. and Lebart, L. and Salem, A.},
}
@INPROCEEDINGS{PARDELLI_1998_INPROCEEDINGS_P_16637,
AUTHOR = {Pardelli, C. L.},
TITLE = {Sviluppo delle raccolte e procedure di gestione nelle Biblioteche dell'ICAS e dell'ILC},
YEAR = {1998},
ABSTRACT = {La gestione del materiale bibliografico è rappresentata da una serie di procedure che vanno dall'acquisizione all'accessibilità dei documenti. Nel presente articolo abbiamo cercato di illustrare la situazione attuale delle nostre Biblioteche, il contenuto argomentativo, il servizio informativo, l'importanza della cooperazione tra Biblioteche e la necessità di aggiornamento professionale costante per un settore, l'IT for Libray, in continuo divenire},
URL = {https://iris.cnr.it/handle/20.500.14243/16637},
}
@TECHREPORT{_1998_TECHREPORT_P_16718,
AUTHOR = {, P. G. R. S.},
TITLE = {Progetto BIBLOS: realizzazione del prototipo per la messa in linea con INTERNET della banca dati bibliografica dell'Istituto di Linguistica Computazionale},
YEAR = {1998},
ABSTRACT = {INTRODUZIONE Nel presente lavoro abbiamo cercato di illustrare la tipologia e il contenuto argomentativo del materiale documentario, le relative procedure di selezione, di registrazione e di scarto per arrivare alla costruzione del prototipo bibliografico del progetto BIBLOS. L'Istituto di Linguistica Computazionale (ILC) del Consiglio Nazionale delle Ricerche (CNR) afferisce al Comitato per le Scienze Storiche, Filosofiche e Filologiche. L' Istituto, nell'ambito della propria area disciplinare, gestisce il patrimonio documentario ed eroga i propri servizi in conformità a quanto previsto nel DPR n. 475/87 1 e nel DPR n. 417/95 2. La biblioteca dell'Istituto raccoglie e conserva: a) le pubblicazioni di consultazione generale o specializzate acquistate nell'ambito dell'attività scientifica del CNR, indispensabili per studi e ricerche; b) le pubblicazioni che riguardano la ricerca scientifica e tecnologica edita dal CNR o con il suo contributo o sotto il suo patrocinio. La biblioteca dell' Istituto ha quindi il compito di curare la raccolta e la catalogazione di tutto il materiale in suo possesso nonché quello di coordinare il servizio di informazione, mediante l'accesso alle banche dati, per rendere disponibile il recupero di documenti anche attraverso il ricorso alle procedure di prestito interbibliotecario. L'assolvimento di tali compiti e la necessità di soddisfare un'utenza esigente comportano una continua e attenta valutazione nell'acquisizione delle raccolte, di fatto spesso condizionata dal dinamismo dell'attività scientifica. Tale attività genera una letteratura spesso caratterizzata da rapida obsolescenza, benchè certi documenti possano essere richiesti anche dopo molti anni dalla loro pubblicazione, per il valore culturale e storico. Tutti questi fattori, non disgiunti dalla razionalizzazione dei fondi destinati alla biblioteca e dallo spazio fisico disponibile, determinano un'attenta valutazione dell'intera attività di gestione},
URL = {https://iris.cnr.it/handle/20.500.14243/16718},
}
@TECHREPORT{PARDELLI_1998_TECHREPORT_P_16698,
AUTHOR = {Pardelli, G.},
TITLE = {Verso la costruzione di un soggettario per il Progetto BIBLOS all'Istituto di Linguistica Computazionale},
YEAR = {1998},
ABSTRACT = {This document describes a methodology aimed at building a subject catalogue at the Institute for Computational Linguistics within the framework of the Biblos Project (Virtual Humanities Library of the National Research Council)},
KEYWORDS = {Subject Indexing, Cataloguing Documentation, Progetto BIBLOS},
PAGES = {1-6},
URL = {https://iris.cnr.it/handle/20.500.14243/16698},
}
@MISC{PARDELLI_1998_MISC_PS_193246,
AUTHOR = {Pardelli, G. and Sassi, M.},
TITLE = {I. L. C. Library},
YEAR = {1998},
ABSTRACT = {La stampa del catalogo dell'archivio librario dell'Istituto di Linguistica Computazionale I. L. C. è tratta dall'archivio elettronico. La registrazione del materiale bibliografico viene effettuata con il software CDS/ISIS dell'UNESCO. Tale sistema ci permette di descrivere il documento secondo gli standard internazionali. I dati bibliografici dell'archivio sono stati curati da Gabriella Pardelli, responsabile della Biblioteca dell'Istituto, le procedure informatiche relative all'indicizzazione e alla stampa complessiva del catalogo sono state effettuate da Manuela Sassi, Tecnologo dell'Istituto},
KEYWORDS = {Catalogo, Linguistica Computazionale},
PAGES = {I-253},
URL = {https://iris.cnr.it/handle/20.500.14243/193246},
PUBLISHER = {S. T. A. R. Servizio Tecnografico Area Ricerca CNR (Pisa, ITA)},
CONFERENCE_PLACE = {Pisa},
}
@ARTICLE{BEDINI_1997_ARTICLE_BBT_392172,
AUTHOR = {Bedini, L. and Bozzi, A. and Tonazzini, A.},
TITLE = {Digital techniques for character recognition in old documents},
YEAR = {1997},
ABSTRACT = {Two research projects have recently been activated by the Italian National Research Council (CNR) with the objective of designing and developing computerised tools to retrieve and restore textual information contained in ancient documents, accessed as digital images. The first, LAperLA, concerns old printed books, while the second, carried out in the framework of a CNR special project that aims at preserving our cultural heritage, regards old manuscripts. Both projects are aimed at implementing an integrated system that improves the quality of the images and, at the same time, activates optical character recognition (OCR) functions. Three CNR Institutes are involved in this activity: the Istituto di Linguistica Computazionale (ILC-Pisa), the Istituto di Elaborazione della Informazione (IEI-Pisa) and the Istituto di Applicazioni del Calcolo (IAC-Rome)},
KEYWORDS = {Digital techniques},
URL = {https://iris.cnr.it/handle/20.500.14243/392172},
VOLUME = {28},
ISSN = {0926-4981},
JOURNAL = {ERCIM NEWS},
}
@ARTICLE{MARCONI_1997_ARTICLE_MRR_216344,
AUTHOR = {Marconi, L. and Ratti, D. and Rolando, C.},
TITLE = {Il lessico scritto dei bambini},
YEAR = {1997},
ABSTRACT = {Il lessico dei bambini è più ricco e fantasioso di quanto normalmente si pensi. Certamente più ricco e vario del lessico usato dagli scrittori dei testidestinati all'infanzia, che sembrano temere di indirizzare la fantasia dei bambini verso coinvolgimenti conflittuali},
PAGES = {22-24},
URL = {https://iris.cnr.it/handle/20.500.14243/216344},
VOLUME = {19 (20-07-1997)},
ISSN = {0042-7349},
JOURNAL = {LA VITA SCOLASTICA},
}
@ARTICLE{MARIABOTTINO_1997_ARTICLE_MCF_227637,
AUTHOR = {Maria Bottino, R. and Cutugno, P. and Furinghetti, F.},
TITLE = {PROGETTAZIONE E UTILIZZO DI UN SISTEMA IPERMEDIALE PER LA STORIA DELLA MATEMATICA},
YEAR = {1997},
ABSTRACT = {This paper concerns with a hypermedia system (IPER-3) that we have designed to deal with the three 'famous mathematical problems': the squaring of the circle, the duplication of the cube, the trisection of the angle. The aim of our work is to study the opportunities offered by this kind of technology to the presentation of mathematical topics both in teacher training courses and in classroom work. The paper is organized as follows. In the first part we explain our choice of a topic in field of the history of mathematics. In the second part we present the main features of the the IPER-3 system, focusing on the technological choices that rely on interesting didactical issues. In the third part we analyse the experimentation of use of this hypermedia that we have carried out with university students. Eventually we outline some possible developments for such a kind of activities},
PAGES = {838-854},
URL = {https://iris.cnr.it/handle/20.500.14243/227637},
VOLUME = {20 (6)},
ISSN = {1123-7570},
JOURNAL = {L'INSEGNAMENTO DELLA MATEMATICA E DELLE SCIENZE INTEGRATE},
}
@ARTICLE{PETERS_1997_ARTICLE_PP_392214,
AUTHOR = {Peters, C. and Picchi, E.},
TITLE = {Across languages, across cultures: Issues in multilinguality and digital libraries},
YEAR = {1997},
ABSTRACT = {With the recent rapid diffusion over the international computer networks of world-wide distributed document bases, the question of multilingual access and multilingual information retrieval is becoming increasingly relevant. We briefly discuss just some of the issues that must be addressed in order to implement a multilingual interface for a Digital Library system and describe our own approach to this problem},
KEYWORDS = {Multingual information access, Information Search and Retrieval. Search process},
URL = {http://www.scopus.com/inward/record.url?eid=2-s2.0-0012623761\&partnerID=q2rCbXpz},
VOLUME = {3 (5)},
ISSN = {1082-9873},
JOURNAL = {D-LIB MAGAZINE},
}
@INCOLLECTION{PETERS_1997_INCOLLECTION_PP_363538,
AUTHOR = {Peters, C. and Picchi, E.},
TITLE = {Reference corpora and lexicons for translators and translation studies},
YEAR = {1997},
ABSTRACT = {Translators, especially professional translators, need fast and flexible tools to assist them in thè task of rendering a text written in one language as skilfully as possible in another. They require rapid and reliable access to authoritative sources of reference (both dictionaries and texts) that can provide them with guidance in selecting thè most appropriate translation equivalent for a given word or expression used in a given context, to suit thè particular text type being treated},
KEYWORDS = {Reference corpora},
PAGES = {247-275},
URL = {https://iris.cnr.it/handle/20.500.14243/363538},
PUBLISHER = {John Benjamins Publishing Company (Amsterdam/Philadelphia, USA)},
ISBN = {90-272-1629-0},
CONFERENCE_PLACE = {Amsterdam/Philadelphia},
}
@EDITORIAL{RATTI_1997_EDITORIAL_RB_220025,
AUTHOR = {Ratti, D. and Biorci, G.},
TITLE = {Sinonimi e contrari. Dizionario compatto dei sinonimi e dei contrari di Daniela Ratti e Grazia Biorci},
YEAR = {1997},
PAGES = {1-719},
URL = {https://iris.cnr.it/handle/20.500.14243/220025},
PUBLISHER = {Zanichelli SpA (Bologna, ITA)},
ISBN = {9788808165206},
CONFERENCE_PLACE = {Bologna},
}
@INPROCEEDINGS{PETERS_1997_INPROCEEDINGS_PP_364201,
AUTHOR = {Peters, C. and Picchi, E.},
TITLE = {Using linguistic tools and resources in cross-language retrieval},
YEAR = {1997},
ABSTRACT = {A System to process bilingual/multilingual text corpora is described. The system includes components for cross-language querying on parallel (ie translation equivalent) and comparable (ie domain-specific) collections of texts in more than one language. Both sets of procedures are dependent on lexical resources (bilingual lexical databases) and linguistic tools (morphological procedures). The System was originally designed to meet the requirements of various types of contrastive language studies. However, we are now studying applications to cross-language retrieval},
KEYWORDS = {Cross-language retrieval},
PAGES = {75-84},
URL = {https://iris.cnr.it/handle/20.500.14243/364201},
ISBN = {2912335027},
CONFERENCE_NAME = {DELOS-Cross-language information retrieval: third DELOS workshop},
}
@INPROCEEDINGS{PICCHI_1997_INPROCEEDINGS_PP_364101,
AUTHOR = {Picchi, E. and Peters, C.},
TITLE = {Using reference corpus evidence in computer-assisted translating},
YEAR = {1997},
ABSTRACT = {In recent years at thè Istituto di Linguistica Computazionale, Pisa, we have worked on implementìng a Translator's Workstation, designed to provide computatìonal tools to assist thè translator in thè difficult task of identifying thè most suitable cross-language equivalences for a given word in a given context. The two main components of the workstation consiet of monoand bilingual lexical databases and monoand bilingual textual corpora together with sets of procedures to manage, query and analyse these resources in different ways, depending on thè particular requirements of thè user. At thè workshop, we will present a proposal for a new addition to the workstation},
KEYWORDS = {Computer-assisted},
URL = {https://iris.cnr.it/handle/20.500.14243/364101},
CONFERENCE_NAME = {International Workshop of Corpus Use \& Learning to Translat: extended Abstract},
}
@INPROCEEDINGS{ROLANDO_1997_INPROCEEDINGS_RM_217024,
AUTHOR = {Rolando, C. and Marconi, L.},
TITLE = {Standard Italian language and Mistakes in Essays Written by 6-20-Year-Old Primary School Children in Italy},
YEAR = {1997},
URL = {https://iris.cnr.it/handle/20.500.14243/217024},
}
@INPROCEEDINGS{PETERS_1997_INPROCEEDINGS_PP_366280,
AUTHOR = {Peters, C. and Picchi, E.},
TITLE = {Computational tools for cross-language querying and analysis},
YEAR = {1997},
ABSTRACT = {An abstract is not avaiable},
KEYWORDS = {Cross-language, Information search and retrieval},
URL = {https://iris.cnr.it/handle/20.500.14243/366280},
CONFERENCE_NAME = {Fourth Nordic Symposium on Text-Based Contrastive Studies},
}
@TECHREPORT{ERJAVEC_1997_TECHREPORT_EM_198862,
AUTHOR = {Erjavec, T. and Monachini, M.},
TITLE = {Specifications and notation for lexicon encoding},
YEAR = {1997},
URL = {https://iris.cnr.it/handle/20.500.14243/198862},
}
@MISC{BEDINI_1997_MISC_BBT_391375,
AUTHOR = {Bedini, L. and Bozzi, A. and Tonazzini, A.},
TITLE = {Digital techniques for characters recognition in hold document},
YEAR = {1997},
ABSTRACT = {Two research projects have recently been activated by the Italian National Research Council (CNR) with the objective of designing and developing computerised tools to retrieve and restore textual information contained in ancient documents, accessed as digital images},
KEYWORDS = {Image Restoration, Image Segmentation, Image Processing and Computer Vision. Restoration, Image Processing and computer vision. Segmentation},
PAGES = {24-24},
URL = {https://iris.cnr.it/handle/20.500.14243/391375},
}
@ARTICLE{MARCONI_1996_ARTICLE_MR_216342,
AUTHOR = {Marconi, L. and Ratti, D.},
TITLE = {Se il bambino scrive luovo},
YEAR = {1996},
ABSTRACT = {In questo lavoro viene analizzata la distribuzione degli errori riferita a 5000 testi liberamente prodotti dai bambini di eta compresa tra i 6 e 11 anni. La casistica degli errori è estremamente ampia e variegata: accanto ad errori di ortografia abbiamo trovato errori di concordanza tra le varie parti del discorso, errori sintattici e errori di tipo morfologico},
PAGES = {14-18},
URL = {https://iris.cnr.it/handle/20.500.14243/216342},
VOLUME = {3 (1-10-1996)},
ISSN = {0042-7349},
JOURNAL = {LA VITA SCOLASTICA},
}
@ARTICLE{PETERS_1996_ARTICLE_PP_364606,
AUTHOR = {Peters, C. and Picchi, E.},
TITLE = {A system for cross-language information retrieval},
YEAR = {1996},
ABSTRACT = {An abstract is not available},
KEYWORDS = {Information retrieval},
PAGES = {25-26},
URL = {https://iris.cnr.it/handle/20.500.14243/364606},
VOLUME = {27},
ISSN = {0926-4981},
JOURNAL = {ERCIM NEWS},
}
@INCOLLECTION{CALZOLARI_1996_INCOLLECTION_CM_141713,
AUTHOR = {Calzolari, N. and Monachini, M.},
TITLE = {EAGLES Proposal for Morphosyntactic Standards: in View of a Ready-to-Use Package},
YEAR = {1996},
URL = {https://iris.cnr.it/handle/20.500.14243/141713},
ISBN = {0-19-823626-3},
}
@INPROCEEDINGS{CORAZZARI_1996_INPROCEEDINGS_CMRC_128435,
AUTHOR = {Corazzari, O. and Monachini, M. and Roventini, A. and Calzolari, N.},
TITLE = {Speech Act and Perception Verbs. Generalization and Contrastive Aspects},
YEAR = {1996},
URL = {https://iris.cnr.it/handle/20.500.14243/128435},
ISBN = {91-87850-14-1},
}
@INPROCEEDINGS{PETERS_1996_INPROCEEDINGS_PPB_363117,
AUTHOR = {Peters, C. and Picchi, E. and Biagini, L.},
TITLE = {Parallel and comparable bilingual corpora in language teaching and learning},
YEAR = {1996},
ABSTRACT = {An abstract is not available},
KEYWORDS = {Language},
PAGES = {68-82},
URL = {https://iris.cnr.it/handle/20.500.14243/363117},
CONFERENCE_NAME = {Teaching and Language Corpora},
EDITOR = {Botley, S.},
}
@INPROCEEDINGS{PICCHI_1996_INPROCEEDINGS_PP_360567,
AUTHOR = {Picchi, E. and Peters, C.},
TITLE = {Cross language information retrieval: a system for comparable corpus querying},
YEAR = {1996},
ABSTRACT = {We describe a system that has been designed to process and query comparable text corpora, i. e. collections of texts from pairs or multiples of languages referring to the same domain. The first version of the system has been developed to retrieve natural language lexical equivalents from sets of sublanguage texts in English and Italian; given the necessary lexical and morphological components it could be extended to cover other languages. The initial implementation was made with the needs of language scholars in mind; however, the system could have applications in the fields of terminology and bilingual/multilingual document retrieval},
KEYWORDS = {Language information retrieval},
PAGES = {24-33},
URL = {https://iris.cnr.it/handle/20.500.14243/360567},
CONFERENCE_NAME = {Workshop on Cross-Linguistic Information Retrieval},
}
@TECHREPORT{MONACHINI_1996_TECHREPORT_MC_198792,
AUTHOR = {Monachini, M. and Calzolari, N.},
TITLE = {Synopsis and comparison of morphosyntactic phenomena encoded in lexicons and corpora: A common proposal and applications to European languages},
YEAR = {1996},
ABSTRACT = {Computational lexicons represent an area where a pressing need is felt for the provision of basic largescale resources which must be actually reusable interchangeable shareable and also integrable in a multilingual environment. In terms of costs and eort it is quite expensive to produce such resources in detail. In the construction of largescale resources and in the denition of annotation strategies reusability is an essential requisite to pursue. The Morphosyntax area was among the first in which EAGLES concentrated its efforts because it is a more mature area where a lot of work has already been done many systems approaches and data exist for many languages this constitutes a solid platform for making reasonable and acceptable proposals for standards},
URL = {https://iris.cnr.it/handle/20.500.14243/198792},
}
@MISC{PETERS_1996_MISC_PP_390684,
AUTHOR = {Peters, C. and Picchi, E.},
TITLE = {Bilingual reference corpora for translators and translation studies},
YEAR = {1996},
ABSTRACT = {A recent trend in corpus linguistics is the construction of bilingual (or multilingual) reference corpora. So far most studies on bilingual text archives have been on parallel corpora, i. e. sets of translationally equivalent texts. Such corpora provide valuable indepth evidence of how texts written in one language can be rendered in another according to contextual factors, such as style, register, domain, etc., and are thus important sources of data when studying the translation processo However, a criticism made of the results of analyses based on these corpora is that a translation is alwaysinfluenced by the source text and, therefore, the target language text(s) can never be considered a true representation of that language in usage. It has been suggested that a more reliable source for certain studies, e. g. how a particular concept is expressed independently in different languages, is a comparable corpus. Comparable archives are sets of texts from pairs or multiples of languages that concem a given domain and can be contrasted because of their common features. However, the development of procedures to query data from this kind of corpus is far more problematic than when interrogating parallel archives as it is difficult to identify automatically equivalent expressions in the different languages. We have studied a solution to this problem. We will present procedures that have been developed at the Istituto di Linguistica Computazionale, Pisa, to construct and query both parallel and comparable bilingual text corpora and to extract significant data for translation purposes and contrastivetextual studies, giving examples of the different types of results that can be obtained. The procedures form part of an integrated mono-and bilingual text and lexical database system, implemented in a prototypal version at the Institute},
KEYWORDS = {Textual Databases, Bilingual Reference Corpora, Contrastive Textology},
URL = {https://iris.cnr.it/handle/20.500.14243/390684},
CONFERENCE_NAME = {International Translation Studies Conference Unity in Diversity?},
}
@ARTICLE{MONACHINI_1995_ARTICLE_M_118646,
AUTHOR = {Monachini, M.},
TITLE = {Morphosyntactic Annotation},
YEAR = {1995},
URL = {https://iris.cnr.it/handle/20.500.14243/118646},
ISSN = {0392-6907},
JOURNAL = {LINGUISTICA COMPUTAZIONALE},
}
@ARTICLE{PETERS_1995_ARTICLE_PP_386213,
AUTHOR = {Peters, C. and Picchi, E.},
TITLE = {Electronic dictionaries},
YEAR = {1995},
ABSTRACT = {An abstract is not available},
KEYWORDS = {Electronic dictionaries, Content Analysis and Indexing. Dictionaries},
PAGES = {16-16},
URL = {https://iris.cnr.it/handle/20.500.14243/386213},
VOLUME = {20},
ISSN = {0926-4981},
JOURNAL = {ERCIM NEWS},
}
@INPROCEEDINGS{CALZOLARI_1995_INPROCEEDINGS_CM_118633,
AUTHOR = {Calzolari, N. and Monachini, M.},
TITLE = {Standards in Morphosyntax: Towards a Ready-to-use Package},
YEAR = {1995},
URL = {https://iris.cnr.it/handle/20.500.14243/118633},
}
@INPROCEEDINGS{LAUDANNA_1995_INPROCEEDINGS_LTBBM_211265,
AUTHOR = {Laudanna, A. and Thornton, A. M. and Brown, G. and Burani, C. and Marconi, L.},
TITLE = {Un corpus dell'italiano scritto contemporaneo dalla parte del ricevente},
YEAR = {1995},
ABSTRACT = {In this paper we describe the criteria we adopted for the selection of a corpus composed of 3, 000, 000 words from Italian contemporary written texts. The corpus will give rise to a frequency dictionary, which should have two main characteristics: i) representativeness of the Italian texts which are actually read, rather than of all possible written texts, ii) usefulness for psycholinguistic research},
KEYWORDS = {Corpora, Frequency, Frequency Dictionary, Psycholinguistics},
PAGES = {103-109},
URL = {https://iris.cnr.it/handle/20.500.14243/211265},
PUBLISHER = {CISU (Roma, ITA)},
ISBN = {8879751603},
CONFERENCE_NAME = {JADT 1995 III Giornate Internazionali di ANALISI STATISTICA dei DATI TESTUALI},
CONFERENCE_PLACE = {Roma},
BOOKTITLE = {JADT 1995 III Giornate Internazionali di ANALISI STATISTICA dei DATI TESTUALI},
EDITOR = {Bolasco, S. and Lebart, L. and Salem, A.},
}
@INPROCEEDINGS{MARCONI_1995_INPROCEEDINGS_MMRC_205219,
AUTHOR = {Marconi, L. and Morgavi, G. and Ratti, D. and C Rolando And, G. M.},
TITLE = {Hybridb System for Natural Language Processing},
YEAR = {1995},
URL = {https://iris.cnr.it/handle/20.500.14243/205219},
ISBN = {0-88986-222-2},
}
@INPROCEEDINGS{MARCONI_1995_INPROCEEDINGS_MRC_205232,
AUTHOR = {Marconi, L. and Ratti, D. and C Rolando, G. M.},
TITLE = {Analisi statistica della distribuzione degli errori in un corpus costituito da testi scritti dai bambini della scuola elementar},
YEAR = {1995},
URL = {https://iris.cnr.it/handle/20.500.14243/205232},
}
@INPROCEEDINGS{MORGAVI_1995_INPROCEEDINGS_MMRC_205230,
AUTHOR = {Morgavi, G. and Marconi, L. and Ratti, D. and C Rolando, G. M.},
TITLE = {Disambiguazione delle parole italiane omografe attraverso reti neurali artificiali},
YEAR = {1995},
URL = {https://iris.cnr.it/handle/20.500.14243/205230},
ISBN = {88-7975-159-X},
}
@INPROCEEDINGS{MORGAVI_1995_INPROCEEDINGS_MMRR_205211,
AUTHOR = {Morgavi, G. and Marconi, L. and Ratti, D. and Rolando, C.},
TITLE = {Italian word disambiguation by using neural network},
YEAR = {1995},
URL = {https://iris.cnr.it/handle/20.500.14243/205211},
ISBN = {0-88986-212-5},
}
@INPROCEEDINGS{PETERS_1995_INPROCEEDINGS_PP_390696,
AUTHOR = {Peters, C. and Picchi, E.},
TITLE = {Capturing the comparable: a system for querying comparable text corpora},
YEAR = {1995},
ABSTRACT = {We discuss the importance of bilingual and multilingual text corpora in many types of cross language investigations and illustrate the differences between parallel and comparable text archives. The advantages of comparable over parallel data for certain kinds of contrastive linguistic studies arc outlined. A prototype version of a system for querying comparable text archives is then described and examples nf the first results arc given. The system will form part of an integrated works talion for mono-and bilingual lexical and text database management and interrogation under development at the Istituto di Linguistica Computazionole, Pisa},
KEYWORDS = {Textual Databases, Bilingual Reference Corpora, Contrastive Textology, Database management, Information Search and Retrieval},
PAGES = {247-254},
URL = {https://iris.cnr.it/handle/20.500.14243/390696},
CONFERENCE_NAME = {3. Giornate Internazionali di Analisi Statistica dei Dati Testuali = 3rd international conference of Statistical analysis on Textual data = 3. Journ},
}
@INPROCEEDINGS{ROVENTINI_1995_INPROCEEDINGS_RM_128392,
AUTHOR = {Roventini, A. and Monachini, M.},
TITLE = {Perception nouns in the Italian Reference Corpus: argument structure and collocational uses},
YEAR = {1995},
URL = {https://iris.cnr.it/handle/20.500.14243/128392},
}
@TECHREPORT{BONITO_1995_TECHREPORT_BDES_394040,
AUTHOR = {Bonito, A. and Del Chicca, A. and Enea, A. and Sbrana, A.},
TITLE = {Progetto comunicazioni digitali a basso costo radio-gateway},
YEAR = {1995},
ABSTRACT = {An abratct is not available},
KEYWORDS = {Radio-gateway},
PAGES = {22},
URL = {https://iris.cnr.it/handle/20.500.14243/394040},
}
@TECHREPORT{PARDELLI_1995_TECHREPORT_P_17314,
AUTHOR = {Pardelli, G.},
TITLE = {Verso una catalogazione dei testi della Biblioteca dell'ILC},
YEAR = {1995},
ABSTRACT = {Il report focalizza la titplogia del materiale bibliografico e la scelta dei criteri di soggettazione per la LC},
KEYWORDS = {Linguistica Computazionale, soggetti argomentativi},
PAGES = {1-12},
URL = {https://iris.cnr.it/handle/20.500.14243/17314},
}
@TECHREPORT{PICCHI_1995_TECHREPORT_PP_393603,
AUTHOR = {Picchi, E. and Peters, C.},
TITLE = {Specification of tools and user interface},
YEAR = {1995},
ABSTRACT = {This document is the draft of Deliverable 1. 1. 1 produced for September 1994. No revisions to this version have been considered appropriate for Milestone B since from a first analysis, it seems that not all the tools developed so far meet the specifications laid down in the first drafts of this document taking into account the needs of the four User Categories defined in Section 1. 1. It thus appears that more discussion is needed between project partners in order to guarantee that one of the primary objectives of Multext is achieved: the development of a totally integrated set of corpus processing and exploitation tools. However, in order to avoid erroneous interpretations of our task we should like to state firmly here certain guiding principles which we feel cannot be rejected or ignored in the development of the tools. The aim of Multext is to produce not only a multi-lingual language reference corpus consisting of sets of parallel and comparable texts in six European languages, but a complex set of efficient and flexible corpus tools. These tools must be designed to be easy to use for a typically non-expert user, working in some sector of the humanities, and must provide a full range of functions for text querying and analysis, implemented with a common query language. This is why in our first versions of 1. 1. 1 considerable attention was given to the Search and Retrieval functions (section 9), which have been defined in particular detail, and the User Interface (section 10) including definition of higher level tools, essential to provide users with efficient, flexible, easy-to-use tools. The modular Lego development adopted by the project clearly implies a cohesion in the tool design and implementation between the different partners so that a smooth, integrated stream of functionalities can be guaranteed. From the beginning of the project, the leaders of this task have attempted to stimulate on-going discussion and exchange of opinions with the developers with the objective of promoting a smooth, coherent development, thus ensuring total integration between the different tools and consensus in the intentions and scopes of the individual products. Unfortunately, this effort has proved only partially successful. At the present moment, certain tools appear to be following an independent line. We hope that it will be possible to smooth over what should be only a momentary lack of accordance in the near future and that the final version of D 1. 1. 1 will be reflected in the actual results of the project},
KEYWORDS = {User interface, Expert system tools and techniques},
PAGES = {37},
URL = {https://iris.cnr.it/handle/20.500.14243/393603},
}
@ARTICLE{BINDI_1994_ARTICLE_BCMPZ_115891,
AUTHOR = {Bindi, R. and Calzolari, N. and Monachini, M. and Pirrelli, V. and Zampolli, A.},
TITLE = {Corpora and Computational Lexica: Integration of Different Methodologies of Lexical Knowledge Acquisition},
YEAR = {1994},
ABSTRACT = {An attempt to integrate different techniques and various perspectives on lexical knowledge acquisition from text corpora is illustrated. In this program we use three distinct methodologies to handle text data, summarized as follows: (1) Simple and traditional stochastic techniques working on pairs of words. (2) A lexicographic approach guided by the techniques mentioned in Section 1, aiming at a formal description of sense disambiguation in terms of rules. (3) More complex and sophisticated statistical methods working on sets of words (possibly belonging to the same semantic field), which allow us to gain a new perspective on the problem of sense disambiguation. The three approaches are complementary to each other and can be contextually used. The overall objective of our work is to try to integrate data and information coming from different sources, i. e. machine-readable dictionaries, text corpora, linguists' or lexicographers' knowledge, within a computational lexicon. We stress the necessity of convergence of (1) lexical and textual projects, (2) computational and traditional lexicography, and (3) statistical and rule based approaches},
URL = {https://iris.cnr.it/handle/20.500.14243/115891},
DOI = {10.1093/llc/9.1.29},
ISSN = {0268-1145},
JOURNAL = {LITERARY \& LINGUISTIC COMPUTING},
}
@ARTICLE{CALZOLARIZAMORANI_1994_ARTICLE_CP_364183,
AUTHOR = {Calzolari Zamorani, N. and Peters, C.},
TITLE = {Lexical knowledge bases},
YEAR = {1994},
ABSTRACT = {One of the major current requirements in real world natural language processing applications is the construction of suitably structured and sufficiently exhaustive computational lexicons or lexical knowledge bases (LKBs). However, this is an extremely difficult, time consuming and expensive task, especially if it is necessary to start from scratch. For this reason, in recent years, researchers have begun to examine the potential or already existing resources, such as machine readable dictionaries and text archives, to see whether it is possible to develop procedures that can capture different kinds of lexical information from them, representing it in a computationally tractable and reusable formal framework},
KEYWORDS = {Lexical databases, Information storage and retrieval. Dictionaries},
PAGES = {10-11},
URL = {https://iris.cnr.it/handle/20.500.14243/364183},
VOLUME = {18},
ISSN = {0926-4981},
JOURNAL = {ERCIM NEWS},
}
@ARTICLE{MARINAI_1994_ARTICLE_MPP_366871,
AUTHOR = {Marinai, E. and Peters, C. and Picchi, E.},
TITLE = {A prototype system for the semi-automatic sense linking and merging of mono-and bilingual LDBs},
YEAR = {1994},
ABSTRACT = {This paper describes a method for the semi-automatic linking of lexical databases (LDBs) based on different source dictionaries and their partial merging. Equivalent entries from different dictionaries are mapped together and links are created between them at the sense level. The results can be modified interactively by the user and saved to form part of a new merged LDB whose entries will contain all the information included in the separate source LDBs. The aim is to provide a tool which makes it easier to compare and study lexical data derived from different sources and also to permit linguistic and lexical analyses of much richer data},
KEYWORDS = {Lexical databases, Databases, Database management, Information search and retrieval},
PAGES = {97-108},
URL = {https://iris.cnr.it/handle/20.500.14243/366871},
VOLUME = {3},
JOURNAL = {RESEARCH IN HUMANITIES COMPUTING},
}
@BOOK{MARCONI_1994_BOOK_MORT_220288,
AUTHOR = {Marconi, L. and Ott, M. and Ratti, D. and Tavella, M.},
TITLE = {Lessico elementare},
YEAR = {1994},
ABSTRACT = {Dati statistici sull'italiano scritto e letto dai bambini delle elementari Le parole che i bambini usano sono l'immagine delle loro conoscenze, della loro vivacità intellettuale, della loro voglia di apprendere e di comunicare, Il patrimonio linguistico e la competenza sulla lingua orale e scritta sono uno degli elementi fondamentali della cultura moderna, scolastica ed extrascolastica, Su questi presupposti gli autori del Lessico Elementare hanno compilato un dizionario di frequenza aggiornato e completo che costituisse da un lato un saldo punto di partenza per ricerche linguistiche e dall'altro uno strumento di lavoro per tutti gli operatori del settore formazione (insegnanti, autori e editori di libri per bambini, genitori)},
PAGES = {447},
URL = {https://iris.cnr.it/handle/20.500.14243/220288},
PUBLISHER = {Zanichelli (Bologna, ITA)},
ISBN = {880809538X},
CONFERENCE_PLACE = {Bologna},
}
@INCOLLECTION{COTONESCHI_1994_INCOLLECTION_CM_141707,
AUTHOR = {Cotoneschi, P. and Monachini, M.},
TITLE = {An empirical experience on the utilization of the Italian Reference Corpus in Meaning Analysis},
YEAR = {1994},
ABSTRACT = {The spirit of the paper can be summarized in the sentence: "Meaning is the product of context". Our experience is founded on three basic assumptions: context is crucial to restrict and identify the senses of a word and to disambiguate them; meaning is a composite net of connections between word-token and the context; textual corpora are a significant source of knowledge for a contextual approach in sense distinctions},
URL = {https://iris.cnr.it/handle/20.500.14243/141707},
ISBN = {0-19-824064-3},
}
@INPROCEEDINGS{MONACHINI_1994_INPROCEEDINGS_MR_118624,
AUTHOR = {Monachini, M. and Roventini, A.},
TITLE = {Italian Audition Verbs: A Corpus-and Frame-based analysis},
YEAR = {1994},
ABSTRACT = {The study described in this paper was carried out within the framework of the LRE-DELIS project, which proposes a corpus-based lexicographical approach and frame-based semantic theory in dictionary construction},
URL = {https://iris.cnr.it/handle/20.500.14243/118624},
ISBN = {90-900-7537-2},
}
@INPROCEEDINGS{PETERS_1994_INPROCEEDINGS_PFMZ_364141,
AUTHOR = {Peters, C. and Federici, S. and Montemagni, S. and Zamorani, C. N.},
TITLE = {From machine readable dictionaries to lexicons for NLP: the cobuild dictionaries-a different approach},
YEAR = {1994},
ABSTRACT = {We describe the results of a syntactic-semantic parser for Cobuild dictionary definitions. Unlike previous work on the automatic analysis of machine readable dictionaries, the particular structure of the Cobuild definition allows us to derive information that classifies the lexical item mainly in terms of the selectional restrictions or preferences encoded on its arguments. The resulting formalized lexical entries contain data that has generally been lacking in other lexical representations but which is expected to be very useful in a wide range of NLP purposes. We show how this information can be used in dictionary sense disambiguation by creating links throughout the lexicon both on the paradigmatic and the syntagmatic axes},
KEYWORDS = {Lexical databases, Information storage and retrieval. Dictionaries},
PAGES = {147-157},
URL = {https://iris.cnr.it/handle/20.500.14243/364141},
CONFERENCE_NAME = {6th International Congress on Lexicography},
BOOKTITLE = {Euralex 1994 Proceedings},
EDITOR = {Martin, W.},
}
@INPROCEEDINGS{PICCHI_1994_INPROCEEDINGS_PPM_366279,
AUTHOR = {Picchi, E. and Peters, C. and Marinai, E.},
TITLE = {Strumenti computazionali per l'apprendimento delle lingue: una stazione di lavoro integrata},
YEAR = {1994},
ABSTRACT = {Presentiamo un prototipo di stazione di lavoro progettata per essere uno strumento efficiente e facile da usare per coloro che apprendono una seconda lingua. La stazione di lavoro è costituita da due componenti principali: una base di dati lessicali mono e bilingui e un sistema testuale per l'interrogazione di corpora testuali mono e bilingui. Il componente lessicale è corredato di un sistema di interrogazione per l'accesso ai dati dei dizionari monolingui e bilingui (nel prototipo presentato sono utilizzate come lingue di riferimento l'italiano e l'inglese). L'altro componente permette l'interrogazione degli archivi testuali mono e bilingui. Una procedura automatica è in grado di rendere "paralleli" due testi, uno traduzione dell'altro, permettendo una interrogazione simultanea di tali testi. La stazione di lavoro funziona su personal computer operativo MS/DOS e con un'interfaccia user friendly di tipo Windows},
KEYWORDS = {Language, Arts and humanities},
PAGES = {189-200},
URL = {https://iris.cnr.it/handle/20.500.14243/366279},
CONFERENCE_NAME = {Didamatica '94. Informatica per la didattica},
BOOKTITLE = {Atti-Lavori scientifici},
EDITOR = {Andronico, A. and Casadei, G. and Sacerdoti, G.},
}
@TECHREPORT{BARNBROOK_1994_TECHREPORT_BCFHMPSS_424362,
AUTHOR = {Barnbrook, G. and Calzolari, N. and Federici, S. and Hoelter, M. and Montemagni, S. and Peters, C. and Schnelle, H. and Sinclair, J.},
TITLE = {ET10/51-Deliverable 8: Evaluation Report},
YEAR = {1994},
ABSTRACT = {The objective of the work in Pisa has been to translate and produce instantiations of the syntactically parsed definitions of the Cobuild dictionary: provided by Birmingham in a Typed Feature Structure formalism. However, as described in Methodology above, our results have been produced at two different levels: intermediate results; final results in the form of TFS entries. In the following, we will discuss briefly the possible applications of these different results for the three user types recognized in the introduction to this section: i. Human user ii. Human user-assisted by the machine iii. The machine Obviously, the discussion here below refers entirely to the results that would be obtained once the parser has been applied to the whole dictionary},
KEYWORDS = {Language, Computational linguistics, Formal Definitions and Theory},
PAGES = {38},
URL = {https://iris.cnr.it/handle/20.500.14243/424362},
}
@TECHREPORT{CALZOLARI_1994_TECHREPORT_CFMP_424783,
AUTHOR = {Calzolari, N. and Federici, S. and Montemagni, S. and Peters, C.},
TITLE = {ET-10/51-Final Report: Par. 3-Extracting, representing and using syntactic-semantic information from cobuild definitions},
YEAR = {1994},
ABSTRACT = {In May 1992 a new research project brought together the authors of this report. With the help and support of several other people and institutions, they worked steadily for two years, trying to improve the design and building of machine-usable lexicons, for automatic translation and many other applications. The starting point was clear. Around 1989 Helmut Schnelle of the Ruhr-Universitat Bochum became interested in the way in which words were defined in a new kind of dictionary called Cobuild. He thought that since theywere couched in sentences of apparently ordinary English, and had distinctive and repetitive shapes according to their meanings, it should be possible to represent them in logical form by means of regular rules},
KEYWORDS = {Language, Computational linguistics, Formal Definitions and Theory, Sema},
PAGES = {162},
URL = {https://iris.cnr.it/handle/20.500.14243/424783},
}
@ARTICLE{MONACHINI_1993_ARTICLE_MP_118585,
AUTHOR = {Monachini, M. and Picchi, E.},
TITLE = {Computational Lexicography: A Query System for Tagged Corpora},
YEAR = {1993},
URL = {https://iris.cnr.it/handle/20.500.14243/118585},
ISSN = {1216-8076},
JOURNAL = {ACTA LINGUISTICA HUNGARICA},
}
@ARTICLE{PETERS_1993_ARTICLE_PP_371451,
AUTHOR = {Peters, C. and Picchi, E.},
TITLE = {Computational tools for the translator: an integrated workstation},
YEAR = {1993},
ABSTRACT = {Translators need fast and f1exible computational tools to assist them in the task of rendering a text written in one language as skillfully as possible in another. Such tools must be easy-to-use, relatively economic and, wherever possible, portable, as many translators are free-lancers and much translating work is done at home. In the paper, we describe a prototype workstation that has been designed for the translator bearing these requirements in mind},
URL = {https://iris.cnr.it/handle/20.500.14243/371451},
}
@TECHREPORT{CALZOLARI_1993_TECHREPORT_CFPMS_363145,
AUTHOR = {Calzolari, N. and Federici, S. and Peters, C. and Montemagni, S. and Spanu, A.},
TITLE = {Extracting syntactic-semantic information from cobuild definitions and representing it in TFS},
YEAR = {1993},
ABSTRACT = {In this part of the Deliverable, we present (i) the work in Pisa on the design and development of a specialised parser to extract syntactic-semantic information from the definitions contained in the Cobuild Student's Dictionary and (ii) a preliminary proposal for the mapping of such information onto a TFS representation system. The work discussed here concentrates on the analysis and extraction of information from the left hand side (LHS) of the definition and the parser must be considered as a first prototype version, to be further refined and extended as our work progresses. Similarly, once we have been able to assess the first results of the parser, it will be possible to define the most appropriate type system to represent the information extracted from this side of the definition},
KEYWORDS = {Representation languages, Knowledge Representation Formalisms and Methods},
URL = {https://iris.cnr.it/handle/20.500.14243/363145},
}
@TECHREPORT{MONACHINI_1993_TECHREPORT_MP_365921,
AUTHOR = {Monachini, M. and Peters, C.},
TITLE = {Survey of tools for corpus-based lexical description},
YEAR = {1993},
ABSTRACT = {This survey deals with tools and computational approaches for corpus based lexicon building. It concentrates on the tasks of the "chain" of work items of corpus based lexicography for which DELIS will implement tools. The goal of this survey is not to give a full picture of corpus handling tools or of lexicographic workstations, but rather to point to those realizations inside and outside the DELIS consortium which are prominent models for DELIS tool building work. Secondly, the tools available at the DELIS members'sites will be presented and an assessment will be made concerning the feasibility of an integration of the newly built DELIS tools with these tools existing at different sites. This is most relevant in the area of annotation of corpora. The corpus exploration work in DELIS, in view of lexicon construction, must rely on the input it receives for different languages. Consequently, the tools available for each language, the type of output they produce and the possibility of interfacing these tools with elements of the DELIS toolbox must be described},
KEYWORDS = {Lexical semantics, Natural Language Processing},
URL = {https://iris.cnr.it/handle/20.500.14243/365921},
}
@TECHREPORT{MONACHINI_1993_TECHREPORT_MPP_365934,
AUTHOR = {Monachini, M. and Peters, C. and Picchi, E.},
TITLE = {The Pisa tools. A survey of computational tools for corpus-based lexicon building},
YEAR = {1993},
ABSTRACT = {In this report, we give a description of the different tools which have been designed and implemented at Pisa for (i) corpus construction, management, annotation and querying, and (ii) diclionary and lexical database acquisition and processing activities. Almost alI of tbe modules described belong to the PìSystem, a fully integrated modular set of 1001s, developed over the last ten years at the ILC to meet the various needs of titerary and Iinguistic computing. Most of tbese tools are now being integrated into a Workstation that provides functions offering online access to both mono-and bilingual text corpora and lexical databases for indepth search operations and analyses},
KEYWORDS = {Lexical semantics, Natural Language Processing},
PAGES = {1-35},
URL = {https://iris.cnr.it/handle/20.500.14243/365934},
}
@TECHREPORT{PETERS_1993_TECHREPORT_PFMC_363132,
AUTHOR = {Peters, C. and Federici, S. and Montemagni, S. and Calzolari, N.},
TITLE = {Processing the ITU vocabulary: revisions and adaptations to the Pisa syntactic-semantic parser},
YEAR = {1993},
ABSTRACT = {The first version of the Pisa syntactic-semantic parser was described in detail in Deliverable 4, Section 2 and Appendices 2, 3, and 4. The scope of this report is to discuss the testing of the parser on the sample set of vocabulary which has been selected from the ITU Corpus (see Deliverable 6. 1) and to illustrate the revisions and extensions that are now being implemented. The report therefore concentrates on presenting analysis and extraction activities. We need to specify clearly all the kinds of information that we can extract from the Cobuild definitions before completing the description of the type system that will be used to represent them (to appear in Deliverable 7). Our parser takes as input the syntactically parsed definitions from Birmingham (referred to as the Birmingham input from now on) and analyses them, using complex pattern matching techniques, in order to derive and extract syntactic and semantic information. While the testing of the first version has confirmed the validity of the core procedures, it is clear that a strategy based on string matching must be tested over a relatively large sample of data before we can identify all the potentially significant markers that permit us to extract meaningful information. This means that, at least in the early stages, each time we test the parser over new samples of definitions, we expect to have to add to the basic set of rules. This report must thus be considered a description of work in progress. When discussing the changes that are now being implemented, continual reference will be made to the description of the first version of the parser presented in Deliverable 4, and to the templates used to represent the information extracted from the definitions. Examples of the new revised templates are given in the Appendix},
KEYWORDS = {Semantic, Knowledge Representation Formalisms and Methods},
PAGES = {1-17},
URL = {https://iris.cnr.it/handle/20.500.14243/363132},
}
@INPROCEEDINGS{MARINAI_1992_INPROCEEDINGS_MPP_398508,
AUTHOR = {Marinai, E. and Peters, C. and Picchi, E.},
TITLE = {Bilingual reference corpora: creation, querying, applications},
YEAR = {1992},
ABSTRACT = {The paper discusses the importance or bilingual reference corpora as valid sources or real-world renderings or texts written in one language (L1) in a second (L2) and illustrates their potential for exploitation in various kinds of crosslanguage studies. A system that has been developed for the creation management and interrogation of such corpora is presented and the integration of this system in a Workstation providing facilities to query and extract information from both mono-and bilingual text archives and lexical databases is described},
KEYWORDS = {Bilingual reference corpora},
PAGES = {221-228},
URL = {https://iris.cnr.it/handle/20.500.14243/398508},
CONFERENCE_NAME = {Complex '92},
}
@INPROCEEDINGS{MONACHINI_1992_INPROCEEDINGS_MP_118573,
AUTHOR = {Monachini, M. and Picchi, E.},
TITLE = {Tagged Corpora: A Query System},
YEAR = {1992},
URL = {https://iris.cnr.it/handle/20.500.14243/118573},
}
@INPROCEEDINGS{PICCHI_1992_INPROCEEDINGS_PPM_398506,
AUTHOR = {Picchi, E. and Peters, C. and Marinai, E.},
TITLE = {A translator's workstation},
YEAR = {1992},
ABSTRACT = {A description is given of the present state of development of a workstation that has been designed to provide the translator with efficient and easy-to-use computational tools. The aim is to offer translators fast and flexible on-line access to existing dictionary databases and bilingual text archives and also to supply them with facilities for updating, adding to and personalizing the system data archives with their own material},
KEYWORDS = {translator's workstation},
PAGES = {972-976},
URL = {https://iris.cnr.it/handle/20.500.14243/398506},
CONFERENCE_NAME = {COLING-92},
}
@INPROCEEDINGS{PICCHI_1992_INPROCEEDINGS_PPM_398512,
AUTHOR = {Picchi, E. and Peters, C. and Marinai, E.},
TITLE = {The Pisa lexicographic workstation: the bilingual components},
YEAR = {1992},
ABSTRACT = {The main components ot the Pisa Lexicographic Workstation are a full text retrieval system and a lexical database system: each system incorporates procedures that have been implemented to meet the specific needs of the lexicographer. The paper describes the recent tailoring of existing modules and the development of new ones with bilingual lexicography in mind. The aim is to provide a flexible, user friendly system that can be employed in all stages of dictionary compilation, from the acquisition of citation material to the formatting of the entry for printing},
KEYWORDS = {Computational lexicography, Computer-aided lexicography, Bilingual lexicography, Bilingual lexical databases, Parallel text retrieval acm: J.5 Arts and Humanities},
PAGES = {277-285},
URL = {https://iris.cnr.it/handle/20.500.14243/398512},
VOLUME = {1},
CONFERENCE_NAME = {EURALEX '92},
}
@TECHREPORT{PETERS_1992_TECHREPORT_PR_394898,
AUTHOR = {Peters, C. and Roventini, A.},
TITLE = {Acquilex: computational model of the dictionary entry},
YEAR = {1992},
ABSTRACT = {Printed dictionary entries are highly structured and very complex pieces of text; the information content depends to a large extent on features of layout and the use of a metalanguage, which is generally (but not always completely) explained in the Introduction and User Notes at the beginning of the dictionary. The entry thus contains a mixture of explicit and implicit information interspersed with codes for type-setting and formatting. However, in a computational model of the entry, the lexical information must be extracted from the rest, interpreted and represented explicitly. At the same time, it is useful to maintain a trace of the entry structure, represented in the printed version by means of particular typographic conventions},
KEYWORDS = {Acquilex},
URL = {https://iris.cnr.it/handle/20.500.14243/394898},
}
@INPROCEEDINGS{BINDI_1991_INPROCEEDINGS_BCMP_117878,
AUTHOR = {Bindi, R. and Calzolari, N. and Monachini, M. and Pirrelli, V.},
TITLE = {Lexical Knowledge Acquisition from Textual Corpora: A Multivariate Statistic Approach as an Integration to Traditional Methodologies},
YEAR = {1991},
URL = {https://iris.cnr.it/handle/20.500.14243/117878},
}
@INPROCEEDINGS{COTONESCHI_1991_INPROCEEDINGS_CM_118558,
AUTHOR = {Cotoneschi, P. and Monachini, M.},
TITLE = {An Empirical Experience on the Utilization of the Italian Corpus in Meaning Analysis},
YEAR = {1991},
URL = {https://iris.cnr.it/handle/20.500.14243/118558},
}
@INPROCEEDINGS{MARCONI_1991_INPROCEEDINGS_MR_19985,
AUTHOR = {Marconi, L. and Ratti, D.},
TITLE = {Aplicaciones de redes neuronales al lenguaje natural},
YEAR = {1991},
ABSTRACT = {In the context of current connectivist theories we present a neural network simuleting some language learning phaenomena, i. e. synonyms, plural, recognition of semantic field. The performance of back-propagation algorithm for such net is computed for specific data. Finally we propose a coding scheme to language application},
PAGES = {699-710},
URL = {https://iris.cnr.it/handle/20.500.14243/19985},
PUBLISHER = {PPU, S. A (Barcelona, ESP)},
ISBN = {84-7665-867-2},
CONFERENCE_NAME = {VI Congreso de Lenguajes Naturales y Lenguajes Formales},
CONFERENCE_PLACE = {Barcelona},
BOOKTITLE = {Lenguajes Naturales y Lenguajes Formales},
EDITOR = {Martín Vide, C.},
}
@INPROCEEDINGS{MARINAI_1991_INPROCEEDINGS_MPP_425240,
AUTHOR = {Marinai, E. and Peters, C. and Picchi, E.},
TITLE = {BILINGUAL REFERENCE CORPORA-A SYSTEM FOR PARALLEL TEXT RETRIEVAL},
YEAR = {1991},
ABSTRACT = {A system for the automatic creation and retrieval of parallel concordances from a Bilingual Reference Corpus is described. At present, the system runs on a test set of ltalian/English 'bilingual' texts. A description is given of the different stages of the procedure which aligns and links equivalent texts in the two languages and of the way in which the query system uses these links to construct parallel contexts. The procedure uses a number of the components of the PiSystem, an integrated set of tools for text processing and analysis, including morphological analyzers and generators, and monolingual and bilingual lexical database systems. The user can use the system to query either of the two sets of texts (Italian and English) and, for any form or cooccurrences of forms found in the set of texts for one language, can retrieve parallel contrastive contexts from the other. The system should be of particular interest to bilingual lexicographers, translators and linguists, and should also find applications in the office automation area and in the language industry in general},
KEYWORDS = {BILINGUAL REFERENCE CORPORA, SYSTEM, PARALLEL TEXT RETRIEVAL},
PAGES = {63-70},
URL = {https://iris.cnr.it/handle/20.500.14243/425240},
CONFERENCE_NAME = {Seventh Annual Conference of the UW Centre for the New Oed and Text Research. Using Corpora},
}
@INPROCEEDINGS{MARINAI_1991_INPROCEEDINGS_MPP_425222,
AUTHOR = {Marinai, E. and Peters, C. and Picchi, E.},
TITLE = {A first prototype of a system for the semi-automatic sense linking and merging of mono-and bilingual ldbs},
YEAR = {1991},
ABSTRACT = {A method far the (semi-automatic) linking of lexical data bases based on different source dictionaries and their partial merging is presented. The resu1ts can be modified interactively by the user and saved to form part of a new merged LDB whose entries will contain all the information included in the separate source LDBs. The aim is to provide not only a tool which makes it easier to compare and study lexical data derived from different sources but also to permit linguistic and lexical analyses on much richer data},
KEYWORDS = {prototype, system, semi-automatic sense linking mono Idbs, bilingual ldbs},
PAGES = {293-298},
URL = {https://iris.cnr.it/handle/20.500.14243/425222},
CONFERENCE_NAME = {Making connections},
}
@INPROCEEDINGS{RATTI_1991_INPROCEEDINGS_RM_19981,
AUTHOR = {Ratti, D. and Marconi, L.},
TITLE = {Criterios y Metodos para la creacion de un lexico de frecuencia de la lengua escrita conocida y usada por los ninos},
YEAR = {1991},
ABSTRACT = {The aim of this project is to identify the active and passive lexicon possesed, in the average, by elementary school children. We use the computer to create and explore, with appropriate methodologies, a reference-corpus of such lexicon},
PAGES = {861-867},
URL = {https://iris.cnr.it/handle/20.500.14243/19981},
PUBLISHER = {PPU, S. A (Barcelona, ESP)},
ISBN = {84-7665-867-2},
CONFERENCE_NAME = {VI Congreso de Lenguajes Naturales y Lenguajes Formales},
CONFERENCE_PLACE = {Barcelona},
BOOKTITLE = {Lenguajes Naturales y Lenguajes Formales},
EDITOR = {Martín Vide, C.},
}
@TECHREPORT{PETERS_1991_TECHREPORT_PP_424609,
AUTHOR = {Peters, C. and Picchi, E.},
TITLE = {Dictionary browsing tool requirements},
YEAR = {1991},
ABSTRACT = {The main features of a dictionary browsing tool designed to satisfy the requirements of the linguist or lexicographer working on machine-readable dictionary data are discussed. Examples are given of the results which can be obtained using existing tools, and recommendations are made regarding the functions which should be included in a dictionary browsing tool developed within the MULTILEX project},
KEYWORDS = {Dictionary browsing, tool requirements},
URL = {https://iris.cnr.it/handle/20.500.14243/424609},
}
@EDITORIAL{MARCONI_1990_EDITORIAL_MRMR_205582,
AUTHOR = {Marconi, L. and Ratti, D. and Morgavi, G. and Rolando, C.},
TITLE = {Italiano Ortografia},
YEAR = {1990},
ABSTRACT = {Questo libro contiene il formario dell'italiano elaborato a partire dal testo: flessioni rime e anagrammi. In particolare contiene:-Le coniugazioni e declinazioni di 58. 000 vocaboli-La classificazione dei verbi in 94 classi-da essere a sedurre -, con indicazione delle varianti e delle irregolarità-I plurali e femminili di sostantivi, pronomi e aggettivi-I femminili dei nomi che indicano mansioni, cariche, professioni e mestieri},
URL = {https://iris.cnr.it/handle/20.500.14243/205582},
ISBN = {9788808068644},
}
@INPROCEEDINGS{ARRIGO_1990_INPROCEEDINGS_ACGMMRRS_312000,
AUTHOR = {Arrigo, P. and Corana, A. and Giuliano, F. and Marconi, L. and Morando, M. and Ridella, S. and Rolando, C. and Scalia, F.},
TITLE = {Neural networks: computer simulation and biomedical applications},
YEAR = {1990},
ABSTRACT = {We present a version of the Back-Propagation (BP) algorithm based on Level 3 BLAS, easily portable onto SIMD and MIMD computers. An implementation is shown for FPS M64 Series Minisupercomputers, where the peak performances of the processor are reached. Some biomedical applications of the proposed algorithm are shown: computer-aided diagnosis of dyspepsia, analysis of PH-metric data and reconstruction of ECG signals},
KEYWORDS = {high-performance computing, neural network simulation, Back-Propagation algorithm, Level 3 BLAS, SIMD computer, MIMD computer, biomedical applications},
PAGES = {205-212},
URL = {https://iris.cnr.it/handle/20.500.14243/312000},
PUBLISHER = {World Scientific Publishing Co (Singapore, SGP)},
CONFERENCE_NAME = {Parallel Architectures and Neural Networks},
CONFERENCE_PLACE = {Singapore},
BOOKTITLE = {Parallel Architectures and Neural Networks},
EDITOR = {Caianiello, E. R.},
}
@INPROCEEDINGS{PICCHI_1990_INPROCEEDINGS_PPC_398463,
AUTHOR = {Picchi, E. and Peters, C. and Calzolari, N.},
TITLE = {Implementing a bilingual lexical database system},
YEAR = {1990},
ABSTRACT = {The current state of progress of a research project for the design and development of a bilingual, Italian-English/English-Italian, lexical database system is presented. The aim is to create an integrated system in which a number of monolingual electronic dictionaries and/or lexical databases can be linked through the medium of a bilingual database. In addition, procedures are being implemented to establish access paths from the dictionary data to archives of texts in machine-readable form and language reference corpora, and vice versa. The system not only provides the standard look-up functions offered by conventional mono-and bilingual dictionaries but the organization of the data on database structures makes it possible to access and exploit the lexical information in many different and new ways. The structuring of the bilingual component is described in some detail and some of the possible applications envisaged for a tool of this type in the fields of pure and applied linguistics, lexicography and language learning are mentioned},
KEYWORDS = {Lexical databases},
PAGES = {317-329},
URL = {https://iris.cnr.it/handle/20.500.14243/398463},
ISBN = {9630558637},
CONFERENCE_NAME = {3rd Euralex International Congress. BudaLEX '88},
BOOKTITLE = {Budalex '88. 3rd Euralex International Congress. Papers (Budapest, 1988)},
EDITOR = {Magay, T. and Zigany, J.},
}
@INPROCEEDINGS{PICCHI_1990_INPROCEEDINGS_PPC_399936,
AUTHOR = {Picchi, E. and Peters, C. and Calzolari, N.},
TITLE = {A tool for the second language learner organizing bilingual dictionary data in an interactive workstation},
YEAR = {1990},
ABSTRACT = {The data contained in a conventional English/ ltalian, ltalian/ English dictionary, recorded in machine-readable form and coded for computer typesetting, have been parsed and organized in a database type structure on a persona! computer. The aim is to implement an interactive bilingual lexical workstation in order to offer the second language learner and user a tool which overcomes many of the restrictions traditionally imposed by the norma! organization of the printed bi/inguai dictionary and allows him to consult and exploit the lexical materia! 1n new ways},
KEYWORDS = {Second language learner, Bilingual dictionary, Workstation},
PAGES = {334-344},
URL = {https://iris.cnr.it/handle/20.500.14243/399936},
ISBN = {2-05-101079-X},
CONFERENCE_NAME = {15th International Conference A. L. L. C},
BOOKTITLE = {TRAVAUX DE LINGUISTIQUE QUANTITATIVE},
EDITOR = {Choueka, Y.},
}
@TECHREPORT{CALZOLARI_1990_TECHREPORT_CPR_396320,
AUTHOR = {Calzolari, N. and Peters, C. and Roventini, A.},
TITLE = {Computational model of the dictionary entry. Preliminary report},
YEAR = {1990},
ABSTRACT = {The description of the computational model of the dictionary entry to be used within the ACQUILEX Project consists of two separate sections. The first part, Section 1, presents a metod wich can be used to represent in a uniform way the content and structure of the entries of machine-readable dictionaries (MRDs), and cpntains explicitrepresentation of texts of international explicit purpose, Initiative Computational Linguistics Linguistic Computing (ALLC)},
KEYWORDS = {Computational model, Dictionary entry},
PAGES = {96},
URL = {https://iris.cnr.it/handle/20.500.14243/396320},
}
@TECHREPORT{MARINAI_1990_TECHREPORT_MPP_400790,
AUTHOR = {Marinai, E. and Peters, C. and Picchi, E.},
TITLE = {The Pisa multi-lexical database. An integrated system for the acquisition, maintenance and interrogation of mono-and bilingual LDBS},
YEAR = {1990},
ABSTRACT = {The objective of the present report is to provide documentation for the 12 month release of the Multi-lexical Database (MLDB) system software, which is now being built at the "Istituto di Linguistica Computazionale", CNR, Pisa, within the context of a description of the various stages of system design and development and includes a preliminary version of the technical description for the Twelve Month Deliverable of the project review workshop in Cambridge, UK, 27-28 November 1990. The scope of the system is to provide fast and flexible access to all the lexical information contained in the component machine-readable dictionaries: morphological, syntactic, semantic and conceptual},
KEYWORDS = {LDBS, Interrogation, Acquisition, Maintenance},
PAGES = {63},
URL = {https://iris.cnr.it/handle/20.500.14243/400790},
}
@MISC{BINDI_1989_MISC_BMO_117884,
AUTHOR = {Bindi, R. and Monachini, M. and Orsolini, P.},
TITLE = {Italian Reference Corpus},
YEAR = {1989},
URL = {https://iris.cnr.it/handle/20.500.14243/117884},
}
@MISC{ZAMPOLLI_1989_MISC_ZMP_17345,
AUTHOR = {Zampolli, A. and Marinelli, R. and Pardelli, G.},
TITLE = {I sistemi di documentazione dell'ILC},
YEAR = {1989},
ABSTRACT = {Il documento si concentra sui punti seguenti: a) Recupero e trasformazione dei materiali codificati su archivi magnetici e costruzione di un sistema informativo per la gestione mista di archivi con dati catalografici normalizzati e dati bibliografici; b) Sistema di gestione dell' d'archivio scientifico per le varie lingue; c) Recupero e trasformazione di informazioni bibliografiche da VM a altro sistema informativo},
KEYWORDS = {Documentazione, Linguistica Computazionale},
PAGES = {1-13},
URL = {https://iris.cnr.it/handle/20.500.14243/17345},
}
@INCOLLECTION{MORGAVI_1988_INCOLLECTION_MAMRS_201240,
AUTHOR = {Morgavi, G. and Arrigo, P. and Marconi, L. and Ridella, S. and Scalia, F.},
TITLE = {Modification of the chaotic/ordered state of biological systems by using electric fields},
YEAR = {1988},
URL = {https://iris.cnr.it/handle/20.500.14243/201240},
}
@EDITORIAL{MARCONI_1988_EDITORIAL_MRMR_205572,
AUTHOR = {Marconi, L. and Ratti, D. and Morgavi, G. and Rolando, C.},
TITLE = {Flessioni, Rime, Anagrammi: l'italiano in scatola di montaggio},
YEAR = {1988},
ABSTRACT = {Flessioni, Rime, Anagrammi è un'opera formata da tre moduli distinti. Ognuno di essi nasce da un unico elenco di parole-le voci-madri -, costituito da tutte le parole definite ne Il Nuovo Zingarelli minore-Vocabolario della Lingua Italiana-Undicesima edizione minore(1987): Questo elenco di voci-madri è stato smontato e ricomposto in ciascuno dei tre moduli in base a differenti criteri. Il modulo Flessioni è lo strumento che consente di costruire le forme flesse-cioè le forme declinate o coniugate-di ognuna delle voci-madri. Le declinazioni di sostantivi, aggettivi, articoli e pronomi sono indicate tramite l'esplicita menzione delle desinenze doi ciascuno di essi. I casi dubbi o con pluralità di forme sono ulteriormente chiariti da note esplicative e di commento. Le coniugazioni dei verbi sono invece riferite, per mezzo di un'indicazione numerica, a uno dei 94 modelli di coniugazione: i loro paradigmi sono riportati-verbo per verbo, da essere a sedurre-nelle pagine iniziali del volume. Il modulo Rime è un dizionario inverso: le voci madri sono qui elencate nel consueto ordine alfabetico dalla A alla Z, ma considerando per prima l'ultima lettera di ogni parola, poi la penultima, poi la terzultima, e così via. In altri termini, mentre nei normali vocabolari compsaiono prima le parole che iniziano per A, poi quelle che iniziano per B, etc., qui compaiono prima quelle che finiscono per A, seguite da quelle che finiscono per B, e così via. Perciò si parte da a, si continua con fiaba, gellaba, sillaba, barabba, sabba, sbobba, gobba, giubba, gleba, ameba, foiba, scriba, diatriba, alba,. e si finisce con gin-fizz. Il modulo Anagrammi è un catalogo ordinato di tutte le parole formate da lettere uguali disposte in ordine diverso: per esempio armi, mari, mira, rima. L'elenco è stato ottenuto confrontando in modo sistematico tutte le forme flesse delle voci-madri: i 172. 662 anagrammi così trovati sono suddivisi in più sezioni, a seconda del numero di lettere di ciascuno di essi. In ogni sezione gli anagrammi sono elencati in corrispondenza della voce formata dalle loro stesse lettere disposte in ordine alfabetico: ad esempio il gruppo armi, mari, mira, rima si trova alla voce AIMR della sezione Parole di 4 lettere},
URL = {https://iris.cnr.it/handle/20.500.14243/205572},
ISBN = {8808030520},
}
@INPROCEEDINGS{MORGAVI_1988_INPROCEEDINGS_MAMR_236286,
AUTHOR = {Morgavi, G. and Arrigo, P. and Marconi, L. and Ridella, S.},
TITLE = {Chaotic oscillating membrane extreme high sensitivity to externally applied electric field},
YEAR = {1988},
URL = {https://iris.cnr.it/handle/20.500.14243/236286},
}
@INCOLLECTION{MORGAVI_1987_INCOLLECTION_MAMRRS_236283,
AUTHOR = {Morgavi, G. and Arrigo, P. and Marconi, L. and Ridella, S. and Rolando, C. and Scalia, F.},
TITLE = {High sensitivity chaotic behaviour in sinusoidally driven Hodgkin-Huxley equations},
YEAR = {1987},
URL = {https://iris.cnr.it/handle/20.500.14243/236283},
}
@INPROCEEDINGS{CORANA_1987_INPROCEEDINGS_CMMMRR_201227,
AUTHOR = {Corana, A. and Marconi, L. and Martini, C. and Morgavi, G. and Ridella, S. and Rolando, C.},
TITLE = {How to reach maximum theoretical performance in solving linear equations systems on FPS Architecture 38/64 bits},
YEAR = {1987},
ABSTRACT = {A technique for dense linear system solution is presented which reaches maximum performances on attached processors like FPS-120, 5000 and X64 using the Fortran language with calls to the vector routines. Starting from the Dongarra's LU factorization algorithm the key idea is to carry out a pseudo-transposition of the lower triangular matrix L (including the main diagonal) around the minor diagonal. The pseudo-transposition allows to carry out all the matrix vector operations involved in LU factorization with only stride 1 dot product operations which, using the TM Auxiliary Memory and the TMDOT routine, can be executed in the FPS processor obtaining the maximum speed. Since the algorithm uses only vector instructions it is fully portable on all the FPS 38/64 bit machines and in general on all the vector computers with a similar memory structure. Furthermore the algorithm can be easily translated into the new FORTRAN 8X, which will probably become the standard for future SIMD computers for numerical applications},
KEYWORDS = {solution of linear equation, optimized algorithm, vector processor, FPS architectture, performance evaluation},
PAGES = {173-179},
URL = {https://iris.cnr.it/handle/20.500.14243/201227},
CONFERENCE_NAME = {Array Conference},
}
@INPROCEEDINGS{MORGAVI_1987_INPROCEEDINGS_MACMR_201236,
AUTHOR = {Morgavi, G. and Arrigo, P. and Casaleggio, A. and Marconi, L. and Ridella, S.},
TITLE = {Transition between chaotic and ordered state in biological membrane induced by an external electric field},
YEAR = {1987},
URL = {https://iris.cnr.it/handle/20.500.14243/201236},
}
@INPROCEEDINGS{MORGAVI_1987_INPROCEEDINGS_MAMRS_235717,
AUTHOR = {Morgavi, G. and Arrigo, P. and Marconi, L. and Ridella, S. and Scalia, F.},
TITLE = {How small currents can change from periodic to chaotic state the HH membrane},
YEAR = {1987},
URL = {https://iris.cnr.it/handle/20.500.14243/235717},
}
@INPROCEEDINGS{MORGAVI_1987_INPROCEEDINGS_MAMRS_201221,
AUTHOR = {Morgavi, G. and Arrigo, P. and Marconi, L. and Ridella, S. and Scalia, S.},
TITLE = {Membrane chaotic and periodic behaviour induced by external current},
YEAR = {1987},
URL = {https://iris.cnr.it/handle/20.500.14243/201221},
}
@INPROCEEDINGS{MORGAVI_1987_INPROCEEDINGS_MACMRS_235724,
AUTHOR = {Morgavi, G. and Arrigo, P. and Casaleggio, A. and Marconi, L. and Ridella, S. and Scalia, F.},
TITLE = {Chaotic behaviour of a self oscillating cell membrane induced by low amplitude electric field},
YEAR = {1987},
URL = {https://iris.cnr.it/handle/20.500.14243/235724},
}
@ARTICLE{MARCONI_1986_ARTICLE_MMRR_201210,
AUTHOR = {Marconi, L. and Morgavi, G. and Ridella, S. and Rolando, C.},
TITLE = {Non linear ionic fluxes in an electrically exposed cell},
YEAR = {1986},
ABSTRACT = {In this paper the problem of non-thermal interaction of a low-frequency, low-amplitude electric field with a non-linear cell membrane is considered. The main result of biological interest is that, when the applied time-varying, zero mean electric field is spatially non-uniform, the pattern of the rectified current density looks like the one observed experimentally in the single-cell early developmental stage of the egg of the seaweed Fucus. It is therefore possible that an external field, applied for a very long time, can start developmental processes by mimicking the natural ionic current pattern},
URL = {https://iris.cnr.it/handle/20.500.14243/201210},
DOI = {10.1016/0302-4598(86)80048-4},
ISSN = {0302-4598},
JOURNAL = {BIOELECTROCHEMISTRY AND BIOENERGETICS},
}
@INPROCEEDINGS{ARRIGO_1986_INPROCEEDINGS_AMMRRC_237900,
AUTHOR = {Arrigo, P. and Marconi, L. and Morgavi, G. and Ridella, S. and Rolando and , C.},
TITLE = {Do externally applied electric fields influence the pattern formation in a developing cell?},
YEAR = {1986},
ABSTRACT = {We consider the problem of nonthermal interaction of a low frequency, low amplitude zero-mean electric field with a cell with nonlinear membrane. If the external electric field is spatially uniform the pattern of the rectified current densities looks like the one observed experimentally in the seaweed Fucus as an occasional 'birth defect' where two roots germinate. If the external electric field is spatially nonuniform the pattern of the rectified current densities looks like the one observed experimentally in a normally developing egg. This result points out the importance of a good characterization of the applied fields in biological experiments and in clinical therapy},
URL = {https://iris.cnr.it/handle/20.500.14243/237900},
ISBN = {0444989862},
}
@INPROCEEDINGS{MORGAVI_1986_INPROCEEDINGS_MMRR_201213,
AUTHOR = {Morgavi, G. and Marconi, L. and Ridella, S. and Rolando, C.},
TITLE = {Influence of externally applied electric field on growth regulation by modification of ionic fluxes and external ion concentration},
YEAR = {1986},
URL = {https://iris.cnr.it/handle/20.500.14243/201213},
}
@INPROCEEDINGS{MORGAVI_1986_INPROCEEDINGS_MAMRR_201217,
AUTHOR = {Morgavi, G. and Arrigo, P. and Marconi, L. and Ridella, S. and Rolando, C.},
TITLE = {Do externally applied electric fields influence the pattern formation in a developing cell?},
YEAR = {1986},
URL = {https://iris.cnr.it/handle/20.500.14243/201217},
}
@TECHREPORT{BIANCHIBANDINELLI_1986_TECHREPORT_BBBFFMSV_377410,
AUTHOR = {Bianchi Bandinelli, R. and Beltrame, R. and Bindi, R. and Faconti, G. and Ferrini, R. and Masserotti, M. V. and Severino, G. and Vasarelli, G.},
TITLE = {Relazione tecnica per la revisione del parco stampanti del CNUCE e dell'Istituto di Linguistica Computazionale},
YEAR = {1986},
ABSTRACT = {No abstract available},
KEYWORDS = {Park Printers},
PAGES = {20},
URL = {https://iris.cnr.it/handle/20.500.14243/377410},
}