2013 |
Charting the digital library evaluation domain with a semantically enhanced mining methodology (Paper in Conference Proceedings) Afiontzi, Eleni; Kazadeis, Giannis; Papachristopoulos, Leonidas; Sfakakis, Michalis; Tsakonas, Giannis; Papatheodorou, Christos Proceedings of the 13th ACM/IEE-CS joint conference on Digital libraries, JCDL , Pages: 125-134 , 2013. @inproceedings{Afiontzi2013, title = {Charting the digital library evaluation domain with a semantically enhanced mining methodology}, author = {Eleni Afiontzi and Giannis Kazadeis and Leonidas Papachristopoulos and Michalis Sfakakis and Giannis Tsakonas and Christos Papatheodorou}, url = {http://dl.acm.org/citation.cfm?id=2467713}, doi = {10.1145/2467696.2467713}, year = {2013}, date = {2013-07-01}, booktitle = {Proceedings of the 13th ACM/IEE-CS joint conference on Digital libraries, JCDL }, pages = {125-134 }, abstract = {The digital library evaluation field has an evolving nature and it is characterized by a noteworthy proclivity to enfold various methodological orientations. Given the fact that the scientific literature in the specific domain is vast, researchers require tools that will exhibit either commonly acceptable practices, or areas for further investigation. In this paper, a data mining methodology is proposed to identify prominent patterns in the evaluation of digital libraries. Using Machine Learning techniques, all papers presented in the ECDL and JCDL conferences between the years 2001 and 2011 were categorized as relevant or non-relevant to the DL evaluation domain. Then, the relevant papers were semantically annotated according to the Digital Library Evaluation Ontology (DiLEO) vocabulary. The produced set of annotations was clustered to evaluation patterns for the most frequently used tools, methods and goals of the domain. Our findings highlight the expressive nature of DiLEO, place emphasis on semantic annotation as a necessary step in handling domain-centric corpora and underline the potential of the proposed methodology in the profiling of evaluation activities.}, keywords = {}, pubstate = {published}, tppubtype = {inproceedings} } The digital library evaluation field has an evolving nature and it is characterized by a noteworthy proclivity to enfold various methodological orientations. Given the fact that the scientific literature in the specific domain is vast, researchers require tools that will exhibit either commonly acceptable practices, or areas for further investigation. In this paper, a data mining methodology is proposed to identify prominent patterns in the evaluation of digital libraries. Using Machine Learning techniques, all papers presented in the ECDL and JCDL conferences between the years 2001 and 2011 were categorized as relevant or non-relevant to the DL evaluation domain. Then, the relevant papers were semantically annotated according to the Digital Library Evaluation Ontology (DiLEO) vocabulary. The produced set of annotations was clustered to evaluation patterns for the most frequently used tools, methods and goals of the domain. Our findings highlight the expressive nature of DiLEO, place emphasis on semantic annotation as a necessary step in handling domain-centric corpora and underline the potential of the proposed methodology in the profiling of evaluation activities. |
An approach to analyzing working practices of research communities in the humanities (Journal Article) Benardou, Agiatis; Constantopoulos, Panos; Dallas, Costis International Journal of Humanities and Arts Computing, Volume: 7 (1-2), Pages: 105-127, 2013. @article{Benardou2013, title = {An approach to analyzing working practices of research communities in the humanities}, author = {Agiatis Benardou and Panos Constantopoulos and Costis Dallas}, url = {http://www.euppublishing.com/doi/abs/10.3366/ijhac.2013.0084}, year = {2013}, date = {2013-01-03}, journal = {International Journal of Humanities and Arts Computing}, volume = {7}, number = {1-2}, pages = {105-127}, abstract = {The need for a firm understanding of the working practices of researchers in the humanities emerges as a prerequisite for the development of effective digital research infrastructures. This paper will focus on the rationale behind the design and implementation of two related studies conducted in the context of two European e-Infrastructures projects, DARIAH and EHRI. Within DARIAH the challenge involved conducting, analysing and understanding research practices of arts and humanities researchers, a largely ill-defined community encompassing a wide spectrum of disciplines. Each of them deals with a variety of objects employing an extensive number of methods. In the context of EHRI, the challenge is slightly different, due to the involvement of a better-defined research community. Holocaust researchers share well-identified objects, common ground on methods, and handle similar setbacks. In this paper we discuss the approach adopted for designing and implementing qualitative user-centric studies aimed at capturing activities, methods, and types of information objects employed by researchers grounded in identified research goals and questions. It addresses both generic and specific entities and processes, and supports the understanding of researchers’ working practices in settings as diverse and wide as DARIAH, or as specialized as EHRI. The outcomes of the analysis of working practices are used in determining user requirements for digital infrastructures to serve the respective research communities.}, keywords = {}, pubstate = {published}, tppubtype = {article} } The need for a firm understanding of the working practices of researchers in the humanities emerges as a prerequisite for the development of effective digital research infrastructures. This paper will focus on the rationale behind the design and implementation of two related studies conducted in the context of two European e-Infrastructures projects, DARIAH and EHRI. Within DARIAH the challenge involved conducting, analysing and understanding research practices of arts and humanities researchers, a largely ill-defined community encompassing a wide spectrum of disciplines. Each of them deals with a variety of objects employing an extensive number of methods. In the context of EHRI, the challenge is slightly different, due to the involvement of a better-defined research community. Holocaust researchers share well-identified objects, common ground on methods, and handle similar setbacks. In this paper we discuss the approach adopted for designing and implementing qualitative user-centric studies aimed at capturing activities, methods, and types of information objects employed by researchers grounded in identified research goals and questions. It addresses both generic and specific entities and processes, and supports the understanding of researchers’ working practices in settings as diverse and wide as DARIAH, or as specialized as EHRI. The outcomes of the analysis of working practices are used in determining user requirements for digital infrastructures to serve the respective research communities. |
Generating Natural Language Description from OWL Ontologies, the NaturalOWL System (Journal Article) Androutsopoulos, Ion; Lampouras, Gerasimos; Galanis, Dimitris Journal of Artificial Intelligence Research, Volume: 48 , Pages: 671-715, 2013. @article{Androutsopoulos2013, title = {Generating Natural Language Description from OWL Ontologies, the NaturalOWL System}, author = {Ion Androutsopoulos and Gerasimos Lampouras and Dimitris Galanis}, url = {https://www.jair.org/media/4017/live-4017-7471-jair.pdf}, year = {2013}, date = {2013-01-02}, journal = {Journal of Artificial Intelligence Research}, volume = {48}, pages = {671-715}, abstract = {We present NaturalOWL, a natural language generation system that produces texts describing individuals or classes of OWL ontologies. Unlike simpler OWL verbalizers, which typically express a single axiom at a time in controlled, often not entirely fluent natural language primarily for the benefit of domain experts, we aim to generate fluent and coherent multi-sentence texts for end-users. With a system like NaturalOWL, one can publish information in OWL on the Web, along with automatically produced corresponding texts in multiple languages, making the information accessible not only to computer programs and domain experts, but also end-users. We discuss the processing stages of NaturalOWL, the optional domain-dependent linguistic resources that the system can use at each stage, and why they are useful. We also present trials showing that when the domain-dependent llinguistic resources are available, NaturalOWL produces significantly better texts compared to a simpler verbalizer, and that the resources can be created with relatively light effort.}, keywords = {}, pubstate = {published}, tppubtype = {article} } We present NaturalOWL, a natural language generation system that produces texts describing individuals or classes of OWL ontologies. Unlike simpler OWL verbalizers, which typically express a single axiom at a time in controlled, often not entirely fluent natural language primarily for the benefit of domain experts, we aim to generate fluent and coherent multi-sentence texts for end-users. With a system like NaturalOWL, one can publish information in OWL on the Web, along with automatically produced corresponding texts in multiple languages, making the information accessible not only to computer programs and domain experts, but also end-users. We discuss the processing stages of NaturalOWL, the optional domain-dependent linguistic resources that the system can use at each stage, and why they are useful. We also present trials showing that when the domain-dependent llinguistic resources are available, NaturalOWL produces significantly better texts compared to a simpler verbalizer, and that the resources can be created with relatively light effort. |
2012 |
Defining User Requirements for Holocaust Research Infrastractures and Services in the EHRI Project (Paper in Conference Proceedings) Benardou, Agiatis; Dallas, Costis Proceedings of the 2012 iConference, Pages: 644-645, 2012. @inproceedings{Benardou2012, title = {Defining User Requirements for Holocaust Research Infrastractures and Services in the EHRI Project}, author = {Agiatis Benardou and Costis Dallas}, url = {http://dl.acm.org/citation.cfm?doid=2132176.2132322}, year = {2012}, date = {2012-01-02}, booktitle = {Proceedings of the 2012 iConference}, pages = {644-645}, abstract = {The poster presents the background, conceptual framework, methodology and initial results of a mixed research project, investigating information practice and user requirements of historians, humanities scholars and social scientists working on the Holocaust. The results of the study will be a foundation for the specification of functionalities of the European digital infrastructure planned as part of the EU-funded European Holocaust Research Infrastructure project, and consisting of the EHRI search/portal and the EHRI Virtual Research Environment. Particular issues to be dealt with are the summarization of qualitative evidence from semi-open interviews by means of a conceptualization of relevant descriptive codes of research activities, resource types and tools/services; identification of specific user requirements and of different researcher profiles through statistical analysis of an online questionnaire defined on the basis of initial qualitative research; and, identification and theorization of special needs of Holocaust research, seen as a highly multi- and inter-disciplinary field of inquiry.}, keywords = {}, pubstate = {published}, tppubtype = {inproceedings} } The poster presents the background, conceptual framework, methodology and initial results of a mixed research project, investigating information practice and user requirements of historians, humanities scholars and social scientists working on the Holocaust. The results of the study will be a foundation for the specification of functionalities of the European digital infrastructure planned as part of the EU-funded European Holocaust Research Infrastructure project, and consisting of the EHRI search/portal and the EHRI Virtual Research Environment. Particular issues to be dealt with are the summarization of qualitative evidence from semi-open interviews by means of a conceptualization of relevant descriptive codes of research activities, resource types and tools/services; identification of specific user requirements and of different researcher profiles through statistical analysis of an online questionnaire defined on the basis of initial qualitative research; and, identification and theorization of special needs of Holocaust research, seen as a highly multi- and inter-disciplinary field of inquiry. |
2011 |
A New Architecture and Approach to Asset Representation for Europeana Aggregation: The CARARE Way (Paper in Conference Proceedings) Papatheodorou, Christos; Dallas, Costis; Ertmann-Christiansen, Christian; Fernie, Kate; Gavrilis, Dimitris; Masci, Maria Emilia; Constantopoulos, Panos; Angelis, Stavros Metadata and Semantic Research, Proceedings of the 5th International Conference, Communications in Computer and Information Science, Volume: 240 of the series Communications in Computer and Information Science Pages: 412-423, 2011. @inproceedings{Papatheodorou2011, title = {A New Architecture and Approach to Asset Representation for Europeana Aggregation: The CARARE Way}, author = {Christos Papatheodorou and Costis Dallas and Christian Ertmann-Christiansen and Kate Fernie and Dimitris Gavrilis and Maria Emilia Masci and Panos Constantopoulos and Stavros Angelis}, url = {http://www.springerlink.com/content/qh565142q69x0763/}, year = {2011}, date = {2011-10-03}, booktitle = {Metadata and Semantic Research, Proceedings of the 5th International Conference, Communications in Computer and Information Science}, volume = {240}, pages = {412-423}, chapter = {Metadata and Semantic Research}, series = {Communications in Computer and Information Science}, abstract = {This paper presents a new metadata aggregation approach based on a mediating repository that intends to ensure the integrity, authenticity and semantic enrichment of metadata provided to Europeana by heterogeneous collections. Primary metadata are mapped to CARARE schema, a schema suitable for describing archaeological and architectural heritage assets, digital resources, collections, as well as events associated with them. The paper specifies the proposed schema and discusses the overall architecture of the proposed approach.}, keywords = {}, pubstate = {published}, tppubtype = {inproceedings} } This paper presents a new metadata aggregation approach based on a mediating repository that intends to ensure the integrity, authenticity and semantic enrichment of metadata provided to Europeana by heterogeneous collections. Primary metadata are mapped to CARARE schema, a schema suitable for describing archaeological and architectural heritage assets, digital resources, collections, as well as events associated with them. The paper specifies the proposed schema and discusses the overall architecture of the proposed approach. |
A Generate and Rank Approach to Sentence Paraphrasing (Paper in Conference Proceedings) Malakasiotis, Prodromos; Androutsopoulos, Ion Proceedings of the 2011 Conference on Empirical Methods in Natural Language Processing, 2011. @inproceedings{Malakasiotis2011, title = {A Generate and Rank Approach to Sentence Paraphrasing}, author = {Prodromos Malakasiotis and Ion Androutsopoulos}, url = {http://www.aclweb.org/anthology/D11-1009}, year = {2011}, date = {2011-01-03}, booktitle = {Proceedings of the 2011 Conference on Empirical Methods in Natural Language Processing}, abstract = {We present a method that paraphrases a given sentence by first generating candidate paraphrases and then ranking (or classifying) them. The candidates are generated by applying existing paraphrasing rules extracted from parallel corpora. The ranking component considers not only the overall quality of the rules that produced each candidate, but also the extent to which they preserve grammaticality and meaning in the particular context of the input sentence, as well as the degree to which the candidate differs from the input. We experimented with both a Maximum Entropy classifier and an SVR ranker. Experimental results show that incorporating features from an existing paraphrase recognizer in the ranking component improves performance, and that our overall method compares well against a state of the art paraphrase generator, when paraphrasing rules apply to the input sentences. We also propose a new methodology to evaluate the ranking components of generate-and-rank paraphrase generators, which evaluates them across different combinations of weights for grammaticality, meaning preservation, and diversity. The paper is accompanied by a paraphrasing dataset we constructed for evaluations of this kind.}, keywords = {}, pubstate = {published}, tppubtype = {inproceedings} } We present a method that paraphrases a given sentence by first generating candidate paraphrases and then ranking (or classifying) them. The candidates are generated by applying existing paraphrasing rules extracted from parallel corpora. The ranking component considers not only the overall quality of the rules that produced each candidate, but also the extent to which they preserve grammaticality and meaning in the particular context of the input sentence, as well as the degree to which the candidate differs from the input. We experimented with both a Maximum Entropy classifier and an SVR ranker. Experimental results show that incorporating features from an existing paraphrase recognizer in the ranking component improves performance, and that our overall method compares well against a state of the art paraphrase generator, when paraphrasing rules apply to the input sentences. We also propose a new methodology to evaluate the ranking components of generate-and-rank paraphrase generators, which evaluates them across different combinations of weights for grammaticality, meaning preservation, and diversity. The paper is accompanied by a paraphrasing dataset we constructed for evaluations of this kind. |
A New Sentence Compression Dataset and Its Use in an Abstractive Generate-and-Rank Sentence Compressor (Paper in Conference Proceedings) Galanis, Dimitrios; Androutsopoulos, Ion Proceedings of the UCNLG+Eval: Language Generation and Evaluation Workshop, Pages: 1-11, 2011. @inproceedings{Galanis2011, title = {A New Sentence Compression Dataset and Its Use in an Abstractive Generate-and-Rank Sentence Compressor}, author = {Dimitrios Galanis and Ion Androutsopoulos}, url = {http://www.aclweb.org/anthology/W11-2701}, year = {2011}, date = {2011-01-03}, booktitle = {Proceedings of the UCNLG+Eval: Language Generation and Evaluation Workshop}, pages = {1-11}, abstract = {Sentence compression has attracted much interest in recent years, but most sentence compressors are extractive, i.e., they only delete words. There is a lack of appropriate datasets to train and evaluate abstractive sentence compressors, i.e., methods that apart from deleting words can also rephrase expressions. We present a new dataset that contains candidate extractive and abstractive compressions of source sentences. The candidate compressions are annotated with human judgements for grammaticality and meaning preservation. We discuss how the dataset was created, and how it can be used in generate-and-rank abstractive sentence compressors. We also report experimental results with a novel abstractive sentence compressor that uses the dataset. }, keywords = {}, pubstate = {published}, tppubtype = {inproceedings} } Sentence compression has attracted much interest in recent years, but most sentence compressors are extractive, i.e., they only delete words. There is a lack of appropriate datasets to train and evaluate abstractive sentence compressors, i.e., methods that apart from deleting words can also rephrase expressions. We present a new dataset that contains candidate extractive and abstractive compressions of source sentences. The candidate compressions are annotated with human judgements for grammaticality and meaning preservation. We discuss how the dataset was created, and how it can be used in generate-and-rank abstractive sentence compressors. We also report experimental results with a novel abstractive sentence compressor that uses the dataset. |
An ontological representation of the digital library evaluation domain (Journal Article) Tsakonas, Giannis; Papatheodorou, Christos Journal of the American Society for Information Science and Technology (JASIST), Volume: 62 (8), Pages: 1577-1593, 2011. @article{Tsakonas2011, title = {An ontological representation of the digital library evaluation domain}, author = {Giannis Tsakonas and Christos Papatheodorou}, url = {http://onlinelibrary.wiley.com/doi/10.1002/asi.21559/abstract}, year = {2011}, date = {2011-01-01}, journal = {Journal of the American Society for Information Science and Technology (JASIST)}, volume = {62}, number = {8}, pages = {1577-1593}, abstract = {Digital library evaluation is a complex field, as complex as the phenomena it studies. The interest of the digital library society still remains vibrant after all these years of solidification, as these systems have entered real-life applications. However the community has still to reach a consensus on what evaluation is and how it can effectively be planned. In the present article, an ontology of the digital library evaluation domain, named DiLEO, is proposed, aiming to reveal explicitly the main concepts of this domain and their correlations, and it tries to combine creatively and integrate several scientific paradigms, approaches, methods, techniques, and tools. This article demonstrates the added value features of the ontology, which are the support of comparative studies between different evaluation initiatives and the assistance in effective digital library evaluation planning.}, keywords = {}, pubstate = {published}, tppubtype = {article} } Digital library evaluation is a complex field, as complex as the phenomena it studies. The interest of the digital library society still remains vibrant after all these years of solidification, as these systems have entered real-life applications. However the community has still to reach a consensus on what evaluation is and how it can effectively be planned. In the present article, an ontology of the digital library evaluation domain, named DiLEO, is proposed, aiming to reveal explicitly the main concepts of this domain and their correlations, and it tries to combine creatively and integrate several scientific paradigms, approaches, methods, techniques, and tools. This article demonstrates the added value features of the ontology, which are the support of comparative studies between different evaluation initiatives and the assistance in effective digital library evaluation planning. |
2010 |
A curation-aware repository supporting information-intensive scholarly research (Presentation) Angelis, Stavros; Benardou, Agiatis; Constantopoulos, Panos; Dallas, Costis; Gavrilis, Dimitris Poster presented at the 6th International Digital Curation Conference , 2010. @misc{Angelis2010, title = {A curation-aware repository supporting information-intensive scholarly research}, author = {Stavros Angelis and Agiatis Benardou and Panos Constantopoulos and Costis Dallas and Dimitris Gavrilis}, url = {http://dcu.gr/admin/getfile.php?type=3&id=1}, year = {2010}, date = {2010-12-06}, abstract = {Poster presentation and discussion of MOPSEUS, a curation-aware repository supporting information-intensive scholarly research. The latter has been analysed and mapped in the context of DCU's work on Preparing DARIAH}, howpublished = {Poster presented at the 6th International Digital Curation Conference}, keywords = {}, pubstate = {published}, tppubtype = {presentation} } Poster presentation and discussion of MOPSEUS, a curation-aware repository supporting information-intensive scholarly research. The latter has been analysed and mapped in the context of DCU's work on Preparing DARIAH |
MOPSEUS - A Digital Repository System with Semantically Enhanced Preservation Services (Paper in Conference Proceedings) Gavrilis, Dimitris; Angelis, Stavros; Papatheodorou, Christos Proceedings of the 7th International Conference on Preservation of Digital Objects, iPRES2010, Vienna, Austria, September 2010, Pages: 135-143, 2010. @inproceedings{Gavrilis2010, title = {MOPSEUS - A Digital Repository System with Semantically Enhanced Preservation Services}, author = {Dimitris Gavrilis and Stavros Angelis and Christos Papatheodorou}, url = {http://www.ifs.tuwien.ac.at/dp/ipres2010/papers/gavrilis-34.pdf}, year = {2010}, date = {2010-09-01}, booktitle = {Proceedings of the 7th International Conference on Preservation of Digital Objects, iPRES2010, Vienna, Austria, September 2010}, journal = {Proceedings of the 7th International Conference on Preservation of Digital Objects, iPRES2010}, pages = {135-143}, abstract = {Repository platforms offer significant tools aiding institutions to preserve the wealth of their information resources. This paper presents the data model as well as the architectural features of Mopseus, a digital library service, built on top of Fedora-commons middleware, designed to facilitate institutions to develop and preserve their own repositories. The main advantage of Mopseus is that it minimizes the customization and programming effort that Fedora-commons involves. Moreover it provides an added value service which semantically annotates the internal structure of a Digital Object. The paper focuses on the preservation functionalities of Mopseus and presents a mechanism for automated generation of PREMIS metadata for each Digital Object of the repository. This mechanism is activated whenever an object is modified and is based on a mapping of the Mopseus data model to the PREMIS data model that ensures the validity of the transformation of the information stored in a Mopseus repository to semantically equivalent PREMIS metadata. }, keywords = {}, pubstate = {published}, tppubtype = {inproceedings} } Repository platforms offer significant tools aiding institutions to preserve the wealth of their information resources. This paper presents the data model as well as the architectural features of Mopseus, a digital library service, built on top of Fedora-commons middleware, designed to facilitate institutions to develop and preserve their own repositories. The main advantage of Mopseus is that it minimizes the customization and programming effort that Fedora-commons involves. Moreover it provides an added value service which semantically annotates the internal structure of a Digital Object. The paper focuses on the preservation functionalities of Mopseus and presents a mechanism for automated generation of PREMIS metadata for each Digital Object of the repository. This mechanism is activated whenever an object is modified and is based on a mapping of the Mopseus data model to the PREMIS data model that ensures the validity of the transformation of the information stored in a Mopseus repository to semantically equivalent PREMIS metadata. |
Query Transformation in a CIDOC CRM Based Cultural Metadata Integration Environment (Paper in Conference Proceedings) Gergatsoulis, Manolis; Bountouri, Lina; Gaitanou, Panoraia; Papatheodorou, Christos Proceedings of the 14th European Conference Research and Advanced Technology for Digital Libraries, ECDL 2010, Pages: 38-45, 2010. @inproceedings{Gergatsoulis2010, title = {Query Transformation in a CIDOC CRM Based Cultural Metadata Integration Environment}, author = {Manolis Gergatsoulis and Lina Bountouri and Panoraia Gaitanou and Christos Papatheodorou}, url = {http://www.springerlink.com/content/m5m353t715866632/}, year = {2010}, date = {2010-09-01}, booktitle = {Proceedings of the 14th European Conference Research and Advanced Technology for Digital Libraries, ECDL 2010}, pages = {38-45}, abstract = {The wide use of a number of cultural heritage metadata schemas imposes the development of new interoperability techniques that facilitate unified access to cultural resources. In this paper, we focus on the ontology based semantic integration by proposing an expressive mapping language for the specification of the mappings between the XML-based metadata schemas and the CIDOC CRM ontology. We also present an algorithm for the transformation of XPath queries posed on XML-based metadata into equivalent queries on the CIDOC CRM ontology. }, keywords = {}, pubstate = {published}, tppubtype = {inproceedings} } The wide use of a number of cultural heritage metadata schemas imposes the development of new interoperability techniques that facilitate unified access to cultural resources. In this paper, we focus on the ontology based semantic integration by proposing an expressive mapping language for the specification of the mappings between the XML-based metadata schemas and the CIDOC CRM ontology. We also present an algorithm for the transformation of XPath queries posed on XML-based metadata into equivalent queries on the CIDOC CRM ontology. |
Mopseus - A Digital Library Management System Focused on Preservation (Paper in Conference Proceedings) Gavrilis, Dimitris; Papatheodorou, Christos; Constantopoulos, Panos; Angelis, Stavros Proceedings of the 14th European Conference Research and Advanced Technology for Digital Libraries, ECDL 2010, Volume: 6273 Pages: 445-448, 2010. @inproceedings{Gavrilis2010b, title = {Mopseus - A Digital Library Management System Focused on Preservation}, author = {Dimitris Gavrilis and Christos Papatheodorou and Panos Constantopoulos and Stavros Angelis}, url = {http://www.springerlink.com/content/j5025k0058664015/}, year = {2010}, date = {2010-09-01}, booktitle = {Proceedings of the 14th European Conference Research and Advanced Technology for Digital Libraries, ECDL 2010}, volume = {6273}, pages = {445-448}, abstract = {This paper presents Mopseus, a Fedora-commons based digital repository that focuses on preservation. An overview of the general architecture of the system is presented along with some more in-depth details of its semantic structures. Mopseus features dynamic RDF- based relations, a service for defining metadata schemas, a built-in RDBMS synchronization and indexing mechanism, a mechanism for migration from existing repositories and a built-in workflow engine. }, keywords = {}, pubstate = {published}, tppubtype = {inproceedings} } This paper presents Mopseus, a Fedora-commons based digital repository that focuses on preservation. An overview of the general architecture of the system is presented along with some more in-depth details of its semantic structures. Mopseus features dynamic RDF- based relations, a service for defining metadata schemas, a built-in RDBMS synchronization and indexing mechanism, a mechanism for migration from existing repositories and a built-in workflow engine. |
Understanding the information requirements of arts and humanities scholarship: implications for digital curation (Journal Article) Benardou, Agiatis; Constantopoulos, Panos; Dallas, Costis; Gavrilis, Dimitris The International Journal of Digital Curation, Volume: 5 (1), Pages: 18-33, 2010. @article{Benardou2010, title = {Understanding the information requirements of arts and humanities scholarship: implications for digital curation}, author = {Agiatis Benardou and Panos Constantopoulos and Costis Dallas and Dimitris Gavrilis}, url = {http://www.ijdc.net/index.php/ijdc/article/viewFile/144/206}, year = {2010}, date = {2010-01-03}, journal = {The International Journal of Digital Curation}, volume = {5}, number = {1}, pages = {18-33}, abstract = {This paper reports on research of scholarly research practices and requirements conducted in the context of the Preparing DARIAH European e-Infrastructures project, with a view to ensuring current and future fitness for purpose of the planned digital infrastructure, services and tools. It summarises the findings of earlier research, primarily from the field of human information behaviour as applied in scholarly work, it presents a conceptual perspective informed by cultural-historical activity theory, it introduces briefly a formal conceptual model for scholarly research activity compliant with CIDOC CRM, it describes the plan of work and methodology of an empirical research project based on open-questionnaire interviews with arts and humanities researchers, and presents illustrative examples of segmentation, tagging and initial conceptual analysis of the empirical evidence. Finally, it presents plans for future work, consisting, firstly, of a comprehensive re-analysis of interview segments within the framework of the scholarly research activity model, and, secondly, of the integration of this analysis with the extended digital curation process model we presented in earlier work.}, keywords = {}, pubstate = {published}, tppubtype = {article} } This paper reports on research of scholarly research practices and requirements conducted in the context of the Preparing DARIAH European e-Infrastructures project, with a view to ensuring current and future fitness for purpose of the planned digital infrastructure, services and tools. It summarises the findings of earlier research, primarily from the field of human information behaviour as applied in scholarly work, it presents a conceptual perspective informed by cultural-historical activity theory, it introduces briefly a formal conceptual model for scholarly research activity compliant with CIDOC CRM, it describes the plan of work and methodology of an empirical research project based on open-questionnaire interviews with arts and humanities researchers, and presents illustrative examples of segmentation, tagging and initial conceptual analysis of the empirical evidence. Finally, it presents plans for future work, consisting, firstly, of a comprehensive re-analysis of interview segments within the framework of the scholarly research activity model, and, secondly, of the integration of this analysis with the extended digital curation process model we presented in earlier work. |
Exploitation of folksonomies in subject analysis (Journal Article) Kakali, Costantia; Papatheodorou, Christos Library & Information Science Research, Volume: 32 (3), Pages: 192-202, 2010. @article{Kakali2010, title = {Exploitation of folksonomies in subject analysis}, author = {Costantia Kakali and Christos Papatheodorou }, url = {http://www.sciencedirect.com/science/article/pii/S0740818810000368}, year = {2010}, date = {2010-01-03}, journal = {Library & Information Science Research}, volume = {32}, number = {3}, pages = {192-202}, abstract = {Social tagging is one of the most popular of social media applications and has attracted the interest of a number of libraries and museums, which have developed services that facilitate user-community collaboration. This paper presents a methodology for the exploitation of social tagging in subject indexing, and explores that method through a case study in an academic library setting. The findings reveal the characteristics of users' tagging behavior, which mainly enhances the subject description of documents. The results suggest the articulation of alternative policies concerning knowledge organization schemes, technological infrastructures, and information services.}, keywords = {}, pubstate = {published}, tppubtype = {article} } Social tagging is one of the most popular of social media applications and has attracted the interest of a number of libraries and museums, which have developed services that facilitate user-community collaboration. This paper presents a methodology for the exploitation of social tagging in subject indexing, and explores that method through a case study in an academic library setting. The findings reveal the characteristics of users' tagging behavior, which mainly enhances the subject description of documents. The results suggest the articulation of alternative policies concerning knowledge organization schemes, technological infrastructures, and information services. |
Retrieving Information from Hybrid Spaces Using Handhelds (Journal Article) Veronikis, Spyros; Gavrilis, Dimitris; Zoutsou, Kyriaki; Papatheodorou, Christos International Journal on Advances in Systems and Measurements, Volume: 2 (1), Pages: 84-96, 2010. @article{Veronikis2010, title = {Retrieving Information from Hybrid Spaces Using Handhelds}, author = {Spyros Veronikis and Dimitris Gavrilis and Kyriaki Zoutsou and Christos Papatheodorou}, year = {2010}, date = {2010-01-02}, journal = {International Journal on Advances in Systems and Measurements}, volume = {2}, number = {1}, pages = {84-96}, abstract = {Hybrid spaces consist of information resources of both physical and electronic form. With the advent of electronic publishing and WWW hybrid libraries became popular and widely acknowledged for their high informative quality and anytime availability. On the other hand, modern computing handheld devices and wireless communication networks can support their users in accessing and using these information volumes wherever a need arises. Therefore, the user can query an information system about the electronic resources and simultaneously explore the nearby physical resources, in a way that enhances awareness of available information collections and relations among them, and also create a new experience while seeking in a hybrid space. In this paper we present the design methodology of creating such a service in an academic library, as well as the evaluation model, the procedure and the results from assessing satisfaction for the use of that service. Our findings imply that users believe that the unified search for physical and electronic resources is an important feature when seeking information in big physical and electronic collections.}, keywords = {}, pubstate = {published}, tppubtype = {article} } Hybrid spaces consist of information resources of both physical and electronic form. With the advent of electronic publishing and WWW hybrid libraries became popular and widely acknowledged for their high informative quality and anytime availability. On the other hand, modern computing handheld devices and wireless communication networks can support their users in accessing and using these information volumes wherever a need arises. Therefore, the user can query an information system about the electronic resources and simultaneously explore the nearby physical resources, in a way that enhances awareness of available information collections and relations among them, and also create a new experience while seeking in a hybrid space. In this paper we present the design methodology of creating such a service in an academic library, as well as the evaluation model, the procedure and the results from assessing satisfaction for the use of that service. Our findings imply that users believe that the unified search for physical and electronic resources is an important feature when seeking information in big physical and electronic collections. |
Modelling the Public Sector Information through CIDOC Conceptual Reference Model (Paper in Conference Proceedings) Bountouri, Lina; Papatheodorou, Christos; Gergatsoulis, Manolis Proceedings of the 6th International Workshop on Ontology Content, OnToContent 2010, Volume: 6428 Pages: 404-413, 2010. @inproceedings{Bountouri2010, title = {Modelling the Public Sector Information through CIDOC Conceptual Reference Model}, author = {Lina Bountouri and Christos Papatheodorou and Manolis Gergatsoulis }, url = {http://dl.acm.org/citation.cfm?id=1948597&preflayout=flat}, year = {2010}, date = {2010-01-01}, booktitle = {Proceedings of the 6th International Workshop on Ontology Content, OnToContent 2010}, journal = {Proceedings of the 6th International Workshop on Ontology Content, OnToContent 2010}, volume = {6428}, pages = {404-413}, abstract = {Nowadays, due to the growing development of eGovernment information systems, there is an increasing need to handle Public Sector Information (PSI) in a homogeneous way. Ontologies are currently a powerful tool to act as semantic reference models for the development of information systems and as semantic mediators for achieving interoperability. In this paper, we analyze the procedures that lead to the PSI's production and management and we present all the concepts and agents that relate to it. Based on this analysis and given that CIDOC CRM ontology is able to define the rich semantics of the historical records' production and management, we propose the CIDOC CRM to represent the public records' conceptualization and to act as a reference model for PSI. }, keywords = {}, pubstate = {published}, tppubtype = {inproceedings} } Nowadays, due to the growing development of eGovernment information systems, there is an increasing need to handle Public Sector Information (PSI) in a homogeneous way. Ontologies are currently a powerful tool to act as semantic reference models for the development of information systems and as semantic mediators for achieving interoperability. In this paper, we analyze the procedures that lead to the PSI's production and management and we present all the concepts and agents that relate to it. Based on this analysis and given that CIDOC CRM ontology is able to define the rich semantics of the historical records' production and management, we propose the CIDOC CRM to represent the public records' conceptualization and to act as a reference model for PSI. |
2009 |
Finding Short Definitions of Terms on Web Pages (Paper in Conference Proceedings) Lampouras, Gerasimos; Androutsopoulos, Ion Proceedings of the 2009 Conference on Empirical Methods on Natural Language Processing (EMNLP 2009 at ACL/IJCNLP 2009), Suntec, Singapore, 2009, Pages: 1270-1279, 2009, ISBN: 978-1-932432-59-6. @inproceedings{Lampouras2009, title = {Finding Short Definitions of Terms on Web Pages}, author = {Gerasimos Lampouras and Ion Androutsopoulos}, url = {http://nlp.cs.aueb.gr/pubs/emnlp09_paper.pdf}, isbn = {978-1-932432-59-6}, year = {2009}, date = {2009-09-01}, booktitle = {Proceedings of the 2009 Conference on Empirical Methods on Natural Language Processing (EMNLP 2009 at ACL/IJCNLP 2009), Suntec, Singapore, 2009}, pages = {1270-1279}, abstract = {We present a system that finds short definitions of terms on Web pages. It employs a Maximum Entropy classifier, but it is trained on automatically generated examples; hence, it is in effect unsupervised. We use ROUGE-W to generate training examples from encyclopedias and Web snippets, a method that outperforms an alternative centroid-based one. After training, our system can be used to find definitions of terms that are not covered by encyclopedias. The system outperforms a comparable publicly available system, as well as a previously published form of our system.}, keywords = {}, pubstate = {published}, tppubtype = {inproceedings} } We present a system that finds short definitions of terms on Web pages. It employs a Maximum Entropy classifier, but it is trained on automatically generated examples; hence, it is in effect unsupervised. We use ROUGE-W to generate training examples from encyclopedias and Web snippets, a method that outperforms an alternative centroid-based one. After training, our system can be used to find definitions of terms that are not covered by encyclopedias. The system outperforms a comparable publicly available system, as well as a previously published form of our system. |
A Digital Library Service for the Small (Paper in Conference Proceedings) Angelis, Stavros; Constantopoulos, Panos; Gavrilis, Dimitris; Papatheodorou, Christos Proceedings of the 2nd Digital Curation Curriculum Symposium: Digital Curation Practice, Promise and Prospects 2009, 2009. @inproceedings{Angelis2009, title = {A Digital Library Service for the Small}, author = {Stavros Angelis and Panos Constantopoulos and Dimitris Gavrilis and Christos Papatheodorou}, url = {http://users.ionio.gr/~papatheodor/papers/digccurr09.pdf}, year = {2009}, date = {2009-04-01}, booktitle = {Proceedings of the 2nd Digital Curation Curriculum Symposium: Digital Curation Practice, Promise and Prospects 2009}, journal = {DigCCurr 2009: Digital Curation Practice, Promise and Prospects}, abstract = {In this paper, we present MOPSEUS, a lightweight digital library service based on the Fedora system. This service was created to address the needs of small libraries without support from technical staff. Hence, MOPSEUS attempts to balance flexibility against ease of installation, configuration and use. The service is available as a standard Java Web servlet, uses no external databases or other systems and can easily be deployed on top of any Fedora installation. Preliminary tests concerning the ease of installation and use are encouraging. We contend that facilitating the introduction of digital library infrastructures in the small may contribute to spreading digital curation practices.}, keywords = {}, pubstate = {published}, tppubtype = {inproceedings} } In this paper, we present MOPSEUS, a lightweight digital library service based on the Fedora system. This service was created to address the needs of small libraries without support from technical staff. Hence, MOPSEUS attempts to balance flexibility against ease of installation, configuration and use. The service is available as a standard Java Web servlet, uses no external databases or other systems and can easily be deployed on top of any Fedora installation. Preliminary tests concerning the ease of installation and use are encouraging. We contend that facilitating the introduction of digital library infrastructures in the small may contribute to spreading digital curation practices. |
Solving differential equations with constructed neural networks (Journal Article) Tsoulos, Ioannis; Gavrilis, Dimitris; Glavas, Euripidis Neurocomputing, Volume: 72 (10-12), Pages: 2385-2391, 2009. @article{Tsoulos2009, title = {Solving differential equations with constructed neural networks}, author = {Ioannis Tsoulos and Dimitris Gavrilis and Euripidis Glavas}, url = {http://www.sciencedirect.com/science/article/pii/S0925231208005560 http://www.dcu.gr/wp-content/uploads/2016/10/Solving-differential-equations.pdf}, year = {2009}, date = {2009-01-02}, issuetitle = {Lattice Computing and Natural Computing (JCIS 2007) / Neural Networks in Intelligent Systems Designn (ISDA 2007)}, journal = {Neurocomputing}, volume = {72}, number = {10-12}, pages = {2385-2391}, abstract = {A novel hybrid method for the solution of ordinary and partial differential equations is presented here. The method creates trial solutions in neural network form using a scheme based on grammatical evolution. The trial solutions are enhanced periodically using a local optimization procedure. The proposed method is tested on a series of ordinary differential equations, systems of them as well as on partial differential equations with Dirichlet boundary conditions and the results are reported.}, keywords = {}, pubstate = {published}, tppubtype = {article} } A novel hybrid method for the solution of ordinary and partial differential equations is presented here. The method creates trial solutions in neural network form using a scheme based on grammatical evolution. The trial solutions are enhanced periodically using a local optimization procedure. The proposed method is tested on a series of ordinary differential equations, systems of them as well as on partial differential equations with Dirichlet boundary conditions and the results are reported. |
Metadata Interoperability in Public Sector Information (Journal Article) Bountouri, Lina; Papatheodorou, Christos; Soulikias, Vasilis; Stratis, Mathios Journal of Information Science, Volume: 35 , Pages: 204-231, 2009. @article{Bountouri2009, title = {Metadata Interoperability in Public Sector Information}, author = {Lina Bountouri and Christos Papatheodorou and Vasilis Soulikias and Mathios Stratis}, url = {http://jis.sagepub.com/content/35/2/204.short}, year = {2009}, date = {2009-01-02}, journal = {Journal of Information Science}, volume = {35}, pages = {204-231}, abstract = {Over recent years, there has been a worldwide growing need for interoperability among the systems that manage and reuse public sector information. This paper explores the documentation needs for public sector information and focuses on metadata interoperability issues. The research work studies a variety of public sector information metadata standards and guidelines internationally accepted and presents two methodologies to obtain interoperability. The first develops an application profile, while the second is based on the semantic integration approach and results in the creation of an ontology. The outcomes of the two approaches are compared under the prism of their scope and usage in terms of interoperability during the metadata integration process. }, keywords = {}, pubstate = {published}, tppubtype = {article} } Over recent years, there has been a worldwide growing need for interoperability among the systems that manage and reuse public sector information. This paper explores the documentation needs for public sector information and focuses on metadata interoperability issues. The research work studies a variety of public sector information metadata standards and guidelines internationally accepted and presents two methodologies to obtain interoperability. The first develops an application profile, while the second is based on the semantic integration approach and results in the creation of an ontology. The outcomes of the two approaches are compared under the prism of their scope and usage in terms of interoperability during the metadata integration process. |