This paper describes OWL ontology re-engineering from the wiki-based social science codebook (thesaurus) developed by the Seshat: Global History Databank. The ontology describes human history as a set of over 1500 time series variables and supports variable uncertainty, temporal scoping, annotations and bibliographic references. The ontology was developed to transition from traditional social science data collection and storage techniques to an RDF-based approach. RDF supports automated generation of high usability data entry and validation tools, data quality management, incorporation of facts from the web of data and management of the data curation lifecycle.
This ontology re-engineering exercise identified several pitfalls in modelling social science codebooks with semantic web technologies; provided insights into the practical application of OWL to complex, real-world modelling challenges; and has enabled the construction of new, RDF-based tools to support the large-scale Seshat data curation effort. The Seshat ontology is an exemplar of a set of ontology design patterns for modelling unncertainty or temporal bounds in standard RDF. Thus the paper provides guidance for deploying RDF in the social sciences. Within Seshat, OWL-based data quality management will assure the data is suitable for statistical analysis. Publication of Seshat as high-quality, linked open data will enable other researchers to build on it.
%0 Conference Paper
%1 brennan2016building
%A Brennan, Rob
%A Feeney, Kevin
%A Mendel-Gleason, Gavin
%A Bozic, Bojan
%A Turchin, Peter
%A Whitehouse, Harvey
%A Francois, Peter
%A Currie, Thomas
%A Gohmann, Stephanie
%B ESWC 2016 THE SEMANTIC WEB. LATEST ADVANCES AND NEW DOMAINS
%D 2016
%E Sack, Harald
%E Blomqvist, Eva
%E d'Aquin, Mathieu
%E Ghidini, Chiara
%E Paolo Ponzetto, Simone
%E Lange, Christoph
%I Springer
%K aligned-project myown
%T Building the Seshat Ontology for a Global History Databank
%V 9678
%X This paper describes OWL ontology re-engineering from the wiki-based social science codebook (thesaurus) developed by the Seshat: Global History Databank. The ontology describes human history as a set of over 1500 time series variables and supports variable uncertainty, temporal scoping, annotations and bibliographic references. The ontology was developed to transition from traditional social science data collection and storage techniques to an RDF-based approach. RDF supports automated generation of high usability data entry and validation tools, data quality management, incorporation of facts from the web of data and management of the data curation lifecycle.
This ontology re-engineering exercise identified several pitfalls in modelling social science codebooks with semantic web technologies; provided insights into the practical application of OWL to complex, real-world modelling challenges; and has enabled the construction of new, RDF-based tools to support the large-scale Seshat data curation effort. The Seshat ontology is an exemplar of a set of ontology design patterns for modelling unncertainty or temporal bounds in standard RDF. Thus the paper provides guidance for deploying RDF in the social sciences. Within Seshat, OWL-based data quality management will assure the data is suitable for statistical analysis. Publication of Seshat as high-quality, linked open data will enable other researchers to build on it.
@inproceedings{brennan2016building,
abstract = {This paper describes OWL ontology re-engineering from the wiki-based social science codebook (thesaurus) developed by the Seshat: Global History Databank. The ontology describes human history as a set of over 1500 time series variables and supports variable uncertainty, temporal scoping, annotations and bibliographic references. The ontology was developed to transition from traditional social science data collection and storage techniques to an RDF-based approach. RDF supports automated generation of high usability data entry and validation tools, data quality management, incorporation of facts from the web of data and management of the data curation lifecycle.
This ontology re-engineering exercise identified several pitfalls in modelling social science codebooks with semantic web technologies; provided insights into the practical application of OWL to complex, real-world modelling challenges; and has enabled the construction of new, RDF-based tools to support the large-scale Seshat data curation effort. The Seshat ontology is an exemplar of a set of ontology design patterns for modelling unncertainty or temporal bounds in standard RDF. Thus the paper provides guidance for deploying RDF in the social sciences. Within Seshat, OWL-based data quality management will assure the data is suitable for statistical analysis. Publication of Seshat as high-quality, linked open data will enable other researchers to build on it.},
added-at = {2016-04-22T13:34:44.000+0200},
author = {Brennan, Rob and Feeney, Kevin and Mendel-Gleason, Gavin and Bozic, Bojan and Turchin, Peter and Whitehouse, Harvey and Francois, Peter and Currie, Thomas and Gohmann, Stephanie},
biburl = {https://www.bibsonomy.org/bibtex/248367d1ca822e24913d5a90f2fcd68da/brennanraj},
booktitle = {ESWC 2016 THE SEMANTIC WEB. LATEST ADVANCES AND NEW DOMAINS},
editor = {Sack, Harald and Blomqvist, Eva and d'Aquin, Mathieu and Ghidini, Chiara and Paolo Ponzetto, Simone and Lange, Christoph},
interhash = {3c4e807889b45233b42850f387a88fad},
intrahash = {48367d1ca822e24913d5a90f2fcd68da},
keywords = {aligned-project myown},
publisher = {Springer},
series = {LNCS},
timestamp = {2016-05-09T15:46:14.000+0200},
title = {Building the Seshat Ontology for a Global History Databank},
volume = 9678,
year = 2016
}