@inproceedings{2e684077e04642c9972d83646ce9e198,
title = "HANKE: Hierarchical attention networks for knowledge extraction in political science domain",
abstract = "Extracting structured metadata from unstructured text in different domains is gaining strong attention from multiple research communities. In Political Science, these metadata play a significant role on studying intra and inter-state interactions between political entities. The process of extracting such metadata usually relies on domain specific ontologies and knowledge-based repositories. In particular, Political Scientists regularly use the well-defined ontology CAMEO, which is designed for capturing conflict and mediation relations. Since CAMEO repositories are currently human maintained, the high cost and extensive human effort associated with updating them makes it difficult to include new entries on a regular basis. This paper introduces HANKE: an innovative framework for automatically extracting knowledge representations from unstructured sources, in order to extend CAMEO ontology both in the same domain and towards other related domains in political science. HANKE combines Hierarchical Attention Networks as engine for identifying relevant structures in raw-text and the novel Frequency-Based Ranker approach to obtain a collection of candidate entries for CAMEO's repositories. To show the efficiency of the proposed framework, we evaluate its performance on capturing existing CAMEO representations in a soft-labelled dataset. We also empirically demonstrate the versatility and superiority of HANKE method by applying it to two case studies related to CAMEO extension on its actual domain and towards organized crime domain.",
keywords = "CAMEO, Hierarchical attention networks, Knowledge extraction, Political events",
author = "{Skorupa Parolin}, Erick and Latifur Khan and Javier Osorio and Vito D'Orazio and Brandt, {Patrick T.} and Jennifer Holmes",
note = "Funding Information: The research reported herein was supported in part by NSF awards DMS-1737978, DGE-2039542, OAC-1828467, OAC-1931541, DGE-1906630; and an IBM faculty award (Research). Publisher Copyright: {\textcopyright} 2020 IEEE.; 7th IEEE International Conference on Data Science and Advanced Analytics, DSAA 2020 ; Conference date: 06-10-2020 Through 09-10-2020",
year = "2020",
month = oct,
doi = "10.1109/DSAA49011.2020.00055",
language = "English (US)",
series = "Proceedings - 2020 IEEE 7th International Conference on Data Science and Advanced Analytics, DSAA 2020",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "410--419",
editor = "Geoff Webb and Zhongfei Zhang and Tseng, {Vincent S.} and Graham Williams and Michalis Vlachos and Longbing Cao",
booktitle = "Proceedings - 2020 IEEE 7th International Conference on Data Science and Advanced Analytics, DSAA 2020",
}