@inproceedings{bf47870465ad4fa9927bd7c84590121b,
title = "Interlinking opensource geo-spatial datasets for optimal utility in ranking",
abstract = "The joining of geospatial datasets is required to utilize the complete set of information available in each of them. There are many open source geospatial datasets available such as GeoNames, Open Street Map, Natural Earth and to get a comprehensive dataset with the union of all available information it is important that such datasets are linked optimally without redundancy or loss of information. Many of the geolocations on digital maps are not classified for importance because of the lack of additional information such as population or administrative level. A way to give an importance scale to the names is by linking the GeoNames to other datasets (OSM, natural earth). OpenStreetMap data provides a limited number of place classifications (such as city, town, village). For the best cartographic results we need classes that are a little more comprehensive about how they rank cities. The challenges faced include geometry searching, matching, buffer determination, local regional naming text inclusion and accuracy. This has been achieved by the current research work where presently GeoNames, Natural Earth and Open Street Map data tables have been merged with the union of all their attribute columns resulting in a complete geospatial dataset with place accuracy of atleast 95 % for any given country dataset. The data tables at global level consist of hundreds of thousands of rows with each row depicting a geolocation. The geometry, name and geo-id complete and fuzzy searching and matching around a buffer of 50 km took a minimum of 30 s to maximum 1 min in a commodity computer with 2 GHz, 2 GB memory, according to size and complexity of the query run for a country which could have a list of points ranging from a dozen to several hundreds. The future aim is to ultimately do this for global datasets to create an all-encompassing geodata bank having such information as administrative, political, ecological details from important databases as GAUL, SALB, GADM etc.",
keywords = "data tables, fuzzy matching, geometry, GeoNames, geospatial, interlinking, label ranking, mapping, metadata, Natural Earth, Open Street Map, open-source data sets, scale ranking",
author = "D. Bhattacharya and P. Pasquali and J. Komarkova and P. Sedlak and A. Saha and P. Boccardo",
note = "Funding Information: The Ministry of Education, Youth and Sports of the Czech Republic, Project CZ.1.07/2.3.00/30.0021 “Strengthening of Research and Development Teams at the University of Pardubice”, financially supported this work. Publisher Copyright: {\textcopyright} Springer International Publishing Switzerland 2015.; International cartographic conference, CARTOCON 2014 ; Conference date: 25-02-2014 Through 28-02-2014",
year = "2014",
month = dec,
day = "2",
doi = "10.1007/978-3-319-07926-4_13",
language = "English",
isbn = "9783319079257",
series = "Lecture Notes in Geoinformation and Cartography",
publisher = "Springer",
pages = "159--172",
editor = "Jan Brus and Alena Vondrakova and Vit Vozenilek",
booktitle = "Modern Trends in Cartography",
address = "United Kingdom",
}