######
# # ## ##### ## ##### # # ####
# # # # # # # # # # # #
# # # # # # # ##### # # ####
# # ###### # ###### # # # # #
# # # # # # # # # # # # #
###### # # # # # ##### #### ####
# Plugin version 1.3-SNAPSHOT - https://github.com/dbpedia/databus-maven-plugin
@prefix databus: .
@prefix dataid-mt: .
@prefix dct: .
@prefix dataid: .
@prefix rdf: .
@prefix dataid-cv: .
@prefix xsd: .
@prefix rdfs: .
@prefix dcat: .
@prefix prov: .
@prefix dataid-debug: .
dataid-cv:tag rdfs:subPropertyOf dataid:contentVariant .
a dataid:Version .
a dataid:Dataset ;
rdfs:comment "Geonames provides a malformed RDF/XML dump, we parsed it, because we needed it in our project."@en ;
rdfs:label "Geonames parsed to NTriples"@en ;
dataid:account databus:kurzum ;
dataid:artifact ;
dataid:associatedAgent ;
dataid:group ;
dataid:groupdocu "# Cleaned Data group\nMirrors of data that my colleagues and I needed cleaner and parseable\n\n## Attribution\nWe mentioned the place, where we downloaded it from and kept the license. \n**Please attribute the original source** \n\n## Version Changelog\nVersions are the same as the original source" ;
dataid:version ;
dataid-debug:documentationLocation
;
dataid-debug:feedbackChannel ;
dataid-debug:issueTracker ;
dct:conformsTo "http://dataid.dbpedia.org/ns/core#" ;
dct:description "## Procedure\nOur use case is to load geonames in our [FlexiFusion project](https://svn.aksw.org/papers/2019/ISWC_FlexiFusion/public.pdf).\nJohannes, Marvin and me needed a while to finally get it working with `parallel`. There were quite a few scripts out there already like [this one](https://swebdev.wordpress.com/2012/10/01/loading-geonames-in-virtuoso/) from 2012, so the problem seems to stay with us. \n```\ncat all-geonames-rdf.txt | grep -v \"^http\" | parallel --pipe -N1 rapper -i rdfxml - urn:base > all-parallel.nt 2> all-paralle.log\n```\nWe are hosting this for us mainly, but as long as this there, feel free to download and use it. Hopefully, it will save you some hours of work. \nAlso I put some extra effort in this docu as a demo for the databus. Copying Retrieval date, Source and License is recommended, as you also sign this with your private key. But I am very sure, I did copy and paste it correctly. \n\n## Source\nretrieved: September 5th, 2019\nfrom: http://www.geonames.org/ontology/documentation.html\n*[RDF dump](http://download.geonames.org/all-geonames-rdf.zip) with 11701589 features and about 176 mio rdf triples (2018 03 11). The dump has one rdf document per toponym on every line of the file. Note: The file is pretty large. Make sure the tool you use to uncompress is able to deal with the size and does not stop after 2GB, an issue that happens with some old (windows) tool versions.* \n\n## License \nretrieved: September 5th, 2019\nfrom: http://download.geonames.org/export/\ncopied relevant parts:\n* \"free : GeoNames data is free, the data is available without costs.\"\n* \"cc-by licence (creative commons attributions license). You should give credit to GeoNames when using data or web services with a link or another reference to GeoNames.\"\n* \"commercial usage is allowed\"\n* \"'as is' : The data is provided \"as is\" without warranty or any representation of accuracy, timeliness or completeness.\"" ;
dct:hasVersion "2018.03.11" ;
dct:issued "2020-06-26T07:19:33Z"^^xsd:dateTime ;
dct:license ;
dct:publisher ;
dct:title "Geonames parsed to NTriples"@en ;
dcat:distribution .
a dataid:DataId ;
rdfs:comment "Metadata created by the DBpedia Databus Maven Plugin: https://github.com/dbpedia/databus-maven-plugin (Version 1.3-SNAPSHOT)\nThe DataID ontology is a metadata omnibus, which can be extended to be interoperable with all metadata formats\nNote that the metadata (the dataid.ttl file) is always CC-0, the files are licensed individually\nMetadata created by https://kurzum.github.io/webid.ttl#this" ;
rdfs:label "DataID metadata for cleaned-data/geonames"@en ;
dataid:associatedAgent ;
dct:conformsTo "http://dataid.dbpedia.org/ns/core#" ;
dct:hasVersion "1.3-SNAPSHOT" ;
dct:issued "2020-06-26T07:19:33Z"^^xsd:dateTime ;
dct:license ;
dct:publisher ;
dct:title "DataID metadata for cleaned-data/geonames"@en .
a dataid:SingleFile ;
dataid:associatedAgent ;
dataid:compression "bzip2" ;
dataid:contentVariant "all" ;
dataid:file ;
dataid:formatExtension "nt" ;
dataid:isDistributionOf ;
dataid:preview " .\n .\n \"Zam\\u012Bn S\\u016Bkhteh\" .\n \"Zam\\u012Bn S\\u016Bkhteh\"@fa .\n \"\\u0632\\u0645\\u064A\\u0646 \\u0633\\u0648\\u062E\\u062A\\u0647\"@fa .\n .\n .\n \"IR\" .\n \"32.45831\" .\n \"48.96335\" ." ;
dataid:sha256sum "14df1d21770a7a6131006b9c50233a776735417f9268cc304c3fb76eb6fca9dd" ;
dataid:signature "lxSAJBcODedcs4ZIP3DfdIZmwfRlN9rQl9Yvqz2423ufXD8cWQxEVBi5Z94mrmorZeZiNrLU7fzBjwSeRFtwu8j4RT7E952JfHC53dykE/82igEk0PxR5tU2g2hvfwR5Bts/e8H4/Dz4rQhNkRT8YAuZ1Vy76+etMZki2slOORL4iFpmMQhWEovgw3U64vBhB2ctQkuB/uGtZ+2UVsqO/UuouegaJcXpsVc1f9sVJn+EdZDt7Na6luJewSD6wAEw/w312HoTj4wMV/Gpdm2g1c8XDaneegd3WH7dum8EZZOwkrlDIdTVQ9EagLxxTobIdmmnJjauX3pDMwOe5yRSRQ==" ;
dataid-cv:tag "all" ;
dct:conformsTo "http://dataid.dbpedia.org/ns/core#" ;
dct:hasVersion "2018.03.11" ;
dct:issued "2020-06-26T07:19:33Z"^^xsd:dateTime ;
dct:license ;
dct:modified "2019-09-05T05:04:36Z"^^xsd:dateTime ;
dct:publisher ;
dcat:byteSize "643561352"^^xsd:decimal ;
dcat:downloadURL ;
dcat:mediaType dataid-mt:ApplicationNTriples .
a dataid:Artifact .
a dataid:Group .
dataid-mt:ApplicationNTriples
a dataid-mt:MediaType ;
dataid:mimetype "application/n-triples" .