PREFIX schema: <http://schema.org/>
PREFIX dc: <http://purl.org/dc/elements/1.1/>
PREFIX sioct: <http://rdfs.org/sioc/types#>
PREFIX skos: <http://www.w3.org/2004/02/skos/core#>
PREFIX projects: <http://aksw.org/Projects/>
PREFIX aiiso: <http://purl.org/vocab/aiiso/schema#>
PREFIX dbr: <http://dbpedia.org/resource/>
PREFIX partner: <http://aksw.org/Partner/>
PREFIX sysont: <http://ns.ontowiki.net/SysOnt/>
PREFIX rdfs: <http://www.w3.org/2000/01/rdf-schema#>
PREFIX vann: <http://purl.org/vocab/vann/>
PREFIX site: <http://ns.ontowiki.net/SysOnt/Site/>
PREFIX projectfunding: <http://vocab.ox.ac.uk/projectfunding#>
PREFIX void: <http://rdfs.org/ns/void#>
PREFIX aksw: <http://aksw.org/schema/>
PREFIX lod2: <http://lod2.eu/schema/>
PREFIX groups: <http://aksw.org/Groups/>
PREFIX content: <http://purl.org/rss/1.0/modules/content/>
PREFIX sioc: <http://rdfs.org/sioc/ns#>
PREFIX dcterms: <http://purl.org/dc/terms/>
PREFIX dbpedia: <http://dbpedia.org/resource/>
PREFIX owl: <http://www.w3.org/2002/07/owl#>
PREFIX sh: <http://www.w3.org/ns/shacl#>
PREFIX doap: <http://usefulinc.com/ns/doap#>
PREFIX dct: <http://purl.org/dc/terms/>
PREFIX rdf: <http://www.w3.org/1999/02/22-rdf-syntax-ns#>
PREFIX v: <http://www.w3.org/2006/vcard/ns#>
PREFIX xsd: <http://www.w3.org/2001/XMLSchema#>
PREFIX ov: <http://open.vocab.org/terms/>
PREFIX people: <http://aksw.org/>
PREFIX foaf: <http://xmlns.com/foaf/0.1/>
PREFIX geo: <http://www.w3.org/2003/01/geo/wgs84_pos#>
PREFIX : <http://aksw.org/>

projects:DBpediaNIF a aksw:DatasetProject;
  aksw:hookline "Open, Large-Scale and Multilingual Knowledge Extraction Corpus";
  aksw:publicationTag "dbpedianif";
  aksw:relatedProject projects:DBpedia;
  site:content "Overview\n========\n\nThe DBpedia community has put signicant amount of effort on developing technical infrastructure and methods for ecient extraction of structured information from Wikipedia. These\nefforts have been primarily focused on harvesting, refinement and publishing semi-structured information found in Wikipedia articles, such as information from infoboxes, categorization information, images, wikilinks and citations. Nevertheless, still vast amount of valuable information is contained in the unstructured Wikipedia article texts.\nDBpedia NIF aims to fill in these gaps and extract valuable information from Wikipedia article texts.\nIn its core, DBpedia NIF is a large-scale and multilingual knowledge extraction corpus. The purpose of this project is two-fold: to dramatically broaden and deepen the amount of structured information in DBpedia, and to provide large-scale and multilingual language resource for development of various NLP and IR task.\nThe dataset provides the content of all articles for 128 Wikipedia languages. It captures the content as it is found in Wikipedia-it **captures the structure** (sections and paragraphs) and the **annotations** provided by the Wikipedia editors.\n\n![DBpedia NIF](https://docs.google.com/drawings/d/e/2PACX-1vR2bn3jW4zuoQ1MOwFnYRQTc7SZtLAHcHq5QQywy0NJyWdD_DOo5yS50SdlvsZN5wngwlonu9WHuJF5/pub?w=530 \"DBpedia NIF\")\n\nKey Features and Facts\n========\n\n- content in 128 Wikipedia languages\n- over 9 billion RDF triples, which is almost 40% of DBpedia\n- selected partitions published as Linked Data\n- exploited within the [TextExt - DBpedia Open Extraction challenge](http://wiki.dbpedia.org/textext \"TextExt - DBpedia Open Extraction challenge\")\n- available for large-scale training NLP and IR methods\n\nTextExt - DBpedia Open Extraction challenge\n========\nThe DBpedia Open Text Extraction Challenge differs significantly from other challenges in the language technology and other areas in that it is not a one time call, but a continuous growing and expanding challenge with the focus to sustainably advance the state of the art and transcend boundaries in a systematic way. The DBpedia Association and the people behind this challenge are committed to provide the necessary infrastructure and drive the challenge for an indefinite time as well as potentially extend the challenge beyond Wikipedia.\nWe provide data form the DBpedia NIF datasets in 9 different languages and **your task** is to execute your NLP tool on the data and **extract** valuable information such as facts, relations, events, terminology, ontologies as RDF triples, or useful NLP annotations such as pos-tags, dependencies or co-reference.\n\n [Join the challenge](http://wiki.dbpedia.org/textext \"TextExt - DBpedia Open Extraction challenge\") at any time, there are no strict deadlines!\n"^^sysont:Markdown;
  dcterms:abstract "DBpedia NIF - a large-scale and multilingual knowledge extraction corpus. The aim of the dataset is two-fold: to dramatically broaden and deepen the amount of structured information in DBpedia, and to\r\nprovide large-scale and multilingual language resource for development of various NLP and IR task. The dataset provides the content of all articles for 128 Wikipedia languages.";
  doap:maintainer people:MilanDojchinovski;
  rdfs:label "DBpedia NIF Dataset";
  foaf:homepage <http://wiki.dbpedia.org/dbpedia-nif-dataset>.