<?php include 'dbpedia.php'; error_reporting(E_ALL); Timer::start("main::Runtime"); // Setup the language version of Wikipedia $language = Options::getOption('language'); $pageTitles = new AllTemplatesSqlIterator($language); $job = new ExtractionJob(new DatabaseWikipediaCollection($language), $pageTitles); $groupInfoboxes = new ExtractionGroup(new NullDestination()); $groupInfoboxes->addExtractor(new TemplateRedirectExtractor()); // Add the ExtractionGroups to the ExtractionJob $job->addExtractionGroup($groupInfoboxes); //Execute the Extraction Job $manager = new ExtractionManager(); $manager->execute($job); Timer::stop("main::Runtime"); Timer::printTime();
} error_reporting(E_ALL | E_NOTICE); $manager = new ExtractionManager(); $pageTitlesEn = new AllArticlesSqlIterator("en"); $jobEnWiki = new ExtractionJob(new LiveWikipedia("en"), $pageTitlesEn); $groupArticlesLabelEn = new ExtractionGroup(new NTripleDumpDestination("articles_label.nt")); $groupArticlesLabelEn->addExtractor(new LabelExtractor()); $jobEnWiki->addExtractionGroup($groupArticlesLabelEn); $groupArticlesShortAbstractEn = new ExtractionGroup(new NTripleDumpDestination("articles_abstract.nt")); $groupArticlesShortAbstractEn->addExtractor(new ShortAbstractExtractor()); $jobEnWiki->addExtractionGroup($groupArticlesShortAbstractEn); $groupImages = new ExtractionGroup(new NTripleDumpDestination("articles_image.nt")); $groupImages->addExtractor(new ImageExtractor()); $jobEnWiki->addExtractionGroup($groupImages); $groupWikipages = new ExtractionGroup(new NTripleDumpDestination("articles_wikipage.nt")); $groupWikipages->addExtractor(new WikipageExtractor()); $jobEnWiki->addExtractionGroup($groupWikipages); $groupInfoboxes = new ExtractionGroup(new NTripleDumpDestination("infoboxes.nt"), new NTripleDumpDestination("infoboxes.properties.nt")); $groupInfoboxes->addExtractor(new InfoboxExtractor()); $jobEnWiki->addExtractionGroup($groupInfoboxes); $groupSemantic = new ExtractionGroup(new NTripleDumpDestination("semantic.nt")); $groupSemantic->addExtractor(new SemanticExtractor()); $jobEnWiki->addExtractionGroup($groupSemantic); $groupDBpedia = new ExtractionGroup(new NTripleDumpDestination("dbpedia_links.nt")); $groupDBpedia->addExtractor(new DBpediaLinkExtractor()); $jobEnWiki->addExtractionGroup($groupDBpedia); $groupGeoCodes = new ExtractionGroup(new NTripleDumpDestination("geocodes.nt")); $groupGeoCodes->addExtractor(new WcGeoExtractor()); $jobEnWiki->addExtractionGroup($groupGeoCodes); $manager->execute($jobEnWiki);