/s3db3.5.10/pearlib/arc/parsers/ARC2_RDFParser.php
PHP | 111 lines | 73 code | 21 blank | 17 comment | 5 complexity | 9fbc7f64fad1c60210f90af775bc2c79 MD5 | raw file
- <?php
- /*
- homepage: http://arc.semsol.org/
- license: http://arc.semsol.org/license
-
- class: ARC2 RDF Parser (generic)
- author: Benjamin Nowack
- version: 2008-07-15 (Addition: SG API JSON support)
- */
-
- ARC2::inc('Class');
-
- class ARC2_RDFParser extends ARC2_Class {
-
- function __construct($a = '', &$caller) {
- parent::__construct($a, $caller);
- }
-
- function ARC2_RDFParser($a = '', &$caller) {
- $this->__construct($a, $caller);
- }
-
- function __init() {/* proxy_host, proxy_port, proxy_skip, http_accept_header, http_user_agent_header, max_redirects, reader, skip_dupes */
- parent::__init();
- $this->a['format'] = $this->v('format', false, $this->a);
- $this->triples = array();
- $this->t_count = 0;
- $this->added_triples = array();
- $this->skip_dupes = $this->v('skip_dupes', false, $this->a);
- $this->bnode_prefix = $this->v('bnode_prefix', 'arc'.substr(md5(uniqid(rand())), 0, 4).'b', $this->a);
- $this->bnode_id = 0;
- }
-
- /* */
-
- function setReader(&$reader) {
- $this->reader =& $reader;
- }
-
- function parse($path, $data = '') {
- /* reader */
- if (!isset($this->reader)) {
- ARC2::inc('Reader');
- $this->reader = & new ARC2_Reader($this->a, $this);
- }
- $this->reader->activate($path, $data) ;
- /* format detection */
- $mappings = array(
- 'rdfxml' => 'RDFXML',
- 'turtle' => 'Turtle',
- 'sparqlxml' => 'SPOG',
- 'ntriples' => 'Turtle',
- 'html' => 'SemHTML',
- 'rss' => 'RSS',
- 'sgajson' => 'SGAJSON'
- );
- $format = $this->reader->getFormat();
- if (!$format || !isset($mappings[$format])) {
- return $this->addError('No parser available for "' . $format . '".');
- }
- /* format parser */
- $suffix = $mappings[$format] . 'Parser';
- ARC2::inc($suffix);
- $cls = 'ARC2_' . $suffix;
- $this->parser =& new $cls($this->a, $this);
- $this->parser->setReader($this->reader);
- return $this->parser->parse($path, $data);
- }
-
- function parseData($data) {
- return $this->parse(ARC2::getScriptURI(), $data);
- }
-
- /* */
-
- function done() {
- }
-
- /* */
-
- function getTriples() {
- return $this->v('parser') ? $this->m('getTriples', false, array(), $this->v('parser')) : array();
- }
-
- function countTriples() {
- return $this->v('parser') ? $this->m('countTriples', false, 0, $this->v('parser')) : 0;
- }
-
- function getSimpleIndex($flatten_objects = 1, $vals = '') {
- return ARC2::getSimpleIndex($this->getTriples(), $flatten_objects, $vals);
- }
-
- /* */
-
- function extractRDF($formats = '') {
- if (method_exists($this->parser, 'extractRDF')) {
- return $this->parser->extractRDF($formats);
- }
- }
-
- /* */
-
- function getEncoding($src = 'config') {
- if (method_exists($this->parser, 'getEncoding')) {
- return $this->parser->getEncoding($src);
- }
- }
-
- /* */
-
- }