/usr/share/php/arc/extractors/ARC2_DcExtractor.php is in libarc-php 2~20101006-2.
This file is owned by root:root, with mode 0o644.
The actual contents of the file can be viewed below.
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 | <?php
/*
homepage: http://arc.semsol.org/
license: http://arc.semsol.org/license
class: ARC2 DC Extractor
author: Benjamin Nowack
version: 2010-11-16
*/
ARC2::inc('RDFExtractor');
class ARC2_DcExtractor extends ARC2_RDFExtractor {
function __construct($a, &$caller) {
parent::__construct($a, $caller);
}
function __init() {
parent::__init();
$this->a['ns']['dc'] = 'http://purl.org/dc/elements/1.1/';
}
/* */
function extractRDF() {
$t_vals = array();
$t = '';
foreach ($this->nodes as $n) {
foreach (array('title', 'link', 'meta') as $tag) {
if ($n['tag'] == $tag) {
$m = 'extract' . ucfirst($tag);
list ($t_vals, $t) = $this->$m($n, $t_vals, $t);
}
}
}
if ($t) {
$doc = $this->getFilledTemplate($t, $t_vals, $n['doc_base']);
$this->addTs(ARC2::getTriplesFromIndex($doc));
}
}
/* */
function extractTitle($n, $t_vals, $t) {
if ($t_vals['title'] = $this->getPlainContent($n)) {
$t .= '<' . $n['doc_url'] . '> dc:title ?title . ';
}
return array($t_vals, $t);
}
/* */
function extractLink($n, $t_vals, $t) {
if ($this->hasRel($n, 'alternate') || $this->hasRel($n, 'meta')) {
if ($href = $this->v('href uri', '', $n['a'])) {
$t .= '<' . $n['doc_url'] . '> rdfs:seeAlso <' . $href . '> . ';
if ($v = $this->v('type', '', $n['a'])) {
$t .= '<' .$href. '> dc:format "' . $v . '" . ';
}
if ($v = $this->v('title', '', $n['a'])) {
$t .= '<' .$href. '> dc:title "' . $v . '" . ';
}
}
}
return array($t_vals, $t);
}
function extractMeta($n, $t_vals, $t) {
if ($this->hasAttribute('http-equiv', $n, 'Content-Type') || $this->hasAttribute('http-equiv', $n, 'content-type')) {
if ($v = $this->v('content', '', $n['a'])) {
$t .= '<' . $n['doc_url'] . '> dc:format "' . $v . '" . ';
}
}
return array($t_vals, $t);
}
/* */
}
|