Blame view
sources/apps/search_lucene/document/OpenDocument.php
2.45 KB
|
42e4f8d60
|
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 |
<?php
namespace OCA\Search_Lucene\Document;
/**
* OpenDocument document.
*/
abstract class OpenDocument extends \Zend_Search_Lucene_Document
{
const OASIS_XPATH_TITLE = '//dc:title';
const OASIS_XPATH_SUBJECT = '//dc:subject';
const OASIS_XPATH_CREATOR = '//meta:initial-creator';
const OASIS_XPATH_KEYWORDS = '//meta:keyword';
const OASIS_XPATH_CREATED = '//meta:creation-date';
const OASIS_XPATH_MODIFIED = '//dc:date';
/**
* Extract metadata from document
*
* @param ZipArchive $package ZipArchive OpenDocument package
* @return array Key-value pairs containing document meta data
*/
protected function extractMetaData(\ZipArchive $package)
{
// Data holders
$coreProperties = array();
// Read relations and search for core properties
$sxe = simplexml_load_string($package->getFromName("meta.xml"));
if (is_object($sxe) && $sxe instanceof \SimpleXMLElement) {
$coreProperties['title'] = $this->extractTermsFromMetadata($sxe, $this::OASIS_XPATH_TITLE);
$coreProperties['subject'] = $this->extractTermsFromMetadata($sxe, $this::OASIS_XPATH_SUBJECT);
$coreProperties['creator'] = $this->extractTermsFromMetadata($sxe, $this::OASIS_XPATH_CREATOR);
$coreProperties['keywords'] = $this->extractTermsFromMetadata($sxe, $this::OASIS_XPATH_KEYWORDS);
//replace T in date string with ' '
$coreProperties['created'] = str_replace('T', ' ', $this->extractTermsFromMetadata($sxe, $this::OASIS_XPATH_CREATED));
$coreProperties['modified'] = str_replace('T', ' ', $this->extractTermsFromMetadata($sxe, $this::OASIS_XPATH_MODIFIED));
}
return $coreProperties;
}
private function extractTermsFromMetadata(\SimpleXMLElement $sxe, $path) {
$terms = array();
foreach ($sxe->xpath($path) as $value) {
$terms[] = (string)$value;
}
return (implode(' ', $terms));
}
/**
* Determine absolute zip path
*
* @param string $path
* @return string
*/
protected function absoluteZipPath($path) {
$path = str_replace(array('/', '\\'), DIRECTORY_SEPARATOR, $path);
$parts = array_filter(explode(DIRECTORY_SEPARATOR, $path), 'strlen');
$absolutes = array();
foreach ($parts as $part) {
if ('.' == $part) continue;
if ('..' == $part) {
array_pop($absolutes);
} else {
$absolutes[] = $part;
}
}
return implode('/', $absolutes);
}
}
|