Blame view

sources/apps/search_lucene/document/OpenDocument.php 2.55 KB
d1bafeea1   Kload   [fix] Upgrade to ...
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
  <?php
  
  namespace OCA\Search_Lucene\Document;
  /**
   * OpenDocument document.
   */
  abstract class OpenDocument extends \Zend_Search_Lucene_Document
  {
  	const OASIS_XPATH_TITLE    = '//dc:title';
  	const OASIS_XPATH_SUBJECT  = '//dc:subject';
  	const OASIS_XPATH_CREATOR  = '//meta:initial-creator';
  	const OASIS_XPATH_KEYWORDS = '//meta:keyword';
  	const OASIS_XPATH_CREATED  = '//meta:creation-date';
  	const OASIS_XPATH_MODIFIED = '//dc:date';
  
      /**
       * Extract metadata from document
       *
       * @param ZipArchive $package ZipArchive OpenDocument package
       * @return array Key-value pairs containing document meta data
       */
      protected function extractMetaData(\ZipArchive $package)
      {
          // Data holders
          $coreProperties = array();
  
          // Read relations and search for core properties
  		$loadEntities = libxml_disable_entity_loader(true);
  		$sxe = simplexml_load_string($package->getFromName("meta.xml"));
  		libxml_disable_entity_loader($loadEntities);
  
  		if (is_object($sxe) && $sxe instanceof \SimpleXMLElement) {
  
  			$coreProperties['title'] = $this->extractTermsFromMetadata($sxe, $this::OASIS_XPATH_TITLE);
  
  			$coreProperties['subject'] = $this->extractTermsFromMetadata($sxe, $this::OASIS_XPATH_SUBJECT);
  
  			$coreProperties['creator'] = $this->extractTermsFromMetadata($sxe, $this::OASIS_XPATH_CREATOR);
  
  			$coreProperties['keywords'] = $this->extractTermsFromMetadata($sxe, $this::OASIS_XPATH_KEYWORDS);
  
  			//replace T in date string with ' '
  			$coreProperties['created'] = str_replace('T', ' ', $this->extractTermsFromMetadata($sxe, $this::OASIS_XPATH_CREATED));
  
  			$coreProperties['modified'] = str_replace('T', ' ', $this->extractTermsFromMetadata($sxe, $this::OASIS_XPATH_MODIFIED));
  		}
  
          return $coreProperties;
      }
  
  	private function extractTermsFromMetadata(\SimpleXMLElement $sxe, $path) {
  
  		$terms = array();
  
  		foreach ($sxe->xpath($path) as $value) {
  			$terms[] = (string)$value;
  		}
  
  		return (implode(' ', $terms));
  
  	}
  
      /**
       * Determine absolute zip path
       *
       * @param string $path
       * @return string
       */
      protected function absoluteZipPath($path) {
          $path = str_replace(array('/', '\\'), DIRECTORY_SEPARATOR, $path);
          $parts = array_filter(explode(DIRECTORY_SEPARATOR, $path), 'strlen');
          $absolutes = array();
          foreach ($parts as $part) {
              if ('.' == $part) continue;
              if ('..' == $part) {
                  array_pop($absolutes);
              } else {
                  $absolutes[] = $part;
              }
          }
          return implode('/', $absolutes);
      }
  }