/** * @param string $content * @param Document $document * @param int $offset * * @return bool|ElementHexa */ public static function parse($content, Document $document = null, &$offset = 0) { if (preg_match('/^\\s*\\<(?P<name>[A-F0-9]+)\\>/is', $content, $match)) { $name = $match['name']; $offset += strpos($content, '<' . $name) + strlen($name) + 2; // 1 for '>' // repackage string as standard $name = '(' . self::decode($name, $document) . ')'; $element = false; if (!($element = ElementDate::parse($name, $document))) { $element = ElementString::parse($name, $document); } return $element; } return false; }
/** * @param $type * @param $value * @param $document * * @return Element|Header * @throws \Exception */ protected function parseHeaderElement($type, $value, $document) { switch ($type) { case '<<': return $this->parseHeader($value, $document); case 'numeric': return new ElementNumeric($value, $document); case 'boolean': return new ElementBoolean($value, $document); case 'null': return new ElementNull($value, $document); case '(': if ($date = ElementDate::parse('(' . $value . ')', $document)) { return $date; } else { return ElementString::parse('(' . $value . ')', $document); } case '<': return $this->parseHeaderElement('(', ElementHexa::decode($value, $document), $document); case '/': return ElementName::parse('/' . $value, $document); case 'ojbref': // old mistake in tcpdf parser // old mistake in tcpdf parser case 'objref': return new ElementXRef($value, $document); case '[': $values = array(); foreach ($value as $sub_element) { $sub_type = $sub_element[0]; $sub_value = $sub_element[1]; $values[] = $this->parseHeaderElement($sub_type, $sub_value, $document); } return new ElementArray($values, $document); case 'endstream': case 'obj': //I don't know what it means but got my project fixed. //I don't know what it means but got my project fixed. case '': // Nothing to do with. break; default: throw new \Exception('Invalid type: "' . $type . '".'); } }
public function testParse() { // Skipped. $offset = 0; $element = \Smalot\PdfParser\Element\ElementDate::parse('ABC', null, $offset); $this->assert->boolean($element)->isEqualTo(false); $this->assert->integer($offset)->isEqualTo(0); $offset = 0; $element = \Smalot\PdfParser\Element\ElementDate::parse(' [ (ABC) 5 6 ]', null, $offset); $this->assert->boolean($element)->isEqualTo(false); $this->assert->integer($offset)->isEqualTo(0); $offset = 0; $element = \Smalot\PdfParser\Element\ElementDate::parse(' << (invalid) >>', null, $offset); $this->assert->boolean($element)->isEqualTo(false); $this->assert->integer($offset)->isEqualTo(0); $offset = 0; $element = \Smalot\PdfParser\Element\ElementDate::parse(' / (FlateDecode) ', null, $offset); $this->assert->boolean($element)->isEqualTo(false); $this->assert->integer($offset)->isEqualTo(0); $offset = 0; $element = \Smalot\PdfParser\Element\ElementDate::parse(' 0 (FlateDecode) ', null, $offset); $this->assert->boolean($element)->isEqualTo(false); $this->assert->integer($offset)->isEqualTo(0); $offset = 0; $element = \Smalot\PdfParser\Element\ElementDate::parse(" 0 \n (FlateDecode) ", null, $offset); $this->assert->boolean($element)->isEqualTo(false); $this->assert->integer($offset)->isEqualTo(0); // Valid. $offset = 0; $element = \Smalot\PdfParser\Element\ElementDate::parse(' (D:20130901235555+02\'00\') ', null, $offset); $element->setFormat('c'); $this->assert->object($element->getContent())->isInstanceOf('\\DateTime'); $this->assert->castToString($element)->isEqualTo('2013-09-01T23:55:55+02:00'); $this->assert->integer($offset)->isEqualTo(26); $offset = 0; $element = \Smalot\PdfParser\Element\ElementDate::parse(' (D:20130901235555+02\'00\') ', null, $offset); $element->setFormat('c'); $this->assert->object($element->getContent())->isInstanceOf('\\DateTime'); $this->assert->castToString($element)->isEqualTo('2013-09-01T23:55:55+02:00'); $this->assert->integer($offset)->isEqualTo(26); $offset = 0; $element = \Smalot\PdfParser\Element\ElementDate::parse(' (D:20130901235555+02\'00\')', null, $offset); $element->setFormat('c'); $this->assert->object($element->getContent())->isInstanceOf('\\DateTime'); $this->assert->castToString($element)->isEqualTo('2013-09-01T23:55:55+02:00'); $this->assert->integer($offset)->isEqualTo(26); $offset = 0; $element = \Smalot\PdfParser\Element\ElementDate::parse('(D:20130901235555+02\'00\')', null, $offset); $element->setFormat('c'); $this->assert->object($element->getContent())->isInstanceOf('\\DateTime'); $this->assert->castToString($element)->isEqualTo('2013-09-01T23:55:55+02:00'); $this->assert->integer($offset)->isEqualTo(25); $offset = 0; $element = \Smalot\PdfParser\Element\ElementDate::parse(" \n (D:20130901235555+02'00') ", null, $offset); $element->setFormat('c'); $this->assert->object($element->getContent())->isInstanceOf('\\DateTime'); $this->assert->castToString($element)->isEqualTo('2013-09-01T23:55:55+02:00'); $this->assert->integer($offset)->isEqualTo(28); $offset = 0; $element = \Smalot\PdfParser\Element\ElementDate::parse(" \n (D:20130901235555) ", null, $offset); $element->setFormat('c'); $this->assert->object($element->getContent())->isInstanceOf('\\DateTime'); $this->assert->boolean($element->equals(new \DateTime('2013-09-01T23:55:55')))->isEqualTo(true); $this->assert->integer($offset)->isEqualTo(21); $offset = 0; $element = \Smalot\PdfParser\Element\ElementDate::parse("(D:20131206091846Z00'00')", null, $offset); $element->setFormat('c'); $this->assert->object($element->getContent())->isInstanceOf('\\DateTime'); //$this->assert->boolean($element->equals(new \DateTime('2013-09-01T23:55:55')))->isEqualTo(true); $this->assert->integer($offset)->isEqualTo(25); // Format invalid $offset = 0; $element = \Smalot\PdfParser\Element\ElementDate::parse(" \n (D:2013+02'00') ", null, $offset); $this->assert->boolean($element)->isEqualTo(false); $this->assert->integer($offset)->isEqualTo(0); }
/** * @param string $content * @param Document $document * @param int $position * * @return array * @throws \Exception */ public static function parse($content, Document $document = null, &$position = 0) { $args = func_get_args(); $only_values = isset($args[3]) ? $args[3] : false; $content = trim($content); $values = array(); do { $old_position = $position; if (!$only_values) { if (!preg_match('/^\\s*(?P<name>\\/[A-Z0-9\\._]+)(?P<value>.*)/si', substr($content, $position), $match)) { break; } else { $name = ltrim($match['name'], '/'); $value = $match['value']; $position = strpos($content, $value, $position + strlen($match['name'])); } } else { $name = count($values); $value = substr($content, $position); } if ($element = ElementName::parse($value, $document, $position)) { $values[$name] = $element; } elseif ($element = ElementXRef::parse($value, $document, $position)) { $values[$name] = $element; } elseif ($element = ElementNumeric::parse($value, $document, $position)) { $values[$name] = $element; } elseif ($element = ElementStruct::parse($value, $document, $position)) { $values[$name] = $element; } elseif ($element = ElementBoolean::parse($value, $document, $position)) { $values[$name] = $element; } elseif ($element = ElementNull::parse($value, $document, $position)) { $values[$name] = $element; } elseif ($element = ElementDate::parse($value, $document, $position)) { $values[$name] = $element; } elseif ($element = ElementString::parse($value, $document, $position)) { $values[$name] = $element; } elseif ($element = ElementHexa::parse($value, $document, $position)) { $values[$name] = $element; } elseif ($element = ElementArray::parse($value, $document, $position)) { $values[$name] = $element; } else { $position = $old_position; break; } } while ($position < strlen($content)); return $values; }