* @date 2017-01-03 * @license LGPLv3 * @url * * PdfParser is a pdf library written in PHP, extraction oriented. * Copyright (C) 2017 - Sébastien MALOT * * This program is free software: you can redistribute it and/or modify * it under the terms of the GNU Lesser General Public License as published by * the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU Lesser General Public License for more details. * * You should have received a copy of the GNU Lesser General Public License * along with this program. * If not, see . * */ namespace Smalot\PdfParser\Element; use Smalot\PdfParser\Element; use Smalot\PdfParser\Document; use Smalot\PdfParser\Header; /** * Class ElementStruct * * @package Smalot\PdfParser\Element */ class ElementStruct extends Element { /** * @param string $content * @param Document $document * @param int $offset * * @return bool|ElementStruct */ public static function parse($content, Document $document = null, &$offset = 0) { if (preg_match('/^\s*<<(?P.*)/is', $content)) { preg_match_all('/(.*?)(<<|>>)/s', trim($content), $matches); $level = 0; $sub = ''; foreach ($matches[0] as $part) { $sub .= $part; $level += (strpos($part, '<<') !== false ? 1 : -1); if ($level <= 0) { break; } } $offset += strpos($content, '<<') + strlen(rtrim($sub)); // Removes '<<' and '>>'. $sub = trim(preg_replace('/^\s*<<(.*)>>\s*$/s', '\\1', $sub)); $position = 0; $elements = Element::parse($sub, $document, $position); $header = new Header($elements, $document); return $header; } return false; } }