entityRepo = $entityRepo; } /** * Convert a page to a self-contained HTML file. * Includes required CSS & image content. Images are base64 encoded into the HTML. * @param Page $page * @return mixed|string */ public function pageToContainedHtml(Page $page) { $pageHtml = view('pages/export', [ 'page' => $page, 'pageContent' => $this->entityRepo->renderPage($page) ])->render(); return $this->containHtml($pageHtml); } /** * Convert a book to a self-contained HTML file. * @param Book $book * @return mixed|string */ public function bookToContainedHtml(Book $book) { $bookTree = $this->entityRepo->getBookChildren($book, true, true); $html = view('books/export', [ 'book' => $book, 'bookChildren' => $bookTree ])->render(); return $this->containHtml($html); } /** * Convert a page to a PDF file. * @param Page $page * @return mixed|string */ public function pageToPdf(Page $page) { $html = view('pages/pdf', [ 'page' => $page, 'pageContent' => $this->entityRepo->renderPage($page) ])->render(); return $this->htmlToPdf($html); } /** * Convert a book to a PDF file * @param Book $book * @return string */ public function bookToPdf(Book $book) { $bookTree = $this->entityRepo->getBookChildren($book, true, true); $html = view('books/export', [ 'book' => $book, 'bookChildren' => $bookTree ])->render(); return $this->htmlToPdf($html); } /** * Convert normal webpage HTML to a PDF. * @param $html * @return string */ protected function htmlToPdf($html) { $containedHtml = $this->containHtml($html); $useWKHTML = config('snappy.pdf.binary') !== false; if ($useWKHTML) { $pdf = \SnappyPDF::loadHTML($containedHtml); $pdf->setOption('print-media-type', true); } else { $pdf = \PDF::loadHTML($containedHtml); } return $pdf->output(); } /** * Bundle of the contents of a html file to be self-contained. * @param $htmlContent * @return mixed|string */ protected function containHtml($htmlContent) { $imageTagsOutput = []; preg_match_all("/\/i", $htmlContent, $imageTagsOutput); // Replace image src with base64 encoded image strings if (isset($imageTagsOutput[0]) && count($imageTagsOutput[0]) > 0) { foreach ($imageTagsOutput[0] as $index => $imgMatch) { $oldImgString = $imgMatch; $srcString = $imageTagsOutput[2][$index]; $isLocal = strpos(trim($srcString), 'http') !== 0; if ($isLocal) { $pathString = public_path(trim($srcString, '/')); } else { $pathString = $srcString; } if ($isLocal && !file_exists($pathString)) continue; try { $imageContent = file_get_contents($pathString); $imageEncoded = 'data:image/' . pathinfo($pathString, PATHINFO_EXTENSION) . ';base64,' . base64_encode($imageContent); $newImageString = str_replace($srcString, $imageEncoded, $oldImgString); } catch (\ErrorException $e) { $newImageString = ''; } $htmlContent = str_replace($oldImgString, $newImageString, $htmlContent); } } $linksOutput = []; preg_match_all("/\/i", $htmlContent, $linksOutput); // Replace image src with base64 encoded image strings if (isset($linksOutput[0]) && count($linksOutput[0]) > 0) { foreach ($linksOutput[0] as $index => $linkMatch) { $oldLinkString = $linkMatch; $srcString = $linksOutput[2][$index]; if (strpos(trim($srcString), 'http') !== 0) { $newSrcString = url($srcString); $newLinkString = str_replace($srcString, $newSrcString, $oldLinkString); $htmlContent = str_replace($oldLinkString, $newLinkString, $htmlContent); } } } // Replace any relative links with system domain return $htmlContent; } /** * Converts the page contents into simple plain text. * This method filters any bad looking content to provide a nice final output. * @param Page $page * @return mixed */ public function pageToPlainText(Page $page) { $html = $this->entityRepo->renderPage($page); $text = strip_tags($html); // Replace multiple spaces with single spaces $text = preg_replace('/\ {2,}/', ' ', $text); // Reduce multiple horrid whitespace characters. $text = preg_replace('/(\x0A|\xA0|\x0A|\r|\n){2,}/su', "\n\n", $text); $text = html_entity_decode($text); // Add title $text = $page->name . "\n\n" . $text; return $text; } /** * Convert a book into a plain text string. * @param Book $book * @return string */ public function bookToPlainText(Book $book) { $bookTree = $this->entityRepo->getBookChildren($book, true, true); $text = $book->name . "\n\n"; foreach ($bookTree as $bookChild) { if ($bookChild->isA('chapter')) { $text .= $bookChild->name . "\n\n"; $text .= $bookChild->description . "\n\n"; foreach ($bookChild->pages as $page) { $text .= $this->pageToPlainText($page); } } else { $text .= $this->pageToPlainText($bookChild); } } return $text; } }