X-Git-Url: http://source.bookstackapp.com/bookstack/blobdiff_plain/ea2e16cabb5ca5815dd1ee5b8eb1ac6a32bac57e..refs/pull/261/head:/app/Services/ExportService.php diff --git a/app/Services/ExportService.php b/app/Services/ExportService.php index 05ba85dd1..78cef41a4 100644 --- a/app/Services/ExportService.php +++ b/app/Services/ExportService.php @@ -1,11 +1,23 @@ entityRepo = $entityRepo; + } /** * Convert a page to a self-contained HTML file. @@ -15,31 +27,146 @@ class ExportService */ public function pageToContainedHtml(Page $page) { - $cssContent = file_get_contents(public_path('/css/export-styles.css')); - $pageHtml = view('pages/pdf', ['page' => $page, 'css' => $cssContent])->render(); + $pageHtml = view('pages/export', [ + 'page' => $page, + 'pageContent' => $this->entityRepo->renderPage($page) + ])->render(); + return $this->containHtml($pageHtml); + } + + /** + * Convert a chapter to a self-contained HTML file. + * @param Chapter $chapter + * @return mixed|string + */ + public function chapterToContainedHtml(Chapter $chapter) + { + $pages = $this->entityRepo->getChapterChildren($chapter); + $pages->each(function($page) { + $page->html = $this->entityRepo->renderPage($page); + }); + $html = view('chapters/export', [ + 'chapter' => $chapter, + 'pages' => $pages + ])->render(); + return $this->containHtml($html); + } + + /** + * Convert a book to a self-contained HTML file. + * @param Book $book + * @return mixed|string + */ + public function bookToContainedHtml(Book $book) + { + $bookTree = $this->entityRepo->getBookChildren($book, true, true); + $html = view('books/export', [ + 'book' => $book, + 'bookChildren' => $bookTree + ])->render(); + return $this->containHtml($html); + } + + /** + * Convert a page to a PDF file. + * @param Page $page + * @return mixed|string + */ + public function pageToPdf(Page $page) + { + $html = view('pages/pdf', [ + 'page' => $page, + 'pageContent' => $this->entityRepo->renderPage($page) + ])->render(); + return $this->htmlToPdf($html); + } + + /** + * Convert a chapter to a PDF file. + * @param Chapter $chapter + * @return mixed|string + */ + public function chapterToPdf(Chapter $chapter) + { + $pages = $this->entityRepo->getChapterChildren($chapter); + $pages->each(function($page) { + $page->html = $this->entityRepo->renderPage($page); + }); + $html = view('chapters/export', [ + 'chapter' => $chapter, + 'pages' => $pages + ])->render(); + return $this->htmlToPdf($html); + } + + /** + * Convert a book to a PDF file + * @param Book $book + * @return string + */ + public function bookToPdf(Book $book) + { + $bookTree = $this->entityRepo->getBookChildren($book, true, true); + $html = view('books/export', [ + 'book' => $book, + 'bookChildren' => $bookTree + ])->render(); + return $this->htmlToPdf($html); + } + + /** + * Convert normal webpage HTML to a PDF. + * @param $html + * @return string + */ + protected function htmlToPdf($html) + { + $containedHtml = $this->containHtml($html); + $useWKHTML = config('snappy.pdf.binary') !== false; + if ($useWKHTML) { + $pdf = \SnappyPDF::loadHTML($containedHtml); + $pdf->setOption('print-media-type', true); + } else { + $pdf = \PDF::loadHTML($containedHtml); + } + return $pdf->output(); + } + /** + * Bundle of the contents of a html file to be self-contained. + * @param $htmlContent + * @return mixed|string + */ + protected function containHtml($htmlContent) + { $imageTagsOutput = []; - preg_match_all("/\/i", $pageHtml, $imageTagsOutput); + preg_match_all("/\/i", $htmlContent, $imageTagsOutput); // Replace image src with base64 encoded image strings if (isset($imageTagsOutput[0]) && count($imageTagsOutput[0]) > 0) { foreach ($imageTagsOutput[0] as $index => $imgMatch) { $oldImgString = $imgMatch; $srcString = $imageTagsOutput[2][$index]; - if (strpos(trim($srcString), 'http') !== 0) { - $pathString = public_path($srcString); + $isLocal = strpos(trim($srcString), 'http') !== 0; + if ($isLocal) { + $pathString = public_path(trim($srcString, '/')); } else { $pathString = $srcString; } - $imageContent = file_get_contents($pathString); - $imageEncoded = 'data:image/' . pathinfo($pathString, PATHINFO_EXTENSION) . ';base64,' . base64_encode($imageContent); - $newImageString = str_replace($srcString, $imageEncoded, $oldImgString); - $pageHtml = str_replace($oldImgString, $newImageString, $pageHtml); + if ($isLocal && !file_exists($pathString)) continue; + try { + $imageContent = file_get_contents($pathString); + $imageEncoded = 'data:image/' . pathinfo($pathString, PATHINFO_EXTENSION) . ';base64,' . base64_encode($imageContent); + $newImageString = str_replace($srcString, $imageEncoded, $oldImgString); + } catch (\ErrorException $e) { + $newImageString = ''; + } + $htmlContent = str_replace($oldImgString, $newImageString, $htmlContent); } } $linksOutput = []; - preg_match_all("/\/i", $pageHtml, $linksOutput); + preg_match_all("/\/i", $htmlContent, $linksOutput); // Replace image src with base64 encoded image strings if (isset($linksOutput[0]) && count($linksOutput[0]) > 0) { @@ -49,13 +176,79 @@ class ExportService if (strpos(trim($srcString), 'http') !== 0) { $newSrcString = url($srcString); $newLinkString = str_replace($srcString, $newSrcString, $oldLinkString); - $pageHtml = str_replace($oldLinkString, $newLinkString, $pageHtml); + $htmlContent = str_replace($oldLinkString, $newLinkString, $htmlContent); } } } // Replace any relative links with system domain - return $pageHtml; + return $htmlContent; + } + + /** + * Converts the page contents into simple plain text. + * This method filters any bad looking content to provide a nice final output. + * @param Page $page + * @return mixed + */ + public function pageToPlainText(Page $page) + { + $html = $this->entityRepo->renderPage($page); + $text = strip_tags($html); + // Replace multiple spaces with single spaces + $text = preg_replace('/\ {2,}/', ' ', $text); + // Reduce multiple horrid whitespace characters. + $text = preg_replace('/(\x0A|\xA0|\x0A|\r|\n){2,}/su', "\n\n", $text); + $text = html_entity_decode($text); + // Add title + $text = $page->name . "\n\n" . $text; + return $text; + } + + /** + * Convert a chapter into a plain text string. + * @param Chapter $chapter + * @return string + */ + public function chapterToPlainText(Chapter $chapter) + { + $text = $chapter->name . "\n\n"; + $text .= $chapter->description . "\n\n"; + foreach ($chapter->pages as $page) { + $text .= $this->pageToPlainText($page); + } + return $text; + } + + /** + * Convert a book into a plain text string. + * @param Book $book + * @return string + */ + public function bookToPlainText(Book $book) + { + $bookTree = $this->entityRepo->getBookChildren($book, true, true); + $text = $book->name . "\n\n"; + foreach ($bookTree as $bookChild) { + if ($bookChild->isA('chapter')) { + $text .= $this->chapterToPlainText($bookChild); + } else { + $text .= $this->pageToPlainText($bookChild); + } + } + return $text; } -} \ No newline at end of file +} + + + + + + + + + + + +