| 
									
										
										
										
											2018-09-25 19:30:50 +08:00
										 |  |  | <?php namespace BookStack\Entities; | 
					
						
							| 
									
										
										
										
											2016-01-21 06:13:13 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  | use BookStack\Entities\Managers\BookContents; | 
					
						
							|  |  |  | use BookStack\Entities\Managers\PageContent; | 
					
						
							| 
									
										
										
										
											2018-09-25 19:30:50 +08:00
										 |  |  | use BookStack\Uploads\ImageService; | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  | use DomPDF; | 
					
						
							|  |  |  | use Exception; | 
					
						
							|  |  |  | use SnappyPDF; | 
					
						
							|  |  |  | use Throwable; | 
					
						
							| 
									
										
										
										
											2016-01-21 06:13:13 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  | class ExportService | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-04-22 19:23:43 +08:00
										 |  |  |     protected $imageService; | 
					
						
							| 
									
										
										
										
											2017-01-21 21:53:00 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  |     /** | 
					
						
							|  |  |  |      * ExportService constructor. | 
					
						
							|  |  |  |      */ | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  |     public function __construct(ImageService $imageService) | 
					
						
							| 
									
										
										
										
											2017-01-21 21:53:00 +08:00
										 |  |  |     { | 
					
						
							| 
									
										
										
										
											2018-04-22 19:23:43 +08:00
										 |  |  |         $this->imageService = $imageService; | 
					
						
							| 
									
										
										
										
											2017-01-21 21:53:00 +08:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-01-21 06:13:13 +08:00
										 |  |  |     /** | 
					
						
							|  |  |  |      * Convert a page to a self-contained HTML file. | 
					
						
							|  |  |  |      * Includes required CSS & image content. Images are base64 encoded into the HTML. | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  |      * @throws Throwable | 
					
						
							| 
									
										
										
										
											2016-01-21 06:13:13 +08:00
										 |  |  |      */ | 
					
						
							|  |  |  |     public function pageToContainedHtml(Page $page) | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |     { | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  |         $page->html = (new PageContent($page))->render(); | 
					
						
							| 
									
										
										
										
											2017-02-26 21:26:51 +08:00
										 |  |  |         $pageHtml = view('pages/export', [ | 
					
						
							| 
									
										
										
										
											2017-08-28 20:38:32 +08:00
										 |  |  |             'page' => $page | 
					
						
							| 
									
										
										
										
											2017-02-26 21:26:51 +08:00
										 |  |  |         ])->render(); | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |         return $this->containHtml($pageHtml); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-02-26 22:25:02 +08:00
										 |  |  |     /** | 
					
						
							|  |  |  |      * Convert a chapter to a self-contained HTML file. | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  |      * @throws Throwable | 
					
						
							| 
									
										
										
										
											2017-02-26 22:25:02 +08:00
										 |  |  |      */ | 
					
						
							|  |  |  |     public function chapterToContainedHtml(Chapter $chapter) | 
					
						
							|  |  |  |     { | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  |         $pages = $chapter->getVisiblePages(); | 
					
						
							| 
									
										
										
										
											2018-01-29 00:58:52 +08:00
										 |  |  |         $pages->each(function ($page) { | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  |             $page->html = (new PageContent($page))->render(); | 
					
						
							| 
									
										
										
										
											2017-02-26 22:25:02 +08:00
										 |  |  |         }); | 
					
						
							|  |  |  |         $html = view('chapters/export', [ | 
					
						
							|  |  |  |             'chapter' => $chapter, | 
					
						
							|  |  |  |             'pages' => $pages | 
					
						
							|  |  |  |         ])->render(); | 
					
						
							|  |  |  |         return $this->containHtml($html); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |     /** | 
					
						
							| 
									
										
										
										
											2017-02-26 21:26:51 +08:00
										 |  |  |      * Convert a book to a self-contained HTML file. | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  |      * @throws Throwable | 
					
						
							| 
									
										
										
										
											2017-02-26 21:26:51 +08:00
										 |  |  |      */ | 
					
						
							|  |  |  |     public function bookToContainedHtml(Book $book) | 
					
						
							|  |  |  |     { | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  |         $bookTree = (new BookContents($book))->getTree(false, true); | 
					
						
							| 
									
										
										
										
											2017-02-26 21:26:51 +08:00
										 |  |  |         $html = view('books/export', [ | 
					
						
							|  |  |  |             'book' => $book, | 
					
						
							|  |  |  |             'bookChildren' => $bookTree | 
					
						
							|  |  |  |         ])->render(); | 
					
						
							|  |  |  |         return $this->containHtml($html); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     /** | 
					
						
							|  |  |  |      * Convert a page to a PDF file. | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  |      * @throws Throwable | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |      */ | 
					
						
							|  |  |  |     public function pageToPdf(Page $page) | 
					
						
							| 
									
										
										
										
											2016-01-21 06:13:13 +08:00
										 |  |  |     { | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  |         $page->html = (new PageContent($page))->render(); | 
					
						
							| 
									
										
										
										
											2017-02-26 21:26:51 +08:00
										 |  |  |         $html = view('pages/pdf', [ | 
					
						
							| 
									
										
										
										
											2017-08-28 20:38:32 +08:00
										 |  |  |             'page' => $page | 
					
						
							| 
									
										
										
										
											2017-02-26 21:26:51 +08:00
										 |  |  |         ])->render(); | 
					
						
							|  |  |  |         return $this->htmlToPdf($html); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-02-26 22:25:02 +08:00
										 |  |  |     /** | 
					
						
							|  |  |  |      * Convert a chapter to a PDF file. | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  |      * @throws Throwable | 
					
						
							| 
									
										
										
										
											2017-02-26 22:25:02 +08:00
										 |  |  |      */ | 
					
						
							|  |  |  |     public function chapterToPdf(Chapter $chapter) | 
					
						
							|  |  |  |     { | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  |         $pages = $chapter->getVisiblePages(); | 
					
						
							| 
									
										
										
										
											2018-01-29 00:58:52 +08:00
										 |  |  |         $pages->each(function ($page) { | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  |             $page->html = (new PageContent($page))->render(); | 
					
						
							| 
									
										
										
										
											2017-02-26 22:25:02 +08:00
										 |  |  |         }); | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-02-26 22:25:02 +08:00
										 |  |  |         $html = view('chapters/export', [ | 
					
						
							|  |  |  |             'chapter' => $chapter, | 
					
						
							|  |  |  |             'pages' => $pages | 
					
						
							|  |  |  |         ])->render(); | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-02-26 22:25:02 +08:00
										 |  |  |         return $this->htmlToPdf($html); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-02-26 21:26:51 +08:00
										 |  |  |     /** | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  |      * Convert a book to a PDF file. | 
					
						
							|  |  |  |      * @throws Throwable | 
					
						
							| 
									
										
										
										
											2017-02-26 21:26:51 +08:00
										 |  |  |      */ | 
					
						
							|  |  |  |     public function bookToPdf(Book $book) | 
					
						
							|  |  |  |     { | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  |         $bookTree = (new BookContents($book))->getTree(false, true); | 
					
						
							| 
									
										
										
										
											2017-02-26 21:26:51 +08:00
										 |  |  |         $html = view('books/export', [ | 
					
						
							|  |  |  |             'book' => $book, | 
					
						
							|  |  |  |             'bookChildren' => $bookTree | 
					
						
							|  |  |  |         ])->render(); | 
					
						
							|  |  |  |         return $this->htmlToPdf($html); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     /** | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  |      * Convert normal web-page HTML to a PDF. | 
					
						
							|  |  |  |      * @throws Exception | 
					
						
							| 
									
										
										
										
											2017-02-26 21:26:51 +08:00
										 |  |  |      */ | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  |     protected function htmlToPdf(string $html): string | 
					
						
							| 
									
										
										
										
											2017-02-26 21:26:51 +08:00
										 |  |  |     { | 
					
						
							|  |  |  |         $containedHtml = $this->containHtml($html); | 
					
						
							| 
									
										
										
										
											2017-01-01 20:20:30 +08:00
										 |  |  |         $useWKHTML = config('snappy.pdf.binary') !== false; | 
					
						
							|  |  |  |         if ($useWKHTML) { | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  |             $pdf = SnappyPDF::loadHTML($containedHtml); | 
					
						
							| 
									
										
										
										
											2017-02-26 21:26:51 +08:00
										 |  |  |             $pdf->setOption('print-media-type', true); | 
					
						
							| 
									
										
										
										
											2017-01-01 20:20:30 +08:00
										 |  |  |         } else { | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  |             $pdf = DomPDF::loadHTML($containedHtml); | 
					
						
							| 
									
										
										
										
											2017-01-01 20:20:30 +08:00
										 |  |  |         } | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |         return $pdf->output(); | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2016-01-21 06:13:13 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |     /** | 
					
						
							|  |  |  |      * Bundle of the contents of a html file to be self-contained. | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  |      * @throws Exception | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |      */ | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  |     protected function containHtml(string $htmlContent): string | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |     { | 
					
						
							| 
									
										
										
										
											2016-01-21 06:13:13 +08:00
										 |  |  |         $imageTagsOutput = []; | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |         preg_match_all("/\<img.*src\=(\'|\")(.*?)(\'|\").*?\>/i", $htmlContent, $imageTagsOutput); | 
					
						
							| 
									
										
										
										
											2016-01-21 06:13:13 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  |         // Replace image src with base64 encoded image strings
 | 
					
						
							|  |  |  |         if (isset($imageTagsOutput[0]) && count($imageTagsOutput[0]) > 0) { | 
					
						
							|  |  |  |             foreach ($imageTagsOutput[0] as $index => $imgMatch) { | 
					
						
							| 
									
										
										
										
											2018-04-22 19:23:43 +08:00
										 |  |  |                 $oldImgTagString = $imgMatch; | 
					
						
							| 
									
										
										
										
											2016-01-21 06:13:13 +08:00
										 |  |  |                 $srcString = $imageTagsOutput[2][$index]; | 
					
						
							| 
									
										
										
										
											2018-04-22 19:23:43 +08:00
										 |  |  |                 $imageEncoded = $this->imageService->imageUriToBase64($srcString); | 
					
						
							|  |  |  |                 if ($imageEncoded === null) { | 
					
						
							|  |  |  |                     $imageEncoded = $srcString; | 
					
						
							| 
									
										
										
										
											2017-01-21 21:53:00 +08:00
										 |  |  |                 } | 
					
						
							| 
									
										
										
										
											2018-04-22 19:23:43 +08:00
										 |  |  |                 $newImgTagString = str_replace($srcString, $imageEncoded, $oldImgTagString); | 
					
						
							|  |  |  |                 $htmlContent = str_replace($oldImgTagString, $newImgTagString, $htmlContent); | 
					
						
							| 
									
										
										
										
											2016-01-21 06:13:13 +08:00
										 |  |  |             } | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         $linksOutput = []; | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |         preg_match_all("/\<a.*href\=(\'|\")(.*?)(\'|\").*?\>/i", $htmlContent, $linksOutput); | 
					
						
							| 
									
										
										
										
											2016-01-21 06:13:13 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  |         // Replace image src with base64 encoded image strings
 | 
					
						
							|  |  |  |         if (isset($linksOutput[0]) && count($linksOutput[0]) > 0) { | 
					
						
							|  |  |  |             foreach ($linksOutput[0] as $index => $linkMatch) { | 
					
						
							|  |  |  |                 $oldLinkString = $linkMatch; | 
					
						
							|  |  |  |                 $srcString = $linksOutput[2][$index]; | 
					
						
							|  |  |  |                 if (strpos(trim($srcString), 'http') !== 0) { | 
					
						
							|  |  |  |                     $newSrcString = url($srcString); | 
					
						
							|  |  |  |                     $newLinkString = str_replace($srcString, $newSrcString, $oldLinkString); | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |                     $htmlContent = str_replace($oldLinkString, $newLinkString, $htmlContent); | 
					
						
							| 
									
										
										
										
											2016-01-21 06:13:13 +08:00
										 |  |  |                 } | 
					
						
							|  |  |  |             } | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         // Replace any relative links with system domain
 | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |         return $htmlContent; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     /** | 
					
						
							|  |  |  |      * Converts the page contents into simple plain text. | 
					
						
							| 
									
										
										
										
											2017-01-21 21:53:00 +08:00
										 |  |  |      * This method filters any bad looking content to provide a nice final output. | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |      */ | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  |     public function pageToPlainText(Page $page): string | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |     { | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  |         $html = (new PageContent($page))->render(); | 
					
						
							| 
									
										
										
										
											2017-01-21 21:53:00 +08:00
										 |  |  |         $text = strip_tags($html); | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |         // Replace multiple spaces with single spaces
 | 
					
						
							|  |  |  |         $text = preg_replace('/\ {2,}/', ' ', $text); | 
					
						
							|  |  |  |         // Reduce multiple horrid whitespace characters.
 | 
					
						
							|  |  |  |         $text = preg_replace('/(\x0A|\xA0|\x0A|\r|\n){2,}/su', "\n\n", $text); | 
					
						
							|  |  |  |         $text = html_entity_decode($text); | 
					
						
							|  |  |  |         // Add title
 | 
					
						
							|  |  |  |         $text = $page->name . "\n\n" . $text; | 
					
						
							|  |  |  |         return $text; | 
					
						
							| 
									
										
										
										
											2016-01-21 06:13:13 +08:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-02-26 22:25:02 +08:00
										 |  |  |     /** | 
					
						
							|  |  |  |      * Convert a chapter into a plain text string. | 
					
						
							|  |  |  |      */ | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  |     public function chapterToPlainText(Chapter $chapter): string | 
					
						
							| 
									
										
										
										
											2017-02-26 22:25:02 +08:00
										 |  |  |     { | 
					
						
							|  |  |  |         $text = $chapter->name . "\n\n"; | 
					
						
							|  |  |  |         $text .= $chapter->description . "\n\n"; | 
					
						
							|  |  |  |         foreach ($chapter->pages as $page) { | 
					
						
							|  |  |  |             $text .= $this->pageToPlainText($page); | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |         return $text; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-02-26 21:26:51 +08:00
										 |  |  |     /** | 
					
						
							|  |  |  |      * Convert a book into a plain text string. | 
					
						
							|  |  |  |      */ | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  |     public function bookToPlainText(Book $book): string | 
					
						
							| 
									
										
										
										
											2017-02-26 21:26:51 +08:00
										 |  |  |     { | 
					
						
							| 
									
										
										
										
											2019-10-05 19:55:01 +08:00
										 |  |  |         $bookTree = (new BookContents($book))->getTree(false, true); | 
					
						
							| 
									
										
										
										
											2017-02-26 21:26:51 +08:00
										 |  |  |         $text = $book->name . "\n\n"; | 
					
						
							|  |  |  |         foreach ($bookTree as $bookChild) { | 
					
						
							|  |  |  |             if ($bookChild->isA('chapter')) { | 
					
						
							| 
									
										
										
										
											2017-02-26 22:25:02 +08:00
										 |  |  |                 $text .= $this->chapterToPlainText($bookChild); | 
					
						
							| 
									
										
										
										
											2017-02-26 21:26:51 +08:00
										 |  |  |             } else { | 
					
						
							|  |  |  |                 $text .= $this->pageToPlainText($bookChild); | 
					
						
							|  |  |  |             } | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |         return $text; | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  | } |