| 
									
										
										
										
											2016-01-21 06:13:13 +08:00
										 |  |  | <?php namespace BookStack\Services; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-02-26 21:26:51 +08:00
										 |  |  | use BookStack\Book; | 
					
						
							| 
									
										
										
										
											2017-02-26 22:25:02 +08:00
										 |  |  | use BookStack\Chapter; | 
					
						
							| 
									
										
										
										
											2016-01-21 06:13:13 +08:00
										 |  |  | use BookStack\Page; | 
					
						
							| 
									
										
										
										
											2017-01-21 21:53:00 +08:00
										 |  |  | use BookStack\Repos\EntityRepo; | 
					
						
							| 
									
										
										
										
											2016-01-21 06:13:13 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  | class ExportService | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-01-21 21:53:00 +08:00
										 |  |  |     protected $entityRepo; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     /** | 
					
						
							|  |  |  |      * ExportService constructor. | 
					
						
							|  |  |  |      * @param $entityRepo | 
					
						
							|  |  |  |      */ | 
					
						
							|  |  |  |     public function __construct(EntityRepo $entityRepo) | 
					
						
							|  |  |  |     { | 
					
						
							|  |  |  |         $this->entityRepo = $entityRepo; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-01-21 06:13:13 +08:00
										 |  |  |     /** | 
					
						
							|  |  |  |      * Convert a page to a self-contained HTML file. | 
					
						
							|  |  |  |      * Includes required CSS & image content. Images are base64 encoded into the HTML. | 
					
						
							|  |  |  |      * @param Page $page | 
					
						
							|  |  |  |      * @return mixed|string | 
					
						
							|  |  |  |      */ | 
					
						
							|  |  |  |     public function pageToContainedHtml(Page $page) | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |     { | 
					
						
							| 
									
										
										
										
											2017-08-28 20:38:32 +08:00
										 |  |  |         $this->entityRepo->renderPage($page); | 
					
						
							| 
									
										
										
										
											2017-02-26 21:26:51 +08:00
										 |  |  |         $pageHtml = view('pages/export', [ | 
					
						
							| 
									
										
										
										
											2017-08-28 20:38:32 +08:00
										 |  |  |             'page' => $page | 
					
						
							| 
									
										
										
										
											2017-02-26 21:26:51 +08:00
										 |  |  |         ])->render(); | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |         return $this->containHtml($pageHtml); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-02-26 22:25:02 +08:00
										 |  |  |     /** | 
					
						
							|  |  |  |      * Convert a chapter to a self-contained HTML file. | 
					
						
							|  |  |  |      * @param Chapter $chapter | 
					
						
							|  |  |  |      * @return mixed|string | 
					
						
							|  |  |  |      */ | 
					
						
							|  |  |  |     public function chapterToContainedHtml(Chapter $chapter) | 
					
						
							|  |  |  |     { | 
					
						
							|  |  |  |         $pages = $this->entityRepo->getChapterChildren($chapter); | 
					
						
							| 
									
										
										
										
											2018-01-29 00:58:52 +08:00
										 |  |  |         $pages->each(function ($page) { | 
					
						
							| 
									
										
										
										
											2017-02-26 22:25:02 +08:00
										 |  |  |             $page->html = $this->entityRepo->renderPage($page); | 
					
						
							|  |  |  |         }); | 
					
						
							|  |  |  |         $html = view('chapters/export', [ | 
					
						
							|  |  |  |             'chapter' => $chapter, | 
					
						
							|  |  |  |             'pages' => $pages | 
					
						
							|  |  |  |         ])->render(); | 
					
						
							|  |  |  |         return $this->containHtml($html); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |     /** | 
					
						
							| 
									
										
										
										
											2017-02-26 21:26:51 +08:00
										 |  |  |      * Convert a book to a self-contained HTML file. | 
					
						
							|  |  |  |      * @param Book $book | 
					
						
							|  |  |  |      * @return mixed|string | 
					
						
							|  |  |  |      */ | 
					
						
							|  |  |  |     public function bookToContainedHtml(Book $book) | 
					
						
							|  |  |  |     { | 
					
						
							|  |  |  |         $bookTree = $this->entityRepo->getBookChildren($book, true, true); | 
					
						
							|  |  |  |         $html = view('books/export', [ | 
					
						
							|  |  |  |             'book' => $book, | 
					
						
							|  |  |  |             'bookChildren' => $bookTree | 
					
						
							|  |  |  |         ])->render(); | 
					
						
							|  |  |  |         return $this->containHtml($html); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     /** | 
					
						
							|  |  |  |      * Convert a page to a PDF file. | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |      * @param Page $page | 
					
						
							|  |  |  |      * @return mixed|string | 
					
						
							|  |  |  |      */ | 
					
						
							|  |  |  |     public function pageToPdf(Page $page) | 
					
						
							| 
									
										
										
										
											2016-01-21 06:13:13 +08:00
										 |  |  |     { | 
					
						
							| 
									
										
										
										
											2017-08-28 20:38:32 +08:00
										 |  |  |         $this->entityRepo->renderPage($page); | 
					
						
							| 
									
										
										
										
											2017-02-26 21:26:51 +08:00
										 |  |  |         $html = view('pages/pdf', [ | 
					
						
							| 
									
										
										
										
											2017-08-28 20:38:32 +08:00
										 |  |  |             'page' => $page | 
					
						
							| 
									
										
										
										
											2017-02-26 21:26:51 +08:00
										 |  |  |         ])->render(); | 
					
						
							|  |  |  |         return $this->htmlToPdf($html); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-02-26 22:25:02 +08:00
										 |  |  |     /** | 
					
						
							|  |  |  |      * Convert a chapter to a PDF file. | 
					
						
							|  |  |  |      * @param Chapter $chapter | 
					
						
							|  |  |  |      * @return mixed|string | 
					
						
							|  |  |  |      */ | 
					
						
							|  |  |  |     public function chapterToPdf(Chapter $chapter) | 
					
						
							|  |  |  |     { | 
					
						
							|  |  |  |         $pages = $this->entityRepo->getChapterChildren($chapter); | 
					
						
							| 
									
										
										
										
											2018-01-29 00:58:52 +08:00
										 |  |  |         $pages->each(function ($page) { | 
					
						
							| 
									
										
										
										
											2017-02-26 22:25:02 +08:00
										 |  |  |             $page->html = $this->entityRepo->renderPage($page); | 
					
						
							|  |  |  |         }); | 
					
						
							|  |  |  |         $html = view('chapters/export', [ | 
					
						
							|  |  |  |             'chapter' => $chapter, | 
					
						
							|  |  |  |             'pages' => $pages | 
					
						
							|  |  |  |         ])->render(); | 
					
						
							|  |  |  |         return $this->htmlToPdf($html); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-02-26 21:26:51 +08:00
										 |  |  |     /** | 
					
						
							|  |  |  |      * Convert a book to a PDF file | 
					
						
							|  |  |  |      * @param Book $book | 
					
						
							|  |  |  |      * @return string | 
					
						
							|  |  |  |      */ | 
					
						
							|  |  |  |     public function bookToPdf(Book $book) | 
					
						
							|  |  |  |     { | 
					
						
							|  |  |  |         $bookTree = $this->entityRepo->getBookChildren($book, true, true); | 
					
						
							|  |  |  |         $html = view('books/export', [ | 
					
						
							|  |  |  |             'book' => $book, | 
					
						
							|  |  |  |             'bookChildren' => $bookTree | 
					
						
							|  |  |  |         ])->render(); | 
					
						
							|  |  |  |         return $this->htmlToPdf($html); | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     /** | 
					
						
							|  |  |  |      * Convert normal webpage HTML to a PDF. | 
					
						
							|  |  |  |      * @param $html | 
					
						
							|  |  |  |      * @return string | 
					
						
							|  |  |  |      */ | 
					
						
							|  |  |  |     protected function htmlToPdf($html) | 
					
						
							|  |  |  |     { | 
					
						
							|  |  |  |         $containedHtml = $this->containHtml($html); | 
					
						
							| 
									
										
										
										
											2017-01-01 20:20:30 +08:00
										 |  |  |         $useWKHTML = config('snappy.pdf.binary') !== false; | 
					
						
							|  |  |  |         if ($useWKHTML) { | 
					
						
							|  |  |  |             $pdf = \SnappyPDF::loadHTML($containedHtml); | 
					
						
							| 
									
										
										
										
											2017-02-26 21:26:51 +08:00
										 |  |  |             $pdf->setOption('print-media-type', true); | 
					
						
							| 
									
										
										
										
											2017-01-01 20:20:30 +08:00
										 |  |  |         } else { | 
					
						
							| 
									
										
										
										
											2017-12-05 01:59:53 +08:00
										 |  |  |             $pdf = \DomPDF::loadHTML($containedHtml); | 
					
						
							| 
									
										
										
										
											2017-01-01 20:20:30 +08:00
										 |  |  |         } | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |         return $pdf->output(); | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2016-01-21 06:13:13 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |     /** | 
					
						
							|  |  |  |      * Bundle of the contents of a html file to be self-contained. | 
					
						
							|  |  |  |      * @param $htmlContent | 
					
						
							|  |  |  |      * @return mixed|string | 
					
						
							| 
									
										
										
										
											2017-10-07 03:49:25 +08:00
										 |  |  |      * @throws \Exception | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |      */ | 
					
						
							|  |  |  |     protected function containHtml($htmlContent) | 
					
						
							|  |  |  |     { | 
					
						
							| 
									
										
										
										
											2016-01-21 06:13:13 +08:00
										 |  |  |         $imageTagsOutput = []; | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |         preg_match_all("/\<img.*src\=(\'|\")(.*?)(\'|\").*?\>/i", $htmlContent, $imageTagsOutput); | 
					
						
							| 
									
										
										
										
											2016-01-21 06:13:13 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  |         // Replace image src with base64 encoded image strings
 | 
					
						
							|  |  |  |         if (isset($imageTagsOutput[0]) && count($imageTagsOutput[0]) > 0) { | 
					
						
							|  |  |  |             foreach ($imageTagsOutput[0] as $index => $imgMatch) { | 
					
						
							|  |  |  |                 $oldImgString = $imgMatch; | 
					
						
							|  |  |  |                 $srcString = $imageTagsOutput[2][$index]; | 
					
						
							| 
									
										
										
										
											2016-09-04 02:24:58 +08:00
										 |  |  |                 $isLocal = strpos(trim($srcString), 'http') !== 0; | 
					
						
							|  |  |  |                 if ($isLocal) { | 
					
						
							|  |  |  |                     $pathString = public_path(trim($srcString, '/')); | 
					
						
							| 
									
										
										
										
											2016-01-21 06:13:13 +08:00
										 |  |  |                 } else { | 
					
						
							|  |  |  |                     $pathString = $srcString; | 
					
						
							|  |  |  |                 } | 
					
						
							| 
									
										
										
										
											2017-10-07 03:49:25 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  |                 // Attempt to find local files even if url not absolute
 | 
					
						
							|  |  |  |                 $base = baseUrl('/'); | 
					
						
							|  |  |  |                 if (strpos($srcString, $base) === 0) { | 
					
						
							|  |  |  |                     $isLocal = true; | 
					
						
							|  |  |  |                     $relString = str_replace($base, '', $srcString); | 
					
						
							|  |  |  |                     $pathString = public_path(trim($relString, '/')); | 
					
						
							|  |  |  |                 } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2018-01-29 00:58:52 +08:00
										 |  |  |                 if ($isLocal && !file_exists($pathString)) { | 
					
						
							|  |  |  |                     continue; | 
					
						
							|  |  |  |                 } | 
					
						
							| 
									
										
										
										
											2017-01-21 21:53:00 +08:00
										 |  |  |                 try { | 
					
						
							| 
									
										
										
										
											2017-10-07 03:49:25 +08:00
										 |  |  |                     if ($isLocal) { | 
					
						
							|  |  |  |                         $imageContent = file_get_contents($pathString); | 
					
						
							|  |  |  |                     } else { | 
					
						
							|  |  |  |                         $ch = curl_init(); | 
					
						
							|  |  |  |                         curl_setopt_array($ch, [CURLOPT_URL => $pathString, CURLOPT_RETURNTRANSFER => 1, CURLOPT_CONNECTTIMEOUT => 5]); | 
					
						
							|  |  |  |                         $imageContent = curl_exec($ch); | 
					
						
							|  |  |  |                         $err = curl_error($ch); | 
					
						
							|  |  |  |                         curl_close($ch); | 
					
						
							| 
									
										
										
										
											2018-01-29 00:58:52 +08:00
										 |  |  |                         if ($err) { | 
					
						
							|  |  |  |                             throw new \Exception("Image fetch failed, Received error: " . $err); | 
					
						
							|  |  |  |                         } | 
					
						
							| 
									
										
										
										
											2017-10-07 03:49:25 +08:00
										 |  |  |                     } | 
					
						
							| 
									
										
										
										
											2017-01-21 21:53:00 +08:00
										 |  |  |                     $imageEncoded = 'data:image/' . pathinfo($pathString, PATHINFO_EXTENSION) . ';base64,' . base64_encode($imageContent); | 
					
						
							|  |  |  |                     $newImageString = str_replace($srcString, $imageEncoded, $oldImgString); | 
					
						
							|  |  |  |                 } catch (\ErrorException $e) { | 
					
						
							|  |  |  |                     $newImageString = ''; | 
					
						
							|  |  |  |                 } | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |                 $htmlContent = str_replace($oldImgString, $newImageString, $htmlContent); | 
					
						
							| 
									
										
										
										
											2016-01-21 06:13:13 +08:00
										 |  |  |             } | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         $linksOutput = []; | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |         preg_match_all("/\<a.*href\=(\'|\")(.*?)(\'|\").*?\>/i", $htmlContent, $linksOutput); | 
					
						
							| 
									
										
										
										
											2016-01-21 06:13:13 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  |         // Replace image src with base64 encoded image strings
 | 
					
						
							|  |  |  |         if (isset($linksOutput[0]) && count($linksOutput[0]) > 0) { | 
					
						
							|  |  |  |             foreach ($linksOutput[0] as $index => $linkMatch) { | 
					
						
							|  |  |  |                 $oldLinkString = $linkMatch; | 
					
						
							|  |  |  |                 $srcString = $linksOutput[2][$index]; | 
					
						
							|  |  |  |                 if (strpos(trim($srcString), 'http') !== 0) { | 
					
						
							|  |  |  |                     $newSrcString = url($srcString); | 
					
						
							|  |  |  |                     $newLinkString = str_replace($srcString, $newSrcString, $oldLinkString); | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |                     $htmlContent = str_replace($oldLinkString, $newLinkString, $htmlContent); | 
					
						
							| 
									
										
										
										
											2016-01-21 06:13:13 +08:00
										 |  |  |                 } | 
					
						
							|  |  |  |             } | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         // Replace any relative links with system domain
 | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |         return $htmlContent; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     /** | 
					
						
							|  |  |  |      * Converts the page contents into simple plain text. | 
					
						
							| 
									
										
										
										
											2017-01-21 21:53:00 +08:00
										 |  |  |      * This method filters any bad looking content to provide a nice final output. | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |      * @param Page $page | 
					
						
							|  |  |  |      * @return mixed | 
					
						
							|  |  |  |      */ | 
					
						
							|  |  |  |     public function pageToPlainText(Page $page) | 
					
						
							|  |  |  |     { | 
					
						
							| 
									
										
										
										
											2017-01-21 21:53:00 +08:00
										 |  |  |         $html = $this->entityRepo->renderPage($page); | 
					
						
							|  |  |  |         $text = strip_tags($html); | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  |         // Replace multiple spaces with single spaces
 | 
					
						
							|  |  |  |         $text = preg_replace('/\ {2,}/', ' ', $text); | 
					
						
							|  |  |  |         // Reduce multiple horrid whitespace characters.
 | 
					
						
							|  |  |  |         $text = preg_replace('/(\x0A|\xA0|\x0A|\r|\n){2,}/su', "\n\n", $text); | 
					
						
							|  |  |  |         $text = html_entity_decode($text); | 
					
						
							|  |  |  |         // Add title
 | 
					
						
							|  |  |  |         $text = $page->name . "\n\n" . $text; | 
					
						
							|  |  |  |         return $text; | 
					
						
							| 
									
										
										
										
											2016-01-21 06:13:13 +08:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-02-26 22:25:02 +08:00
										 |  |  |     /** | 
					
						
							|  |  |  |      * Convert a chapter into a plain text string. | 
					
						
							|  |  |  |      * @param Chapter $chapter | 
					
						
							|  |  |  |      * @return string | 
					
						
							|  |  |  |      */ | 
					
						
							|  |  |  |     public function chapterToPlainText(Chapter $chapter) | 
					
						
							|  |  |  |     { | 
					
						
							|  |  |  |         $text = $chapter->name . "\n\n"; | 
					
						
							|  |  |  |         $text .= $chapter->description . "\n\n"; | 
					
						
							|  |  |  |         foreach ($chapter->pages as $page) { | 
					
						
							|  |  |  |             $text .= $this->pageToPlainText($page); | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |         return $text; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-02-26 21:26:51 +08:00
										 |  |  |     /** | 
					
						
							|  |  |  |      * Convert a book into a plain text string. | 
					
						
							|  |  |  |      * @param Book $book | 
					
						
							|  |  |  |      * @return string | 
					
						
							|  |  |  |      */ | 
					
						
							|  |  |  |     public function bookToPlainText(Book $book) | 
					
						
							|  |  |  |     { | 
					
						
							|  |  |  |         $bookTree = $this->entityRepo->getBookChildren($book, true, true); | 
					
						
							|  |  |  |         $text = $book->name . "\n\n"; | 
					
						
							|  |  |  |         foreach ($bookTree as $bookChild) { | 
					
						
							|  |  |  |             if ($bookChild->isA('chapter')) { | 
					
						
							| 
									
										
										
										
											2017-02-26 22:25:02 +08:00
										 |  |  |                 $text .= $this->chapterToPlainText($bookChild); | 
					
						
							| 
									
										
										
										
											2017-02-26 21:26:51 +08:00
										 |  |  |             } else { | 
					
						
							|  |  |  |                 $text .= $this->pageToPlainText($bookChild); | 
					
						
							|  |  |  |             } | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |         return $text; | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2016-02-01 01:53:30 +08:00
										 |  |  | } |