include 'vendor/autoload.php';
use Gufy\PdfToHtml\Pdf;
use PHPHtmlParser\Dom;
use DateTime;
公共函数解析pdf(请求$请求){
$pdf = new Pdf($request->file('csv_file'));
$html = $pdf->html();
$dom = new Dom;
$total_pages = $pdf->getPages();
if ($total_pages == 1) {
$html->goToPage(1);
$dom->load($html);
$paragraphs = $dom->find('p');
$paragraphs = collect($paragraphs);
foreach($paragraphs as $p){
$datestring = preg_replace('/\xc2\xa0/', ' ', trim($p->text));
echo $datestring;
}
}
以上代码在 laravel 中将 pdf 转换为 html
composer require gufy/pdftohtml-php:~2
Poppler-Utils(如果您使用的是 Ubuntu Distro,只需从 apt 安装它) sudo apt-get install poppler-utils