From 0aaf337889928b48e55745a53d06751ff40d6f46 Mon Sep 17 00:00:00 2001 From: krzysiej Date: Fri, 3 Oct 2025 15:21:57 +0200 Subject: [PATCH] Update search to website changes (#1) MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Co-authored-by: Krzysztof Płaczek Reviewed-on: https://git.techtube.pl/krzysiej/bookinfo/pulls/1 --- README.md | 8 +++++++- composer.json | 4 ++-- src/Api/AbstractBookInfo.php | 5 ++++- src/BookFinder.php | 2 +- src/DataParser.php | 11 +++++++++-- 5 files changed, 23 insertions(+), 7 deletions(-) diff --git a/README.md b/README.md index 47f6796..d70b9f0 100644 --- a/README.md +++ b/README.md @@ -10,7 +10,13 @@ Place this in the composer.json. }] } ``` -Then execute +Then execute to get latest version: + +```bash +composer require techtube/bookinfo +``` + +or this to get specific version: ```bash composer require techtube/bookinfo:"1.0.4" diff --git a/composer.json b/composer.json index 02395e3..a8a3cc3 100644 --- a/composer.json +++ b/composer.json @@ -13,8 +13,8 @@ }, "authors": [ { - "name": "kplaczek", - "email": "kplaczek@wi.ps.pl" + "name": "Krzysztof Płaczek", + "email": "krzysztofplaczek@techtube.pl" } ] } diff --git a/src/Api/AbstractBookInfo.php b/src/Api/AbstractBookInfo.php index 99cecb4..75410d2 100644 --- a/src/Api/AbstractBookInfo.php +++ b/src/Api/AbstractBookInfo.php @@ -9,12 +9,15 @@ abstract class AbstractBookInfo public string $isbn; public string $description; public string $title; + public string $originalTitle; public string $category; public array $cover_url; public int $pages; public string $cycle; - public int $volume; + public string $cycleUrl; + public string $volume; public ?string $language; public string $datePublished; public ?string $publisher; + public ?string $translator; } \ No newline at end of file diff --git a/src/BookFinder.php b/src/BookFinder.php index ee7ec90..d0c8389 100644 --- a/src/BookFinder.php +++ b/src/BookFinder.php @@ -28,7 +28,7 @@ class BookFinder private function getSearchUrl(string $phrase): string { - return self::$searchUrl . $phrase; + return sprintf('%s%s', self::$searchUrl, $phrase); } } diff --git a/src/DataParser.php b/src/DataParser.php index 189113d..d0722a7 100644 --- a/src/DataParser.php +++ b/src/DataParser.php @@ -4,6 +4,7 @@ namespace Techtube\Bookinfo; use DiDom\Document; use DiDom\Exceptions\InvalidSelectorException; +use DiDom\Query; use JetBrains\PhpStorm\ArrayShape; use Techtube\Bookinfo\Api\AbstractBookInfo; @@ -24,6 +25,7 @@ class DataParser $info->isbn = $document->first('meta[property="books:isbn"]')->getAttribute('content'); $info->description = trim($document->first('#book-description p')->text()); $info->title = trim($document->first('h1.book__title')->text()); + $info->originalTitle = trim($document->first("//*[contains(text(), 'Tytuł oryginału:')]", Query::TYPE_XPATH)?->nextSibling('dd')?->text() ?? ''); $info->category = trim($document->first('.book__category')->text()); $info->cover_url = $this->generateCoverUrls( $document->first('meta[property="og:image"]')->getAttribute('content') @@ -35,6 +37,7 @@ class DataParser } $info->language = $jsonInfo?->inLanguage ?? trim($document->xpath("//*[contains(text(), 'Język:')]")[0]->nextSibling('dd')->text()); $info->datePublished = $jsonInfo?->datePublished ?? null; + $info->translator = trim($document->first("//*[contains(text(), 'Tłumacz:')]", Query::TYPE_XPATH)?->nextSibling('dd')?->text() ?? ''); return $info; } @@ -46,8 +49,7 @@ class DataParser */ public function searchPage(Document $document): array { - $books = $document->find('#search .authorAllBooks__single'); - + $books = $document->find('#ksiazki .authorAllBooks__single'); $booksInfo = []; if ($document->has('#searchksiazki')) { foreach ($books as $book) { @@ -56,6 +58,11 @@ class DataParser $bookInfo->author = trim($book->first('.authorAllBooks__singleTextAuthor')->text()); $bookInfo->url = $book->first('button[data-book-url]')->getAttribute('data-book-url'); $bookInfo->cover_url = $this->generateCoverUrls($book->first('.img-fluid')->getAttribute('data-src')); + if (preg_match('#(.*) \(tom (.*)\)#ism', trim($book->first('a[href*="/cykl/"]')?->text() ?? ''), $series)) { + $bookInfo->cycle = $series[1]; + $bookInfo->volume = $series[2]; + $bookInfo->cycleUrl = $book->first('a[href*="/cykl/"]')?->href; + } $booksInfo[] = $bookInfo; } }