2025-02-19 00:44:49 +01:00
|
|
|
<?php
|
|
|
|
/*
|
|
|
|
* This file is part of Part-DB (https://github.com/Part-DB/Part-DB-symfony).
|
|
|
|
*
|
|
|
|
* Copyright (C) 2019 - 2025 Jan Böhmer (https://github.com/jbtronics)
|
|
|
|
*
|
|
|
|
* This program is free software: you can redistribute it and/or modify
|
|
|
|
* it under the terms of the GNU Affero General Public License as published
|
|
|
|
* by the Free Software Foundation, either version 3 of the License, or
|
|
|
|
* (at your option) any later version.
|
|
|
|
*
|
|
|
|
* This program is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
* GNU Affero General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU Affero General Public License
|
|
|
|
* along with this program. If not, see <https://www.gnu.org/licenses/>.
|
|
|
|
*/
|
|
|
|
|
|
|
|
declare(strict_types=1);
|
|
|
|
|
|
|
|
|
|
|
|
namespace App\Services\InfoProviderSystem\Providers;
|
|
|
|
|
2025-02-19 23:55:58 +01:00
|
|
|
use App\Services\InfoProviderSystem\DTOs\FileDTO;
|
2025-02-20 00:18:05 +01:00
|
|
|
use App\Services\InfoProviderSystem\DTOs\ParameterDTO;
|
2025-02-19 00:44:49 +01:00
|
|
|
use App\Services\InfoProviderSystem\DTOs\PartDetailDTO;
|
|
|
|
use App\Services\InfoProviderSystem\DTOs\SearchResultDTO;
|
|
|
|
use Symfony\Component\DomCrawler\Crawler;
|
|
|
|
use Symfony\Contracts\HttpClient\HttpClientInterface;
|
|
|
|
|
|
|
|
class ReicheltProvider implements InfoProviderInterface
|
|
|
|
{
|
|
|
|
|
|
|
|
private const SEARCH_ENDPOINT = "https://www.reichelt.com/index.html?ACTION=446&LA=0&nbc=1&q=%s";
|
|
|
|
|
|
|
|
public function __construct(private readonly HttpClientInterface $client)
|
|
|
|
{
|
|
|
|
}
|
|
|
|
|
|
|
|
public function getProviderInfo(): array
|
|
|
|
{
|
|
|
|
return [
|
|
|
|
'name' => 'Reichelt',
|
|
|
|
'description' => 'TODO',
|
|
|
|
'url' => 'https://www.reichelt.de/',
|
|
|
|
'disabled_help' => 'TODO'
|
|
|
|
];
|
|
|
|
}
|
|
|
|
|
|
|
|
public function getProviderKey(): string
|
|
|
|
{
|
|
|
|
return 'reichelt';
|
|
|
|
}
|
|
|
|
|
|
|
|
public function isActive(): bool
|
|
|
|
{
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
public function searchByKeyword(string $keyword): array
|
|
|
|
{
|
|
|
|
//Lowercase the keyword and urlencode it
|
|
|
|
$keyword = urlencode($keyword);
|
|
|
|
$response = $this->client->request('GET', sprintf(self::SEARCH_ENDPOINT, $keyword));
|
|
|
|
$html = $response->getContent();
|
|
|
|
|
|
|
|
//Parse the HTML and return the results
|
|
|
|
$dom = new Crawler($html);
|
|
|
|
//Iterate over all div.al_gallery_article elements
|
|
|
|
$results = [];
|
|
|
|
$dom->filter('div.al_gallery_article')->each(function (Crawler $element) use (&$results) {
|
|
|
|
|
2025-02-19 23:55:58 +01:00
|
|
|
//Extract product id from data-product attribute
|
|
|
|
$artId = json_decode($element->attr('data-product'), true, 2, JSON_THROW_ON_ERROR)['artid'];
|
|
|
|
|
2025-02-19 00:44:49 +01:00
|
|
|
$productID = $element->filter('meta[itemprop="productID"]')->attr('content');
|
|
|
|
$name = $element->filter('meta[itemprop="name"]')->attr('content');
|
|
|
|
$sku = $element->filter('meta[itemprop="sku"]')->attr('content');
|
|
|
|
|
|
|
|
//Try to extract a picture URL:
|
|
|
|
$pictureURL = $element->filter("div.al_artlogo img")->attr('src');
|
|
|
|
|
|
|
|
$results[] = new SearchResultDTO(
|
|
|
|
provider_key: $this->getProviderKey(),
|
2025-02-19 23:55:58 +01:00
|
|
|
provider_id: $artId,
|
2025-02-19 00:44:49 +01:00
|
|
|
name: $productID,
|
|
|
|
description: $name,
|
|
|
|
category: null,
|
|
|
|
manufacturer: $sku,
|
|
|
|
preview_image_url: $pictureURL,
|
|
|
|
provider_url: $element->filter('a.al_artinfo_link')->attr('href')
|
|
|
|
);
|
|
|
|
});
|
|
|
|
|
|
|
|
return $results;
|
|
|
|
}
|
|
|
|
|
|
|
|
public function getDetails(string $id): PartDetailDTO
|
|
|
|
{
|
2025-02-19 23:55:58 +01:00
|
|
|
//Check that the ID is a number
|
|
|
|
if (!is_numeric($id)) {
|
|
|
|
throw new \InvalidArgumentException("Invalid ID");
|
|
|
|
}
|
|
|
|
|
|
|
|
//Use this endpoint to resolve the artID to a product page
|
|
|
|
$response = $this->client->request('GET', sprintf('https://www.reichelt.com/?ACTION=514&id=74&article=%s&LANGUAGE=EN&CCOUNTRY=DE', $id));
|
|
|
|
$json = $response->toArray();
|
|
|
|
|
|
|
|
//Retrieve the product page from the response
|
|
|
|
$productPage = $this->getBaseURL() . '/shop/product' . $json[0]['article_path'];
|
|
|
|
|
|
|
|
|
|
|
|
$response = $this->client->request('GET', $productPage);
|
|
|
|
$html = $response->getContent();
|
|
|
|
$dom = new Crawler($html);
|
|
|
|
|
|
|
|
//Extract the product notes
|
|
|
|
$notes = $dom->filter('p[itemprop="description"]')->html();
|
|
|
|
|
|
|
|
//Extract datasheets
|
|
|
|
$datasheets = [];
|
|
|
|
$dom->filter('div.articleDatasheet a')->each(function (Crawler $element) use (&$datasheets) {
|
|
|
|
$datasheets[] = new FileDTO($element->attr('href'), $element->filter('span')->text());
|
|
|
|
});
|
|
|
|
|
|
|
|
//Create part object
|
|
|
|
return new PartDetailDTO(
|
|
|
|
provider_key: $this->getProviderKey(),
|
|
|
|
provider_id: $id,
|
|
|
|
name: $json[0]['article_artnr'],
|
|
|
|
description: $json[0]['article_besch'],
|
|
|
|
manufacturer: $json[0]['manufacturer_name'],
|
|
|
|
preview_image_url: $json[0]['article_picture'],
|
|
|
|
provider_url: $productPage,
|
|
|
|
notes: $notes,
|
2025-02-20 00:18:05 +01:00
|
|
|
datasheets: $datasheets,
|
|
|
|
parameters: $this->parseParameters($dom)
|
2025-02-19 23:55:58 +01:00
|
|
|
);
|
|
|
|
|
|
|
|
}
|
|
|
|
|
2025-02-20 00:18:05 +01:00
|
|
|
private function parseParameters(Crawler $dom): array
|
|
|
|
{
|
|
|
|
$parameters = [];
|
|
|
|
//Iterate over each ul.articleTechnicalData which contains the specifications of each group
|
|
|
|
$dom->filter('ul.articleTechnicalData')->each(function (Crawler $groupElement) use (&$parameters) {
|
|
|
|
$groupName = $groupElement->filter('li.articleTechnicalHeadline')->text();
|
|
|
|
|
|
|
|
//Iterate over each second li in ul.articleAttribute, which contains the specifications
|
|
|
|
$groupElement->filter('ul.articleAttribute li:nth-child(2n)')->each(function (Crawler $specElement) use (&$parameters, $groupName) {
|
|
|
|
$parameters[] = ParameterDTO::parseValueField(
|
|
|
|
name: $specElement->previousAll()->text(),
|
|
|
|
value: $specElement->text(),
|
|
|
|
group: $groupName
|
|
|
|
);
|
|
|
|
});
|
|
|
|
});
|
|
|
|
|
|
|
|
return $parameters;
|
|
|
|
}
|
|
|
|
|
2025-02-19 23:55:58 +01:00
|
|
|
private function getBaseURL(): string
|
|
|
|
{
|
|
|
|
//Without the trailing slash
|
|
|
|
return 'https://www.reichelt.com/de/en';
|
2025-02-19 00:44:49 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
public function getCapabilities(): array
|
|
|
|
{
|
|
|
|
return [
|
|
|
|
ProviderCapabilities::BASIC,
|
|
|
|
ProviderCapabilities::PICTURE,
|
|
|
|
ProviderCapabilities::DATASHEET,
|
|
|
|
ProviderCapabilities::PRICE,
|
|
|
|
];
|
|
|
|
}
|
|
|
|
}
|