150 lines
5.4 KiB
PHP
150 lines
5.4 KiB
PHP
<?php
|
|
|
|
namespace App\Parser;
|
|
|
|
use App\ParsedHome;
|
|
use App\Parser;
|
|
use GuzzleHttp\Exception\GuzzleException;
|
|
use Symfony\Component\DomCrawler\Crawler;
|
|
|
|
/**
|
|
* Thanks to https://github.com/axeleroy/untoitpourcaramel/issues/3
|
|
* Class SeLoger
|
|
* @package App\Parser
|
|
*/
|
|
class SeLoger extends Parser
|
|
{
|
|
public const TOKEN_URL = 'https://api-seloger.svc.groupe-seloger.com/api/v1/security/authenticate';
|
|
public const LISTING_URL = 'https://api-seloger.svc.groupe-seloger.com/api/v1/listings/';
|
|
public const SELOGER_TOKEN = 'eyJ0eXAiOiJKV1QiLCJhbGciOiJIUzI1NiJ9.eyJpc3MiOiJTZUxvZ2VyLW1vYmlsZSIsImFwcCI6IjYzZWU3MTRkLWE2MmEtNGEyNy05ZmJlLTQwYjdhMmMzMThlNCIsImlhdCI6MTUzOTQ0MjMyMCwianRpIjoiNWYzODRhNDYtZjk5MS00ODZkLWFkN2YtMmE2M2YxZTdkM2UwIiwiYXVkIjoiU2VMb2dlci1Nb2JpbGUtNi4wIn0.Qib13Y4395f_bi5Df0IhMQRvIxQZEfpf8Ac66oTfyiA';
|
|
public const SELOGER_GUID = '63ee714d-a62a-4a27-9fbe-40b7a2c318e4';
|
|
|
|
/**
|
|
* @inheritDoc
|
|
*/
|
|
public function parse(): ParsedHome
|
|
{
|
|
$token = $this->retrieveToken();
|
|
$idAnnonce = $this->getIdAnnonceFromUrl($this->url);
|
|
$url = sprintf('%s%s', self::LISTING_URL, $idAnnonce);
|
|
try {
|
|
$request = $this->client->request(
|
|
'GET',
|
|
$url,
|
|
[
|
|
'headers' => [
|
|
'AppToken' => $token,
|
|
],
|
|
]
|
|
);
|
|
} catch (GuzzleException $e) {
|
|
return $this->parseHTML();
|
|
}
|
|
$annonce = json_decode($request->getBody()->getContents(), true);
|
|
|
|
$parsedHome = new ParsedHome();
|
|
$parsedHome->city = $annonce['city'];
|
|
//ex: Vente maison 110 m² Tréguier (22220)
|
|
$parsedHome->title = $annonce['title'];
|
|
$parsedHome->price = $annonce['price'];
|
|
$parsedHome->surface = $annonce['livingArea'];
|
|
$parsedHome->rooms = $annonce['rooms'];
|
|
$parsedHome->energy = $annonce['energy']['grade'];
|
|
$parsedHome->description = $annonce['description'];
|
|
$parsedHome->pictures = $annonce['photos'];
|
|
$location = $annonce['coordinates'];
|
|
$parsedHome->map = ['lat' => $location['latitude'], 'lng' => $location['longitude']];
|
|
|
|
return $parsedHome;
|
|
}
|
|
|
|
/**
|
|
* @param string $url
|
|
*
|
|
* @return string
|
|
*/
|
|
private function getIdAnnonceFromUrl($url)
|
|
{
|
|
// ex : https://www.seloger.com/annonces/achat/maison/franconville-95/vieux-marche-mare-des-noues/159100953.htm
|
|
$url = parse_url($url, PHP_URL_PATH);
|
|
return collect(explode('.', collect(explode('/', $url))->last()))->first();
|
|
}
|
|
|
|
/**
|
|
* @return string
|
|
* @throws \GuzzleHttp\Exception\GuzzleException
|
|
*/
|
|
private function retrieveToken()
|
|
{
|
|
$request = $this->client->request(
|
|
'GET',
|
|
self::TOKEN_URL,
|
|
[
|
|
'headers' => [
|
|
'AppToken' => self::SELOGER_TOKEN,
|
|
'AppGuid' => self::SELOGER_GUID,
|
|
],
|
|
]
|
|
);
|
|
|
|
return trim($request->getBody()->getContents(), '"');
|
|
}
|
|
|
|
/**
|
|
* @return \App\ParsedHome
|
|
*/
|
|
private function parseHTML()
|
|
{
|
|
$request = $this->client->get(
|
|
$this->url,
|
|
[
|
|
'headers' => [
|
|
'User-Agent' => 'Mozilla/5.0 (X11; Ubuntu; Linux x86_64; rv:85.0) Gecko/20100101 Firefox/85.0',
|
|
'Accept' => 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8',
|
|
'Accept-Encoding' => 'gzip, deflate, br',
|
|
'Accept-Language' => 'fr,fr-FR;q=0.8,en-US;q=0.5,en;q=0.3',
|
|
'Cache-Control' => 'no-cache',
|
|
'Connection' => 'keep-alive',
|
|
]
|
|
]
|
|
);
|
|
$body = $request->getBody()->getContents();
|
|
$crawler = new Crawler($body);
|
|
|
|
$parsed_home = new ParsedHome();
|
|
|
|
$parsed_home->title = $crawler->filter('h1')->text();
|
|
$parsed_home->description = $crawler->filter('#showcase-description > div')->first()->text();
|
|
$parsed_home->price = (int) str_replace(' ', '', $crawler->filter('[class^=Summarystyled__PriceText]')->text());
|
|
$parsed_home->city = $crawler->filter('[class^=Summarystyled__Address]')->text();
|
|
$parsed_home->energy = $this->calculateDPE(
|
|
(int)$crawler->filter('[class^=Preview__PreviewTooltipValue]')->first()->text()
|
|
);
|
|
$parsed_home->ges = $this->calculateGES(
|
|
(int)$crawler->filter('[class^=Preview__PreviewTooltipValue]')->eq(1)->text()
|
|
);
|
|
|
|
$crawler
|
|
->filter('[class^=Summarystyled__TagsWrapper] > div')
|
|
->each(static function (Crawler $property____information, $i) use (&$parsed_home) {
|
|
$element = $property____information->children()->eq(1)->text();
|
|
if ('pièces' === mb_substr($element, -6)) {
|
|
$parsed_home->rooms = (int) $element;
|
|
}
|
|
if ('m²' === mb_substr($element, -2) && strpos($element, '/') === false) {
|
|
$parsed_home->surface = (int) $element;
|
|
}
|
|
});
|
|
|
|
$parsed_home->pictures = $crawler
|
|
->filter('.swiper-wrapper')
|
|
->first()
|
|
->filter('[data-background]')
|
|
->each(static function ($img) {
|
|
return $img->attr('data-background');
|
|
});
|
|
|
|
return $parsed_home;
|
|
}
|
|
}
|