3 namespace Rapsys\AirBundle\Command
; 
   5 use Doctrine\Bundle\DoctrineBundle\Command\DoctrineCommand
; 
   6 use Symfony\Component\Console\Input\InputInterface
; 
   7 use Symfony\Component\Console\Output\OutputInterface
; 
   8 use Symfony\Component\Filesystem\Exception\IOExceptionInterface
; 
   9 use Symfony\Component\Filesystem\Filesystem
; 
  10 use Rapsys\AirBundle\Entity\Session
; 
  12 class WeatherCommand 
extends DoctrineCommand 
{ 
  13         //Set failure constant 
  16         ///Set success constant 
  21                 //Mostly useless in fact 
  23                 //Required to simplify simplexml transition 
  25                 //Required to avoid xml errors 
  26                 'quote-nbsp' => false, 
  27                 //Required to fix code 
  31         ///Set accuweather uris 
  32         private $accuweather = [ 
  35                         75001 => 'https://www.accuweather.com/en/fr/paris-01-louvre/75001/hourly-weather-forecast/179142_pc?day=', 
  36                         75004 => 'https://www.accuweather.com/en/fr/paris-04-hotel-de-ville/75004/hourly-weather-forecast/179145_pc?day=', 
  37                         75005 => 'https://www.accuweather.com/en/fr/paris-05-pantheon/75005/hourly-weather-forecast/179146_pc?day=', 
  38                         75007 => 'https://www.accuweather.com/en/fr/paris-07-palais-bourbon/75007/hourly-weather-forecast/179148_pc?day=', 
  39                         75009 => 'https://www.accuweather.com/en/fr/paris-09-opera/75009/hourly-weather-forecast/179150_pc?day=', 
  40                         75013 => 'https://www.accuweather.com/en/fr/paris-13-gobelins/75013/hourly-weather-forecast/179154_pc?day=', 
  41                         75015 => 'https://www.accuweather.com/en/fr/paris-15-vaugirard/75015/hourly-weather-forecast/179156_pc?day=', 
  42                         75019 => 'https://www.accuweather.com/en/fr/paris-19-buttes-chaumont/75019/hourly-weather-forecast/179160_pc?day=', 
  43                         75116 => 'https://www.accuweather.com/en/fr/paris-16-passy/75116/hourly-weather-forecast/179246_pc?day=' 
  47                         75001 => 'https://www.accuweather.com/en/fr/paris-01-louvre/75001/daily-weather-forecast/179142_pc', 
  48                         75004 => 'https://www.accuweather.com/en/fr/paris-04-hotel-de-ville/75004/daily-weather-forecast/179145_pc', 
  49                         75005 => 'https://www.accuweather.com/en/fr/paris-05-pantheon/75005/daily-weather-forecast/179146_pc', 
  50                         75007 => 'https://www.accuweather.com/en/fr/paris-07-palais-bourbon/75007/daily-weather-forecast/179148_pc', 
  51                         75009 => 'https://www.accuweather.com/en/fr/paris-09-opera/75009/daily-weather-forecast/179150_pc', 
  52                         75013 => 'https://www.accuweather.com/en/fr/paris-13-gobelins/75013/daily-weather-forecast/179154_pc', 
  53                         75015 => 'https://www.accuweather.com/en/fr/paris-15-vaugirard/75015/daily-weather-forecast/179156_pc', 
  54                         75019 => 'https://www.accuweather.com/en/fr/paris-19-buttes-chaumont/75019/daily-weather-forecast/179160_pc', 
  55                         75116 => 'https://www.accuweather.com/en/fr/paris-16-passy/75116/daily-weather-forecast/179246_pc' 
  62         ///Configure attribute command 
  63         protected function configure() { 
  67                         ->setName('rapsysair:weather') 
  68                         //Set description shown with bin/console list 
  69                         ->setDescription('Updates session rain and temperature fields') 
  70                         //Set description shown with bin/console --help airlibre:attribute 
  71                         ->setHelp('This command updates session rain and temperature fields in next three days') 
  72                         //Add daily and hourly aliases 
  73                         ->setAliases(['rapsysair:weather:daily', 'rapsysair:weather:hourly']); 
  76         ///Process the attribution 
  77         protected function execute(InputInterface 
$input, OutputInterface 
$output) { 
  79                 $doctrine = $this->getDoctrine(); 
  82                 $manager = $doctrine->getManager(); 
  93                 //Process hourly accuweather 
  94                 if (($command = $input->getFirstArgument()) == 'rapsysair:weather:hourly' || $command == 'rapsysair:weather') { 
  95                         //Fetch hourly sessions to attribute 
  96                         $types['hourly'] = $doctrine->getRepository(Session
::class)->findAllPendingHourlyWeather(); 
  98                         //Iterate on each session 
  99                         foreach($types['hourly'] as $sessionId => $session) { 
 101                                 $zipcode = $session->getLocation()->getZipcode(); 
 104                                 $start = $session->getStart(); 
 107                                 $day = $start->diff((new \
DateTime('now'))->setTime(0, 0, 0))->d + 
1; 
 109                                 //Check if zipcode is set 
 110                                 if (!isset($zipcodes[$zipcode])) { 
 111                                         $zipcodes[$zipcode] = []; 
 114                                 //Check if zipcode date is set 
 115                                 if (!isset($zipcodes[$zipcode][$day])) { 
 116                                         $zipcodes[$zipcode][$day] = [ $sessionId => $sessionId ]; 
 118                                         $zipcodes[$zipcode][$day][$sessionId] = $sessionId; 
 122                                 $stop = $session->getStop(); 
 125                                 $day = $stop->diff((new \
DateTime('now'))->setTime(0, 0, 0))->d + 
1; 
 127                                 //Check if zipcode date is set 
 128                                 if (!isset($zipcodes[$zipcode][$day])) { 
 129                                         $zipcodes[$zipcode][$day] = [ $sessionId => $sessionId ]; 
 131                                         $zipcodes[$zipcode][$day][$sessionId] = $sessionId; 
 136                 //Process daily accuweather 
 137                 if ($command == 'rapsysair:weather:daily' || $command == 'rapsysair:weather') { 
 138                         //Fetch daily sessions to attribute 
 139                         $types['daily'] = $doctrine->getRepository(Session
::class)->findAllPendingDailyWeather(); 
 141                         //Iterate on each session 
 142                         foreach($types['daily'] as $sessionId => $session) { 
 144                                 $zipcode = $session->getLocation()->getZipcode(); 
 147                                 $start = $session->getStart(); 
 152                                 //Check if zipcode is set 
 153                                 if (!isset($zipcodes[$zipcode])) { 
 154                                         $zipcodes[$zipcode] = []; 
 157                                 //Check if zipcode date is set 
 158                                 if (!isset($zipcodes[$zipcode][$day])) { 
 159                                         $zipcodes[$zipcode][$day] = [ $sessionId => $sessionId ]; 
 161                                         $zipcodes[$zipcode][$day][$sessionId] = $sessionId; 
 167                 $filesystem = new Filesystem(); 
 170                 //XXX: worst case scenario we have 3 files per zipcode 
 171                 if (!is_dir($tmpdir = sys_get_temp_dir().'/accuweather')) { 
 174                             $filesystem->mkdir($tmpdir, 0775); 
 175                         } catch (IOExceptionInterface 
$exception) { 
 177                                 echo 'Create dir '.$exception->getPath().' failed'."\n"; 
 190                 //Iterate on zipcodes 
 191                 foreach($zipcodes as $zipcode => $days) { 
 193                         foreach($days as $day => $null) { 
 194                                 //Try to load content from cache 
 195                                 if (!is_file($file = $tmpdir.'/'.$zipcode.'.'.$day.'.html') || stat($file)['ctime'] <= (time() - ($day == 'daily' ? 4 : 2)*3600) || ($content = file_get_contents($file)) === false) { 
 196                                         //Prevent timing detection 
 197                                         //XXX: from 0.1 to 5 seconds 
 198                                         usleep(rand(1,50) * 100000);  
 201                                         //TODO: for daily we may load data for requested quarter of the day 
 202                                         $content = $this->curl_get($day == 'daily' ? $this->accuweather
['daily'][$zipcode] : $this->accuweather
['hourly'][$zipcode].$day); 
 205                                         if (file_put_contents($tmpdir.'/'.$zipcode.'.'.$day.'.html', $content) === false) { 
 207                                                 echo 'Write to '.$tmpdir.'/'.$zipcode.'.'.$day.'.html failed'."\n"; 
 215                                 $tidy->parseString($content, $this->config
, 'utf8'); 
 218                                 //XXX: don't care about theses errors, tidy is here to fix... 
 219                                 #if (!empty($tidy->errorBuffer)) { 
 220                                 #       var_dump($tidy->errorBuffer); 
 221                                 #       die('Tidy errors'); 
 225                                 //XXX: trash all xmlns= broken tags 
 226                                 $sx = new \
SimpleXMLElement(str_replace(['xmlns=', 'xlink:href='], ['xns=', 'href='], $tidy)); 
 229                                 if ($day == 'daily') { 
 230                                         //Iterate on each link containing data 
 231                                         foreach($sx->xpath('//a[@class="daily-forecast-card"]') as $node) { 
 233                                                 $dsm = trim($node->div
[0]->h2
[0]->span
[1]); 
 236                                                 $temperature = str_replace('°', '', $node->div
[0]->div
[0]->span
[0]); 
 239                                                 $rainrisk = str_replace('%', '', trim($node->div
[2]))/100; 
 242                                                 $data[$zipcode][$dsm]['daily'] = [ 
 243                                                         'temperature' => $temperature, 
 244                                                         'rainrisk' => $rainrisk 
 249                                         //Iterate on each div containing data 
 250                                         #(string)$sx->xpath('//div[@class="hourly-card-nfl"]')[0]->attributes()->value 
 251                                         #/html/body/div[1]/div[5]/div[1]/div[1]/div[1]/div[1]/div[1]/div/h2/span[1] 
 252                                         foreach($sx->xpath('//div[@data-shared="false"]') as $node) { 
 254                                                 $hour = trim($node->div
[0]->div
[0]->h2
[0]->span
[0]); 
 257                                                 $dsm = trim($node->div
[0]->div
[0]->h2
[0]->span
[1]); 
 260                                                 $temperature = str_replace('°', '', $node->div
[0]->div
[0]->div
[0]); 
 263                                                 $realfeel = str_replace(['RealFeel® ', '°'], '', trim($node->div
[0]->div
[0]->span
[0])); 
 266                                                 $rainrisk = str_replace('%', '', trim($node->div
[0]->div
[0]->div
[1]))/100; 
 268                                                 //Label is Rain when we have a rainfall 
 269                                                 if (($pluviolabel = trim($node->div
[1]->div
[0]->div
[0]->div
[1]->p
[1])) == 'Rain') { 
 271                                                         $rainfall = str_replace(' mm', '', $node->div
[1]->div
[0]->div
[0]->div
[1]->p
[1]->span
[0]); 
 272                                                 //Cloud Cover, no rainfall 
 274                                                         //Set rainfall to 0 (mm) 
 279                                                 $data[$zipcode][$dsm][$hour] = [ 
 280                                                         'temperature' => $temperature, 
 281                                                         'realfeel' => $realfeel, 
 282                                                         'rainrisk' => $rainrisk, 
 283                                                         'rainfall' => $rainfall 
 294                 foreach($types as $type => $sessions) { 
 295                         //Iterate on each type 
 296                         foreach($sessions as $sessionId => $session) { 
 298                                 $zipcode = $session->getLocation()->getZipcode(); 
 301                                 $start = $session->getStart(); 
 304                                 if ($type == 'daily') { 
 306                                         $period = [ $start ]; 
 310                                         $stop = $session->getStop(); 
 313                                         $period = new \
DatePeriod( 
 316                                                 //Iterate on each hour 
 317                                                 new \
DateInterval('PT1H'), 
 318                                                 //End with begin + length 
 328                                         'realfeelmin' => null, 
 329                                         'realfeelmax' => null, 
 331                                         'temperaturemin' => null, 
 332                                         'temperaturemax' => null 
 335                                 //Iterate on the period 
 336                                 foreach($period as $time) { 
 338                                         $dsm = $time->format('d/m'); 
 341                                         $hour = $type=='daily'?$type:$time->format('H'); 
 343                                         //Check data availability 
 344                                         //XXX: should never happen 
 345                                         #if (!isset($data[$zipcode][$dsm][$hour])) { 
 346                                         #       //Skip unavailable data 
 351                                         $info = $data[$zipcode][$dsm][$hour]; 
 353                                         //Check if rainrisk is higher 
 354                                         if ($meteo['rainrisk'] === null || $info['rainrisk'] > $meteo['rainrisk']) { 
 355                                                 //Set highest rain risk 
 356                                                 $meteo['rainrisk'] = floatval($info['rainrisk']); 
 359                                         //Check if rainfall is set 
 360                                         if (isset($info['rainfall'])) { 
 362                                                 $meteo['rainfall'] +
= floatval($info['rainfall']); 
 366                                         $meteo['temperature'][$hour] = $info['temperature']; 
 369                                         if ($type != 'daily') { 
 370                                                 //Check min temperature 
 371                                                 if ($meteo['temperaturemin'] === null || $info['temperature'] < $meteo['temperaturemin']) { 
 372                                                         $meteo['temperaturemin'] = floatval($info['temperature']); 
 375                                                 //Check max temperature 
 376                                                 if ($meteo['temperaturemax'] === null || $info['temperature'] > $meteo['temperaturemax']) { 
 377                                                         $meteo['temperaturemax'] = floatval($info['temperature']); 
 381                                         //Check if realfeel is set 
 382                                         if (isset($info['realfeel'])) { 
 384                                                 $meteo['realfeel'][$hour] = $info['realfeel']; 
 387                                                 if ($meteo['realfeelmin'] === null || $info['realfeel'] < $meteo['realfeelmin']) { 
 388                                                         $meteo['realfeelmin'] = floatval($info['realfeel']); 
 392                                                 if ($meteo['realfeelmax'] === null || $info['realfeel'] > $meteo['realfeelmax']) { 
 393                                                         $meteo['realfeelmax'] = floatval($info['realfeel']); 
 398                                 //Check if rainfall is set and differ 
 399                                 if ($session->getRainfall() !== $meteo['rainfall']) { 
 401                                         $session->setRainfall($meteo['rainfall']); 
 404                                 //Check if rainrisk differ 
 405                                 if ($session->getRainrisk() !== $meteo['rainrisk']) { 
 407                                         $session->setRainrisk($meteo['rainrisk']); 
 410                                 //Check realfeel array 
 411                                 if ($meteo['realfeel'] !== []) { 
 413                                         $realfeel = floatval(round(array_sum($meteo['realfeel'])/count($meteo['realfeel']),1)); 
 415                                         //Check if realfeel differ 
 416                                         if ($session->getRealfeel() !== $realfeel) { 
 417                                                 //Set average realfeel 
 418                                                 #$meteo['realfeel'] = array_sum($meteo['realfeel'])/count($meteo['realfeel']); 
 419                                                 $session->setRealfeel($realfeel); 
 422                                         //Check if realfeelmin differ 
 423                                         if ($session->getRealfeelmin() !== $meteo['realfeelmin']) { 
 425                                                 $session->setRealfeelmin($meteo['realfeelmin']); 
 428                                         //Check if realfeelmax differ 
 429                                         if ($session->getRealfeelmax() !== $meteo['realfeelmax']) { 
 431                                                 $session->setRealfeelmax($meteo['realfeelmax']); 
 435                                 //Check temperature array 
 436                                 if ($meteo['temperature'] !== []) { 
 437                                         //Compute temperature 
 438                                         $temperature = floatval(round(array_sum($meteo['temperature'])/count($meteo['temperature']),1)); 
 440                                         //Check if temperature differ 
 441                                         if ($session->getTemperature() !== $temperature) { 
 442                                                 //Set average temperature 
 443                                                 #$meteo['temperature'] = array_sum($meteo['temperature'])/count($meteo['temperature']); 
 444                                                 $session->setTemperature($temperature); 
 447                                         //Check if temperaturemin differ 
 448                                         if ($session->getTemperaturemin() !== $meteo['temperaturemin']) { 
 450                                                 $session->setTemperaturemin($meteo['temperaturemin']); 
 453                                         //Check if temperaturemax differ 
 454                                         if ($session->getTemperaturemax() !== $meteo['temperaturemax']) { 
 456                                                 $session->setTemperaturemax($meteo['temperaturemax']); 
 462                 //Flush to get the ids 
 469                 return self
::SUCCESS
; 
 475          * @return bool|void Return success or exit 
 477         function curl_init() { 
 479                 if (($this->ch 
= curl_init()) === false) { 
 481                         echo 'Curl init failed: '.curl_error($this->ch
)."\n"; 
 492                                         CURLOPT_HTTP_VERSION 
=> CURL_HTTP_VERSION_2_0
, 
 494                                         CURLOPT_HTTPHEADER 
=> [ 
 495                                                 //XXX: it seems that you can disable akamai fucking protection with Pragma: akamai-x-cache-off 
 496                                                 //XXX: see https://support.globaldots.com/hc/en-us/articles/115003996705-Akamai-Pragma-Headers-overview 
 497                                                 #'Pragma: akamai-x-cache-off', 
 498                                                 //XXX: working curl command 
 499                                                 #curl --http2 --cookie file.jar --cookie-jar file.jar -v -i -k -H 'Accept: text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.9' -H 'Accept-Language: en-GB,en;q=0.9' -H 'Cache-Control: no-cache' -H 'Connection: keep-alive' -H 'Host: www.accuweather.com' -H 'Pragma: no-cache' -H 'Upgrade-Insecure-Requests: 1' -H 'User-Agent: Mozilla/5.0 (Windows NT 6.1; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/86.0.4240.198 Safari/537.36' 'https://www.accuweather.com/' 
 501                                                 'Accept: text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.9', 
 502                                                 //Set accept language 
 503                                                 'Accept-Language: en-GB,en;q=0.9', 
 505                                                 'Cache-Control: no-cache', 
 506                                                 //Keep connection alive 
 507                                                 'Connection: keep-alive', 
 510                                                 //Force secure requests 
 511                                                 'Upgrade-Insecure-Requests: 1', 
 513                                                 'User-Agent: Mozilla/5.0 (Windows NT 6.1; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/86.0.4240.198 Safari/537.36', 
 514                                                 //Force akamai cookie 
 515                                                 //XXX: seems to come from http request 
 519                                         CURLOPT_COOKIEFILE 
=> '', 
 520                                         //Disable location following 
 521                                         CURLOPT_FOLLOWLOCATION 
=> false, 
 523                                         #CURLOPT_URL => $url = 'https://www.accuweather.com/', 
 525                                         CURLOPT_HEADER 
=> true, 
 527                                         CURLOPT_RETURNTRANSFER 
=> true, 
 530                                         CURLINFO_HEADER_OUT 
=> true 
 535                         echo 'Curl setopt array failed: '.curl_error($this->ch
)."\n"; 
 547          * @return string|void Return url content or exit 
 549         function curl_get($url) { 
 551                 if (curl_setopt($this->ch
, CURLOPT_URL
, $url) === false) { 
 553                         echo 'Setopt for '.$url.' failed: '.curl_error($this->ch
)."\n"; 
 556                         curl_close($this->ch
); 
 562                 //Check return status 
 563                 if (($response = curl_exec($this->ch
)) === false) { 
 565                         echo 'Get for '.$url.' failed: '.curl_error($this->ch
)."\n"; 
 567                         //Display sent headers 
 568                         var_dump(curl_getinfo($this->ch
, CURLINFO_HEADER_OUT
)); 
 574                         curl_close($this->ch
); 
 581                 if (empty($hs = curl_getinfo($this->ch
, CURLINFO_HEADER_SIZE
))) { 
 583                         echo 'Getinfo for '.$url.' failed: '.curl_error($this->ch
)."\n"; 
 585                         //Display sent headers 
 586                         var_dump(curl_getinfo($this->ch
, CURLINFO_HEADER_OUT
)); 
 592                         curl_close($this->ch
); 
 599                 if (empty($header = substr($response, 0, $hs))) { 
 601                         echo 'Header for '.$url.' empty: '.curl_error($this->ch
)."\n"; 
 603                         //Display sent headers 
 604                         var_dump(curl_getinfo($this->ch
, CURLINFO_HEADER_OUT
)); 
 610                         curl_close($this->ch
); 
 616                 //Check request success 
 617                 if (strlen($header) <= 10 || substr($header, 0, 10) !== 'HTTP/2 200') { 
 619                         echo 'Status for '.$url.' failed: '.curl_error($this->ch
)."\n"; 
 621                         //Display sent headers 
 622                         var_dump(curl_getinfo($this->ch
, CURLINFO_HEADER_OUT
)); 
 628                         curl_close($this->ch
); 
 635                 return substr($response, $hs); 
 641          * @return bool Return success or failure 
 643         function curl_close() { 
 644                 return curl_close($this->ch
);