Jacek Kowalski
2019-06-22 45b7eba2cf3654667bf79c35c5525e2674c38341
parse.php
@@ -1,43 +1,39 @@
<?php
require_once(__DIR__.'/vendor/autoload.php');
require_once(__DIR__.'/lib/database.php');
require_once(__DIR__.'/lib/fetch.php');
require_once(__DIR__.'/lib/mapper.php');
$logger = new Monolog\Logger('Parse changes');
$sources = [
   'buses' => [
      'gtfs' => 'ftp://ztp.krakow.pl/VehiclePositions_A.pb',
      'gtfs_file' => 'VehiclePositions_A.pb',
      'ttss' => 'http://91.223.13.70/internetservice/geoserviceDispatcher/services/vehicleinfo/vehicles',
      'ttss_file' => 'vehicles_A.json',
      'database' => 'mapping_A.sqlite3',
      'result' => 'mapping_A.json',
   ],
];
require_once(__DIR__.'/lib/output.php');
require_once(__DIR__.'/lib/vehicle_types.php');
require_once(__DIR__.'/config.php');
foreach($sources as $name => $source) {
   $logger = new Monolog\Logger('fetch_'.$name);
   try {
      foreach(['gtfs_file', 'ttss_file', 'database', 'result'] as $field) {
         $source[$field] = __DIR__.'/data/'.$source[$field];
      }
      $source['result_temp'] = $source['result'].'.tmp';
      $logger->info('Fetching '.$name.' position data from FTP...');
      $updated = ftp_fetch_if_newer($source['gtfs'], $source['gtfs_file']);
      $updated = ftp_fetch_if_newer($source['gtfsrt'], $source['gtfsrt_file']);
      if(!$updated) {
         $logger->info('Nothing to do, remote file not newer than local one');
         continue;
      }
      
      $logger->info('Fetching '.$name.' positions from TTSS...');
      fetch($source['ttss'],$source['ttss_file']);
      $logger->info('Fetching '.$name.' position data from TTSS...');
      fetch($source['ttss'], $source['ttss_file']);
      
      $logger->info('Loading data...');
      $mapper = new Mapper();
      $mapper->loadTTSS($source['ttss_file']);
      $mapper->loadGTFS($source['gtfs_file']);
      $timeDifference = time() - $mapper->getTTSSDate();
      if(abs($timeDifference) > 120) {
         throw new Exception('TTSS timestamp difference ('.$timeDifference.'s) is too high, aborting!');
      }
      $mapper->loadGTFSRT($source['gtfsrt_file']);
      $timeDifference = time() - $mapper->getGTFSRTDate();
      if(abs($timeDifference) > 120) {
         throw new Exception('GTFSRT timestamp difference ('.$timeDifference.'s) is too high, aborting!');
      }
      
      $db = new Database($source['database']);
      
@@ -48,58 +44,51 @@
      }
      
      $logger->info('Got offset '.$offset.', creating mapping...');
      $mapping = $mapper->getMapping($offset);
      $mapping = $mapper->mapUsingOffset($offset);
      
      $logger->info('Checking the data for correctness...');
      $weight = count($mapping);
      $replace = 0;
      $ignore = 0;
      foreach($mapping as $id => $vehicle) {
      $correct = 0;
      $incorrect = 0;
      $old = 0;
      $maxWeight = 0;
      foreach($mapping as $id => $num) {
         $dbVehicle = $db->getById($id);
         if($dbVehicle) {
            if((int)substr($vehicle['num'], 2) != (int)$dbVehicle['num']) {
               if($weight > $dbVehicle['weight']) {
                  $replace += 1;
                  $logger->warn($vehicle['num'].' voting to replace '.$dbVehicle['num'].' (same ID: '.$id.')');
               } else {
                  $ignore += 1;
                  $logger->warn($vehicle['num'].' voting to ignore '.$dbVehicle['num'].' (same ID: '.$id.')');
               }
            $maxWeight = max($maxWeight, (int)$dbVehicle['weight']);
            if($num === $dbVehicle['num']) {
               $correct += 1;
            } else {
               $incorrect += 1;
            }
            continue;
         }
         
         $dbVehicle = $db->getByNum($vehicle['num']);
         if($dbVehicle && $dbVehicle['id'] != $id) {
            $replace += 1;
            $logger->warn($vehicle['id'].' voting to replace '.$dbVehicle['id'].' (same num: '.$vehicle['num'].')');
         $dbVehicle = $db->getByNum($num);
         if($dbVehicle && $dbVehicle['id'] !== $id) {
            $old += 1;
         }
      }
      $logger->info('Weight: '.$weight.', ignore: '.$ignore.', replace: '.$replace);
      $logger->info('Weight: '.$weight.', correct: '.$correct.', incorrect: '.$incorrect.', old: '.$old);
      
      $previousMapping = NULL;
      if($ignore > 0 && $ignore >= $replace) {
      if($incorrect > $correct && $maxWeight > $weight) {
         throw new Exception('Ignoring result due to better data already present');
      } elseif($replace > 0) {
         $logger->warn('Replacing DB data with the mapping');
         $db->clear();
      } else {
         $previousMapping = @json_decode(@file_get_contents($source['result']), TRUE);
      }
      $logger->info('Creating mapping...');
      
      $db->addMapping($mapping);
      
      if(is_array($previousMapping)) {
         $logger->info('Merging previous data with current mapping');
         $mapping = $previousMapping + $mapping;
         ksort($mapping);
      }
      $finalMapping = createMapping($db, $source['mapper'], $source);
      
      $json = json_encode($mapping);
      if(!file_put_contents($source['result_temp'], $json)) {
         throw new Exception('Result save failed');
      }
      rename($source['result_temp'], $source['result']);
      $logger->info('Creating vehicle list...');
      createVehiclesList($mapper->getTTSSTrips(), $finalMapping, $source);
      $logger->info('Finished');
   } catch(Throwable $e) {
      $logger->error($e->getMessage(), ['exception' => $e, 'exception_string' => (string)$e]);