hove-io · xlqian · Jan 18, 2023 · Jan 6, 2023 · Jan 13, 2023 · Jan 13, 2023
diff --git a/source/kraken/apply_disruption.cpp b/source/kraken/apply_disruption.cpp
@@ -98,6 +98,14 @@ nt::VehicleJourney* create_vj_from_old_vj(nt::MetaVehicleJourney* mvj,
     return new_vj;
 }
 
+std::string make_new_vj_uri(const std::string& mvj_uri,
+                            nt::RTLevel rt_level,
+                            int nb_rt_vj,
+                            const std::string& disruption_uri) {
+    return "vehicle_journey:" + mvj_uri + ":" + type::get_string_from_rt_level(rt_level) + ":"
+           + std::to_string(nb_rt_vj) + ":" + disruption_uri;
+}
+
 struct apply_impacts_visitor : public boost::static_visitor<> {
     boost::shared_ptr<nt::disruption::Impact> impact;
     nt::PT_Data& pt_data;
@@ -152,7 +160,7 @@ struct apply_impacts_visitor : public boost::static_visitor<> {
         // we cannot ensure that all VJ of a MetaVJ are on the same route,
         // and since we want all actions to operate on MetaVJ, we collect all MetaVJ of the route
         // (but we'll change only the route's vj)
-        std::set<nt::MetaVehicleJourney*> mvjs;
+        std::unordered_set<nt::MetaVehicleJourney*> mvjs;
         route->for_each_vehicle_journey([&mvjs](nt::VehicleJourney& vj) {
             mvjs.insert(vj.meta_vj);
             return true;
@@ -318,8 +326,8 @@ struct add_impacts_visitor : public apply_impacts_visitor {
             }
 
             auto nb_rt_vj = mvj->get_rt_vj().size();
-            std::string new_vj_uri =
-                "vehicle_journey:" + mvj->uri + ":modified:" + std::to_string(nb_rt_vj) + ":" + impact->disruption->uri;
+            auto new_vj_uri = make_new_vj_uri(mvj->uri, rt_level, nb_rt_vj, impact->disruption->uri);
+
             std::vector<type::StopTime> stoptimes;  // we copy all the stoptimes
             for (const auto& stu : impact->aux_info.stop_times) {
                 stoptimes.push_back(stu.stop_time);
@@ -491,8 +499,7 @@ struct add_impacts_visitor : public apply_impacts_visitor {
                 continue;
             }
             auto nb_rt_vj = mvj->get_vjs_at(rt_level).size();
-            std::string new_vj_uri = vj->uri + ":" + type::get_string_from_rt_level(rt_level) + ":"
-                                     + std::to_string(nb_rt_vj) + ":" + impact->disruption->uri;
+            auto new_vj_uri = make_new_vj_uri(mvj->uri, rt_level, nb_rt_vj, impact->disruption->uri);
 
             new_vp.days = new_vp.days & (vj->validity_patterns[rt_level]->days >> vj->shift);
 
@@ -560,8 +567,7 @@ struct add_impacts_visitor : public apply_impacts_visitor {
                 continue;
             }
             auto nb_rt_vj = mvj->get_vjs_at(rt_level).size();
-            std::string new_vj_uri = vj->uri + ":" + type::get_string_from_rt_level(rt_level) + ":"
-                                     + std::to_string(nb_rt_vj) + ":" + impact->disruption->uri;
+            auto new_vj_uri = make_new_vj_uri(mvj->uri, rt_level, nb_rt_vj, impact->disruption->uri);
 
             new_vp.days = new_vp.days & (vj->validity_patterns[rt_level]->days >> vj->shift);
 
@@ -716,8 +722,7 @@ struct add_impacts_visitor : public apply_impacts_visitor {
             mvj->push_unique_impact(impact);
 
             auto nb_rt_vj = mvj->get_vjs_at(rt_level).size();
-            std::string new_vj_uri = "vehicle_journey:" + mvj->uri + ":" + type::get_string_from_rt_level(rt_level)
-                                     + ":" + std::to_string(nb_rt_vj) + concatenate_impact_uris(*mvj);
+            auto new_vj_uri = make_new_vj_uri(mvj->uri, rt_level, nb_rt_vj, impact->disruption->uri);
 
             new_vp.days = new_vp.days & (vj->validity_patterns[rt_level]->days >> vj->shift);
 

diff --git a/source/kraken/configuration.cpp b/source/kraken/configuration.cpp
@@ -92,7 +92,9 @@ po::options_description get_options_description(const boost::optional<std::strin
         ("BROKER.vhost", po::value<std::string>()->default_value("/"), "vhost for rabbitmq")
         ("BROKER.exchange", po::value<std::string>()->default_value("navitia"), "exchange used in rabbitmq")
         ("BROKER.rt_topics", po::value<std::vector<std::string>>(), "list of realtime topic for this instance")
-        ("BROKER.timeout", po::value<int>()->default_value(100), "timeout for maintenance worker in millisecond")
+        ("BROKER.timeout", po::value<int>()->default_value(200), "timeout for maintenance worker in millisecond")
+        ("BROKER.max_batch_nb", po::value<int>()->default_value(5000), "max size of the realtime message")
+        ("BROKER.retrieving_timeout", po::value<int>()->default_value(10000), "max duration the worker is going to spend when retrieving messages")
         ("BROKER.sleeptime", po::value<int>()->default_value(1), "sleeptime for maintenance worker in second")
         ("BROKER.reconnect_wait", po::value<int>()->default_value(1), "Wait duration between connection attempts to rabbitmq, in seconds")
         ("BROKER.queue", po::value<std::string>(), "rabbitmq's queue name to be bound")
@@ -232,6 +234,14 @@ int Configuration::broker_timeout() const {
     return vm["BROKER.timeout"].as<int>();
 }
 
+int Configuration::retrieving_timeout() const {
+    return vm["BROKER.retrieving_timeout"].as<int>();
+}
+
+int Configuration::broker_max_batch_nb() const {
+    return vm["BROKER.max_batch_nb"].as<int>();
+}
+
 int Configuration::broker_sleeptime() const {
     return vm["BROKER.sleeptime"].as<int>();
 }

diff --git a/source/kraken/configuration.h b/source/kraken/configuration.h
@@ -64,6 +64,8 @@ class Configuration {
     bool broker_queue_auto_delete() const;
     int broker_queue_expire() const;
     int broker_timeout() const;
+    int retrieving_timeout() const;
+    int broker_max_batch_nb() const;
     int broker_sleeptime() const;
     int broker_reconnect_wait() const;
     bool is_realtime_enabled() const;

diff --git a/source/kraken/maintenance_worker.cpp b/source/kraken/maintenance_worker.cpp
@@ -43,6 +43,7 @@ www.navitia.io
 #include <boost/algorithm/string/join.hpp>
 #include <boost/optional.hpp>
 #include <boost/thread/thread.hpp>
+#include <boost/range/adaptor/reversed.hpp>
 
 #include <chrono>
 #include <csignal>
@@ -364,7 +365,9 @@ void MaintenanceWorker::handle_rt_in_batch(const std::vector<AmqpClient::Envelop
     pt::ptime begin = pt::microsec_clock::universal_time();
     bool autocomplete_rebuilding_activated = false;
     auto rt_action = RTAction::chaos;
-    for (auto& envelope : envelopes) {
+
+    std::unordered_set<std::string> applied_visited_id;
+    for (auto& envelope : boost::adaptors::reverse(envelopes)) {
         const auto routing_key = envelope->RoutingKey();
         LOG4CPLUS_DEBUG(logger, "realtime info received from " << routing_key);
         assert(envelope);
@@ -375,6 +378,10 @@ void MaintenanceWorker::handle_rt_in_batch(const std::vector<AmqpClient::Envelop
         }
         LOG4CPLUS_TRACE(logger, "received entity: " << feed_message.DebugString());
         for (const auto& entity : feed_message.entity()) {
+            auto res = applied_visited_id.insert(entity.id());
+            if (!res.second) {
+                continue;
+            }
-            auto res = applied_visited_id.insert(entity.id());
-            if (!res.second) {
-                continue;
-            }
+            auto res = applied_visited_id.insert(entity.id());
+            // an newer disruption with the same id has already been seen, so we can ignore this one
+            if (!res.second) {
+                continue;
+            }
-            auto res = applied_visited_id.insert(entity.id());
-            if (!res.second) {
-                continue;
-            }
+            auto res = applied_visited_id.insert(entity.id());
+            // an newer disruption with the same id has already been seen, so we can ignore this one
+            if (!res.second) {
+                continue;
+            }
             if (!data) {
                 pt::ptime copy_begin = pt::microsec_clock::universal_time();
                 data = data_manager.get_data_clone();
@@ -452,7 +459,11 @@ std::vector<AmqpClient::Envelope::ptr_t> MaintenanceWorker::consume_in_batch(con
     std::vector<AmqpClient::Envelope::ptr_t> envelopes;
     envelopes.reserve(max_nb);
     size_t consumed_nb = 0;
-    while (consumed_nb < max_nb) {
+    auto begin = pt::microsec_clock::universal_time();
+
+    auto retrieving_timeout = conf.retrieving_timeout();
+    while (consumed_nb < max_nb
+           && (pt::microsec_clock::universal_time() - begin).total_milliseconds() < retrieving_timeout) {
         AmqpClient::Envelope::ptr_t envelope{};
 
         /* !
@@ -499,7 +510,7 @@ void MaintenanceWorker::listen_rabbitmq() {
 
         // Arbitrary Number: we suppose that disruptions can be handled very quickly so that,
         // in theory, we can handle a batch of 5000 disruptions in one time very quickly too.
-        size_t max_batch_nb = 5000;
+        size_t max_batch_nb = conf.broker_max_batch_nb();
 
         try {
             auto rt_envelopes = consume_in_batch(rt_tag, max_batch_nb, timeout_ms, no_ack);