[Author Prev][Author Next][Thread Prev][Thread Next][Author Index][Thread Index]

[tor-commits] [sbws/master] Merge branch 'ticket28565_rebased'



commit f9df7658807b51434b93570add232b3becd0797f
Merge: 3db367b 127cf46
Author: juga0 <juga@xxxxxxxxxx>
Date:   Thu Mar 21 12:46:01 2019 +0000

    Merge branch 'ticket28565_rebased'

 sbws/lib/v3bwfile.py            | 130 +++++++++++++++++++++++++++++++---------
 tests/unit/lib/test_v3bwfile.py |  44 +++++++++++---
 2 files changed, 139 insertions(+), 35 deletions(-)

diff --cc sbws/lib/v3bwfile.py
index 61657b9,e6dcde1..6a433d0
--- a/sbws/lib/v3bwfile.py
+++ b/sbws/lib/v3bwfile.py
@@@ -67,19 -89,7 +89,9 @@@ BW_HEADER_KEYVALUES_MONITOR = 
      # something else we don't know yet
      # So far is the number of ResultError
      'recent_measurement_failure_count',
-     # The number of success results should be:
-     # the number of attempts - the number of failures
-     # 4.6 header: the number of successful results, created in the last 5 days,
-     # that were excluded by a filter
-     # This is the sum of the following 3 + not success results
-     # 'recent_measurement_exclusion_count',
-     'recent_measurement_exclusion_not_distanciated_count',
-     'recent_measurement_exclusion_not_recent_count',
-     'recent_measurement_exclusion_not_min_num_count',
- 
 +    # The time it took to report about half of the network.
 +    'time_to_report_half_network',
- ]
+ ] + BW_HEADER_KEYVALUES_RECENT_MEASUREMENTS_EXCLUDED
  BANDWIDTH_HEADER_KEY_VALUES_INIT = \
      ['earliest_bandwidth', 'generator_started',
       'scanner_country', 'destinations_countries']\
@@@ -435,59 -453,15 +455,68 @@@ class V3BWHeader(object)
          [setattr(self, k, str(v)) for k, v in kwargs.items()
           if k in STATS_KEYVALUES]
  
 +    def add_time_report_half_network(self):
 +        """Add to the header the time it took to measure half of the network.
 +
 +        It is not the time the scanner actually takes on measuring all the
 +        network, but the ``number_eligible_relays`` that are reported in the
 +        bandwidth file and directory authorities will vote on.
 +
 +        This is calculated for half of the network, so that failed or not
 +        reported relays do not affect too much.
 +
 +        For instance, if there are 6500 relays in the network, half of the
 +        network would be 3250. And if there were 4000 eligible relays
 +        measured in an interval of 3 days, the time to measure half of the
 +        network would be 3 days * 3250 / 4000.
 +
 +        Since the elapsed time is calculated from the earliest and the
 +        latest measurement and a relay might have more than 2 measurements,
 +        this would give an estimate on how long it would take to measure
 +        the network including all the valid measurements.
 +
 +        Log also an estimated on how long it would take with the current
 +        number of relays included in the bandwidth file.
 +        """
 +        # NOTE: in future refactor do not convert attributes to str until
 +        # writing to the file, so that they do not need to be converted back
 +        # to do some calculations.
 +        elapsed_time = (
 +            (isostr_to_dt_obj(self.latest_bandwidth)
 +             - isostr_to_dt_obj(self.earliest_bandwidth))
 +            .total_seconds())
 +
 +        # This attributes were added later and some tests that
 +        # do not initialize them would fail.
 +        eligible_relays = int(getattr(self, 'number_eligible_relays', 0))
 +        consensus_relays = int(getattr(self, 'number_consensus_relays', 0))
 +        if not(eligible_relays and consensus_relays):
 +            return
 +
 +        half_network = consensus_relays / 2
 +        # Calculate the time it would take to measure half of the network
 +        if eligible_relays >= half_network:
 +            time_half_network = round(
 +                elapsed_time * half_network / eligible_relays
 +            )
 +            self.time_to_report_half_network = str(time_half_network)
 +
 +        # In any case log an estimated on the time to measure all the network.
 +        estimated_time = round(
 +            elapsed_time * consensus_relays / eligible_relays
 +        )
 +        log.info("Estimated time to measure the network: %s hours.",
 +                 round(estimated_time / 60 / 60))
 +
+     def add_relays_excluded_counters(self, exclusion_dict):
+         """
+         Add the monitoring KeyValues to the header about the number of
+         relays not included because they were not ``eligible``.
+         """
+         log.debug("Adding relays excluded counters.")
+         for k, v in exclusion_dict.items():
+             setattr(self, k, str(v))
+ 
  
  class V3BWLine(object):
      """



_______________________________________________
tor-commits mailing list
tor-commits@xxxxxxxxxxxxxxxxxxxx
https://lists.torproject.org/cgi-bin/mailman/listinfo/tor-commits