[tor-commits] [chutney/master] Move network tests to separate Python files

teor at torproject.org teor at torproject.org
Sat Jul 2 10:01:04 UTC 2016


commit 14bb7b862174734fced8fc290d33ffb377d1df49
Author: cypherpunks <cypherpunks at torproject.org>
Date:   Fri Jul 1 13:32:49 2016 +0000

    Move network tests to separate Python files
    
    Based on a patch from chobe.
    
    Closes ticket 9087.
---
 README                            |   5 +
 chutney                           |   2 +-
 lib/chutney/TorNet.py             | 219 +++++---------------------------------
 scripts/chutney_tests/__init__.py |   0
 scripts/chutney_tests/verify.py   | 203 +++++++++++++++++++++++++++++++++++
 5 files changed, 233 insertions(+), 196 deletions(-)

diff --git a/README b/README
index e0eb457..d11da52 100644
--- a/README
+++ b/README
@@ -69,3 +69,8 @@ The working files:
 
   You can override the directory "./net" with the CHUTNEY_DATA_DIR
   environment variable.
+
+Test scripts:
+  The test scripts are stored in the "scripts/chutney_tests" directory. These
+  Python files must define a "run_test(network)" function. Files starting with
+  an underscore ("_") are ignored.
diff --git a/chutney b/chutney
index 2076185..da8d97d 100755
--- a/chutney
+++ b/chutney
@@ -3,7 +3,7 @@
 set -o errexit
 set -o nounset
 
-export PYTHONPATH="$(dirname "${0}")/lib:${PYTHONPATH-}"
+export PYTHONPATH="$(dirname "${0}")/lib:$(dirname "${0}")/scripts:${PYTHONPATH-}"
 
 binaries="python2 python"
 
diff --git a/lib/chutney/TorNet.py b/lib/chutney/TorNet.py
index a952944..87c5dab 100644
--- a/lib/chutney/TorNet.py
+++ b/lib/chutney/TorNet.py
@@ -19,6 +19,7 @@ import re
 import errno
 import time
 import shutil
+import importlib
 
 import chutney.Templating
 import chutney.Traffic
@@ -903,199 +904,6 @@ class Network(object):
             for c in controllers:
                 c.check(listNonRunning=False)
 
-    def verify(self):
-        print("Verifying data transmission:")
-        status = self._verify_traffic()
-        print("Transmission: %s" % ("Success" if status else "Failure"))
-        if not status:
-            # TODO: allow the debug flag to be passed as an argument to
-            # src/test/test-network.sh and chutney
-            print("Set 'debug_flag = True' in Traffic.py to diagnose.")
-        return status
-
-    def _verify_traffic(self):
-        """Verify (parts of) the network by sending traffic through it
-        and verify what is received."""
-        LISTEN_PORT = 4747  # FIXME: Do better! Note the default exit policy.
-        # HSs must have a HiddenServiceDir with
-        # "HiddenServicePort <HS_PORT> <CHUTNEY_LISTEN_ADDRESS>:<LISTEN_PORT>"
-        HS_PORT = 5858
-        # The amount of data to send between each source-sink pair,
-        # each time the source connects.
-        # We create a source-sink pair for each (bridge) client to an exit,
-        # and a source-sink pair for a (bridge) client to each hidden service
-        DATALEN = self._dfltEnv['data_bytes']
-        # Print a dot each time a sink verifies this much data
-        DOTDATALEN = 5 * 1024 * 1024  # Octets.
-        TIMEOUT = 3                   # Seconds.
-        # Calculate the amount of random data we should use
-        randomlen = self._calculate_randomlen(DATALEN)
-        reps = self._calculate_reps(DATALEN, randomlen)
-        # sanity check
-        if reps == 0:
-            DATALEN = 0
-        # Get the random data
-        if randomlen > 0:
-            # print a dot after every DOTDATALEN data is verified, rounding up
-            dot_reps = self._calculate_reps(DOTDATALEN, randomlen)
-            # make sure we get at least one dot per transmission
-            dot_reps = min(reps, dot_reps)
-            with open('/dev/urandom', 'r') as randfp:
-                tmpdata = randfp.read(randomlen)
-        else:
-            dot_reps = 0
-            tmpdata = {}
-        # now make the connections
-        bind_to = (DEFAULTS['ip'], LISTEN_PORT)
-        tt = chutney.Traffic.TrafficTester(bind_to, tmpdata, TIMEOUT, reps,
-                                           dot_reps)
-        client_list = filter(lambda n:
-                             n._env['tag'] == 'c' or n._env['tag'] == 'bc',
-                             self._nodes)
-        exit_list = filter(lambda n:
-                           ('exit' in n._env.keys()) and n._env['exit'] == 1,
-                           self._nodes)
-        hs_list = filter(lambda n:
-                         n._env['tag'] == 'h',
-                         self._nodes)
-        if len(client_list) == 0:
-            print("  Unable to verify network: no client nodes available")
-            return False
-        if len(exit_list) == 0 and len(hs_list) == 0:
-            print("  Unable to verify network: no exit/hs nodes available")
-            print("  Exit nodes must be declared 'relay=1, exit=1'")
-            print("  HS nodes must be declared 'tag=\"hs\"'")
-            return False
-        print("Connecting:")
-        # the number of tor nodes in paths which will send DATALEN data
-        # if a node is used in two paths, we count it twice
-        # this is a lower bound, as cannabilised circuits are one node longer
-        total_path_node_count = 0
-        total_path_node_count += self._configure_exits(tt, bind_to, tmpdata,
-                                                       reps, client_list,
-                                                       exit_list, LISTEN_PORT)
-        total_path_node_count += self._configure_hs(tt, tmpdata, reps,
-                                                    client_list, hs_list,
-                                                    HS_PORT, LISTEN_PORT)
-        print("Transmitting Data:")
-        start_time = time.clock()
-        status = tt.run()
-        end_time = time.clock()
-        # if we fail, don't report the bandwidth
-        if not status:
-            return status
-        # otherwise, report bandwidth used, if sufficient data was transmitted
-        self._report_bandwidth(DATALEN, total_path_node_count,
-                               start_time, end_time)
-        return status
-
-    # In order to performance test a tor network, we need to transmit
-    # several hundred megabytes of data or more. Passing around this
-    # much data in Python has its own performance impacts, so we provide
-    # a smaller amount of random data instead, and repeat it to DATALEN
-    def _calculate_randomlen(self, datalen):
-        MAX_RANDOMLEN = 128 * 1024   # Octets.
-        if datalen > MAX_RANDOMLEN:
-            return MAX_RANDOMLEN
-        else:
-            return datalen
-
-    def _calculate_reps(self, datalen, replen):
-        # sanity checks
-        if datalen == 0 or replen == 0:
-            return 0
-        # effectively rounds datalen up to the nearest replen
-        if replen < datalen:
-            return (datalen + replen - 1) / replen
-        else:
-            return 1
-
-    # if there are any exits, each client / bridge client transmits
-    # via 4 nodes (including the client) to an arbitrary exit
-    # Each client binds directly to <CHUTNEY_LISTEN_ADDRESS>:LISTEN_PORT
-    # via an Exit relay
-    def _configure_exits(self, tt, bind_to, tmpdata, reps, client_list,
-                         exit_list, LISTEN_PORT):
-        CLIENT_EXIT_PATH_NODES = 4
-        connection_count = self._dfltEnv['connection_count']
-        exit_path_node_count = 0
-        if len(exit_list) > 0:
-            exit_path_node_count += (len(client_list) *
-                                     CLIENT_EXIT_PATH_NODES *
-                                     connection_count)
-            for op in client_list:
-                print("  Exit to %s:%d via client %s:%s"
-                      % (DEFAULTS['ip'], LISTEN_PORT,
-                         'localhost', op._env['socksport']))
-                for i in range(connection_count):
-                    proxy = ('localhost', int(op._env['socksport']))
-                    tt.add(chutney.Traffic.Source(tt, bind_to, tmpdata, proxy,
-                                                  reps))
-        return exit_path_node_count
-
-    # The HS redirects .onion connections made to hs_hostname:HS_PORT
-    # to the Traffic Tester's CHUTNEY_LISTEN_ADDRESS:LISTEN_PORT
-    # an arbitrary client / bridge client transmits via 8 nodes
-    # (including the client and hs) to each hidden service
-    # Instead of binding directly to LISTEN_PORT via an Exit relay,
-    # we bind to hs_hostname:HS_PORT via a hidden service connection
-    def _configure_hs(self, tt, tmpdata, reps, client_list, hs_list, HS_PORT,
-                      LISTEN_PORT):
-        CLIENT_HS_PATH_NODES = 8
-        connection_count = self._dfltEnv['connection_count']
-        hs_path_node_count = (len(hs_list) * CLIENT_HS_PATH_NODES *
-                              connection_count)
-        # Each client in hs_client_list connects to each hs
-        if self._dfltEnv['hs_multi_client']:
-            hs_client_list = client_list
-            hs_path_node_count *= len(client_list)
-        else:
-            # only use the first client in the list
-            hs_client_list = client_list[:1]
-        # Setup the connections from each client in hs_client_list to each hs
-        for hs in hs_list:
-            hs_bind_to = (hs._env['hs_hostname'], HS_PORT)
-            for client in hs_client_list:
-                print("  HS to %s:%d (%s:%d) via client %s:%s"
-                      % (hs._env['hs_hostname'], HS_PORT,
-                         DEFAULTS['ip'], LISTEN_PORT,
-                         'localhost', client._env['socksport']))
-                for i in range(connection_count):
-                    proxy = ('localhost', int(client._env['socksport']))
-                    tt.add(chutney.Traffic.Source(tt, hs_bind_to, tmpdata,
-                                                  proxy, reps))
-        return hs_path_node_count
-
-    # calculate the single stream bandwidth and overall tor bandwidth
-    # the single stream bandwidth is the bandwidth of the
-    # slowest stream of all the simultaneously transmitted streams
-    # the overall bandwidth estimates the simultaneous bandwidth between
-    # all tor nodes over all simultaneous streams, assuming:
-    # * minimum path lengths (no cannibalized circuits)
-    # * unlimited network bandwidth (that is, localhost)
-    # * tor performance is CPU-limited
-    # This be used to estimate the bandwidth capacity of a CPU-bound
-    # tor relay running on this machine
-    def _report_bandwidth(self, data_length, total_path_node_count,
-                          start_time, end_time):
-        # otherwise, if we sent at least 5 MB cumulative total, and
-        # it took us at least a second to send, report bandwidth
-        MIN_BWDATA = 5 * 1024 * 1024  # Octets.
-        MIN_ELAPSED_TIME = 1.0        # Seconds.
-        cumulative_data_sent = total_path_node_count * data_length
-        elapsed_time = end_time - start_time
-        if (cumulative_data_sent >= MIN_BWDATA and
-                elapsed_time >= MIN_ELAPSED_TIME):
-            # Report megabytes per second
-            BWDIVISOR = 1024*1024
-            single_stream_bandwidth = (data_length / elapsed_time / BWDIVISOR)
-            overall_bandwidth = (cumulative_data_sent / elapsed_time /
-                                 BWDIVISOR)
-            print("Single Stream Bandwidth: %.2f MBytes/s"
-                  % single_stream_bandwidth)
-            print("Overall tor Bandwidth: %.2f MBytes/s"
-                  % overall_bandwidth)
-
 
 def ConfigureNodes(nodelist):
     network = _THE_NETWORK
@@ -1106,11 +914,22 @@ def ConfigureNodes(nodelist):
             network._dfltEnv['hasbridgeauth'] = True
 
 
+def getTests():
+    tests = []
+    for x in os.listdir("scripts/chutney_tests/"):
+        if not x.startswith("_") and os.path.splitext(x)[1] == ".py":
+            tests.append(os.path.splitext(x)[0])
+    return tests
+
+
 def usage(network):
-    return "\n".join(["Usage: chutney {command} {networkfile}",
+    return "\n".join(["Usage: chutney {command/test} {networkfile}",
                       "Known commands are: %s" % (
                           " ".join(x for x in dir(network)
-                                   if not x.startswith("_")))])
+                                   if not x.startswith("_"))),
+                      "Known tests are: %s" % (
+                          " ".join(getTests()))
+                      ])
 
 
 def exit_on_error(err_msg):
@@ -1128,6 +947,16 @@ def runConfigFile(verb, data):
     exec(data, _GLOBALS)
     network = _GLOBALS['_THE_NETWORK']
 
+    # let's check if the verb is a valid test and run it
+    if verb in getTests():
+        test_module = importlib.import_module("chutney_tests.{}".format(verb))
+        try:
+            return test_module.run_test(network)
+        except AttributeError:
+            print("Test {!r} has no 'run_test(network)' function".format(verb))
+            return False
+
+    # tell the user we don't know what their verb meant
     if not hasattr(network, verb):
         print(usage(network))
         print("Error: I don't know how to %s." % verb)
diff --git a/scripts/chutney_tests/__init__.py b/scripts/chutney_tests/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/scripts/chutney_tests/verify.py b/scripts/chutney_tests/verify.py
new file mode 100644
index 0000000..480cf97
--- /dev/null
+++ b/scripts/chutney_tests/verify.py
@@ -0,0 +1,203 @@
+import time
+import chutney
+
+
+def run_test(network):
+    print("Verifying data transmission:")
+    status = _verify_traffic(network)
+    print("Transmission: %s" % ("Success" if status else "Failure"))
+    if not status:
+        # TODO: allow the debug flag to be passed as an argument to
+        # src/test/test-network.sh and chutney
+        print("Set 'debug_flag = True' in Traffic.py to diagnose.")
+    return status
+
+
+def _verify_traffic(network):
+    """Verify (parts of) the network by sending traffic through it
+    and verify what is received."""
+    LISTEN_ADDR = network._dfltEnv['ip']
+    LISTEN_PORT = 4747  # FIXME: Do better! Note the default exit policy.
+    # HSs must have a HiddenServiceDir with
+    # "HiddenServicePort <HS_PORT> <CHUTNEY_LISTEN_ADDRESS>:<LISTEN_PORT>"
+    HS_PORT = 5858
+    # The amount of data to send between each source-sink pair,
+    # each time the source connects.
+    # We create a source-sink pair for each (bridge) client to an exit,
+    # and a source-sink pair for a (bridge) client to each hidden service
+    DATALEN = network._dfltEnv['data_bytes']
+    # Print a dot each time a sink verifies this much data
+    DOTDATALEN = 5 * 1024 * 1024  # Octets.
+    TIMEOUT = 3                   # Seconds.
+    # Calculate the amount of random data we should use
+    randomlen = _calculate_randomlen(DATALEN)
+    reps = _calculate_reps(DATALEN, randomlen)
+    connection_count = network._dfltEnv['connection_count']
+    # sanity check
+    if reps == 0:
+        DATALEN = 0
+    # Get the random data
+    if randomlen > 0:
+        # print a dot after every DOTDATALEN data is verified, rounding up
+        dot_reps = _calculate_reps(DOTDATALEN, randomlen)
+        # make sure we get at least one dot per transmission
+        dot_reps = min(reps, dot_reps)
+        with open('/dev/urandom', 'r') as randfp:
+            tmpdata = randfp.read(randomlen)
+    else:
+        dot_reps = 0
+        tmpdata = {}
+    # now make the connections
+    bind_to = (LISTEN_ADDR, LISTEN_PORT)
+    tt = chutney.Traffic.TrafficTester(bind_to, tmpdata, TIMEOUT, reps,
+                                       dot_reps)
+    client_list = filter(lambda n:
+                         n._env['tag'] == 'c' or n._env['tag'] == 'bc',
+                         network._nodes)
+    exit_list = filter(lambda n:
+                       ('exit' in n._env.keys()) and n._env['exit'] == 1,
+                       network._nodes)
+    hs_list = filter(lambda n:
+                     n._env['tag'] == 'h',
+                     network._nodes)
+    if len(client_list) == 0:
+        print("  Unable to verify network: no client nodes available")
+        return False
+    if len(exit_list) == 0 and len(hs_list) == 0:
+        print("  Unable to verify network: no exit/hs nodes available")
+        print("  Exit nodes must be declared 'relay=1, exit=1'")
+        print("  HS nodes must be declared 'tag=\"hs\"'")
+        return False
+    print("Connecting:")
+    # the number of tor nodes in paths which will send DATALEN data
+    # if a node is used in two paths, we count it twice
+    # this is a lower bound, as cannabilised circuits are one node longer
+    total_path_node_count = 0
+    total_path_node_count += _configure_exits(tt, bind_to, tmpdata, reps,
+                                              client_list, exit_list,
+                                              LISTEN_ADDR, LISTEN_PORT,
+                                              connection_count)
+    total_path_node_count += _configure_hs(tt, tmpdata, reps, client_list,
+                                           hs_list, HS_PORT, LISTEN_ADDR,
+                                           LISTEN_PORT, connection_count,
+                                           network._dfltEnv['hs_multi_client'])
+    print("Transmitting Data:")
+    start_time = time.clock()
+    status = tt.run()
+    end_time = time.clock()
+    # if we fail, don't report the bandwidth
+    if not status:
+        return status
+    # otherwise, report bandwidth used, if sufficient data was transmitted
+    _report_bandwidth(DATALEN, total_path_node_count, start_time, end_time)
+    return status
+
+
+# In order to performance test a tor network, we need to transmit
+# several hundred megabytes of data or more. Passing around this
+# much data in Python has its own performance impacts, so we provide
+# a smaller amount of random data instead, and repeat it to DATALEN
+def _calculate_randomlen(datalen):
+    MAX_RANDOMLEN = 128 * 1024   # Octets.
+    if datalen > MAX_RANDOMLEN:
+        return MAX_RANDOMLEN
+    else:
+        return datalen
+
+
+def _calculate_reps(datalen, replen):
+    # sanity checks
+    if datalen == 0 or replen == 0:
+        return 0
+    # effectively rounds datalen up to the nearest replen
+    if replen < datalen:
+        return (datalen + replen - 1) / replen
+    else:
+        return 1
+
+
+# if there are any exits, each client / bridge client transmits
+# via 4 nodes (including the client) to an arbitrary exit
+# Each client binds directly to <CHUTNEY_LISTEN_ADDRESS>:LISTEN_PORT
+# via an Exit relay
+def _configure_exits(tt, bind_to, tmpdata, reps, client_list, exit_list,
+                     LISTEN_ADDR, LISTEN_PORT, connection_count):
+    CLIENT_EXIT_PATH_NODES = 4
+    exit_path_node_count = 0
+    if len(exit_list) > 0:
+        exit_path_node_count += (len(client_list) *
+                                 CLIENT_EXIT_PATH_NODES *
+                                 connection_count)
+        for op in client_list:
+            print("  Exit to %s:%d via client %s:%s"
+                  % (LISTEN_ADDR, LISTEN_PORT,
+                     'localhost', op._env['socksport']))
+            for _ in range(connection_count):
+                proxy = ('localhost', int(op._env['socksport']))
+                tt.add(chutney.Traffic.Source(tt, bind_to, tmpdata, proxy,
+                                              reps))
+    return exit_path_node_count
+
+
+# The HS redirects .onion connections made to hs_hostname:HS_PORT
+# to the Traffic Tester's CHUTNEY_LISTEN_ADDRESS:LISTEN_PORT
+# an arbitrary client / bridge client transmits via 8 nodes
+# (including the client and hs) to each hidden service
+# Instead of binding directly to LISTEN_PORT via an Exit relay,
+# we bind to hs_hostname:HS_PORT via a hidden service connection
+def _configure_hs(tt, tmpdata, reps, client_list, hs_list, HS_PORT,
+                  LISTEN_ADDR, LISTEN_PORT, connection_count, hs_multi_client):
+    CLIENT_HS_PATH_NODES = 8
+    hs_path_node_count = (len(hs_list) * CLIENT_HS_PATH_NODES *
+                          connection_count)
+    # Each client in hs_client_list connects to each hs
+    if hs_multi_client:
+        hs_client_list = client_list
+        hs_path_node_count *= len(client_list)
+    else:
+        # only use the first client in the list
+        hs_client_list = client_list[:1]
+    # Setup the connections from each client in hs_client_list to each hs
+    for hs in hs_list:
+        hs_bind_to = (hs._env['hs_hostname'], HS_PORT)
+        for client in hs_client_list:
+            print("  HS to %s:%d (%s:%d) via client %s:%s"
+                  % (hs._env['hs_hostname'], HS_PORT,
+                     LISTEN_ADDR, LISTEN_PORT,
+                     'localhost', client._env['socksport']))
+            for _ in range(connection_count):
+                proxy = ('localhost', int(client._env['socksport']))
+                tt.add(chutney.Traffic.Source(tt, hs_bind_to, tmpdata,
+                                              proxy, reps))
+    return hs_path_node_count
+
+
+# calculate the single stream bandwidth and overall tor bandwidth
+# the single stream bandwidth is the bandwidth of the
+# slowest stream of all the simultaneously transmitted streams
+# the overall bandwidth estimates the simultaneous bandwidth between
+# all tor nodes over all simultaneous streams, assuming:
+# * minimum path lengths (no cannibalized circuits)
+# * unlimited network bandwidth (that is, localhost)
+# * tor performance is CPU-limited
+# This be used to estimate the bandwidth capacity of a CPU-bound
+# tor relay running on this machine
+def _report_bandwidth(data_length, total_path_node_count, start_time,
+                      end_time):
+    # otherwise, if we sent at least 5 MB cumulative total, and
+    # it took us at least a second to send, report bandwidth
+    MIN_BWDATA = 5 * 1024 * 1024  # Octets.
+    MIN_ELAPSED_TIME = 1.0        # Seconds.
+    cumulative_data_sent = total_path_node_count * data_length
+    elapsed_time = end_time - start_time
+    if (cumulative_data_sent >= MIN_BWDATA and
+            elapsed_time >= MIN_ELAPSED_TIME):
+        # Report megabytes per second
+        BWDIVISOR = 1024*1024
+        single_stream_bandwidth = (data_length / elapsed_time / BWDIVISOR)
+        overall_bandwidth = (cumulative_data_sent / elapsed_time /
+                             BWDIVISOR)
+        print("Single Stream Bandwidth: %.2f MBytes/s"
+              % single_stream_bandwidth)
+        print("Overall tor Bandwidth: %.2f MBytes/s"
+              % overall_bandwidth)





More information about the tor-commits mailing list