[tor-commits] [stem/master] Exposing the validate arg through parse_file()
atagar at torproject.org
atagar at torproject.org
Sun Jan 20 22:04:13 UTC 2013
commit 998abb262eb4ed6a3d88a7be865412685ab26d3a
Author: Damian Johnson <atagar at torproject.org>
Date: Sun Jan 20 13:59:05 2013 -0800
Exposing the validate arg through parse_file()
Users may want to opt out of validation, either for performance or to accept
quasy-malformed content. Giving them that option.
---
stem/descriptor/__init__.py | 36 +++++++++++++++++++-----------------
1 files changed, 19 insertions(+), 17 deletions(-)
diff --git a/stem/descriptor/__init__.py b/stem/descriptor/__init__.py
index f6d76c0..0e4a3e1 100644
--- a/stem/descriptor/__init__.py
+++ b/stem/descriptor/__init__.py
@@ -40,7 +40,7 @@ PGP_BLOCK_START = re.compile("^-----BEGIN ([%s%s]+)-----$" % (KEYWORD_CHAR, WHIT
PGP_BLOCK_END = "-----END %s-----"
-def parse_file(descriptor_file, descriptor_type = None, path = None):
+def parse_file(descriptor_file, descriptor_type = None, path = None, validate = True):
"""
Simple function to read the descriptor contents from a file, providing an
iterator for its :class:`~stem.descriptor.__init__.Descriptor` contents.
@@ -83,6 +83,8 @@ def parse_file(descriptor_file, descriptor_type = None, path = None):
:param file descriptor_file: opened file with the descriptor contents
:param str descriptor_type: `descriptor type <https://metrics.torproject.org/formats.html#descriptortypes>`_, this is guessed if not provided
:param str path: absolute path to the file's location on disk
+ :param bool validate: checks the validity of the descriptor's content if
+ **True**, skips these checks otherwise
:returns: iterator for :class:`~stem.descriptor.__init__.Descriptor` instances in the file
@@ -116,25 +118,25 @@ def parse_file(descriptor_file, descriptor_type = None, path = None):
if descriptor_type_match:
desc_type, major_version, minor_version = descriptor_type_match.groups()
- file_parser = lambda f: _parse_metrics_file(desc_type, int(major_version), int(minor_version), f)
+ file_parser = lambda f: _parse_metrics_file(desc_type, int(major_version), int(minor_version), f, validate)
else:
raise ValueError("The descriptor_type must be of the form '<type> <major_version>.<minor_version>'")
elif metrics_header_match:
# Metrics descriptor handling
desc_type, major_version, minor_version = metrics_header_match.groups()
- file_parser = lambda f: _parse_metrics_file(desc_type, int(major_version), int(minor_version), f)
+ file_parser = lambda f: _parse_metrics_file(desc_type, int(major_version), int(minor_version), f, validate)
else:
# Cached descriptor handling. These contain multiple descriptors per file.
if filename == "cached-descriptors":
- file_parser = stem.descriptor.server_descriptor._parse_file
+ file_parser = lambda f: stem.descriptor.server_descriptor._parse_file(f, validate = validate)
elif filename == "cached-extrainfo":
- file_parser = stem.descriptor.extrainfo_descriptor._parse_file
+ file_parser = lambda f: stem.descriptor.extrainfo_descriptor._parse_file(f, validate = validate)
elif filename == "cached-consensus":
- file_parser = stem.descriptor.networkstatus._parse_file
+ file_parser = lambda f: stem.descriptor.networkstatus._parse_file(f, validate = validate)
elif filename == "cached-microdesc-consensus":
- file_parser = lambda f: stem.descriptor.networkstatus._parse_file(f, is_microdescriptor = True)
+ file_parser = lambda f: stem.descriptor.networkstatus._parse_file(f, is_microdescriptor = True, validate = validate)
if file_parser:
for desc in file_parser(descriptor_file):
@@ -150,7 +152,7 @@ def parse_file(descriptor_file, descriptor_type = None, path = None):
raise TypeError("Unable to determine the descriptor's type. filename: '%s', first line: '%s'" % (filename, first_line))
-def _parse_metrics_file(descriptor_type, major_version, minor_version, descriptor_file):
+def _parse_metrics_file(descriptor_type, major_version, minor_version, descriptor_file, validate):
# Parses descriptor files from metrics, yielding individual descriptors. This
# throws a TypeError if the descriptor_type or version isn't recognized.
import stem.descriptor.server_descriptor
@@ -158,41 +160,41 @@ def _parse_metrics_file(descriptor_type, major_version, minor_version, descripto
import stem.descriptor.networkstatus
if descriptor_type == "server-descriptor" and major_version == 1:
- for desc in stem.descriptor.server_descriptor._parse_file(descriptor_file, is_bridge = False):
+ for desc in stem.descriptor.server_descriptor._parse_file(descriptor_file, is_bridge = False, validate = validate):
yield desc
elif descriptor_type == "bridge-server-descriptor" and major_version == 1:
- for desc in stem.descriptor.server_descriptor._parse_file(descriptor_file, is_bridge = True):
+ for desc in stem.descriptor.server_descriptor._parse_file(descriptor_file, is_bridge = True, validate = validate):
yield desc
elif descriptor_type == "extra-info" and major_version == 1:
- for desc in stem.descriptor.extrainfo_descriptor._parse_file(descriptor_file, is_bridge = False):
+ for desc in stem.descriptor.extrainfo_descriptor._parse_file(descriptor_file, is_bridge = False, validate = validate):
yield desc
elif descriptor_type == "bridge-extra-info" and major_version == 1:
# version 1.1 introduced a 'transport' field...
# https://trac.torproject.org/6257
- for desc in stem.descriptor.extrainfo_descriptor._parse_file(descriptor_file, is_bridge = True):
+ for desc in stem.descriptor.extrainfo_descriptor._parse_file(descriptor_file, is_bridge = True, validate = validate):
yield desc
elif descriptor_type == "network-status-2" and major_version == 1:
document_type = stem.descriptor.networkstatus.NetworkStatusDocumentV2
- for desc in stem.descriptor.networkstatus._parse_file(descriptor_file, document_type):
+ for desc in stem.descriptor.networkstatus._parse_file(descriptor_file, document_type, validate = validate):
yield desc
elif descriptor_type == "dir-key-certificate-3" and major_version == 1:
- yield stem.descriptor.networkstatus.KeyCertificate(descriptor_file.read())
+ yield stem.descriptor.networkstatus.KeyCertificate(descriptor_file.read(), validate = validate)
elif descriptor_type in ("network-status-consensus-3", "network-status-vote-3") and major_version == 1:
document_type = stem.descriptor.networkstatus.NetworkStatusDocumentV3
- for desc in stem.descriptor.networkstatus._parse_file(descriptor_file, document_type):
+ for desc in stem.descriptor.networkstatus._parse_file(descriptor_file, document_type, validate = validate):
yield desc
elif descriptor_type == "network-status-microdesc-consensus-3" and major_version == 1:
document_type = stem.descriptor.networkstatus.NetworkStatusDocumentV3
- for desc in stem.descriptor.networkstatus._parse_file(descriptor_file, document_type, is_microdescriptor = True):
+ for desc in stem.descriptor.networkstatus._parse_file(descriptor_file, document_type, is_microdescriptor = True, validate = validate):
yield desc
elif descriptor_type == "bridge-network-status" and major_version == 1:
document_type = stem.descriptor.networkstatus.BridgeNetworkStatusDocument
- for desc in stem.descriptor.networkstatus._parse_file(descriptor_file, document_type):
+ for desc in stem.descriptor.networkstatus._parse_file(descriptor_file, document_type, validate = validate):
yield desc
else:
raise TypeError("Unrecognized metrics descriptor format. type: '%s', version: '%i.%i'" % (descriptor_type, major_version, minor_version))
More information about the tor-commits
mailing list