[or-cvs] r9965: Refactor router/directory parsing backend: use a separate to (in tor/trunk: . src/or)
nickm at seul.org
nickm at seul.org
Mon Apr 16 04:18:27 UTC 2007
Author: nickm
Date: 2007-04-16 00:18:21 -0400 (Mon, 16 Apr 2007)
New Revision: 9965
Modified:
tor/trunk/
tor/trunk/ChangeLog
tor/trunk/src/or/routerparse.c
Log:
r12387 at catbus: nickm | 2007-04-16 00:06:40 -0400
Refactor router/directory parsing backend: use a separate token table for everything that we parse, and enforce the correct count of each item.
Property changes on: tor/trunk
___________________________________________________________________
svk:merge ticket from /tor/trunk [r12387] on 8246c3cf-6607-4228-993b-4d95d33730f1
Modified: tor/trunk/ChangeLog
===================================================================
--- tor/trunk/ChangeLog 2007-04-16 04:18:06 UTC (rev 9964)
+++ tor/trunk/ChangeLog 2007-04-16 04:18:21 UTC (rev 9965)
@@ -53,6 +53,8 @@
- Don't save non-general-purpose router descriptors to the disk cache,
because we have no way of remembering what their purpose was when
we restart.
+ - Correctly enforce that elements of directory objects do not appear
+ more often than they are allowed to appear.
o Minor bugfixes (controller), reported by daejees:
- Make 'getinfo fingerprint' return a 551 error if we're not a
Modified: tor/trunk/src/or/routerparse.c
===================================================================
--- tor/trunk/src/or/routerparse.c 2007-04-16 04:18:06 UTC (rev 9964)
+++ tor/trunk/src/or/routerparse.c 2007-04-16 04:18:21 UTC (rev 9965)
@@ -22,7 +22,7 @@
* not-a-token.
*/
typedef enum {
- K_ACCEPT,
+ K_ACCEPT = 0,
K_DIRECTORY_SIGNATURE,
K_RECOMMENDED_SOFTWARE,
K_REJECT,
@@ -77,7 +77,7 @@
int n_args; /**< Number of elements in args */
char **args; /**< Array of arguments from keyword line. */
char *object_type; /**< -----BEGIN [object_type]-----*/
- size_t object_size; /**< Bytes in object_body */
+ size_t object_size; /**< Bytes in object_body */
char *object_body; /**< Contents of object, base64-decoded. */
crypto_pk_env_t *key; /**< For public keys only. */
const char *error; /**< For _ERR tokens only. */
@@ -102,63 +102,105 @@
OBJ_OK, /**< Object is optional. */
} obj_syntax;
-/** Rules for where a keyword can appear. */
-typedef enum {
- DIR = 1, /**< Appears only in directory. */
- RTR = 2, /**< Appears only in router descriptor or runningrouters. */
- NETSTATUS = 4, /**< v2 or later ("versioned") network status. */
- ANYSIGNED = 7, /**< Any "full" document (that is, not a router status.) */
- RTRSTATUS = 8, /**< Router-status portion of a versioned network status. */
- EXTRAINFO = 16, /**< DOCDOC */
- ANY = 31, /**< Appears in any document type. */
-} where_syntax;
+/** DOCDOC */
+typedef struct token_rule_t {
+ const char *t; directory_keyword v; arg_syntax s; obj_syntax os;
+ int min_cnt; int max_cnt;
+} token_rule_t;
-/** Table mapping keywords to token value and to argument rules. */
-static struct {
- const char *t; directory_keyword v; arg_syntax s; obj_syntax os; int ws;
-} token_table[] = {
- { "accept", K_ACCEPT, ARGS, NO_OBJ, RTR },
- { "directory-signature", K_DIRECTORY_SIGNATURE, ARGS, NEED_OBJ,
- DIR|NETSTATUS},
- { "r", K_R, ARGS, NO_OBJ, RTRSTATUS },
- { "s", K_S, ARGS, NO_OBJ, RTRSTATUS },
- { "v", K_V, CONCAT_ARGS, NO_OBJ, RTRSTATUS },
- { "reject", K_REJECT, ARGS, NO_OBJ, RTR },
- { "router", K_ROUTER, ARGS, NO_OBJ, RTR },
- { "recommended-software",K_RECOMMENDED_SOFTWARE,ARGS, NO_OBJ, DIR },
- { "signed-directory", K_SIGNED_DIRECTORY, NO_ARGS, NO_OBJ, DIR },
- { "signing-key", K_SIGNING_KEY, NO_ARGS, NEED_KEY,RTR },
- { "onion-key", K_ONION_KEY, NO_ARGS, NEED_KEY,RTR },
- { "router-signature", K_ROUTER_SIGNATURE, NO_ARGS, NEED_OBJ,RTR|EXTRAINFO },
- { "running-routers", K_RUNNING_ROUTERS, ARGS, NO_OBJ, DIR },
- { "router-status", K_ROUTER_STATUS, ARGS, NO_OBJ, DIR },
- { "bandwidth", K_BANDWIDTH, ARGS, NO_OBJ, RTR },
- { "platform", K_PLATFORM, CONCAT_ARGS, NO_OBJ, RTR },
- { "published", K_PUBLISHED, CONCAT_ARGS, NO_OBJ, ANYSIGNED|EXTRAINFO },
- { "opt", K_OPT, CONCAT_ARGS, OBJ_OK, ANY },
- { "contact", K_CONTACT, CONCAT_ARGS, NO_OBJ, ANYSIGNED },
- { "network-status", K_NETWORK_STATUS, NO_ARGS, NO_OBJ, DIR },
- { "uptime", K_UPTIME, ARGS, NO_OBJ, RTR },
- { "dir-signing-key", K_DIR_SIGNING_KEY, ARGS, OBJ_OK,
- DIR|NETSTATUS},
- { "family", K_FAMILY, ARGS, NO_OBJ, RTR },
- { "fingerprint", K_FINGERPRINT, CONCAT_ARGS, NO_OBJ, ANYSIGNED },
- { "hibernating", K_HIBERNATING, ARGS, NO_OBJ, RTR },
- { "read-history", K_READ_HISTORY, ARGS, NO_OBJ, RTR|EXTRAINFO },
- { "write-history", K_WRITE_HISTORY, ARGS, NO_OBJ, RTR|EXTRAINFO },
- { "network-status-version", K_NETWORK_STATUS_VERSION,
- ARGS, NO_OBJ, NETSTATUS },
- { "dir-source", K_DIR_SOURCE, ARGS, NO_OBJ, NETSTATUS },
- { "dir-options", K_DIR_OPTIONS, ARGS, NO_OBJ, NETSTATUS },
- { "client-versions", K_CLIENT_VERSIONS, ARGS, NO_OBJ, NETSTATUS },
- { "server-versions", K_SERVER_VERSIONS, ARGS, NO_OBJ, NETSTATUS },
- { "eventdns", K_EVENTDNS, ARGS, NO_OBJ, RTR },
- { "extra-info", K_EXTRA_INFO, ARGS, NO_OBJ, EXTRAINFO },
- { "extra-info-digest", K_EXTRA_INFO_DIGEST, ARGS, NO_OBJ, RTR },
- { "caches-extra-info", K_CACHES_EXTRA_INFO, NO_ARGS, NO_OBJ, RTR },
- { NULL, _NIL, NO_ARGS, NO_OBJ, ANY }
+/** DOCDOC */
+#define END_OF_TABLE { NULL, _NIL, NO_ARGS, NO_OBJ, 0, INT_MAX }
+#define T(s,t,a,o) { s, t, a, o, 0, INT_MAX }
+#define T0N(s,t,a,o) { s, t, a, o, 0, INT_MAX }
+#define T1(s,t,a,o) { s, t, a, o, 1, 1 }
+#define T01(s,t,a,o) { s, t, a, o, 0, 1 }
+
+/** DOCDOC */
+static token_rule_t routerdesc_token_table[] = {
+ T0N("accept", K_ACCEPT, ARGS, NO_OBJ ),
+ T0N("reject", K_REJECT, ARGS, NO_OBJ ),
+ T1( "router", K_ROUTER, ARGS, NO_OBJ ),
+ T1( "signing-key", K_SIGNING_KEY, NO_ARGS, NEED_KEY ),
+ T1( "onion-key", K_ONION_KEY, NO_ARGS, NEED_KEY ),
+ T1( "router-signature", K_ROUTER_SIGNATURE, NO_ARGS, NEED_OBJ ),
+ T1( "published", K_PUBLISHED, CONCAT_ARGS, NO_OBJ ),
+ T0N("opt", K_OPT, CONCAT_ARGS, OBJ_OK ),
+ T01("contact", K_CONTACT, CONCAT_ARGS, NO_OBJ ),
+ T01("uptime", K_UPTIME, ARGS, NO_OBJ ),
+ T01("family", K_FAMILY, ARGS, NO_OBJ ),
+ T01("fingerprint", K_FINGERPRINT, CONCAT_ARGS, NO_OBJ ),
+ T01("hibernating", K_HIBERNATING, ARGS, NO_OBJ ),
+ T01("read-history", K_READ_HISTORY, ARGS, NO_OBJ ),
+ T01("write-history", K_WRITE_HISTORY, ARGS, NO_OBJ ),
+ T01("eventdns", K_EVENTDNS, ARGS, NO_OBJ ),
+ T01("extra-info-digest", K_EXTRA_INFO_DIGEST, ARGS, NO_OBJ ),
+ T01("caches-extra-info", K_CACHES_EXTRA_INFO, NO_ARGS, NO_OBJ ),
+ T1("bandwidth", K_BANDWIDTH, ARGS, NO_OBJ ),
+ T01("platform", K_PLATFORM, CONCAT_ARGS, NO_OBJ ),
+
+ END_OF_TABLE
};
+static token_rule_t extrainfo_token_table[] = {
+ T1( "router-signature", K_ROUTER_SIGNATURE, NO_ARGS, NEED_OBJ ),
+ T1( "published", K_PUBLISHED, CONCAT_ARGS, NO_OBJ ),
+ T0N("opt", K_OPT, CONCAT_ARGS, OBJ_OK ),
+ T01("read-history", K_READ_HISTORY, ARGS, NO_OBJ ),
+ T01("write-history", K_WRITE_HISTORY, ARGS, NO_OBJ ),
+ T1( "extra-info", K_EXTRA_INFO, ARGS, NO_OBJ ),
+
+ END_OF_TABLE
+};
+
+static token_rule_t rtrstatus_token_table[] = {
+ T1( "r", K_R, ARGS, NO_OBJ ),
+ T1( "s", K_S, ARGS, NO_OBJ ),
+ T01("v", K_V, CONCAT_ARGS, NO_OBJ ),
+ T0N("opt", K_OPT, CONCAT_ARGS, OBJ_OK ),
+ END_OF_TABLE
+};
+
+static token_rule_t netstatus_token_table[] = {
+ T1( "published", K_PUBLISHED, CONCAT_ARGS, NO_OBJ ),
+ T0N("opt", K_OPT, CONCAT_ARGS, OBJ_OK ),
+ T1( "contact", K_CONTACT, CONCAT_ARGS, NO_OBJ ),
+ T1( "dir-signing-key", K_DIR_SIGNING_KEY, ARGS, OBJ_OK ),
+ T1( "fingerprint", K_FINGERPRINT, CONCAT_ARGS, NO_OBJ ),
+ T1( "network-status-version", K_NETWORK_STATUS_VERSION,
+ ARGS, NO_OBJ ),
+ T1( "dir-source", K_DIR_SOURCE, ARGS, NO_OBJ ),
+ T01("dir-options", K_DIR_OPTIONS, ARGS, NO_OBJ ),
+ T01("client-versions", K_CLIENT_VERSIONS, ARGS, NO_OBJ ),
+ T01("server-versions", K_SERVER_VERSIONS, ARGS, NO_OBJ ),
+
+ END_OF_TABLE
+};
+
+static token_rule_t dir_footer_token_table[] = {
+ T1( "directory-signature", K_DIRECTORY_SIGNATURE, ARGS, NEED_OBJ ),
+ END_OF_TABLE
+};
+
+static token_rule_t dir_token_table[] = {
+ /* don't enforce counts; this is obsolete. */
+ T( "network-status", K_NETWORK_STATUS, NO_ARGS, NO_OBJ ),
+ T( "directory-signature", K_DIRECTORY_SIGNATURE, ARGS, NEED_OBJ ),
+ T( "recommended-software",K_RECOMMENDED_SOFTWARE,ARGS, NO_OBJ ),
+ T( "signed-directory", K_SIGNED_DIRECTORY, NO_ARGS, NO_OBJ ),
+
+ T( "running-routers", K_RUNNING_ROUTERS, ARGS, NO_OBJ ),
+ T( "router-status", K_ROUTER_STATUS, ARGS, NO_OBJ ),
+ T( "published", K_PUBLISHED, CONCAT_ARGS, NO_OBJ ),
+ T( "opt", K_OPT, CONCAT_ARGS, OBJ_OK ),
+ T( "contact", K_CONTACT, CONCAT_ARGS, NO_OBJ ),
+ T( "dir-signing-key", K_DIR_SIGNING_KEY, ARGS, OBJ_OK ),
+ T( "fingerprint", K_FINGERPRINT, CONCAT_ARGS, NO_OBJ ),
+
+ END_OF_TABLE
+};
+
+#undef T
+
/* static function prototypes */
static int router_add_exit_policy(routerinfo_t *router,directory_token_t *tok);
static addr_policy_t *router_parse_addr_policy(directory_token_t *tok);
@@ -171,8 +213,10 @@
static directory_token_t *find_first_by_keyword(smartlist_t *s,
directory_keyword keyword);
static int tokenize_string(const char *start, const char *end,
- smartlist_t *out, where_syntax where);
-static directory_token_t *get_next_token(const char **s, where_syntax where);
+ smartlist_t *out,
+ struct token_rule_t *table);
+static directory_token_t *get_next_token(const char **s,
+ struct token_rule_t *table);
static int check_directory_signature(const char *digest,
directory_token_t *tok,
crypto_pk_env_t *pkey,
@@ -402,7 +446,7 @@
}
++cp;
tokens = smartlist_create();
- if (tokenize_string(cp,strchr(cp,'\0'),tokens,DIR)) {
+ if (tokenize_string(cp,strchr(cp,'\0'),tokens,dir_token_table)) {
log_warn(LD_DIR, "Error tokenizing directory signature"); goto err;
}
if (smartlist_len(tokens) != 1) {
@@ -431,7 +475,7 @@
}
tokens = smartlist_create();
- if (tokenize_string(str,end,tokens,DIR)) {
+ if (tokenize_string(str,end,tokens,dir_token_table)) {
log_warn(LD_DIR, "Error tokenizing directory"); goto err;
}
@@ -481,7 +525,7 @@
goto err;
}
tokens = smartlist_create();
- if (tokenize_string(str,str+strlen(str),tokens,DIR)) {
+ if (tokenize_string(str,str+strlen(str),tokens,dir_token_table)) {
log_warn(LD_DIR, "Error tokenizing running-routers"); goto err;
}
tok = smartlist_get(tokens,0);
@@ -540,7 +584,7 @@
return NULL;
++cp; /* Now cp points to the start of the token. */
- tok = get_next_token(&cp, DIR);
+ tok = get_next_token(&cp, dir_token_table);
if (!tok) {
log_warn(LD_DIR, "Unparseable dir-signing-key token");
return NULL;
@@ -772,7 +816,7 @@
return NULL;
}
tokens = smartlist_create();
- if (tokenize_string(s,end,tokens,RTR)) {
+ if (tokenize_string(s,end,tokens,routerdesc_token_table)) {
log_warn(LD_DIR, "Error tokeninzing router descriptor.");
goto err;
}
@@ -1038,7 +1082,7 @@
return NULL;
}
tokens = smartlist_create();
- if (tokenize_string(s,end,tokens,EXTRAINFO)) {
+ if (tokenize_string(s,end,tokens,extrainfo_token_table)) {
log_warn(LD_DIR, "Error tokeninzing router descriptor.");
goto err;
}
@@ -1162,7 +1206,7 @@
eos = find_start_of_next_routerstatus(*s);
- if (tokenize_string(*s, eos, tokens, RTRSTATUS)) {
+ if (tokenize_string(*s, eos, tokens, rtrstatus_token_table)) {
log_warn(LD_DIR, "Error tokenizing router status");
goto err;
}
@@ -1297,6 +1341,7 @@
{
const char *eos;
smartlist_t *tokens = smartlist_create();
+ smartlist_t *footer_tokens = smartlist_create();
networkstatus_t *ns = NULL;
char ns_digest[DIGEST_LEN];
char tmp_digest[DIGEST_LEN];
@@ -1310,7 +1355,7 @@
}
eos = find_start_of_next_routerstatus(s);
- if (tokenize_string(s, eos, tokens, NETSTATUS)) {
+ if (tokenize_string(s, eos, tokens, netstatus_token_table)) {
log_warn(LD_DIR, "Error tokenizing network-status header.");
goto err;
}
@@ -1433,15 +1478,15 @@
smartlist_uniq(ns->entries, _compare_routerstatus_entries,
_free_duplicate_routerstatus_entry);
- if (tokenize_string(s, NULL, tokens, NETSTATUS)) {
+ if (tokenize_string(s, NULL, footer_tokens, dir_footer_token_table)) {
log_warn(LD_DIR, "Error tokenizing network-status footer.");
goto err;
}
- if (smartlist_len(tokens) < 1) {
+ if (smartlist_len(footer_tokens) < 1) {
log_warn(LD_DIR, "Too few items in network-status footer.");
goto err;
}
- tok = smartlist_get(tokens, smartlist_len(tokens)-1);
+ tok = smartlist_get(footer_tokens, smartlist_len(footer_tokens)-1);
if (tok->tp != K_DIRECTORY_SIGNATURE) {
log_warn(LD_DIR,
"Expected network-status footer to end with a signature.");
@@ -1460,6 +1505,8 @@
done:
SMARTLIST_FOREACH(tokens, directory_token_t *, t, token_free(t));
smartlist_free(tokens);
+ SMARTLIST_FOREACH(footer_tokens, directory_token_t *, t, token_free(t));
+ smartlist_free(footer_tokens);
return ns;
}
@@ -1494,7 +1541,7 @@
tor_free(tmp);
cp = tmp = new_str;
}
- tok = get_next_token(&cp, RTR);
+ tok = get_next_token(&cp, routerdesc_token_table);
if (tok->tp == _ERR) {
log_warn(LD_DIR, "Error reading address policy: %s", tok->error);
goto err;
@@ -1668,11 +1715,10 @@
}
/** Helper function: read the next token from *s, advance *s to the end
- * of the token, and return the parsed token. If 'where' is DIR
- * or RTR, reject all tokens of the wrong type.
+ * of the token, and return the parsed token. DOCDOC table
*/
static directory_token_t *
-get_next_token(const char **s, where_syntax where)
+get_next_token(const char **s, struct token_rule_t *table)
{
const char *next, *obstart;
int i, done, allocated, is_opt;
@@ -1710,23 +1756,12 @@
RET_ERR("opt without keyword");
}
}
- for (i = 0; token_table[i].t ; ++i) {
- if (!strncmp(token_table[i].t, *s, next-*s)) {
+ for (i = 0; table[i].t ; ++i) {
+ if (!strncmp(table[i].t, *s, next-*s)) {
/* We've found the keyword. */
- tok->tp = token_table[i].v;
- a_syn = token_table[i].s;
- o_syn = token_table[i].os;
- if (!(token_table[i].ws & where)) {
- if (where == DIR) {
- RET_ERR("Found an out-of-place token in a directory section");
- } else if (where == RTR) {
- RET_ERR("Found an out-of-place token in a router descriptor");
- } else if (where == NETSTATUS) {
- RET_ERR("Found an out-of-place token in a network-status header");
- } else {
- RET_ERR("Found an out-of-place token in a router status body");
- }
- }
+ tok->tp = table[i].v;
+ a_syn = table[i].s;
+ o_syn = table[i].os;
if (a_syn == ARGS) {
/* This keyword takes multiple arguments. */
i = 0;
@@ -1846,28 +1881,45 @@
}
/** Read all tokens from a string between <b>start</b> and <b>end</b>, and add
- * them to <b>out</b>. If <b>is_dir</b> is true, reject all non-directory
- * tokens; else reject all non-routerdescriptor tokens.
+ * them to <b>out</b>. DOCDOC table.
*/
static int
tokenize_string(const char *start, const char *end, smartlist_t *out,
- where_syntax where)
+ token_rule_t *table)
{
const char **s;
directory_token_t *tok = NULL;
+ int counts[_NIL];
+ int i;
+
s = &start;
if (!end)
end = start+strlen(start);
+ memset(counts, 0, sizeof(counts));
+ for (i = 0; i < _NIL; ++i)
+ counts[i] = 0;
while (*s < end && (!tok || tok->tp != _EOF)) {
- tok = get_next_token(s, where);
+ tok = get_next_token(s, table);
if (tok->tp == _ERR) {
log_warn(LD_DIR, "parse error: %s", tok->error);
return -1;
}
+ ++counts[tok->tp];
smartlist_add(out, tok);
*s = eat_whitespace(*s);
}
+ for (i = 0; table[i].t; ++i) {
+ if (counts[table[i].v] < table[i].min_cnt) {
+ log_warn(LD_DIR, "Parse error: missing %s element.", table[i].t);
+ tor_assert(0);
+ return -1;
+ }
+ if (counts[table[i].v] > table[i].max_cnt) {
+ log_warn(LD_DIR, "Parse error: too many %s elements.", table[i].t);
+ return -1;
+ }
+ }
return 0;
}
More information about the tor-commits
mailing list