[tor-commits] [onionperf/master] Add JSON schema for analysis file format 3.0.

karsten at torproject.org karsten at torproject.org
Mon Aug 10 09:30:41 UTC 2020


commit 7c1ae345effc8197e35ffffde86d318893d42285
Author: Karsten Loesing <karsten.loesing at gmx.net>
Date:   Sun Jul 12 17:43:08 2020 +0200

    Add JSON schema for analysis file format 3.0.
    
    This schema can be used to validate an analysis file using version 3.0
    by using the following commands:
    
    ```
    pip3 install jsonschema
    unxz final_onionperf.analysis.json.xz
    jsonschema -i final_onionperf.analysis.json onionperf-3.0.json
    ```
    
    Implements tpo/metrics/onionperf#40003.
---
 schema/onionperf-3.0.json | 546 ++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 546 insertions(+)

diff --git a/schema/onionperf-3.0.json b/schema/onionperf-3.0.json
new file mode 100644
index 0000000..f670c4c
--- /dev/null
+++ b/schema/onionperf-3.0.json
@@ -0,0 +1,546 @@
+{
+  "$schema": "http://json-schema.org/draft-07/schema",
+  "$id": "https://gitlab.torproject.org/tpo/metrics/onionperf/-/raw/master/schema/onionperf-3.0.json",
+  "type": "object",
+  "title": "OnionPerf analysis JSON file format 3.0",
+  "required": [
+    "data",
+    "type",
+    "version"
+  ],
+  "properties": {
+    "data": {
+      "type": "object",
+      "title": "Measurement data by source name",
+      "propertyNames": {
+        "pattern": "^[A-Za-z0-9-]+$"
+      },
+      "additionalProperties": {
+        "type": "object",
+        "title": "Measurement data from a single source",
+        "required": [
+          "measurement_ip",
+          "tgen",
+          "tor"
+        ],
+        "properties": {
+          "measurement_ip": {
+            "type": "string",
+            "title": "Public IP address of the measuring host."
+          },
+          "tgen": {
+            "type": "object",
+            "title": "Measurement data obtained from client-side TGen logs",
+            "required": [
+              "streams"
+            ],
+            "properties": {
+              "streams": {
+                "type": "object",
+                "title": "Measurement data, by TGen stream identifier",
+                "additionalProperties": {
+                  "type": "object",
+                  "title": "Information on a single measurement, obtained from a single [stream-success] or [stream-error] log message (except for elapsed_seconds)",
+                  "required": [
+                    "byte_info",
+                    "is_complete",
+                    "is_error",
+                    "is_success",
+                    "stream_id",
+                    "stream_info",
+                    "time_info",
+                    "transport_info",
+                    "unix_ts_end",
+                    "unix_ts_start"
+                  ],
+                  "properties": {
+                    "byte_info": {
+                      "type": "object",
+                      "title": "Information on sent and received bytes",
+                      "required": [
+                        "payload-bytes-recv",
+                        "payload-bytes-send",
+                        "payload-progress-recv",
+                        "payload-progress-send",
+                        "total-bytes-recv",
+                        "total-bytes-send"
+                      ],
+                      "properties": {
+                        "payload-bytes-recv": {
+                          "type": "string",
+                          "pattern": "^[0-9]+$",
+                          "title": "Number of payload bytes received"
+                        },
+                        "payload-bytes-send": {
+                          "type": "string",
+                          "pattern": "^[0-9]+$",
+                          "title": "Number of payload bytes sent"
+                        },
+                        "payload-progress-recv": {
+                          "type": "string",
+                          "pattern": "^[0-9]+\\.[0-9]+%$",
+                          "title": "Progress of receiving payload in percent"
+                        },
+                        "payload-progress-send": {
+                          "type": "string",
+                          "pattern": "^[0-9]+\\.[0-9]+%$",
+                          "title": "Progress of sending payload in percent"
+                        },
+                        "total-bytes-recv": {
+                          "type": "string",
+                          "pattern": "^[0-9]+$",
+                          "title": "Total number of bytes received"
+                        },
+                        "total-bytes-send": {
+                          "type": "string",
+                          "pattern": "^[0-9]+$",
+                          "title": "Total number of bytes sent"
+                        }
+                      }
+                    },
+                    "elapsed_seconds": {
+                      "type": "object",
+                      "title": "Elapsed seconds until a given number or fraction of payload bytes have been received or sent, obtained from [stream-status], [stream-success], and [stream-error] log messages, only included if the measurement was a success",
+                      "properties": {
+                        "payload_bytes_recv": {
+                          "type": "object",
+                          "title": "Number of received payload bytes",
+                          "propertyNames": {
+                            "pattern": "^[0-9]+$"
+                          },
+                          "additionalProperties": {
+                            "type": "number",
+                            "title": "Elapsed seconds"
+                          }
+                        },
+                        "payload_bytes_send": {
+                          "type": "object",
+                          "title": "Number of sent payload bytes",
+                          "propertyNames": {
+                            "pattern": "^[0-9]+$"
+                          },
+                          "additionalProperties": {
+                            "type": "number",
+                            "title": "Elapsed seconds"
+                          }
+                        },
+                        "payload_progress_recv": {
+                          "type": "object",
+                          "title": "Fraction of received payload bytes",
+                          "propertyNames": {
+                            "pattern": "^[01]\\.[0-9]$"
+                          },
+                          "additionalProperties": {
+                            "type": "number",
+                            "title": "Elapsed seconds"
+                          }
+                        },
+                        "payload_progress_send": {
+                          "type": "object",
+                          "title": "Fraction of sent payload bytes",
+                          "propertyNames": {
+                            "pattern": "^[01]\\.[0-9]$"
+                          },
+                          "additionalProperties": {
+                            "type": "number",
+                            "title": "Elapsed seconds"
+                          }
+                        }
+                      }
+                    },
+                    "is_complete": {
+                      "type": "boolean",
+                      "title": "Whether the stream finished, no matter the error state, which is always true, or otherwise the measurement would not be included here"
+                    },
+                    "is_error": {
+                      "type": "boolean",
+                      "title": "Whether an error occurred"
+                    },
+                    "is_success": {
+                      "type": "boolean",
+                      "title": "Whether the measurement was a success"
+                    },
+                    "stream_id": {
+                      "type": "string",
+                      "title": "Stream identifier"
+                    },
+                    "stream_info": {
+                      "type": "object",
+                      "title": "Information about the TGen stream",
+                      "required": [
+                        "error",
+                        "id",
+                        "name",
+                        "peername",
+                        "recvsize",
+                        "recvstate",
+                        "sendsize",
+                        "sendstate",
+                        "vertexid"
+                      ],
+                      "properties": {
+                        "error": {
+                          "type": "string",
+                          "title": "Error code, or NONE if no error occurred"
+                        },
+                        "id": {
+                          "type": "string",
+                          "title": "Stream numerical identifier, or 0 if the stream failed"
+                        },
+                        "name": {
+                          "type": "string",
+                          "title": "Hostname of the TGen client"
+                        },
+                        "peername": {
+                          "type": "string",
+                          "title": "Hostname of the TGen server"
+                        },
+                        "recvsize": {
+                          "type": "string",
+                          "title": "Number of expected payload bytes in the response"
+                        },
+                        "recvstate": {
+                          "type": "string",
+                          "title": "Last recorded receive state of the stream, one of RECV_{NONE,AUTHENTICATE,HEADER,MODEL,PAYLOAD,CHECKSUM,SUCCESS,ERROR}"
+                        },
+                        "sendsize": {
+                          "type": "string",
+                          "title": "Number of expected payload bytes in the request"
+                        },
+                        "sendstate": {
+                          "type": "string",
+                          "title": "Last recorded send state of the stream, one of SEND_{NONE,COMMAND,RESPONSE,PAYLOAD,CHECKSUM,FLUSH,SUCCESS,ERROR}"
+                        },
+                        "vertexid": {
+                          "type": "string",
+                          "title": "Vertex identifier in the TGen model"
+                        }
+                      }
+                    },
+                    "time_info": {
+                      "type": "object",
+                      "title": "Elapsed time until reaching given substeps in a measurement",
+                      "required": [
+                        "created-ts",
+                        "now-ts",
+                        "usecs-to-checksum-recv",
+                        "usecs-to-checksum-send",
+                        "usecs-to-command",
+                        "usecs-to-first-byte-recv",
+                        "usecs-to-first-byte-send",
+                        "usecs-to-last-byte-recv",
+                        "usecs-to-last-byte-send",
+                        "usecs-to-proxy-choice",
+                        "usecs-to-proxy-init",
+                        "usecs-to-proxy-request",
+                        "usecs-to-proxy-response",
+                        "usecs-to-response",
+                        "usecs-to-socket-connect",
+                        "usecs-to-socket-create"
+                      ],
+                      "properties": {
+                        "created-ts": {
+                          "type": "string",
+                          "title": "Montonic system time when TGen created this stream, in microseconds since some arbitrary, fixed point in the past."
+                        },
+                        "now-ts": {
+                          "type": "string",
+                          "title": "Montonic system time when TGen computed elapsed microseconds for this stream, in microseconds since some arbitrary, fixed point in the past."
+                        },
+                        "usecs-to-checksum-recv": {
+                          "type": "string",
+                          "title": "Elapsed microseconds until the TGen client has received the checksum from the TGen server, or -1 if missing (step 11)"
+                        },
+                        "usecs-to-checksum-send": {
+                          "type": "string",
+                          "title": "Elapsed microseconds until the TGen client has sent the checksum to the TGen server, or -1 if missing (step 11)"
+                        },
+                        "usecs-to-command": {
+                          "type": "string",
+                          "title": "Elapsed microseconds until the TGen client has sent the command to the TGen server, or -1 if missing (step 7)"
+                        },
+                        "usecs-to-first-byte-recv": {
+                          "type": "string",
+                          "title": "Elapsed microseconds until the TGen client has received the first payload byte, or -1 if missing (step 9)"
+                        },
+                        "usecs-to-first-byte-send": {
+                          "type": "string",
+                          "title": "Elapsed microseconds until the TGen client has sent the first payload byte, or -1 if missing (step 9)"
+                        },
+                        "usecs-to-last-byte-recv": {
+                          "type": "string",
+                          "title": "Elapsed microseconds until the TGen client has received the last payload byte, or -1 if missing (step 10)"
+                        },
+                        "usecs-to-last-byte-send": {
+                          "type": "string",
+                          "title": "Elapsed microseconds until the TGen client has sent the last payload byte, or -1 if missing (step 10)"
+                        },
+                        "usecs-to-proxy-choice": {
+                          "type": "string",
+                          "title": "Elapsed microseconds until the TGen client has received the SOCKS choice from the Tor client, or -1 if missing (step 4)"
+                        },
+                        "usecs-to-proxy-init": {
+                          "type": "string",
+                          "title": "Elapsed microseconds until the TGen client has sent the SOCKS initialization to the Tor client, or -1 if missing (step 3)"
+                        },
+                        "usecs-to-proxy-request": {
+                          "type": "string",
+                          "title": "Elapsed microseconds until the TGen client has sent the SOCKS request to the Tor client, or -1 if missing (step 5)"
+                        },
+                        "usecs-to-proxy-response": {
+                          "type": "string",
+                          "title": "Elapsed microseconds until the TGen client has received the SOCKS response from the Tor client, or -1 if missing (step 6)"
+                        },
+                        "usecs-to-response": {
+                          "type": "string",
+                          "title": "Elapsed microseconds until the TGen client has received the command from the TGen server, or -1 if missing (step 8)"
+                        },
+                        "usecs-to-socket-connect": {
+                          "type": "string",
+                          "title": "Elapsed microseconds until the TGen client has connected to the Tor client's SOCKS port, or -1 if missing (step 2)"
+                        },
+                        "usecs-to-socket-create": {
+                          "type": "string",
+                          "title": "Elapsed microseconds until the TGen client has opened a TCP connection to the Tor client's SOCKS port, or -1 if missing (step 1)"
+                        }
+                      }
+                    },
+                    "transport_info": {
+                      "type": "object",
+                      "title": "Information about the TGen transport",
+                      "required": [
+                        "error",
+                        "fd",
+                        "local",
+                        "proxy",
+                        "remote",
+                        "state"
+                      ],
+                      "properties": {
+                        "error": {
+                          "type": "string",
+                          "title": "Error code, or NONE if no error occurred"
+                        },
+                        "fd": {
+                          "type": "string",
+                          "title": "File descriptor"
+                        },
+                        "local": {
+                          "type": "string",
+                          "title": "Local host name, IP address, and TCP port"
+                        },
+                        "proxy": {
+                          "type": "string",
+                          "title": "Proxy host name, IP address, and TCP port"
+                        },
+                        "remote": {
+                          "type": "string",
+                          "title": "Remote host name, IP address, and TCP port"
+                        },
+                        "state": {
+                          "type": "string",
+                          "title": "Last recorded state of the transport, one of CONNECT,INIT,CHOICE,REQUEST,AUTH_{REQUEST,RESPONSE},RESPONSE_{STATUS,TYPE,IPV4,NAMELEN,NAME},SUCCESS_{OPEN,EOF},ERROR"
+                        }
+                      }
+                    },
+                    "unix_ts_end": {
+                      "type": "number",
+                      "title": "Final end time of the measurement, obtained from the log time of the [stream-success] or [stream-error] log message, given in seconds since the epoch"
+                    },
+                    "unix_ts_start": {
+                      "type": "number",
+                      "title": "Initial start time of the measurement, obtained by subtracting the largest number of elapsed microseconds in time_info from unix_ts_end, given in seconds since the epoch"
+                    }
+                  }
+                }
+              }
+            }
+          },
+          "tor": {
+            "type": "object",
+            "title": "Metadata obtained from client-side Tor controller logs",
+            "required": [
+              "circuits",
+              "streams"
+            ],
+            "properties": {
+              "circuits": {
+                "type": "object",
+                "title": "Information about Tor circuits, by circuit identifier, obtained from CIRC and CIRC_MINOR events, for all circuits created by the Tor client",
+                "propertyNames": {
+                  "pattern": "^[0-9]+$"
+                },
+                "additionalProperties": {
+                  "type": "object",
+                  "title": "Information about a Tor circuit",
+                  "required": [
+                    "circuit_id",
+                    "elapsed_seconds",
+                    "unix_ts_end",
+                    "unix_ts_start"
+                  ],
+                  "additionalProperties": false,
+                  "properties": {
+                    "build_quantile": {
+                      "type": "number",
+                      "title": "Circuit build time quantile, obtained from the most recent BUILDTIMEOUT_SET event preceding the CIRC LAUNCHED event"
+                    },
+                    "build_timeout": {
+                      "type": "integer",
+                      "title": "Circuit build time in milliseconds, obtained from the most recent BUILDTIMEOUT_SET event preceding the CIRC event with status LAUNCHED"
+                    },
+                    "buildtime_seconds": {
+                      "type": "number",
+                      "title": "Build time in seconds, computed as time elapsed between CIRC LAUNCHED and CIRC BUILT events"
+                    },
+                    "circuit_id": {
+                      "type": "integer",
+                      "title": "Circuit identifier, obtained from CIRC and CIRC_MINOR events"
+                    },
+                    "elapsed_seconds": {
+                      "type": "array",
+                      "title": "Elapsed seconds until receiving and logging CIRC and CIRC_MINOR events",
+                      "items": {
+                        "type": "array",
+                        "title": "Elapsed seconds until reaching a given circuit status change",
+                        "items": [
+                          {
+                            "type": "string",
+                            "title": "Circuit status change"
+                          },
+                          {
+                            "type": "number",
+                            "title": "Elapsed seconds"
+                          }
+                        ]
+                      }
+                    },
+                    "failure_reason_local": {
+                      "type": "string",
+                      "title": "Local failure reason, obtained from CIRC FAILED events"
+                    },
+                    "failure_reason_remote": {
+                      "type": "string",
+                      "title": "Remote failure reason, obtained from CIRC FAILED events"
+                    },
+                    "path": {
+                      "type": "array",
+                      "title": "Path information",
+                      "items": {
+                        "type": "array",
+                        "title": "Elapsed seconds until extending the circuit to a given relay",
+                        "items": [
+                          {
+                            "type": "string",
+                            "pattern": "^\\$[0-9A-Z]{40}~[0-9a-zA-Z]{1,19}$",
+                            "title": "Relay fingerprint and nickname"
+                          },
+                          {
+                            "type": "number",
+                            "minimum": 0,
+                            "title": "Elapsed seconds"
+                          }
+                        ]
+                      }
+                    },
+                    "unix_ts_end": {
+                      "type": "number",
+                      "title": "Final end time of the circuit, obtained from the log time of the last CIRC CLOSED or CIRC FAILED event, given in seconds since the epoch"
+                    },
+                    "unix_ts_start": {
+                      "type": "number",
+                      "title": "Initial start time of the circuit, obtained from the log time of the CIRC LAUNCHED event, given in seconds since the epoch"
+                    }
+                  }
+                }
+              },
+              "streams": {
+                "type": "object",
+                "title": "Information about Tor stream, by stream identifier, obtained from STREAM events, for all streams created by the Tor client",
+                "propertyNames": {
+                  "pattern": "^[0-9]+$"
+                },
+                "additionalProperties": {
+                  "type": "object",
+                  "title": "Information about a Tor stream",
+                  "required": [
+                    "circuit_id",
+                    "elapsed_seconds",
+                    "stream_id",
+                    "target",
+                    "unix_ts_end",
+                    "unix_ts_start"
+                  ],
+                  "additionalProperties": false,
+                  "properties": {
+                    "circuit_id": {
+                      "title": "Circuit identifier, obtained from STREAM events"
+                    },
+                    "elapsed_seconds": {
+                      "type": "array",
+                      "title": "Elapsed seconds until receiving and logging STREAM events",
+                      "items": {
+                        "type": "array",
+                        "items": [
+                          {
+                            "type": "string",
+                            "title": "Stream purpose and STREAM event status"
+                          },
+                          {
+                            "type": "number",
+                            "title": "Elapsed seconds"
+                          }
+                        ]
+                      }
+                    },
+                    "failure_reason_local": {
+                      "type": "string",
+                      "title": "Local failure reason, obtained from STREAM FAILED events"
+                    },
+                    "failure_reason_remote": {
+                      "type": "string",
+                      "title": "Remote failure reason, obtained from STREAM FAILED events"
+                    },
+                    "source": {
+                      "type": "string",
+                      "title": "Stream source IP address and TCP port, obtained from STREAM NEW or STREAM NEWRESOLVE events"
+                    },
+                    "stream_id": {
+                      "type": "integer",
+                      "title": "Stream identifier, unique at least for the lifetime of this stream"
+                    },
+                    "target": {
+                      "type": "string",
+                      "title": "Stream target domain name and TCP port, obtained from STREAM events",
+                      "examples": [
+                        "jzxfvaupigl7hkemf4jhfi2vrruvbb7ucyiwdolkkc2hf3xlm34f3qyd.onion:8080"
+                      ]
+                    },
+                    "unix_ts_end": {
+                      "type": "number",
+                      "title": "Final end time of the stream, obtained from the log time of the last STREAM CLOSED or STREAM FAILED event, given in seconds since the epoch"
+                    },
+                    "unix_ts_start": {
+                      "type": "number",
+                      "title": "Initial start time of the stream, obtained from the log time of the first STREAM NEW or STREAM NEWRESOLVE event, given in seconds since the epoch"
+                    }
+                  }
+                }
+              }
+            }
+          }
+        }
+      }
+    },
+    "type": {
+      "type": "string",
+      "title": "Document type",
+      "const": "onionperf"
+    },
+    "version": {
+      "type": "string",
+      "title": "Document version",
+      "pattern": "^3\\.[0-9]+$"
+    }
+  }
+}





More information about the tor-commits mailing list