[tor-commits] [metrics-web/release] Make bandwidth.csv independent of import order.

karsten at torproject.org karsten at torproject.org
Sat Nov 9 21:45:07 UTC 2019


commit 1fd062c11e45ca5c4cb166f6db8a27eabaf60e48
Author: Karsten Loesing <karsten.loesing at gmx.net>
Date:   Fri Mar 8 15:08:08 2019 +0100

    Make bandwidth.csv independent of import order.
    
    With this patch we're not overwriting bandwidth history parts with
    whichever history comes last, but we're computing the maximum value
    for each 15-minute interval of all imported bandwidth histories. This
    makes bandwidth.csv independent of descriptor import order.
---
 src/main/sql/bwhist/tordir.sql | 41 ++++++++++++++++++++++-------------------
 1 file changed, 22 insertions(+), 19 deletions(-)

diff --git a/src/main/sql/bwhist/tordir.sql b/src/main/sql/bwhist/tordir.sql
index dfe7b5d..047f18e 100644
--- a/src/main/sql/bwhist/tordir.sql
+++ b/src/main/sql/bwhist/tordir.sql
@@ -122,6 +122,24 @@ CREATE TABLE updates (
     date DATE
 );
 
+-- Return an array as the result of merging two arrays: if an array index is
+-- only contained in one array, that array element is included in the result;
+-- if an array index is contained in both arrays, the greater of the two
+-- elements is included.
+CREATE OR REPLACE FUNCTION array_merge(first BIGINT[], second BIGINT[])
+RETURNS BIGINT[] AS $$
+DECLARE
+  merged BIGINT[];
+BEGIN
+  FOR i IN LEAST(array_lower(first, 1), array_lower(second, 1))..
+      GREATEST(array_upper(first, 1), array_upper(second, 1)) LOOP
+    merged[i] := GREATEST(first[i], second[i]);
+  END LOOP;
+RETURN merged;
+END;
+$$ LANGUAGE plpgsql
+STABLE RETURNS NULL ON NULL INPUT;
+
 CREATE OR REPLACE FUNCTION array_sum (BIGINT[]) RETURNS BIGINT AS $$
   SELECT SUM($1[i])::bigint
   FROM generate_series(array_lower($1, 1), array_upper($1, 1)) index(i);
@@ -143,25 +161,10 @@ CREATE OR REPLACE FUNCTION insert_bwhist(
   ELSE
     BEGIN
     UPDATE bwhist
-    SET read[array_lower(insert_read, 1):
-          array_upper(insert_read, 1)] = insert_read,
-        written[array_lower(insert_written, 1):
-          array_upper(insert_written, 1)] = insert_written,
-        dirread[array_lower(insert_dirread, 1):
-          array_upper(insert_dirread, 1)] = insert_dirread,
-        dirwritten[array_lower(insert_dirwritten, 1):
-          array_upper(insert_dirwritten, 1)] = insert_dirwritten
-    WHERE fingerprint = insert_fingerprint AND date = insert_date;
-    -- Updating twice is an ugly workaround for PostgreSQL bug 5840
-    UPDATE bwhist
-    SET read[array_lower(insert_read, 1):
-          array_upper(insert_read, 1)] = insert_read,
-        written[array_lower(insert_written, 1):
-          array_upper(insert_written, 1)] = insert_written,
-        dirread[array_lower(insert_dirread, 1):
-          array_upper(insert_dirread, 1)] = insert_dirread,
-        dirwritten[array_lower(insert_dirwritten, 1):
-          array_upper(insert_dirwritten, 1)] = insert_dirwritten
+    SET read = array_merge(read, insert_read),
+        written = array_merge(written, insert_written),
+        dirread = array_merge(dirread, insert_dirread),
+        dirwritten = array_merge(dirwritten, insert_dirwritten)
     WHERE fingerprint = insert_fingerprint AND date = insert_date;
     END;
   END IF;





More information about the tor-commits mailing list