Add "data optimization" which treats empty fields in data.csv as equivalent to the previous entry.

This optimization takes data size down from 41 MB to 16MB which is ~40% which is huge!
2021-06-01 12:15:16 -07:00 · 2021-06-01 12:15:16 -07:00 · 419f2506e6
parent 424c954770
commit 419f2506e6
2 changed files with 7 additions and 1 deletions
--- a/hack/test-flake-chart/flake_chart.js
+++ b/hack/test-flake-chart/flake_chart.js
@ -49,12 +49,15 @@ async function loadTestData() {
  }

  const testData = [];
+  let lineData = ["", "", "", "", "", ""];
  for await (const line of lines) {
-    const splitLine = line.split(",");
+    let splitLine = line.split(",");
    if (splitLine.length != 6) {
      console.warn(`Found line with wrong number of fields. Actual: ${splitLine.length} Expected: 6. Line: "${line}"`);
      continue;
    }
+    splitLine = splitLine.map((value, index) => value === "" ? lineData[index] : value);
+    lineData = splitLine;
    if (!isValidEnumValue(testStatus, splitLine[4])) {
      console.warn(`Invalid test status provided. Actual: ${splitLine[4]} Expected: One of ${Object.values(testStatus).join(", ")}`);
      continue;
--- a/hack/test-flake-chart/optimize_data.sh
+++ b/hack/test-flake-chart/optimize_data.sh
@ -0,0 +1,3 @@
+#!/bin/bash
+
+awk -F, 'BEGIN {OFS = FS} { for(i=1; i<=NF; i++) { if($i == j[i]) { $i = ""; } else { j[i] = $i; } } printf "%s\n",$0 }'