[
  {
    "name": {
      "name": "num_references",
      "split": "test"
    },
    "count": 1,
    "sum": 4.0,
    "sum_squared": 16.0,
    "min": 4.0,
    "max": 4.0,
    "mean": 4.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_train_trials",
      "split": "test"
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_prompt_tokens",
      "split": "test"
    },
    "count": 1,
    "sum": 701.7872340425532,
    "sum_squared": 492505.3218650974,
    "min": 701.7872340425532,
    "max": 701.7872340425532,
    "mean": 701.7872340425532,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_completion_tokens",
      "split": "test"
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_output_tokens",
      "split": "test"
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "training_co2_cost",
      "split": "test"
    },
    "count": 0,
    "sum": 0,
    "sum_squared": 0
  },
  {
    "name": {
      "name": "training_energy_cost",
      "split": "test"
    },
    "count": 0,
    "sum": 0,
    "sum_squared": 0
  },
  {
    "name": {
      "name": "inference_runtime",
      "split": "test"
    },
    "count": 1,
    "sum": 0.40838242591695584,
    "sum_squared": 0.16677620579781793,
    "min": 0.40838242591695584,
    "max": 0.40838242591695584,
    "mean": 0.40838242591695584,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "batch_size",
      "split": "test"
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "finish_reason_length",
      "split": "test"
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "finish_reason_stop",
      "split": "test"
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "finish_reason_endoftext",
      "split": "test"
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "finish_reason_unknown",
      "split": "test"
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_train_instances",
      "split": "test"
    },
    "count": 1,
    "sum": 5.0,
    "sum_squared": 25.0,
    "min": 5.0,
    "max": 5.0,
    "mean": 5.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "prompt_truncated",
      "split": "test"
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "max_prob",
      "split": "test"
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "exact_match",
      "split": "test"
    },
    "count": 1,
    "sum": 0.723404255319149,
    "sum_squared": 0.5233137166138525,
    "min": 0.723404255319149,
    "max": 0.723404255319149,
    "mean": 0.723404255319149,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "exact_match@5",
      "split": "test"
    },
    "count": 1,
    "sum": 0.723404255319149,
    "sum_squared": 0.5233137166138525,
    "min": 0.723404255319149,
    "max": 0.723404255319149,
    "mean": 0.723404255319149,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "quasi_exact_match",
      "split": "test"
    },
    "count": 1,
    "sum": 0.723404255319149,
    "sum_squared": 0.5233137166138525,
    "min": 0.723404255319149,
    "max": 0.723404255319149,
    "mean": 0.723404255319149,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "quasi_exact_match@5",
      "split": "test"
    },
    "count": 1,
    "sum": 0.723404255319149,
    "sum_squared": 0.5233137166138525,
    "min": 0.723404255319149,
    "max": 0.723404255319149,
    "mean": 0.723404255319149,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "prefix_exact_match",
      "split": "test"
    },
    "count": 1,
    "sum": 0.723404255319149,
    "sum_squared": 0.5233137166138525,
    "min": 0.723404255319149,
    "max": 0.723404255319149,
    "mean": 0.723404255319149,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "prefix_exact_match@5",
      "split": "test"
    },
    "count": 1,
    "sum": 0.723404255319149,
    "sum_squared": 0.5233137166138525,
    "min": 0.723404255319149,
    "max": 0.723404255319149,
    "mean": 0.723404255319149,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "quasi_prefix_exact_match",
      "split": "test"
    },
    "count": 1,
    "sum": 0.723404255319149,
    "sum_squared": 0.5233137166138525,
    "min": 0.723404255319149,
    "max": 0.723404255319149,
    "mean": 0.723404255319149,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "quasi_prefix_exact_match@5",
      "split": "test"
    },
    "count": 1,
    "sum": 0.723404255319149,
    "sum_squared": 0.5233137166138525,
    "min": 0.723404255319149,
    "max": 0.723404255319149,
    "mean": 0.723404255319149,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "logprob",
      "split": "test"
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_perplexity_tokens",
      "split": "test"
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_bytes",
      "split": "test"
    },
    "count": 1,
    "sum": 1.4893617021276595,
    "sum_squared": 2.218198279764599,
    "min": 1.4893617021276595,
    "max": 1.4893617021276595,
    "mean": 1.4893617021276595,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_references",
      "split": "valid"
    },
    "count": 1,
    "sum": 4.0,
    "sum_squared": 16.0,
    "min": 4.0,
    "max": 4.0,
    "mean": 4.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_train_trials",
      "split": "valid"
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_prompt_tokens",
      "split": "valid"
    },
    "count": 1,
    "sum": 687.3333333333334,
    "sum_squared": 472427.1111111112,
    "min": 687.3333333333334,
    "max": 687.3333333333334,
    "mean": 687.3333333333334,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_completion_tokens",
      "split": "valid"
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_output_tokens",
      "split": "valid"
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "training_co2_cost",
      "split": "valid"
    },
    "count": 0,
    "sum": 0,
    "sum_squared": 0
  },
  {
    "name": {
      "name": "training_energy_cost",
      "split": "valid"
    },
    "count": 0,
    "sum": 0,
    "sum_squared": 0
  },
  {
    "name": {
      "name": "inference_runtime",
      "split": "valid"
    },
    "count": 1,
    "sum": 0.40913232167561847,
    "sum_squared": 0.16738925663968174,
    "min": 0.40913232167561847,
    "max": 0.40913232167561847,
    "mean": 0.40913232167561847,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "batch_size",
      "split": "valid"
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "finish_reason_length",
      "split": "valid"
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "finish_reason_stop",
      "split": "valid"
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "finish_reason_endoftext",
      "split": "valid"
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "finish_reason_unknown",
      "split": "valid"
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_train_instances",
      "split": "valid"
    },
    "count": 1,
    "sum": 5.0,
    "sum_squared": 25.0,
    "min": 5.0,
    "max": 5.0,
    "mean": 5.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "prompt_truncated",
      "split": "valid"
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "max_prob",
      "split": "valid"
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "exact_match",
      "split": "valid"
    },
    "count": 1,
    "sum": 0.6666666666666666,
    "sum_squared": 0.4444444444444444,
    "min": 0.6666666666666666,
    "max": 0.6666666666666666,
    "mean": 0.6666666666666666,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "exact_match@5",
      "split": "valid"
    },
    "count": 1,
    "sum": 0.6666666666666666,
    "sum_squared": 0.4444444444444444,
    "min": 0.6666666666666666,
    "max": 0.6666666666666666,
    "mean": 0.6666666666666666,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "quasi_exact_match",
      "split": "valid"
    },
    "count": 1,
    "sum": 0.6666666666666666,
    "sum_squared": 0.4444444444444444,
    "min": 0.6666666666666666,
    "max": 0.6666666666666666,
    "mean": 0.6666666666666666,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "quasi_exact_match@5",
      "split": "valid"
    },
    "count": 1,
    "sum": 0.6666666666666666,
    "sum_squared": 0.4444444444444444,
    "min": 0.6666666666666666,
    "max": 0.6666666666666666,
    "mean": 0.6666666666666666,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "prefix_exact_match",
      "split": "valid"
    },
    "count": 1,
    "sum": 0.6666666666666666,
    "sum_squared": 0.4444444444444444,
    "min": 0.6666666666666666,
    "max": 0.6666666666666666,
    "mean": 0.6666666666666666,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "prefix_exact_match@5",
      "split": "valid"
    },
    "count": 1,
    "sum": 0.6666666666666666,
    "sum_squared": 0.4444444444444444,
    "min": 0.6666666666666666,
    "max": 0.6666666666666666,
    "mean": 0.6666666666666666,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "quasi_prefix_exact_match",
      "split": "valid"
    },
    "count": 1,
    "sum": 0.6666666666666666,
    "sum_squared": 0.4444444444444444,
    "min": 0.6666666666666666,
    "max": 0.6666666666666666,
    "mean": 0.6666666666666666,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "quasi_prefix_exact_match@5",
      "split": "valid"
    },
    "count": 1,
    "sum": 0.6666666666666666,
    "sum_squared": 0.4444444444444444,
    "min": 0.6666666666666666,
    "max": 0.6666666666666666,
    "mean": 0.6666666666666666,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "logprob",
      "split": "valid"
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_perplexity_tokens",
      "split": "valid"
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_bytes",
      "split": "valid"
    },
    "count": 1,
    "sum": 1.6666666666666667,
    "sum_squared": 2.777777777777778,
    "min": 1.6666666666666667,
    "max": 1.6666666666666667,
    "mean": 1.6666666666666667,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "perplexity",
      "split": "test"
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "bits_per_byte",
      "split": "test"
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "logprob_per_byte",
      "split": "test"
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "perplexity",
      "split": "valid"
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "bits_per_byte",
      "split": "valid"
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "logprob_per_byte",
      "split": "valid"
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_references",
      "split": "test",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 4.0,
    "sum_squared": 16.0,
    "min": 4.0,
    "max": 4.0,
    "mean": 4.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_references",
      "split": "test",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 4.0,
    "sum_squared": 16.0,
    "min": 4.0,
    "max": 4.0,
    "mean": 4.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_train_trials",
      "split": "test",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_train_trials",
      "split": "test",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_prompt_tokens",
      "split": "test",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 701.7872340425532,
    "sum_squared": 492505.3218650974,
    "min": 701.7872340425532,
    "max": 701.7872340425532,
    "mean": 701.7872340425532,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_prompt_tokens",
      "split": "test",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 701.7872340425532,
    "sum_squared": 492505.3218650974,
    "min": 701.7872340425532,
    "max": 701.7872340425532,
    "mean": 701.7872340425532,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_completion_tokens",
      "split": "test",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_completion_tokens",
      "split": "test",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_output_tokens",
      "split": "test",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_output_tokens",
      "split": "test",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "inference_runtime",
      "split": "test",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.40838242591695584,
    "sum_squared": 0.16677620579781793,
    "min": 0.40838242591695584,
    "max": 0.40838242591695584,
    "mean": 0.40838242591695584,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "inference_runtime",
      "split": "test",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.40838242591695584,
    "sum_squared": 0.16677620579781793,
    "min": 0.40838242591695584,
    "max": 0.40838242591695584,
    "mean": 0.40838242591695584,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "batch_size",
      "split": "test",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "batch_size",
      "split": "test",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "finish_reason_length",
      "split": "test",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "finish_reason_length",
      "split": "test",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "finish_reason_stop",
      "split": "test",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "finish_reason_stop",
      "split": "test",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "finish_reason_endoftext",
      "split": "test",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "finish_reason_endoftext",
      "split": "test",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "finish_reason_unknown",
      "split": "test",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "finish_reason_unknown",
      "split": "test",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_train_instances",
      "split": "test",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 5.0,
    "sum_squared": 25.0,
    "min": 5.0,
    "max": 5.0,
    "mean": 5.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_train_instances",
      "split": "test",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 5.0,
    "sum_squared": 25.0,
    "min": 5.0,
    "max": 5.0,
    "mean": 5.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "prompt_truncated",
      "split": "test",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "prompt_truncated",
      "split": "test",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "max_prob",
      "split": "test",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "max_prob",
      "split": "test",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "exact_match",
      "split": "test",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.723404255319149,
    "sum_squared": 0.5233137166138525,
    "min": 0.723404255319149,
    "max": 0.723404255319149,
    "mean": 0.723404255319149,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "exact_match",
      "split": "test",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.723404255319149,
    "sum_squared": 0.5233137166138525,
    "min": 0.723404255319149,
    "max": 0.723404255319149,
    "mean": 0.723404255319149,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "exact_match@5",
      "split": "test",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.723404255319149,
    "sum_squared": 0.5233137166138525,
    "min": 0.723404255319149,
    "max": 0.723404255319149,
    "mean": 0.723404255319149,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "exact_match@5",
      "split": "test",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.723404255319149,
    "sum_squared": 0.5233137166138525,
    "min": 0.723404255319149,
    "max": 0.723404255319149,
    "mean": 0.723404255319149,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "quasi_exact_match",
      "split": "test",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.723404255319149,
    "sum_squared": 0.5233137166138525,
    "min": 0.723404255319149,
    "max": 0.723404255319149,
    "mean": 0.723404255319149,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "quasi_exact_match",
      "split": "test",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.723404255319149,
    "sum_squared": 0.5233137166138525,
    "min": 0.723404255319149,
    "max": 0.723404255319149,
    "mean": 0.723404255319149,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "quasi_exact_match@5",
      "split": "test",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.723404255319149,
    "sum_squared": 0.5233137166138525,
    "min": 0.723404255319149,
    "max": 0.723404255319149,
    "mean": 0.723404255319149,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "quasi_exact_match@5",
      "split": "test",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.723404255319149,
    "sum_squared": 0.5233137166138525,
    "min": 0.723404255319149,
    "max": 0.723404255319149,
    "mean": 0.723404255319149,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "prefix_exact_match",
      "split": "test",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.723404255319149,
    "sum_squared": 0.5233137166138525,
    "min": 0.723404255319149,
    "max": 0.723404255319149,
    "mean": 0.723404255319149,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "prefix_exact_match",
      "split": "test",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.723404255319149,
    "sum_squared": 0.5233137166138525,
    "min": 0.723404255319149,
    "max": 0.723404255319149,
    "mean": 0.723404255319149,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "prefix_exact_match@5",
      "split": "test",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.723404255319149,
    "sum_squared": 0.5233137166138525,
    "min": 0.723404255319149,
    "max": 0.723404255319149,
    "mean": 0.723404255319149,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "prefix_exact_match@5",
      "split": "test",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.723404255319149,
    "sum_squared": 0.5233137166138525,
    "min": 0.723404255319149,
    "max": 0.723404255319149,
    "mean": 0.723404255319149,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "quasi_prefix_exact_match",
      "split": "test",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.723404255319149,
    "sum_squared": 0.5233137166138525,
    "min": 0.723404255319149,
    "max": 0.723404255319149,
    "mean": 0.723404255319149,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "quasi_prefix_exact_match",
      "split": "test",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.723404255319149,
    "sum_squared": 0.5233137166138525,
    "min": 0.723404255319149,
    "max": 0.723404255319149,
    "mean": 0.723404255319149,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "quasi_prefix_exact_match@5",
      "split": "test",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.723404255319149,
    "sum_squared": 0.5233137166138525,
    "min": 0.723404255319149,
    "max": 0.723404255319149,
    "mean": 0.723404255319149,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "quasi_prefix_exact_match@5",
      "split": "test",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.723404255319149,
    "sum_squared": 0.5233137166138525,
    "min": 0.723404255319149,
    "max": 0.723404255319149,
    "mean": 0.723404255319149,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "logprob",
      "split": "test",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "logprob",
      "split": "test",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_perplexity_tokens",
      "split": "test",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_perplexity_tokens",
      "split": "test",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_bytes",
      "split": "test",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.4893617021276595,
    "sum_squared": 2.218198279764599,
    "min": 1.4893617021276595,
    "max": 1.4893617021276595,
    "mean": 1.4893617021276595,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_bytes",
      "split": "test",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.4893617021276595,
    "sum_squared": 2.218198279764599,
    "min": 1.4893617021276595,
    "max": 1.4893617021276595,
    "mean": 1.4893617021276595,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_references",
      "split": "valid",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 4.0,
    "sum_squared": 16.0,
    "min": 4.0,
    "max": 4.0,
    "mean": 4.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_references",
      "split": "valid",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 4.0,
    "sum_squared": 16.0,
    "min": 4.0,
    "max": 4.0,
    "mean": 4.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_train_trials",
      "split": "valid",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_train_trials",
      "split": "valid",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_prompt_tokens",
      "split": "valid",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 687.3333333333334,
    "sum_squared": 472427.1111111112,
    "min": 687.3333333333334,
    "max": 687.3333333333334,
    "mean": 687.3333333333334,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_prompt_tokens",
      "split": "valid",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 687.3333333333334,
    "sum_squared": 472427.1111111112,
    "min": 687.3333333333334,
    "max": 687.3333333333334,
    "mean": 687.3333333333334,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_completion_tokens",
      "split": "valid",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_completion_tokens",
      "split": "valid",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_output_tokens",
      "split": "valid",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_output_tokens",
      "split": "valid",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "inference_runtime",
      "split": "valid",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.40913232167561847,
    "sum_squared": 0.16738925663968174,
    "min": 0.40913232167561847,
    "max": 0.40913232167561847,
    "mean": 0.40913232167561847,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "inference_runtime",
      "split": "valid",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.40913232167561847,
    "sum_squared": 0.16738925663968174,
    "min": 0.40913232167561847,
    "max": 0.40913232167561847,
    "mean": 0.40913232167561847,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "batch_size",
      "split": "valid",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "batch_size",
      "split": "valid",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "finish_reason_length",
      "split": "valid",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "finish_reason_length",
      "split": "valid",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "finish_reason_stop",
      "split": "valid",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "finish_reason_stop",
      "split": "valid",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "finish_reason_endoftext",
      "split": "valid",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "finish_reason_endoftext",
      "split": "valid",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "finish_reason_unknown",
      "split": "valid",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "finish_reason_unknown",
      "split": "valid",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_train_instances",
      "split": "valid",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 5.0,
    "sum_squared": 25.0,
    "min": 5.0,
    "max": 5.0,
    "mean": 5.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_train_instances",
      "split": "valid",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 5.0,
    "sum_squared": 25.0,
    "min": 5.0,
    "max": 5.0,
    "mean": 5.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "prompt_truncated",
      "split": "valid",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "prompt_truncated",
      "split": "valid",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "max_prob",
      "split": "valid",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "max_prob",
      "split": "valid",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "exact_match",
      "split": "valid",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.6666666666666666,
    "sum_squared": 0.4444444444444444,
    "min": 0.6666666666666666,
    "max": 0.6666666666666666,
    "mean": 0.6666666666666666,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "exact_match",
      "split": "valid",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.6666666666666666,
    "sum_squared": 0.4444444444444444,
    "min": 0.6666666666666666,
    "max": 0.6666666666666666,
    "mean": 0.6666666666666666,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "exact_match@5",
      "split": "valid",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.6666666666666666,
    "sum_squared": 0.4444444444444444,
    "min": 0.6666666666666666,
    "max": 0.6666666666666666,
    "mean": 0.6666666666666666,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "exact_match@5",
      "split": "valid",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.6666666666666666,
    "sum_squared": 0.4444444444444444,
    "min": 0.6666666666666666,
    "max": 0.6666666666666666,
    "mean": 0.6666666666666666,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "quasi_exact_match",
      "split": "valid",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.6666666666666666,
    "sum_squared": 0.4444444444444444,
    "min": 0.6666666666666666,
    "max": 0.6666666666666666,
    "mean": 0.6666666666666666,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "quasi_exact_match",
      "split": "valid",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.6666666666666666,
    "sum_squared": 0.4444444444444444,
    "min": 0.6666666666666666,
    "max": 0.6666666666666666,
    "mean": 0.6666666666666666,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "quasi_exact_match@5",
      "split": "valid",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.6666666666666666,
    "sum_squared": 0.4444444444444444,
    "min": 0.6666666666666666,
    "max": 0.6666666666666666,
    "mean": 0.6666666666666666,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "quasi_exact_match@5",
      "split": "valid",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.6666666666666666,
    "sum_squared": 0.4444444444444444,
    "min": 0.6666666666666666,
    "max": 0.6666666666666666,
    "mean": 0.6666666666666666,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "prefix_exact_match",
      "split": "valid",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.6666666666666666,
    "sum_squared": 0.4444444444444444,
    "min": 0.6666666666666666,
    "max": 0.6666666666666666,
    "mean": 0.6666666666666666,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "prefix_exact_match",
      "split": "valid",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.6666666666666666,
    "sum_squared": 0.4444444444444444,
    "min": 0.6666666666666666,
    "max": 0.6666666666666666,
    "mean": 0.6666666666666666,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "prefix_exact_match@5",
      "split": "valid",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.6666666666666666,
    "sum_squared": 0.4444444444444444,
    "min": 0.6666666666666666,
    "max": 0.6666666666666666,
    "mean": 0.6666666666666666,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "prefix_exact_match@5",
      "split": "valid",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.6666666666666666,
    "sum_squared": 0.4444444444444444,
    "min": 0.6666666666666666,
    "max": 0.6666666666666666,
    "mean": 0.6666666666666666,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "quasi_prefix_exact_match",
      "split": "valid",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.6666666666666666,
    "sum_squared": 0.4444444444444444,
    "min": 0.6666666666666666,
    "max": 0.6666666666666666,
    "mean": 0.6666666666666666,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "quasi_prefix_exact_match",
      "split": "valid",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.6666666666666666,
    "sum_squared": 0.4444444444444444,
    "min": 0.6666666666666666,
    "max": 0.6666666666666666,
    "mean": 0.6666666666666666,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "quasi_prefix_exact_match@5",
      "split": "valid",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.6666666666666666,
    "sum_squared": 0.4444444444444444,
    "min": 0.6666666666666666,
    "max": 0.6666666666666666,
    "mean": 0.6666666666666666,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "quasi_prefix_exact_match@5",
      "split": "valid",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.6666666666666666,
    "sum_squared": 0.4444444444444444,
    "min": 0.6666666666666666,
    "max": 0.6666666666666666,
    "mean": 0.6666666666666666,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "logprob",
      "split": "valid",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "logprob",
      "split": "valid",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 0.0,
    "sum_squared": 0.0,
    "min": 0.0,
    "max": 0.0,
    "mean": 0.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_perplexity_tokens",
      "split": "valid",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_perplexity_tokens",
      "split": "valid",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.0,
    "sum_squared": 1.0,
    "min": 1.0,
    "max": 1.0,
    "mean": 1.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_bytes",
      "split": "valid",
      "perturbation": {
        "name": "robustness",
        "robustness": true,
        "fairness": false,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.6666666666666667,
    "sum_squared": 2.777777777777778,
    "min": 1.6666666666666667,
    "max": 1.6666666666666667,
    "mean": 1.6666666666666667,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_bytes",
      "split": "valid",
      "perturbation": {
        "name": "fairness",
        "robustness": false,
        "fairness": true,
        "computed_on": "worst"
      }
    },
    "count": 1,
    "sum": 1.6666666666666667,
    "sum_squared": 2.777777777777778,
    "min": 1.6666666666666667,
    "max": 1.6666666666666667,
    "mean": 1.6666666666666667,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_instances",
      "split": "test"
    },
    "count": 1,
    "sum": 47.0,
    "sum_squared": 2209.0,
    "min": 47.0,
    "max": 47.0,
    "mean": 47.0,
    "variance": 0.0,
    "stddev": 0.0
  },
  {
    "name": {
      "name": "num_instances",
      "split": "valid"
    },
    "count": 1,
    "sum": 3.0,
    "sum_squared": 9.0,
    "min": 3.0,
    "max": 3.0,
    "mean": 3.0,
    "variance": 0.0,
    "stddev": 0.0
  }
]