[
  {
    "instance_id": "id1413",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3464,
        "sum_squared": 11999296,
        "min": 3464,
        "max": 3464,
        "mean": 3464.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.7125389575958252,
        "sum_squared": 0.5077117660917452,
        "min": 0.7125389575958252,
        "max": 0.7125389575958252,
        "mean": 0.7125389575958252,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 0.8571428571428571,
        "sum_squared": 0.7346938775510203,
        "min": 0.8571428571428571,
        "max": 0.8571428571428571,
        "mean": 0.8571428571428571,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 0.5,
        "sum_squared": 0.25,
        "min": 0.5,
        "max": 0.5,
        "mean": 0.5,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 2.2250738585072626e-308,
        "sum_squared": 0.0,
        "min": 2.2250738585072626e-308,
        "max": 2.2250738585072626e-308,
        "mean": 2.2250738585072626e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 21,
        "sum_squared": 441,
        "min": 21,
        "max": 21,
        "mean": 21.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1332",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3323,
        "sum_squared": 11042329,
        "min": 3323,
        "max": 3323,
        "mean": 3323.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.7003147602081299,
        "sum_squared": 0.49044076336537046,
        "min": 0.7003147602081299,
        "max": 0.7003147602081299,
        "mean": 0.7003147602081299,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 0.6666666666666666,
        "sum_squared": 0.4444444444444444,
        "min": 0.6666666666666666,
        "max": 0.6666666666666666,
        "mean": 0.6666666666666666,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 0.6666666666666666,
        "sum_squared": 0.4444444444444444,
        "min": 0.6666666666666666,
        "max": 0.6666666666666666,
        "mean": 0.6666666666666666,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 7,
        "sum_squared": 49,
        "min": 7,
        "max": 7,
        "mean": 7.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1123",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "valid"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 3320,
        "sum_squared": 11022400,
        "min": 3320,
        "max": 3320,
        "mean": 3320.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "valid"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "valid"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "valid"
        },
        "count": 1,
        "sum": 0.6937730312347412,
        "sum_squared": 0.4813210188686412,
        "min": 0.6937730312347412,
        "max": 0.6937730312347412,
        "mean": 0.6937730312347412,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "valid"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "valid"
        },
        "count": 1,
        "sum": 0.6666666666666666,
        "sum_squared": 0.4444444444444444,
        "min": 0.6666666666666666,
        "max": 0.6666666666666666,
        "mean": 0.6666666666666666,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "valid"
        },
        "count": 1,
        "sum": 0.6666666666666666,
        "sum_squared": 0.4444444444444444,
        "min": 0.6666666666666666,
        "max": 0.6666666666666666,
        "mean": 0.6666666666666666,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "valid"
        },
        "count": 1,
        "sum": 11,
        "sum_squared": 121,
        "min": 11,
        "max": 11,
        "mean": 11.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1514",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3455,
        "sum_squared": 11937025,
        "min": 3455,
        "max": 3455,
        "mean": 3455.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.6071457862854004,
        "sum_squared": 0.3686260058041171,
        "min": 0.6071457862854004,
        "max": 0.6071457862854004,
        "mean": 0.6071457862854004,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 2.2250738585072626e-308,
        "sum_squared": 0.0,
        "min": 2.2250738585072626e-308,
        "max": 2.2250738585072626e-308,
        "mean": 2.2250738585072626e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 13,
        "sum_squared": 169,
        "min": 13,
        "max": 13,
        "mean": 13.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1340",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 2995,
        "sum_squared": 8970025,
        "min": 2995,
        "max": 2995,
        "mean": 2995.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.7272942066192627,
        "sum_squared": 0.5289568629819428,
        "min": 0.7272942066192627,
        "max": 0.7272942066192627,
        "mean": 0.7272942066192627,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 0.6666666666666666,
        "sum_squared": 0.4444444444444444,
        "min": 0.6666666666666666,
        "max": 0.6666666666666666,
        "mean": 0.6666666666666666,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 0.5882352941176471,
        "sum_squared": 0.34602076124567477,
        "min": 0.5882352941176471,
        "max": 0.5882352941176471,
        "mean": 0.5882352941176471,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 0.4,
        "sum_squared": 0.16000000000000003,
        "min": 0.4,
        "max": 0.4,
        "mean": 0.4,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 2.2250738585072626e-308,
        "sum_squared": 0.0,
        "min": 2.2250738585072626e-308,
        "max": 2.2250738585072626e-308,
        "mean": 2.2250738585072626e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 28,
        "sum_squared": 784,
        "min": 28,
        "max": 28,
        "mean": 28.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1281",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3571,
        "sum_squared": 12752041,
        "min": 3571,
        "max": 3571,
        "mean": 3571.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.6679620742797852,
        "sum_squared": 0.4461733326761532,
        "min": 0.6679620742797852,
        "max": 0.6679620742797852,
        "mean": 0.6679620742797852,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 0.15384615384615385,
        "sum_squared": 0.02366863905325444,
        "min": 0.15384615384615385,
        "max": 0.15384615384615385,
        "mean": 0.15384615384615385,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 0.13333333333333333,
        "sum_squared": 0.017777777777777778,
        "min": 0.13333333333333333,
        "max": 0.13333333333333333,
        "mean": 0.13333333333333333,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 0.08333333333333333,
        "sum_squared": 0.006944444444444444,
        "min": 0.08333333333333333,
        "max": 0.08333333333333333,
        "mean": 0.08333333333333333,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 2.2250738585072626e-308,
        "sum_squared": 0.0,
        "min": 2.2250738585072626e-308,
        "max": 2.2250738585072626e-308,
        "mean": 2.2250738585072626e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 70,
        "sum_squared": 4900,
        "min": 70,
        "max": 70,
        "mean": 70.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1234",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3293,
        "sum_squared": 10843849,
        "min": 3293,
        "max": 3293,
        "mean": 3293.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.5743286609649658,
        "sum_squared": 0.32985341080581065,
        "min": 0.5743286609649658,
        "max": 0.5743286609649658,
        "mean": 0.5743286609649658,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 0.5,
        "sum_squared": 0.25,
        "min": 0.5,
        "max": 0.5,
        "mean": 0.5,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 0.4,
        "sum_squared": 0.16000000000000003,
        "min": 0.4,
        "max": 0.4,
        "mean": 0.4,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 11,
        "sum_squared": 121,
        "min": 11,
        "max": 11,
        "mean": 11.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1237",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3614,
        "sum_squared": 13060996,
        "min": 3614,
        "max": 3614,
        "mean": 3614.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.4558103084564209,
        "sum_squared": 0.20776303729513756,
        "min": 0.4558103084564209,
        "max": 0.4558103084564209,
        "mean": 0.4558103084564209,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 2.2250738585072626e-308,
        "sum_squared": 0.0,
        "min": 2.2250738585072626e-308,
        "max": 2.2250738585072626e-308,
        "mean": 2.2250738585072626e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 9,
        "sum_squared": 81,
        "min": 9,
        "max": 9,
        "mean": 9.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1173",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "valid"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 3381,
        "sum_squared": 11431161,
        "min": 3381,
        "max": 3381,
        "mean": 3381.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "valid"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "valid"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "valid"
        },
        "count": 1,
        "sum": 0.7605588436126709,
        "sum_squared": 0.5784497545974432,
        "min": 0.7605588436126709,
        "max": 0.7605588436126709,
        "mean": 0.7605588436126709,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "valid"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "valid"
        },
        "count": 1,
        "sum": 0.7788007830714049,
        "sum_squared": 0.6065306597126334,
        "min": 0.7788007830714049,
        "max": 0.7788007830714049,
        "mean": 0.7788007830714049,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "valid"
        },
        "count": 1,
        "sum": 0.7788007830714049,
        "sum_squared": 0.6065306597126334,
        "min": 0.7788007830714049,
        "max": 0.7788007830714049,
        "mean": 0.7788007830714049,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "valid"
        },
        "count": 1,
        "sum": 29,
        "sum_squared": 841,
        "min": 29,
        "max": 29,
        "mean": 29.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1483",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3191,
        "sum_squared": 10182481,
        "min": 3191,
        "max": 3191,
        "mean": 3191.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.5537986755371094,
        "sum_squared": 0.30669297302665655,
        "min": 0.5537986755371094,
        "max": 0.5537986755371094,
        "mean": 0.5537986755371094,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 0.5,
        "sum_squared": 0.25,
        "min": 0.5,
        "max": 0.5,
        "mean": 0.5,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 0.5,
        "sum_squared": 0.25,
        "min": 0.5,
        "max": 0.5,
        "mean": 0.5,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 26,
        "sum_squared": 676,
        "min": 26,
        "max": 26,
        "mean": 26.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1474",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3496,
        "sum_squared": 12222016,
        "min": 3496,
        "max": 3496,
        "mean": 3496.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.6231951713562012,
        "sum_squared": 0.38837222160168494,
        "min": 0.6231951713562012,
        "max": 0.6231951713562012,
        "mean": 0.6231951713562012,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 0.7499999999999999,
        "sum_squared": 0.5624999999999999,
        "min": 0.7499999999999999,
        "max": 0.7499999999999999,
        "mean": 0.7499999999999999,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 0.8,
        "sum_squared": 0.6400000000000001,
        "min": 0.8,
        "max": 0.8,
        "mean": 0.8,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 0.6703200460356393,
        "sum_squared": 0.4493289641172216,
        "min": 0.6703200460356393,
        "max": 0.6703200460356393,
        "mean": 0.6703200460356393,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 1.491511611267286e-308,
        "sum_squared": 0.0,
        "min": 1.491511611267286e-308,
        "max": 1.491511611267286e-308,
        "mean": 1.491511611267286e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 20,
        "sum_squared": 400,
        "min": 20,
        "max": 20,
        "mean": 20.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1571",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3636,
        "sum_squared": 13220496,
        "min": 3636,
        "max": 3636,
        "mean": 3636.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.6136291027069092,
        "sum_squared": 0.3765406756888865,
        "min": 0.6136291027069092,
        "max": 0.6136291027069092,
        "mean": 0.6136291027069092,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 0.5,
        "sum_squared": 0.25,
        "min": 0.5,
        "max": 0.5,
        "mean": 0.5,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 0.42857142857142855,
        "sum_squared": 0.18367346938775508,
        "min": 0.42857142857142855,
        "max": 0.42857142857142855,
        "mean": 0.42857142857142855,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 0.3333333333333333,
        "sum_squared": 0.1111111111111111,
        "min": 0.3333333333333333,
        "max": 0.3333333333333333,
        "mean": 0.3333333333333333,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 2.2250738585072626e-308,
        "sum_squared": 0.0,
        "min": 2.2250738585072626e-308,
        "max": 2.2250738585072626e-308,
        "mean": 2.2250738585072626e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 40,
        "sum_squared": 1600,
        "min": 40,
        "max": 40,
        "mean": 40.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1366",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3723,
        "sum_squared": 13860729,
        "min": 3723,
        "max": 3723,
        "mean": 3723.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.44627857208251953,
        "sum_squared": 0.19916456390001258,
        "min": 0.44627857208251953,
        "max": 0.44627857208251953,
        "mean": 0.44627857208251953,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 0.8571428571428572,
        "sum_squared": 0.7346938775510206,
        "min": 0.8571428571428572,
        "max": 0.8571428571428572,
        "mean": 0.8571428571428572,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 0.782608695652174,
        "sum_squared": 0.612476370510397,
        "min": 0.782608695652174,
        "max": 0.782608695652174,
        "mean": 0.782608695652174,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 0.7,
        "sum_squared": 0.48999999999999994,
        "min": 0.7,
        "max": 0.7,
        "mean": 0.7,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 0.5714285714285714,
        "sum_squared": 0.32653061224489793,
        "min": 0.5714285714285714,
        "max": 0.5714285714285714,
        "mean": 0.5714285714285714,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 43,
        "sum_squared": 1849,
        "min": 43,
        "max": 43,
        "mean": 43.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1442",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3495,
        "sum_squared": 12215025,
        "min": 3495,
        "max": 3495,
        "mean": 3495.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.5825526714324951,
        "sum_squared": 0.3393676149931366,
        "min": 0.5825526714324951,
        "max": 0.5825526714324951,
        "mean": 0.5825526714324951,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 0.0,
        "sum_squared": 0.0,
        "min": 0.0,
        "max": 0.0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 13,
        "sum_squared": 169,
        "min": 13,
        "max": 13,
        "mean": 13.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1529",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3263,
        "sum_squared": 10647169,
        "min": 3263,
        "max": 3263,
        "mean": 3263.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.4336731433868408,
        "sum_squared": 0.1880723952950234,
        "min": 0.4336731433868408,
        "max": 0.4336731433868408,
        "mean": 0.4336731433868408,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 2.2250738585072626e-308,
        "sum_squared": 0.0,
        "min": 2.2250738585072626e-308,
        "max": 2.2250738585072626e-308,
        "mean": 2.2250738585072626e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 9,
        "sum_squared": 81,
        "min": 9,
        "max": 9,
        "mean": 9.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1209",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "valid"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 3485,
        "sum_squared": 12145225,
        "min": 3485,
        "max": 3485,
        "mean": 3485.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "valid"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "valid"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "valid"
        },
        "count": 1,
        "sum": 0.5985329151153564,
        "sum_squared": 0.3582416504764865,
        "min": 0.5985329151153564,
        "max": 0.5985329151153564,
        "mean": 0.5985329151153564,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "valid"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "valid"
        },
        "count": 1,
        "sum": 2.2250738585072626e-308,
        "sum_squared": 0.0,
        "min": 2.2250738585072626e-308,
        "max": 2.2250738585072626e-308,
        "mean": 2.2250738585072626e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "valid"
        },
        "count": 1,
        "sum": 20,
        "sum_squared": 400,
        "min": 20,
        "max": 20,
        "mean": 20.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1408",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3239,
        "sum_squared": 10491121,
        "min": 3239,
        "max": 3239,
        "mean": 3239.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.6681976318359375,
        "sum_squared": 0.4464880751911551,
        "min": 0.6681976318359375,
        "max": 0.6681976318359375,
        "mean": 0.6681976318359375,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 0.2,
        "sum_squared": 0.04000000000000001,
        "min": 0.2,
        "max": 0.2,
        "mean": 0.2,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 0.08695652173913043,
        "sum_squared": 0.007561436672967863,
        "min": 0.08695652173913043,
        "max": 0.08695652173913043,
        "mean": 0.08695652173913043,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 0.17647058823529413,
        "sum_squared": 0.031141868512110732,
        "min": 0.17647058823529413,
        "max": 0.17647058823529413,
        "mean": 0.17647058823529413,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 2.2250738585072626e-308,
        "sum_squared": 0.0,
        "min": 2.2250738585072626e-308,
        "max": 2.2250738585072626e-308,
        "mean": 2.2250738585072626e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 90,
        "sum_squared": 8100,
        "min": 90,
        "max": 90,
        "mean": 90.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1315",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3140,
        "sum_squared": 9859600,
        "min": 3140,
        "max": 3140,
        "mean": 3140.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.6611320972442627,
        "sum_squared": 0.4370956500065972,
        "min": 0.6611320972442627,
        "max": 0.6611320972442627,
        "mean": 0.6611320972442627,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 21,
        "sum_squared": 441,
        "min": 21,
        "max": 21,
        "mean": 21.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1421",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3721,
        "sum_squared": 13845841,
        "min": 3721,
        "max": 3721,
        "mean": 3721.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.6954751014709473,
        "sum_squared": 0.4836856167660244,
        "min": 0.6954751014709473,
        "max": 0.6954751014709473,
        "mean": 0.6954751014709473,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 0.5882352941176471,
        "sum_squared": 0.34602076124567477,
        "min": 0.5882352941176471,
        "max": 0.5882352941176471,
        "mean": 0.5882352941176471,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 0.6,
        "sum_squared": 0.36,
        "min": 0.6,
        "max": 0.6,
        "mean": 0.6,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 0.4375,
        "sum_squared": 0.19140625,
        "min": 0.4375,
        "max": 0.4375,
        "mean": 0.4375,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 2.2250738585072626e-308,
        "sum_squared": 0.0,
        "min": 2.2250738585072626e-308,
        "max": 2.2250738585072626e-308,
        "mean": 2.2250738585072626e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 69,
        "sum_squared": 4761,
        "min": 69,
        "max": 69,
        "mean": 69.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1308",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3588,
        "sum_squared": 12873744,
        "min": 3588,
        "max": 3588,
        "mean": 3588.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.5277736186981201,
        "sum_squared": 0.2785449925937087,
        "min": 0.5277736186981201,
        "max": 0.5277736186981201,
        "mean": 0.5277736186981201,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 0.6666666666666666,
        "sum_squared": 0.4444444444444444,
        "min": 0.6666666666666666,
        "max": 0.6666666666666666,
        "mean": 0.6666666666666666,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 0.6666666666666666,
        "sum_squared": 0.4444444444444444,
        "min": 0.6666666666666666,
        "max": 0.6666666666666666,
        "mean": 0.6666666666666666,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 0.5,
        "sum_squared": 0.25,
        "min": 0.5,
        "max": 0.5,
        "mean": 0.5,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 2.2250738585072626e-308,
        "sum_squared": 0.0,
        "min": 2.2250738585072626e-308,
        "max": 2.2250738585072626e-308,
        "mean": 2.2250738585072626e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 17,
        "sum_squared": 289,
        "min": 17,
        "max": 17,
        "mean": 17.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1456",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3404,
        "sum_squared": 11587216,
        "min": 3404,
        "max": 3404,
        "mean": 3404.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.3675065040588379,
        "sum_squared": 0.13506103052554863,
        "min": 0.3675065040588379,
        "max": 0.3675065040588379,
        "mean": 0.3675065040588379,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 0.6666666666666666,
        "sum_squared": 0.4444444444444444,
        "min": 0.6666666666666666,
        "max": 0.6666666666666666,
        "mean": 0.6666666666666666,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 2.2250738585072626e-308,
        "sum_squared": 0.0,
        "min": 2.2250738585072626e-308,
        "max": 2.2250738585072626e-308,
        "mean": 2.2250738585072626e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 31,
        "sum_squared": 961,
        "min": 31,
        "max": 31,
        "mean": 31.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1335",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3612,
        "sum_squared": 13046544,
        "min": 3612,
        "max": 3612,
        "mean": 3612.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.5181593894958496,
        "sum_squared": 0.2684891529227116,
        "min": 0.5181593894958496,
        "max": 0.5181593894958496,
        "mean": 0.5181593894958496,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 2.2250738585072626e-308,
        "sum_squared": 0.0,
        "min": 2.2250738585072626e-308,
        "max": 2.2250738585072626e-308,
        "mean": 2.2250738585072626e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 10,
        "sum_squared": 100,
        "min": 10,
        "max": 10,
        "mean": 10.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1337",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3339,
        "sum_squared": 11148921,
        "min": 3339,
        "max": 3339,
        "mean": 3339.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.5959987640380859,
        "sum_squared": 0.35521452673492604,
        "min": 0.5959987640380859,
        "max": 0.5959987640380859,
        "mean": 0.5959987640380859,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 2.2250738585072626e-308,
        "sum_squared": 0.0,
        "min": 2.2250738585072626e-308,
        "max": 2.2250738585072626e-308,
        "mean": 2.2250738585072626e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 16,
        "sum_squared": 256,
        "min": 16,
        "max": 16,
        "mean": 16.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1114",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "valid"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 3132,
        "sum_squared": 9809424,
        "min": 3132,
        "max": 3132,
        "mean": 3132.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "valid"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "valid"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "valid"
        },
        "count": 1,
        "sum": 0.4272313117980957,
        "sum_squared": 0.18252659378072167,
        "min": 0.4272313117980957,
        "max": 0.4272313117980957,
        "mean": 0.4272313117980957,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "valid"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "valid"
        },
        "count": 1,
        "sum": 2.2250738585072626e-308,
        "sum_squared": 0.0,
        "min": 2.2250738585072626e-308,
        "max": 2.2250738585072626e-308,
        "mean": 2.2250738585072626e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "valid"
        },
        "count": 1,
        "sum": 9,
        "sum_squared": 81,
        "min": 9,
        "max": 9,
        "mean": 9.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1198",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "valid"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 3495,
        "sum_squared": 12215025,
        "min": 3495,
        "max": 3495,
        "mean": 3495.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "valid"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "valid"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "valid"
        },
        "count": 1,
        "sum": 0.4658520221710205,
        "sum_squared": 0.21701810656082898,
        "min": 0.4658520221710205,
        "max": 0.4658520221710205,
        "mean": 0.4658520221710205,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "valid"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "valid"
        },
        "count": 1,
        "sum": 0.5,
        "sum_squared": 0.25,
        "min": 0.5,
        "max": 0.5,
        "mean": 0.5,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "valid"
        },
        "count": 1,
        "sum": 0.2222222222222222,
        "sum_squared": 0.04938271604938271,
        "min": 0.2222222222222222,
        "max": 0.2222222222222222,
        "mean": 0.2222222222222222,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "valid"
        },
        "count": 1,
        "sum": 0.2857142857142857,
        "sum_squared": 0.08163265306122448,
        "min": 0.2857142857142857,
        "max": 0.2857142857142857,
        "mean": 0.2857142857142857,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "valid"
        },
        "count": 1,
        "sum": 2.2250738585072626e-308,
        "sum_squared": 0.0,
        "min": 2.2250738585072626e-308,
        "max": 2.2250738585072626e-308,
        "mean": 2.2250738585072626e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "valid"
        },
        "count": 1,
        "sum": 29,
        "sum_squared": 841,
        "min": 29,
        "max": 29,
        "mean": 29.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1178",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "valid"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 3060,
        "sum_squared": 9363600,
        "min": 3060,
        "max": 3060,
        "mean": 3060.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "valid"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "valid"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "valid"
        },
        "count": 1,
        "sum": 0.485506534576416,
        "sum_squared": 0.23571659511640064,
        "min": 0.485506534576416,
        "max": 0.485506534576416,
        "mean": 0.485506534576416,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "valid"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "valid"
        },
        "count": 1,
        "sum": 2.2250738585072626e-308,
        "sum_squared": 0.0,
        "min": 2.2250738585072626e-308,
        "max": 2.2250738585072626e-308,
        "mean": 2.2250738585072626e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "valid"
        },
        "count": 1,
        "sum": 20,
        "sum_squared": 400,
        "min": 20,
        "max": 20,
        "mean": 20.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1117",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "valid"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 3451,
        "sum_squared": 11909401,
        "min": 3451,
        "max": 3451,
        "mean": 3451.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "valid"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "valid"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "valid"
        },
        "count": 1,
        "sum": 0.4716372489929199,
        "sum_squared": 0.22244169463760954,
        "min": 0.4716372489929199,
        "max": 0.4716372489929199,
        "mean": 0.4716372489929199,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "valid"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "valid"
        },
        "count": 1,
        "sum": 0.5,
        "sum_squared": 0.25,
        "min": 0.5,
        "max": 0.5,
        "mean": 0.5,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "valid"
        },
        "count": 1,
        "sum": 2.2250738585072626e-308,
        "sum_squared": 0.0,
        "min": 2.2250738585072626e-308,
        "max": 2.2250738585072626e-308,
        "mean": 2.2250738585072626e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "valid"
        },
        "count": 1,
        "sum": 14,
        "sum_squared": 196,
        "min": 14,
        "max": 14,
        "mean": 14.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1273",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3719,
        "sum_squared": 13830961,
        "min": 3719,
        "max": 3719,
        "mean": 3719.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.8274936676025391,
        "sum_squared": 0.6847457699223014,
        "min": 0.8274936676025391,
        "max": 0.8274936676025391,
        "mean": 0.8274936676025391,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 0.8,
        "sum_squared": 0.6400000000000001,
        "min": 0.8,
        "max": 0.8,
        "mean": 0.8,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 0.8571428571428571,
        "sum_squared": 0.7346938775510203,
        "min": 0.8571428571428571,
        "max": 0.8571428571428571,
        "mean": 0.8571428571428571,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 0.8,
        "sum_squared": 0.6400000000000001,
        "min": 0.8,
        "max": 0.8,
        "mean": 0.8,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 0.4166666666666667,
        "sum_squared": 0.17361111111111113,
        "min": 0.4166666666666667,
        "max": 0.4166666666666667,
        "mean": 0.4166666666666667,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 85,
        "sum_squared": 7225,
        "min": 85,
        "max": 85,
        "mean": 85.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1180",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "valid"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 3735,
        "sum_squared": 13950225,
        "min": 3735,
        "max": 3735,
        "mean": 3735.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "valid"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "valid"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "valid"
        },
        "count": 1,
        "sum": 0.6176438331604004,
        "sum_squared": 0.3814839046410725,
        "min": 0.6176438331604004,
        "max": 0.6176438331604004,
        "mean": 0.6176438331604004,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "valid"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "valid"
        },
        "count": 1,
        "sum": 0.5,
        "sum_squared": 0.25,
        "min": 0.5,
        "max": 0.5,
        "mean": 0.5,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "valid"
        },
        "count": 1,
        "sum": 0.5,
        "sum_squared": 0.25,
        "min": 0.5,
        "max": 0.5,
        "mean": 0.5,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "valid"
        },
        "count": 1,
        "sum": 0.5,
        "sum_squared": 0.25,
        "min": 0.5,
        "max": 0.5,
        "mean": 0.5,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "valid"
        },
        "count": 1,
        "sum": 2.2250738585072626e-308,
        "sum_squared": 0.0,
        "min": 2.2250738585072626e-308,
        "max": 2.2250738585072626e-308,
        "mean": 2.2250738585072626e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "valid"
        },
        "count": 1,
        "sum": 16,
        "sum_squared": 256,
        "min": 16,
        "max": 16,
        "mean": 16.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1261",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3719,
        "sum_squared": 13830961,
        "min": 3719,
        "max": 3719,
        "mean": 3719.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.5868656635284424,
        "sum_squared": 0.34441130702867895,
        "min": 0.5868656635284424,
        "max": 0.5868656635284424,
        "mean": 0.5868656635284424,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 0.7142857142857143,
        "sum_squared": 0.5102040816326531,
        "min": 0.7142857142857143,
        "max": 0.7142857142857143,
        "mean": 0.7142857142857143,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 0.4444444444444445,
        "sum_squared": 0.19753086419753088,
        "min": 0.4444444444444445,
        "max": 0.4444444444444445,
        "mean": 0.4444444444444445,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 0.5,
        "sum_squared": 0.25,
        "min": 0.5,
        "max": 0.5,
        "mean": 0.5,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 2.2250738585072626e-308,
        "sum_squared": 0.0,
        "min": 2.2250738585072626e-308,
        "max": 2.2250738585072626e-308,
        "mean": 2.2250738585072626e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 42,
        "sum_squared": 1764,
        "min": 42,
        "max": 42,
        "mean": 42.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1290",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3580,
        "sum_squared": 12816400,
        "min": 3580,
        "max": 3580,
        "mean": 3580.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.5990800857543945,
        "sum_squared": 0.3588969491474927,
        "min": 0.5990800857543945,
        "max": 0.5990800857543945,
        "mean": 0.5990800857543945,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 0.5882352941176471,
        "sum_squared": 0.34602076124567477,
        "min": 0.5882352941176471,
        "max": 0.5882352941176471,
        "mean": 0.5882352941176471,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 0.5714285714285715,
        "sum_squared": 0.32653061224489804,
        "min": 0.5714285714285715,
        "max": 0.5714285714285715,
        "mean": 0.5714285714285715,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 0.375,
        "sum_squared": 0.140625,
        "min": 0.375,
        "max": 0.375,
        "mean": 0.375,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 0.07692307692307693,
        "sum_squared": 0.00591715976331361,
        "min": 0.07692307692307693,
        "max": 0.07692307692307693,
        "mean": 0.07692307692307693,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 78,
        "sum_squared": 6084,
        "min": 78,
        "max": 78,
        "mean": 78.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1202",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "valid"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 3553,
        "sum_squared": 12623809,
        "min": 3553,
        "max": 3553,
        "mean": 3553.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "valid"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "valid"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "valid"
        },
        "count": 1,
        "sum": 0.5991933345794678,
        "sum_squared": 0.359032652204462,
        "min": 0.5991933345794678,
        "max": 0.5991933345794678,
        "mean": 0.5991933345794678,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "valid"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "valid"
        },
        "count": 1,
        "sum": 0.36787944117144233,
        "sum_squared": 0.1353352832366127,
        "min": 0.36787944117144233,
        "max": 0.36787944117144233,
        "mean": 0.36787944117144233,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "valid"
        },
        "count": 1,
        "sum": 8.18558927632837e-309,
        "sum_squared": 0.0,
        "min": 8.18558927632837e-309,
        "max": 8.18558927632837e-309,
        "mean": 8.18558927632837e-309,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "valid"
        },
        "count": 1,
        "sum": 11,
        "sum_squared": 121,
        "min": 11,
        "max": 11,
        "mean": 11.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1463",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3580,
        "sum_squared": 12816400,
        "min": 3580,
        "max": 3580,
        "mean": 3580.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.4251828193664551,
        "sum_squared": 0.18078042988440757,
        "min": 0.4251828193664551,
        "max": 0.4251828193664551,
        "mean": 0.4251828193664551,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 2.2250738585072626e-308,
        "sum_squared": 0.0,
        "min": 2.2250738585072626e-308,
        "max": 2.2250738585072626e-308,
        "mean": 2.2250738585072626e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 16,
        "sum_squared": 256,
        "min": 16,
        "max": 16,
        "mean": 16.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1112",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "valid"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 3497,
        "sum_squared": 12229009,
        "min": 3497,
        "max": 3497,
        "mean": 3497.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "valid"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "valid"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "valid"
        },
        "count": 1,
        "sum": 0.826244592666626,
        "sum_squared": 0.6826801269108387,
        "min": 0.826244592666626,
        "max": 0.826244592666626,
        "mean": 0.826244592666626,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "valid"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "valid"
        },
        "count": 1,
        "sum": 0.8333333333333334,
        "sum_squared": 0.6944444444444445,
        "min": 0.8333333333333334,
        "max": 0.8333333333333334,
        "mean": 0.8333333333333334,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "valid"
        },
        "count": 1,
        "sum": 0.875,
        "sum_squared": 0.765625,
        "min": 0.875,
        "max": 0.875,
        "mean": 0.875,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "valid"
        },
        "count": 1,
        "sum": 0.6,
        "sum_squared": 0.36,
        "min": 0.6,
        "max": 0.6,
        "mean": 0.6,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "valid"
        },
        "count": 1,
        "sum": 39,
        "sum_squared": 1521,
        "min": 39,
        "max": 39,
        "mean": 39.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1293",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3487,
        "sum_squared": 12159169,
        "min": 3487,
        "max": 3487,
        "mean": 3487.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.3892490863800049,
        "sum_squared": 0.1515148512476685,
        "min": 0.3892490863800049,
        "max": 0.3892490863800049,
        "mean": 0.3892490863800049,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 0.36787944117144233,
        "sum_squared": 0.1353352832366127,
        "min": 0.36787944117144233,
        "max": 0.36787944117144233,
        "mean": 0.36787944117144233,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 8.18558927632837e-309,
        "sum_squared": 0.0,
        "min": 8.18558927632837e-309,
        "max": 8.18558927632837e-309,
        "mean": 8.18558927632837e-309,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 9,
        "sum_squared": 81,
        "min": 9,
        "max": 9,
        "mean": 9.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1256",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3159,
        "sum_squared": 9979281,
        "min": 3159,
        "max": 3159,
        "mean": 3159.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.4164438247680664,
        "sum_squared": 0.173425459187456,
        "min": 0.4164438247680664,
        "max": 0.4164438247680664,
        "mean": 0.4164438247680664,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 2.2250738585072626e-308,
        "sum_squared": 0.0,
        "min": 2.2250738585072626e-308,
        "max": 2.2250738585072626e-308,
        "mean": 2.2250738585072626e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 17,
        "sum_squared": 289,
        "min": 17,
        "max": 17,
        "mean": 17.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1499",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3525,
        "sum_squared": 12425625,
        "min": 3525,
        "max": 3525,
        "mean": 3525.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.42165184020996094,
        "sum_squared": 0.17779027435244643,
        "min": 0.42165184020996094,
        "max": 0.42165184020996094,
        "mean": 0.42165184020996094,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 0.7272727272727273,
        "sum_squared": 0.5289256198347108,
        "min": 0.7272727272727273,
        "max": 0.7272727272727273,
        "mean": 0.7272727272727273,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 0.7272727272727272,
        "sum_squared": 0.5289256198347106,
        "min": 0.7272727272727272,
        "max": 0.7272727272727272,
        "mean": 0.7272727272727272,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 0.5362560368285115,
        "sum_squared": 0.2875705370350219,
        "min": 0.5362560368285115,
        "max": 0.5362560368285115,
        "mean": 0.5362560368285115,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 0.33516002301781966,
        "sum_squared": 0.1123322410293054,
        "min": 0.33516002301781966,
        "max": 0.33516002301781966,
        "mean": 0.33516002301781966,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 37,
        "sum_squared": 1369,
        "min": 37,
        "max": 37,
        "mean": 37.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1419",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3072,
        "sum_squared": 9437184,
        "min": 3072,
        "max": 3072,
        "mean": 3072.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.36020684242248535,
        "sum_squared": 0.1297489693279772,
        "min": 0.36020684242248535,
        "max": 0.36020684242248535,
        "mean": 0.36020684242248535,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 0.5,
        "sum_squared": 0.25,
        "min": 0.5,
        "max": 0.5,
        "mean": 0.5,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 0.6666666666666666,
        "sum_squared": 0.4444444444444444,
        "min": 0.6666666666666666,
        "max": 0.6666666666666666,
        "mean": 0.6666666666666666,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 0.3333333333333333,
        "sum_squared": 0.1111111111111111,
        "min": 0.3333333333333333,
        "max": 0.3333333333333333,
        "mean": 0.3333333333333333,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 2.2250738585072626e-308,
        "sum_squared": 0.0,
        "min": 2.2250738585072626e-308,
        "max": 2.2250738585072626e-308,
        "mean": 2.2250738585072626e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 17,
        "sum_squared": 289,
        "min": 17,
        "max": 17,
        "mean": 17.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1103",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "valid"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 3457,
        "sum_squared": 11950849,
        "min": 3457,
        "max": 3457,
        "mean": 3457.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "valid"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "valid"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "valid"
        },
        "count": 1,
        "sum": 0.614283561706543,
        "sum_squared": 0.3773442941828762,
        "min": 0.614283561706543,
        "max": 0.614283561706543,
        "mean": 0.614283561706543,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "valid"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "valid"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "valid"
        },
        "count": 1,
        "sum": 2.2250738585072626e-308,
        "sum_squared": 0.0,
        "min": 2.2250738585072626e-308,
        "max": 2.2250738585072626e-308,
        "mean": 2.2250738585072626e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "valid"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "valid"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "valid"
        },
        "count": 1,
        "sum": 7,
        "sum_squared": 49,
        "min": 7,
        "max": 7,
        "mean": 7.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1331",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3225,
        "sum_squared": 10400625,
        "min": 3225,
        "max": 3225,
        "mean": 3225.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.7753558158874512,
        "sum_squared": 0.6011766412304951,
        "min": 0.7753558158874512,
        "max": 0.7753558158874512,
        "mean": 0.7753558158874512,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 0.5454545454545454,
        "sum_squared": 0.29752066115702475,
        "min": 0.5454545454545454,
        "max": 0.5454545454545454,
        "mean": 0.5454545454545454,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 0.5454545454545454,
        "sum_squared": 0.29752066115702475,
        "min": 0.5454545454545454,
        "max": 0.5454545454545454,
        "mean": 0.5454545454545454,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 0.42857142857142855,
        "sum_squared": 0.18367346938775508,
        "min": 0.42857142857142855,
        "max": 0.42857142857142855,
        "mean": 0.42857142857142855,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 2.2250738585072626e-308,
        "sum_squared": 0.0,
        "min": 2.2250738585072626e-308,
        "max": 2.2250738585072626e-308,
        "mean": 2.2250738585072626e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 38,
        "sum_squared": 1444,
        "min": 38,
        "max": 38,
        "mean": 38.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1410",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3137,
        "sum_squared": 9840769,
        "min": 3137,
        "max": 3137,
        "mean": 3137.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.6295897960662842,
        "sum_squared": 0.3963833113107853,
        "min": 0.6295897960662842,
        "max": 0.6295897960662842,
        "mean": 0.6295897960662842,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 0.6666666666666666,
        "sum_squared": 0.4444444444444444,
        "min": 0.6666666666666666,
        "max": 0.6666666666666666,
        "mean": 0.6666666666666666,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 9,
        "sum_squared": 81,
        "min": 9,
        "max": 9,
        "mean": 9.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1516",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3461,
        "sum_squared": 11978521,
        "min": 3461,
        "max": 3461,
        "mean": 3461.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.6306917667388916,
        "sum_squared": 0.39777210463222445,
        "min": 0.6306917667388916,
        "max": 0.6306917667388916,
        "mean": 0.6306917667388916,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 2.2250738585072626e-308,
        "sum_squared": 0.0,
        "min": 2.2250738585072626e-308,
        "max": 2.2250738585072626e-308,
        "mean": 2.2250738585072626e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 8,
        "sum_squared": 64,
        "min": 8,
        "max": 8,
        "mean": 8.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1449",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3129,
        "sum_squared": 9790641,
        "min": 3129,
        "max": 3129,
        "mean": 3129.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.37206339836120605,
        "sum_squared": 0.1384311724000895,
        "min": 0.37206339836120605,
        "max": 0.37206339836120605,
        "mean": 0.37206339836120605,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 0.5,
        "sum_squared": 0.25,
        "min": 0.5,
        "max": 0.5,
        "mean": 0.5,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 0.4,
        "sum_squared": 0.16000000000000003,
        "min": 0.4,
        "max": 0.4,
        "mean": 0.4,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 9,
        "sum_squared": 81,
        "min": 9,
        "max": 9,
        "mean": 9.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1411",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3536,
        "sum_squared": 12503296,
        "min": 3536,
        "max": 3536,
        "mean": 3536.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.4775688648223877,
        "sum_squared": 0.228072020647744,
        "min": 0.4775688648223877,
        "max": 0.4775688648223877,
        "mean": 0.4775688648223877,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 2.2250738585072626e-308,
        "sum_squared": 0.0,
        "min": 2.2250738585072626e-308,
        "max": 2.2250738585072626e-308,
        "mean": 2.2250738585072626e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 17,
        "sum_squared": 289,
        "min": 17,
        "max": 17,
        "mean": 17.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1495",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3522,
        "sum_squared": 12404484,
        "min": 3522,
        "max": 3522,
        "mean": 3522.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.42740893363952637,
        "sum_squared": 0.18267839655487705,
        "min": 0.42740893363952637,
        "max": 0.42740893363952637,
        "mean": 0.42740893363952637,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 0.36787944117144233,
        "sum_squared": 0.1353352832366127,
        "min": 0.36787944117144233,
        "max": 0.36787944117144233,
        "mean": 0.36787944117144233,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 8.18558927632837e-309,
        "sum_squared": 0.0,
        "min": 8.18558927632837e-309,
        "max": 8.18558927632837e-309,
        "mean": 8.18558927632837e-309,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 4,
        "sum_squared": 16,
        "min": 4,
        "max": 4,
        "mean": 4.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1445",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3002,
        "sum_squared": 9012004,
        "min": 3002,
        "max": 3002,
        "mean": 3002.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.5897533893585205,
        "sum_squared": 0.3478090602598627,
        "min": 0.5897533893585205,
        "max": 0.5897533893585205,
        "mean": 0.5897533893585205,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 9,
        "sum_squared": 81,
        "min": 9,
        "max": 9,
        "mean": 9.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1507",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 4017,
        "sum_squared": 16136289,
        "min": 4017,
        "max": 4017,
        "mean": 4017.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.6103475093841553,
        "sum_squared": 0.3725240822114415,
        "min": 0.6103475093841553,
        "max": 0.6103475093841553,
        "mean": 0.6103475093841553,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 0.36787944117144233,
        "sum_squared": 0.1353352832366127,
        "min": 0.36787944117144233,
        "max": 0.36787944117144233,
        "mean": 0.36787944117144233,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 8.18558927632837e-309,
        "sum_squared": 0.0,
        "min": 8.18558927632837e-309,
        "max": 8.18558927632837e-309,
        "mean": 8.18558927632837e-309,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 9,
        "sum_squared": 81,
        "min": 9,
        "max": 9,
        "mean": 9.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1414",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3900,
        "sum_squared": 15210000,
        "min": 3900,
        "max": 3900,
        "mean": 3900.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.6751255989074707,
        "sum_squared": 0.455794574300171,
        "min": 0.6751255989074707,
        "max": 0.6751255989074707,
        "mean": 0.6751255989074707,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 0.36787944117144233,
        "sum_squared": 0.1353352832366127,
        "min": 0.36787944117144233,
        "max": 0.36787944117144233,
        "mean": 0.36787944117144233,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 8.18558927632837e-309,
        "sum_squared": 0.0,
        "min": 8.18558927632837e-309,
        "max": 8.18558927632837e-309,
        "mean": 8.18558927632837e-309,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 9,
        "sum_squared": 81,
        "min": 9,
        "max": 9,
        "mean": 9.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1246",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3795,
        "sum_squared": 14402025,
        "min": 3795,
        "max": 3795,
        "mean": 3795.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.6423261165618896,
        "sum_squared": 0.41258284001747825,
        "min": 0.6423261165618896,
        "max": 0.6423261165618896,
        "mean": 0.6423261165618896,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 2.2250738585072626e-308,
        "sum_squared": 0.0,
        "min": 2.2250738585072626e-308,
        "max": 2.2250738585072626e-308,
        "mean": 2.2250738585072626e-308,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 7,
        "sum_squared": 49,
        "min": 7,
        "max": 7,
        "mean": 7.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  },
  {
    "instance_id": "id1555",
    "train_trial_index": 0,
    "stats": [
      {
        "name": {
          "name": "num_references",
          "split": "test"
        },
        "count": 1,
        "sum": 2,
        "sum_squared": 4,
        "min": 2,
        "max": 2,
        "mean": 2.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_trials",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_prompt_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 3082,
        "sum_squared": 9498724,
        "min": 3082,
        "max": 3082,
        "mean": 3082.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_completion_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_output_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "training_co2_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "training_energy_cost",
          "split": "test"
        },
        "count": 0,
        "sum": 0,
        "sum_squared": 0
      },
      {
        "name": {
          "name": "inference_runtime",
          "split": "test"
        },
        "count": 1,
        "sum": 0.5439956188201904,
        "sum_squared": 0.2959312332955619,
        "min": 0.5439956188201904,
        "max": 0.5439956188201904,
        "mean": 0.5439956188201904,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "batch_size",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_length",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_stop",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_endoftext",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "finish_reason_unknown",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_train_instances",
          "split": "test"
        },
        "count": 1,
        "sum": 5,
        "sum_squared": 25,
        "min": 5,
        "max": 5,
        "mean": 5.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "prompt_truncated",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "max_prob",
          "split": "test"
        },
        "count": 1,
        "sum": 1.0,
        "sum_squared": 1.0,
        "min": 1.0,
        "max": 1.0,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "quasi_exact_match",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "f1_score",
          "split": "test"
        },
        "count": 1,
        "sum": 0.15384615384615385,
        "sum_squared": 0.02366863905325444,
        "min": 0.15384615384615385,
        "max": 0.15384615384615385,
        "mean": 0.15384615384615385,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "rouge_l",
          "split": "test"
        },
        "count": 1,
        "sum": 0.20689655172413793,
        "sum_squared": 0.04280618311533888,
        "min": 0.20689655172413793,
        "max": 0.20689655172413793,
        "mean": 0.20689655172413793,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_1",
          "split": "test"
        },
        "count": 1,
        "sum": 0.05075073121372976,
        "sum_squared": 0.0025756367187282445,
        "min": 0.05075073121372976,
        "max": 0.05075073121372976,
        "mean": 0.05075073121372976,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "bleu_4",
          "split": "test"
        },
        "count": 1,
        "sum": 3.01131000863463e-309,
        "sum_squared": 0.0,
        "min": 3.01131000863463e-309,
        "max": 3.01131000863463e-309,
        "mean": 3.01131000863463e-309,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "logprob",
          "split": "test"
        },
        "count": 1,
        "sum": 0,
        "sum_squared": 0,
        "min": 0,
        "max": 0,
        "mean": 0.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_perplexity_tokens",
          "split": "test"
        },
        "count": 1,
        "sum": 1,
        "sum_squared": 1,
        "min": 1,
        "max": 1,
        "mean": 1.0,
        "variance": 0.0,
        "stddev": 0.0
      },
      {
        "name": {
          "name": "num_bytes",
          "split": "test"
        },
        "count": 1,
        "sum": 45,
        "sum_squared": 2025,
        "min": 45,
        "max": 45,
        "mean": 45.0,
        "variance": 0.0,
        "stddev": 0.0
      }
    ]
  }
]