{
  "best_metric": 0.38773971796035767,
  "best_model_checkpoint": "./vit-base-brain-tumor-detection2/checkpoint-1500",
  "epoch": 30.0,
  "eval_steps": 500,
  "global_step": 1920,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.78125,
      "grad_norm": 1.7783442735671997,
      "learning_rate": 2.5000000000000004e-07,
      "loss": 1.3686,
      "step": 50
    },
    {
      "epoch": 1.5625,
      "grad_norm": 1.8243844509124756,
      "learning_rate": 5.000000000000001e-07,
      "loss": 1.3468,
      "step": 100
    },
    {
      "epoch": 2.34375,
      "grad_norm": 2.272806167602539,
      "learning_rate": 7.5e-07,
      "loss": 1.2931,
      "step": 150
    },
    {
      "epoch": 3.125,
      "grad_norm": 1.0346544981002808,
      "learning_rate": 1.0000000000000002e-06,
      "loss": 1.1861,
      "step": 200
    },
    {
      "epoch": 3.90625,
      "grad_norm": 0.897363007068634,
      "learning_rate": 1.25e-06,
      "loss": 1.092,
      "step": 250
    },
    {
      "epoch": 4.6875,
      "grad_norm": 1.0376484394073486,
      "learning_rate": 1.5e-06,
      "loss": 1.0504,
      "step": 300
    },
    {
      "epoch": 5.46875,
      "grad_norm": 1.2069748640060425,
      "learning_rate": 1.75e-06,
      "loss": 0.993,
      "step": 350
    },
    {
      "epoch": 6.25,
      "grad_norm": 1.41449773311615,
      "learning_rate": 2.0000000000000003e-06,
      "loss": 0.9428,
      "step": 400
    },
    {
      "epoch": 7.03125,
      "grad_norm": 3.5506372451782227,
      "learning_rate": 2.25e-06,
      "loss": 0.9065,
      "step": 450
    },
    {
      "epoch": 7.8125,
      "grad_norm": 2.408358573913574,
      "learning_rate": 2.5e-06,
      "loss": 0.8758,
      "step": 500
    },
    {
      "epoch": 7.8125,
      "eval_accuracy": 0.6181640625,
      "eval_loss": 0.891155481338501,
      "eval_runtime": 5.9944,
      "eval_samples_per_second": 170.826,
      "eval_steps_per_second": 21.353,
      "step": 500
    },
    {
      "epoch": 8.59375,
      "grad_norm": 4.127248764038086,
      "learning_rate": 2.7500000000000004e-06,
      "loss": 0.8371,
      "step": 550
    },
    {
      "epoch": 9.375,
      "grad_norm": 4.548064231872559,
      "learning_rate": 3e-06,
      "loss": 0.7951,
      "step": 600
    },
    {
      "epoch": 10.15625,
      "grad_norm": 7.226322174072266,
      "learning_rate": 3.2500000000000002e-06,
      "loss": 0.7666,
      "step": 650
    },
    {
      "epoch": 10.9375,
      "grad_norm": 4.653890132904053,
      "learning_rate": 3.5e-06,
      "loss": 0.7219,
      "step": 700
    },
    {
      "epoch": 11.71875,
      "grad_norm": 3.7779295444488525,
      "learning_rate": 3.7500000000000005e-06,
      "loss": 0.6926,
      "step": 750
    },
    {
      "epoch": 12.5,
      "grad_norm": 3.6519362926483154,
      "learning_rate": 4.000000000000001e-06,
      "loss": 0.646,
      "step": 800
    },
    {
      "epoch": 13.28125,
      "grad_norm": 24.227773666381836,
      "learning_rate": 4.25e-06,
      "loss": 0.6269,
      "step": 850
    },
    {
      "epoch": 14.0625,
      "grad_norm": 8.960350036621094,
      "learning_rate": 4.5e-06,
      "loss": 0.5882,
      "step": 900
    },
    {
      "epoch": 14.84375,
      "grad_norm": 6.60162878036499,
      "learning_rate": 4.75e-06,
      "loss": 0.544,
      "step": 950
    },
    {
      "epoch": 15.625,
      "grad_norm": 10.583850860595703,
      "learning_rate": 5e-06,
      "loss": 0.5256,
      "step": 1000
    },
    {
      "epoch": 15.625,
      "eval_accuracy": 0.7607421875,
      "eval_loss": 0.6331567764282227,
      "eval_runtime": 5.4782,
      "eval_samples_per_second": 186.924,
      "eval_steps_per_second": 23.365,
      "step": 1000
    },
    {
      "epoch": 16.40625,
      "grad_norm": 3.9983010292053223,
      "learning_rate": 4.999850432733413e-06,
      "loss": 0.4768,
      "step": 1050
    },
    {
      "epoch": 17.1875,
      "grad_norm": 12.768200874328613,
      "learning_rate": 4.999401748829942e-06,
      "loss": 0.4863,
      "step": 1100
    },
    {
      "epoch": 17.96875,
      "grad_norm": 14.71330451965332,
      "learning_rate": 4.9986540019763296e-06,
      "loss": 0.4181,
      "step": 1150
    },
    {
      "epoch": 18.75,
      "grad_norm": 9.602484703063965,
      "learning_rate": 4.997607281643338e-06,
      "loss": 0.3901,
      "step": 1200
    },
    {
      "epoch": 19.53125,
      "grad_norm": 27.293039321899414,
      "learning_rate": 4.996261713075046e-06,
      "loss": 0.3496,
      "step": 1250
    },
    {
      "epoch": 20.3125,
      "grad_norm": 3.6233201026916504,
      "learning_rate": 4.994617457273862e-06,
      "loss": 0.3312,
      "step": 1300
    },
    {
      "epoch": 21.09375,
      "grad_norm": 11.52304458618164,
      "learning_rate": 4.992674710981266e-06,
      "loss": 0.2929,
      "step": 1350
    },
    {
      "epoch": 21.875,
      "grad_norm": 6.805290222167969,
      "learning_rate": 4.990433706654258e-06,
      "loss": 0.2653,
      "step": 1400
    },
    {
      "epoch": 22.65625,
      "grad_norm": 15.234956741333008,
      "learning_rate": 4.987894712437552e-06,
      "loss": 0.2635,
      "step": 1450
    },
    {
      "epoch": 23.4375,
      "grad_norm": 3.9582715034484863,
      "learning_rate": 4.985058032131488e-06,
      "loss": 0.2247,
      "step": 1500
    },
    {
      "epoch": 23.4375,
      "eval_accuracy": 0.8935546875,
      "eval_loss": 0.38773971796035767,
      "eval_runtime": 5.9931,
      "eval_samples_per_second": 170.863,
      "eval_steps_per_second": 21.358,
      "step": 1500
    },
    {
      "epoch": 24.21875,
      "grad_norm": 3.0134124755859375,
      "learning_rate": 4.98192400515568e-06,
      "loss": 0.1965,
      "step": 1550
    },
    {
      "epoch": 25.0,
      "grad_norm": 5.4471540451049805,
      "learning_rate": 4.978564534206973e-06,
      "loss": 0.193,
      "step": 1600
    },
    {
      "epoch": 25.78125,
      "grad_norm": 11.847530364990234,
      "learning_rate": 4.974842901390282e-06,
      "loss": 0.1709,
      "step": 1650
    },
    {
      "epoch": 26.5625,
      "grad_norm": 4.015501022338867,
      "learning_rate": 4.970825144183195e-06,
      "loss": 0.158,
      "step": 1700
    },
    {
      "epoch": 27.34375,
      "grad_norm": 4.216943264007568,
      "learning_rate": 4.966511743325682e-06,
      "loss": 0.1452,
      "step": 1750
    },
    {
      "epoch": 28.125,
      "grad_norm": 23.560443878173828,
      "learning_rate": 4.961903214932604e-06,
      "loss": 0.1288,
      "step": 1800
    },
    {
      "epoch": 28.90625,
      "grad_norm": 0.9162831902503967,
      "learning_rate": 4.957000110431956e-06,
      "loss": 0.1195,
      "step": 1850
    },
    {
      "epoch": 29.6875,
      "grad_norm": 2.046557664871216,
      "learning_rate": 4.95180301649889e-06,
      "loss": 0.1002,
      "step": 1900
    },
    {
      "epoch": 30.0,
      "step": 1920,
      "total_flos": 9.52238637305561e+18,
      "train_loss": 0.5872499863306682,
      "train_runtime": 1494.2494,
      "train_samples_per_second": 82.235,
      "train_steps_per_second": 1.285
    }
  ],
  "logging_steps": 50,
  "max_steps": 1920,
  "num_input_tokens_seen": 0,
  "num_train_epochs": 30,
  "save_steps": 500,
  "stateful_callbacks": {
    "EarlyStoppingCallback": {
      "args": {
        "early_stopping_patience": 5,
        "early_stopping_threshold": 0.0
      },
      "attributes": {
        "early_stopping_patience_counter": 0
      }
    },
    "TrainerControl": {
      "args": {
        "should_epoch_stop": false,
        "should_evaluate": false,
        "should_log": false,
        "should_save": true,
        "should_training_stop": true
      },
      "attributes": {}
    }
  },
  "total_flos": 9.52238637305561e+18,
  "train_batch_size": 8,
  "trial_name": null,
  "trial_params": null
}