onnxruntime/orttraining/tools/ci_test/compare_huggingface.py

import sys
import json

actual = sys.argv[1]
expect = sys.argv[2]

with open(actual) as file_actual:
  json_actual = json.loads(file_actual.read())

with open(expect) as file_expect:
  json_expect = json.loads(file_expect.read())

# loss curve match
def almost_equal(x, y, threshold=0.0001):
  return abs(x-y) < threshold

for i in range(len(json_actual['steps'])):
  step_actual = json_actual['steps'][i]
  step_expect = json_expect['steps'][i]
  print('step {} loss actual {:.6f} expected {:.6f}'.format(step_actual['step'], step_actual['loss'], step_expect['loss']))
  assert(step_actual['step'] == step_expect['step'])
  assert(almost_equal(step_actual['loss'], step_expect['loss']))

# perf match
print('samples_per_second actual {:.3f} expected {:.3f}'.format(json_actual['samples_per_second'], json_expect['samples_per_second']))
assert(json_actual['samples_per_second'] >= 0.95*json_expect['samples_per_second'])