test_cases = [ { "predictions": ["New York City", "Albert Einstein"], "references": [["New York City", "NYC"], ["Einstein", "Albert Einstein"]], "result": {"exact_match": 1.0, "f1": 1.0}, }, ]