test_cases = [
    {
        "predictions": ["blu red yellow", "green orange violet"],
        "references": ["pizza spaghetti mandolino", "piplup prinplup empoleon"],
        "result": {"metric_score": 0}
    },
    {
        "predictions": ["a random string", "another string maybe"],
        "references": ["random random string", "string string maybe"],
        "result": {"metric_score": 1}
    },
    {
        "predictions": ["conda search evaluate", "conda search transformers"],
        "references": ["conda search evaluate", "conda install pytorch"],
        "result": {"metric_score": 0.5}
    }
]