from torchmetrics.text import BLEUScore metric = BLEUScore() preds = ['the cat is on the mat'] target = [['there is a cat on the mat', 'a cat is on the mat']] values = [ ] for _ in range(10): values.append(metric(preds, target)) fig_, ax_ = metric.plot(values)