import torch from torchmetrics.multimodal import CLIPScore metric = CLIPScore(model_name_or_path="openai/clip-vit-base-patch16") values = [ ] for _ in range(10): values.append(metric(torch.randint(255, (3, 224, 224)), "a photo of a cat")) fig_, ax_ = metric.plot(values)