diff --git a/README.md b/README.md index c1e4639..a5bcb2b 100644 --- a/README.md +++ b/README.md @@ -33,7 +33,7 @@ model = AlignModel.from_pretrained("kakaobrain/align-base") url = "http://images.cocodataset.org/val2017/000000039769.jpg" image = Image.open(requests.get(url, stream=True).raw) -inputs = processor(text=["a photo of a cat", "a photo of a dog"], images=image, return_tensors="pt", padding=True) +inputs = processor(text=["a photo of a cat", "a photo of a dog"], images=image, return_tensors="pt") outputs = model(**inputs) logits_per_image = outputs.logits_per_image # this is the image-text similarity score