import gradio as gr from transformers import AutoProcessor, AutoModelForCausalLM, AutoConfig def inference(img): pretrained_model_path = "git-large-coco" processor = AutoProcessor.from_pretrained(pretrained_model_path) model = AutoModelForCausalLM.from_pretrained(pretrained_model_path) pixel_values = processor(images=img, return_tensors="pt").pixel_values generated_ids = model.generate(pixel_values=pixel_values, max_length=50) generated_caption = processor.batch_decode(generated_ids, skip_special_tokens=True)[0] return generated_caption title = "Image to text:git-large-coco" article = "