from transformers import TrOCRProcessor, VisionEncoderDecoderModel from PIL import Image import requests import gradio as gr processor = TrOCRProcessor.from_pretrained('microsoft/trocr-base-printed') model = VisionEncoderDecoderModel.from_pretrained('microsoft/trocr-base-printed') def ocr(image): pixel_values = processor(images=image, return_tensors="pt").pixel_values generated_ids = model.generate(pixel_values) generated_text = processor.batch_decode(generated_ids, skip_special_tokens=True)[0] return generated_text demo = gr.Interface(fn=ocr, inputs='image', outputs='text', title = "ocr", examples = ['printed.jpg']) if __name__ == "__main__": demo.queue(concurrency_count=3).launch(server_name = "0.0.0.0", server_port = 7011)