from transformers import pipeline pipe = pipeline("image-text-to-text", model="zai-org/GLM-OCR")