import torch from transformers import CLIPProcessor, CLIPModel # Load the pre-trained model and processor model = CLIPModel.from_pretrained("openai/clip-vit-base-patch32") processor = CLIPProcessor.from_pretrained("openai/clip-vit-base-patch32") # Define the text prompt text_prompt = "a futuristic city at sunset" # Process the text prompt inputs = processor(text=[text_prompt], return_tensors="pt", padding=True) # Generate the image with torch.no_grad(): outputs = model(**inputs) logits_per_image = outputs.logits_per_image probs = logits_per_image.softmax(dim=1) # Display the generated image (this is just an example; adjust as necessary for your chatbot framework) print(probs)