Last active
January 2, 2025 05:21
-
-
Save conanak99/970857292f603781363b99dbbf20fabb to your computer and use it in GitHub Desktop.
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
# Nhớ cài "pip install transformers gradio Pillow" | |
from PIL import Image | |
from transformers import BlipProcessor, BlipForConditionalGeneration | |
processor = BlipProcessor.from_pretrained("Salesforce/blip-image-captioning-base") | |
model = BlipForConditionalGeneration.from_pretrained("Salesforce/blip-image-captioning-base") | |
def generate_caption(raw_image: Image) -> str: | |
inputs = processor(raw_image, return_tensors="pt") | |
outputs = model.generate(**inputs) | |
caption = processor.decode(outputs[0], skip_special_tokens=True) | |
return caption | |
# Code tải ảnh về và test | |
import requests | |
# Tải ảnh về | |
image_url = 'https://storage.googleapis.com/petbacker/images/blog/2017/dog-and-cat-cover.jpg' | |
image = Image.open(requests.get(image_url, stream=True).raw) | |
# Chạy generate_caption và in ảnh ra | |
caption = generate_caption(image) | |
# Output: "a cat and dog are looking over a white sign" | |
print(caption) |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment