使用blip图像生成描述

import gc
import os
from PIL import Image
from transformers import BlipProcessor, BlipForConditionalGeneration
processor = BlipProcessor.from_pretrained("./checkpoints/Salesforceblip-image-captioning-large")
model = BlipForConditionalGeneration.from_pretrained("./checkpoints/Salesforceblip-image-captioning-large")
# img_url = 'https://storage.googleapis.com/sfr-vision-language-research/BLIP/demo.jpg'
path = r"C:\Users\pc\Desktop\sd_train\images"
out_path = r"C:\Users\pc\Desktop\sd_train\labels"
images = os.listdir(path)
for i in images:
    txt_name = os.path.join(out_path,i[:-4]+".txt")
    image = os.path.join(path,i)
    raw_image = Image.open(image).convert('RGB')

    # conditional image captioning
    text = "a gdgzcj style photography of"
    inputs = processor(raw_image, text, return_tensors="pt")
    out = model.generate(**inputs)
    txt_prompts = processor.decode(out[0], skip_special_tokens=True)
    print(txt_prompts)

    # unconditional image captioning
    # inputs = processor(raw_image, return_tensors="pt")
    # out = model.generate(**inputs)
    # txt_no_prompts = processor.decode(out[0], skip_special_tokens=True)
    # print(txt_no_prompts)
    # print(txt_name)
    with open(txt_name, 'w') as file:
        file.write(txt_prompts)
gc.collect()


  • 8
    点赞
  • 11
    收藏
    觉得还不错? 一键收藏
  • 0
    评论

“相关推荐”对你有帮助么?

  • 非常没帮助
  • 没帮助
  • 一般
  • 有帮助
  • 非常有帮助
提交
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值