Python基于百度API 图片识别+文字转语音

最新推荐文章于 2024-06-13 16:50:23 发布

不知火猪

最新推荐文章于 2024-06-13 16:50:23 发布

阅读量793

点赞数 2

分类专栏： python 文章标签： python 图文识别语音合成

本文链接：https://blog.csdn.net/qq_21405949/article/details/99687897

版权

python 专栏收录该内容

5 篇文章 0 订阅

订阅专栏

#!/usr/bin/env python3
# -*- coding: utf-8 -*-

'''
    功能：利用百度官方api，读取图片中的文字，同时将文字转换成语音
    官方地址：http://ai.baidu.com/docs#/OCR-Python-SDK/top
'''


from aip import AipOcr,AipSpeech


""" 你的 APPID AK SK """
# 定义常量
# APP_ID = '你的appid' #你百度帐号上的APP_ID
# API_KEY = '你的apikey' #你百度帐号上的API_KEY
# SECRET_KEY = '你的secretkey'#你百度帐号上的SECRET_KEY



clientAipOcr = AipOcr(APP_ID, API_KEY, SECRET_KEY)
clientAipSpeech = AipSpeech(APP_ID, API_KEY, SECRET_KEY)

#测试图片
picture_url="http://image.bug2048.com/mongo20180906.jpg"


""" 读取图片 """
def get_file_content(filePath):
    with open(filePath, 'rb') as fp:
        return fp.read()

"""
    1.调用文字识别API识别图片上的文字
    2.拼接文字后调用语音合成API转换成语音
"""

def convert_picture_words():
    words=''
    wordsResult=clientAipOcr.basicGeneralUrl(picture_url)
    for item in wordsResult['words_result']:
        words+=item['words']+','
    if words=='':
        return
    words=words[:-1]
    print('words-',words)
    speechResult=clientAipSpeech.synthesis(str(words), 'zh', 1, {
        'vol': 5,
        'per': 3
    })
    print('result',speechResult)

    # 识别正确返回语音二进制 错误则返回dict 参照下面错误码
    if not isinstance(speechResult, dict):
        with open('result.mp3', 'wb') as f:
            f.write(speechResult)
            print('oook')


if __name__ == '__main__':
    convert_picture_words()