TensorFlow Lite模型量化方法

Replete

于 2021-04-19 09:35:08 发布

阅读量219

点赞数

文章标签： tensorflow python 深度学习机器学习人工智能

本文链接：https://blog.csdn.net/weixin_38906715/article/details/125675915

版权

##CUDA_VISIBLE_DEVICES=-1& tflite_convert --saved_model_dir ./sfz1model/ --output_file ./tflite/sfz1.tflit
def convert2f16():
    modeldir='./sfz1model'
    tfdir='./tflite/float16.tflite'

    tfconverter = \
                tf.lite.TFLiteConverter.from_saved_model(modeldir)
    #float16 量化            
    tfconverter.optimizations=[tf.lite.Optimize.DEFAULT]
    tfconverter.target_spec.supported_types=[tf.float16]
    #
    saved_model_tflite = tfconverter.convert()


    with open(tfdir, 'wb') as f:
        f.write(saved_model_tflite)

def convert2f8if32():
    modeldir='./sfz1model'
    tfdir='./tflite/i8f32.tflite'
    
    tfconverter = \
                tf.lite.TFLiteConverter.from_saved_model(modeldir)
    #int8 float32 混合量化            
    tfconverter.optimizations=[tf.lite.Optimize.DEFAULT]
    #tfconverter.target_spec.supported_types=[tf.float16]
    #
    saved_model_tflite = tfconverter.convert()


    with open(tfdir, 'wb') as f:
        f.write(saved_model_tflite)


from nets.resnetsfz import *
h,w = 135,240
BATCH_SIZE=1
val_split = 0.1
gen=SfzGen(BATCH_SIZE,w,h,val_split,[
        ])        
def data_gen():
    data=gen.generate(True)
    for i in range(100):
        x,y=data.__next__()
        # Model has only one input so each data point has one element.
        yield [x]
# mnist_train, _ = tf.keras.datasets.mnist.load_data()
# images = tf.cast(mnist_train[0], tf.float32) / 255.0
# mnist_ds = tf.data.Dataset.from_tensor_slices((images)).batch(1)
# def representative_data_gen():
#   for input_value in mnist_ds.take(100):
#     # Model has only one input so each data point has one element.
#     yield [input_value]

def convert2int8():#
    modeldir='./sfz1model'
    tfdir='./tflite/int8.tflite'
    
    tfconverter = \
                tf.lite.TFLiteConverter.from_saved_model(modeldir)
    #int8 float32 混合量化            
    tfconverter.optimizations=[tf.lite.Optimize.DEFAULT]
    #tfconverter.target_spec.supported_types=[tf.float16]
    tfconverter.target_spec.supported_ops = [tf.lite.OpsSet.TFLITE_BUILTINS_INT8]
    tfconverter.inference_input_type = tf.uint8
    tfconverter.inference_output_type = tf.uint8    
    
    tfconverter.representative_dataset = data_gen

    saved_model_tflite = tfconverter.convert()


    with open(tfdir, 'wb') as f:
        f.write(saved_model_tflite)

Frank Wang：TensorFlow Lite量化方法介绍

Replete

关注

0
点赞
踩
0

收藏

觉得还不错? 一键收藏
0
评论
TensorFlow Lite模型量化方法

##CUDA_VISIBLE_DEVICES=-1& tflite_convert --saved_model_dir ./sfz1model/ --output_file ./tflite/sfz1.tflitdef convert2f16(): modeldir='./sfz1model' tfdir='./tflite/float16.tflite' tf...
复制链接

扫一扫