tf AlexNet

# encoding:utf-8
# author:wht@92
from datetime import datetime
import math
import time
import tensorflow as tf
 
def print_activations(t):
 print(t.op.name, ' ', t.get_shape().as_list())
 
def inference(images):
 parameters = []
 with tf.name_scope('conv1') as scope:
  kernel = tf.Variable(tf.truncated_normal([11,11,3,64],dtype=tf.float32,stddev=1e-1),name='weights')
  conv = tf.nn.conv2d(images, kernel, [1,4,4,1], padding='SAME')
  biases = tf.Variable(tf.constant(0.0, shape=[64], dtype=tf.float32),trainable=True, name='biases')
  bias = tf.nn.bias_add(conv, biases)
  conv1 = tf.nn.relu(bias, name=scope)
  print_activations(conv1)
  parameters += [kernel,biases]
 lrn1 = tf.nn.lrn(conv1, 4, bias=1.0, alpha=0.001/9, beta=0.75, name='lrn1')
 pool1 = tf.nn.max_pool(lrn1, ksize=[1,3,3,1], strides=[1,2,2,1], padding='VALID', name='pool1')
 print_activations(pool1)
 with tf.name_scope('conv2') as scope:
  kernel = tf.Variable(tf.truncated_normal([5,5,64,192],dtype=tf.float32, stddev=1e-1), name='weights')
  conv = tf.nn.conv2d(pool1, kernel, [1,1,1,1],padding='SAME')
  biases = tf.Variable(tf.constant(0.0,shape=[192],dtype=tf.float32), trainable=True, name='biases')
  bias = tf.nn.bias_add(conv, biases)
  conv2 = tf.nn.relu(bias, name=scope)
  parameters += [kernel, biases]
  print_activations(conv2)
 lrn2 = tf.nn.lrn(conv2, 4, bias=1.0, alpha=0.001/9, beta=0.75, name='lrn2')
 pool2 = tf.nn.max_pool(lrn2, ksize=[1,3,3,1], strides=[1,2,2,1], padding='VALID',name='pool2')
 print_activations(pool2)
 with tf.name_scope('conv3') as scope:
  kernel = tf.Variable(tf.truncated_normal([3,3,192,384], dtype=tf.float32, stddev=1e-1), name='weights')
  conv = tf.nn.conv2d(pool2, kernel, [1,1,1,1], padding='SAME')
  biases = tf.Variable(tf.constant(0.0, shape=[384], dtype=tf.float32), trainable=True, name='biases')
  bias = tf.nn.bias_add(conv, biases)
  conv3 = tf.nn.relu(bias, name=scope)
  parameters += [kernel, biases]
  print_activations(conv3)
 with tf.name_scope('conv4') as scope:
  kernel = tf.Variable(tf.truncated_normal([3,3,384,256], dtype=tf.float32, stddev=1e-1), name='weights')
  conv = tf.nn.conv2d(conv3, kernel, [1,1,1,1], padding='SAME')
  biases = tf.Variable(tf.constant(0.0, shape=[256], dtype=tf.float32), trainable=True, name='biases')
  bias = tf.nn.bias_add(conv,biases)
  conv4 = tf.nn.relu(bias, name=scope)
  parameters += [kernel, biases]
  print_activations(conv4)
 with tf.name_scope('conv5') as scope:
  kernel = tf.Variable(tf.truncated_normal([3,3,256,256],dtype=tf.float32,stddev=1e-1), name='weights')
  conv = tf.nn.conv2d(conv4,kernel, [1,1,1,1], padding='SAME')
  biases = tf.Variable(tf.constant(0.0, shape=[256], dtype=tf.float32), trainable=True, name='biases')
  bias = tf.nn.bias_add(conv,biases)
  conv5 = tf.nn.relu(bias, name=scope)
  parameters += [kernel, biases]
  print_activations(conv5)
 pool5 = tf.nn.max_pool(conv5, ksize=[1,3,3,1], strides=[1,2,2,1], padding='VALID', name='pool5')
 print_activations(pool5)
 return pool5, parameters
 def time_tensorflow_run(session, target, info_string):
 num_steps_burn_in = 10
 total_duration = 0.0 
 total_duration_squared = 0.0
 for i in range(num_batches + num_steps_burn_in):
  start_time = time.time()
  _ = session.run(target)
  duration = time.time() - start_time
  if i >= num_steps_burn_in:
   if not i% 10 :
    print('%s: step %d, duration= %.3f' % (datetime.now(), i - num_steps_burn_in, duration))
   total_duration += duration
   total_duration_squared += duration *duration
 mn = total_duration / num_batches
 vr = total_duration_squared / num_batches - mn*mn
 sd = math.sqrt(vr)
 print('%s : %s across %d steps, %.3f +/- %.3f sec/batch' %(datetime.now(), info_string, num_batches, mn, sd))
def run_benchmark():
 with tf.Graph().as_default():
  image_size = 224 
  images = tf.Variable(tf.random_normal([batch_size,
                                      image_size,
                                      image_size, 3],
                                      dtype=tf.float32,
                                      stddev=1e-1))
  pool5, parameters = inference(images)
  init = tf.global_variables_initializer()
  sess = tf.Session()
  sess.run(init)
  time_tensorflow_run(sess, pool5, "Forward")
  objective = tf.nn.l2_loss(pool5)
  grad = tf.gradients(objective, parameters)
  time_tensorflow_run(sess, grad, "Forward-backward")
  
run_benchmark()
AlexNet是由Alex Krizhevsky等人在2012年提出的一个深度卷积神经网络(Convolutional Neural Network,CNN),它在ImageNet图像识别挑战赛中取得了显著突破,首次击败了传统的计算机视觉方法。这标志着深度学习在计算机视觉领域的重大进展。 在TensorFlow框架中,AlexNet可以被用来作为预训练模型,用于迁移学习任务,即在一个大型数据集(如ImageNet)上训练好的模型,在新的、具有相似任务的小规模数据集上进行微调。TensorFlow库提供了方便的接口,如`tf.keras.applications.AlexNet()`,可以直接加载预训练的AlexNet模型,并允许用户进行前向传播或对某些层进行修改和训练。 以下是使用AlexNet的基本步骤: 1. **导入模型**: ```python from tensorflow.keras.applications import AlexNet model = AlexNet(weights='imagenet') # 加载预训练权重 ``` 2. **冻结层**(如果不需要训练整个网络): ```python for layer in model.layers[:-10]: # 冻结除最后几层之外的层 layer.trainable = False ``` 3. **添加新层**(如果需要自定义输出): ```python new_output_layer = tf.keras.layers.Dense(units=...)(model.output) model = tf.keras.Model(inputs=model.input, outputs=new_output_layer) ``` 4. **编译和训练**(替换为新数据集): ```python model.compile(optimizer='adam', loss='categorical_crossentropy', metrics=['accuracy']) model.fit(x_train, y_train, epochs=..., validation_data=(x_val, y_val)) ```
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值