uberscientist · July 3, 2015 19:56
diff --git a/gistfile1.py b/gistfile1.py
 # could be a lot more readable if I just broke the deepdream out into a module...
 import os

 #Copied from deepdream iPython notebook
 # imports and basic notebook setup
 from cStringIO import StringIO
 import numpy as np
 import scipy.ndimage as nd
 import PIL.Image
 from google.protobuf import text_format

 import caffe

 model_path = '/opt/caffe/models/bvlc_googlenet/' # substitute your path here
 net_fn   = model_path + 'deploy.prototxt'
 param_fn = model_path + 'bvlc_googlenet.caffemodel'

 # Patching model to be able to compute gradients.
 # Note that you can also manually add "force_backward: true" line to "deploy.prototxt".
 model = caffe.io.caffe_pb2.NetParameter()
 text_format.Merge(open(net_fn).read(), model)
 model.force_backward = True
 open('tmp.prototxt', 'w').write(str(model))

 net = caffe.Classifier('tmp.prototxt', param_fn,
                       mean = np.float32([104.0, 116.0, 122.0]), # ImageNet mean, training set dependent
                       channel_swap = (2,1,0)) # the reference model has channels in BGR order instead of RGB

 # a couple of utility functions for converting to and from Caffe's input image layout
 def preprocess(net, img):
    return np.float32(np.rollaxis(img, 2)[::-1]) - net.transformer.mean['data']

 def deprocess(net, img):
    return np.dstack((img + net.transformer.mean['data'])[::-1])

 def make_step(net, step_size=1.5, end='inception_4c/output', jitter=32, clip=True):
    '''Basic gradient ascent step.'''

    src = net.blobs['data'] # input image is storred in Net's 'data' blob
    dst = net.blobs[end]

    ox, oy = np.random.randint(-jitter, jitter+1, 2)
    src.data[0] = np.roll(np.roll(src.data[0], ox, -1), oy, -2) # apply jitter shift
            
    net.forward(end=end)
    dst.diff[:] = dst.data  # specify the optimiation objective
    net.backward(start=end)
    g = src.diff[0]
    # apply normaized ascent step to the input image
    src.data[:] += step_size/np.abs(g).mean() * g

    src.data[0] = np.roll(np.roll(src.data[0], -ox, -1), -oy, -2) # unshift image
            
    if clip:
        bias = net.transformer.mean['data']
        src.data[:] = np.clip(src.data, -bias, 255-bias)

 def deepdream(net, base_img, iter_n=10, octave_n=4, octave_scale=1.4, end='inception_4c/output', clip=True, **step_params):
    # prepare base images for all octaves
    octaves = [preprocess(net, base_img)]
    for i in xrange(octave_n-1):
        octaves.append(nd.zoom(octaves[-1], (1, 1.0/octave_scale,1.0/octave_scale), order=1))
    
    src = net.blobs['data']
    detail = np.zeros_like(octaves[-1]) # allocate image for network-produced details
    for octave, octave_base in enumerate(octaves[::-1]):
        h, w = octave_base.shape[-2:]
        if octave > 0:
            # upscale details from the previous octave
            h1, w1 = detail.shape[-2:]
            detail = nd.zoom(detail, (1, 1.0*h/h1,1.0*w/w1), order=1)

        src.reshape(1,3,h,w) # resize the network's input image size
        src.data[0] = octave_base+detail
        for i in xrange(iter_n):
            make_step(net, end=end, clip=clip, **step_params)
            
            # visualization
            vis = deprocess(net, src.data[0])
            if not clip: # adjust image contrast if clipping is disabled
                vis = vis*(255.0/np.percentile(vis, 99.98))
            print octave, i, end, vis.shape
            #clear_output(wait=True)
            
        # extract details produced on the current octave
        detail = src.data[0]-octave_base
    # returning the resulting image
    return deprocess(net, src.data[0])

 #This is where we process the video
 #/frames directory contains frames extracted from the original video
 frame_files = os.listdir('frames/')
 frame_files.sort()

 prev_frame = False
 frame_i = 1

 for file in frame_files:
    print file
    pil_img = PIL.Image.open('frames/' + file)

    if prev_frame: #if prev_frame, combine images
        pil_img = PIL.Image.blend(pil_img, prev_frame, 0.15)

    img = np.float32(pil_img)

    pframe = deepdream(net, img, iter_n=10, octave_n=2, end='inception_4b/3x3_reduce')

    prev_frame = PIL.Image.fromarray(np.uint8(pframe))
    prev_frame.save("pframes/%04d.jpg"%frame_i)
    frame_i += 1
	# could be a lot more readable if I just broke the deepdream out into a module...
	import os

	#Copied from deepdream iPython notebook
	# imports and basic notebook setup
	from cStringIO import StringIO
	import numpy as np
	import scipy.ndimage as nd
	import PIL.Image
	from google.protobuf import text_format

	import caffe

	model_path = '/opt/caffe/models/bvlc_googlenet/' # substitute your path here
	net_fn = model_path + 'deploy.prototxt'
	param_fn = model_path + 'bvlc_googlenet.caffemodel'

	# Patching model to be able to compute gradients.
	# Note that you can also manually add "force_backward: true" line to "deploy.prototxt".
	model = caffe.io.caffe_pb2.NetParameter()
	text_format.Merge(open(net_fn).read(), model)
	model.force_backward = True
	open('tmp.prototxt', 'w').write(str(model))

	net = caffe.Classifier('tmp.prototxt', param_fn,
	mean = np.float32([104.0, 116.0, 122.0]), # ImageNet mean, training set dependent
	channel_swap = (2,1,0)) # the reference model has channels in BGR order instead of RGB

	# a couple of utility functions for converting to and from Caffe's input image layout
	def preprocess(net, img):
	return np.float32(np.rollaxis(img, 2)[::-1]) - net.transformer.mean['data']

	def deprocess(net, img):
	return np.dstack((img + net.transformer.mean['data'])[::-1])

	def make_step(net, step_size=1.5, end='inception_4c/output', jitter=32, clip=True):
	'''Basic gradient ascent step.'''

	src = net.blobs['data'] # input image is storred in Net's 'data' blob
	dst = net.blobs[end]

	ox, oy = np.random.randint(-jitter, jitter+1, 2)
	src.data[0] = np.roll(np.roll(src.data[0], ox, -1), oy, -2) # apply jitter shift

	net.forward(end=end)
	dst.diff[:] = dst.data # specify the optimiation objective
	net.backward(start=end)
	g = src.diff[0]
	# apply normaized ascent step to the input image
	src.data[:] += step_size/np.abs(g).mean() * g

	src.data[0] = np.roll(np.roll(src.data[0], -ox, -1), -oy, -2) # unshift image

	if clip:
	bias = net.transformer.mean['data']
	src.data[:] = np.clip(src.data, -bias, 255-bias)

	def deepdream(net, base_img, iter_n=10, octave_n=4, octave_scale=1.4, end='inception_4c/output', clip=True, **step_params):
	# prepare base images for all octaves
	octaves = [preprocess(net, base_img)]
	for i in xrange(octave_n-1):
	octaves.append(nd.zoom(octaves[-1], (1, 1.0/octave_scale,1.0/octave_scale), order=1))

	src = net.blobs['data']
	detail = np.zeros_like(octaves[-1]) # allocate image for network-produced details
	for octave, octave_base in enumerate(octaves[::-1]):
	h, w = octave_base.shape[-2:]
	if octave > 0:
	# upscale details from the previous octave
	h1, w1 = detail.shape[-2:]
	detail = nd.zoom(detail, (1, 1.0h/h1,1.0w/w1), order=1)

	src.reshape(1,3,h,w) # resize the network's input image size
	src.data[0] = octave_base+detail
	for i in xrange(iter_n):
	make_step(net, end=end, clip=clip, **step_params)

	# visualization
	vis = deprocess(net, src.data[0])
	if not clip: # adjust image contrast if clipping is disabled
	vis = vis*(255.0/np.percentile(vis, 99.98))
	print octave, i, end, vis.shape
	#clear_output(wait=True)

	# extract details produced on the current octave
	detail = src.data[0]-octave_base
	# returning the resulting image
	return deprocess(net, src.data[0])

	#This is where we process the video
	#/frames directory contains frames extracted from the original video
	frame_files = os.listdir('frames/')
	frame_files.sort()

	prev_frame = False
	frame_i = 1

	for file in frame_files:
	print file
	pil_img = PIL.Image.open('frames/' + file)

	if prev_frame: #if prev_frame, combine images
	pil_img = PIL.Image.blend(pil_img, prev_frame, 0.15)

	img = np.float32(pil_img)

	pframe = deepdream(net, img, iter_n=10, octave_n=2, end='inception_4b/3x3_reduce')

	prev_frame = PIL.Image.fromarray(np.uint8(pframe))
	prev_frame.save("pframes/%04d.jpg"%frame_i)
	frame_i += 1
No results found