Created
July 22, 2011 06:10
-
-
Save cncuckoo/1098968 to your computer and use it in GitHub Desktop.
Wote用python语言写的imgHash.py
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
#!/usr/bin/python | |
import glob | |
import os | |
import sys | |
from PIL import Image | |
EXTS = 'jpg', 'jpeg', 'JPG', 'JPEG', 'gif', 'GIF', 'png', 'PNG' | |
def avhash(im): | |
if not isinstance(im, Image.Image): | |
im = Image.open(im) | |
im = im.resize((8, 8), Image.ANTIALIAS).convert('L') | |
avg = reduce(lambda x, y: x + y, im.getdata()) / 64. | |
return reduce(lambda x, (y, z): x | (z << y), | |
enumerate(map(lambda i: 0 if i < avg else 1, im.getdata())), | |
0) | |
def hamming(h1, h2): | |
h, d = 0, h1 ^ h2 | |
while d: | |
h += 1 | |
d &= d - 1 | |
return h | |
if __name__ == '__main__': | |
if len(sys.argv) <= 1 or len(sys.argv) > 3: | |
print "Usage: %s image.jpg [dir]" % sys.argv[0] | |
else: | |
im, wd = sys.argv[1], '.' if len(sys.argv) < 3 else sys.argv[2] | |
h = avhash(im) | |
os.chdir(wd) | |
images = [] | |
for ext in EXTS: | |
images.extend(glob.glob('*.%s' % ext)) | |
seq = [] | |
prog = int(len(images) > 50 and sys.stdout.isatty()) | |
for f in images: | |
seq.append((f, hamming(avhash(f), h))) | |
if prog: | |
perc = 100. * prog / len(images) | |
x = int(2 * perc / 5) | |
print '\rCalculating... [' + '#' * x + ' ' * (40 - x) + ']', | |
print '%.2f%%' % perc, '(%d/%d)' % (prog, len(images)), | |
sys.stdout.flush() | |
prog += 1 | |
if prog: print | |
for f, ham in sorted(seq, key=lambda i: i[1]): | |
print "%d\t%s" % (ham, f) |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment
摘自:http://www.ruanyifeng.com/blog/2011/07/principle_of_similar_image_search.html