按日期对照片进行分类整理

清华大佬耗费三个月吐血整理的几百G的资源,免费分享!....>>>

# -*- coding:utf-8 -*-
__author__ = 'Barry'


from PIL import Image
from PIL.ExifTags import TAGS
from datetime import datetime
from hashlib import md5
import time
import os
import shutil
import fnmatch
import random


def IterFindFiles(path, fnexp):
    for root, dirs, files in os.walk(path):
        for filename in fnmatch.filter(files, fnexp):
            yield os.path.join(root, filename)

def GenRandomStr():
    str = ''
    chars = 'ABCDEFGHIJKLMNOPQRSTUVWXYZ01234567890'
    for num in range(10):
        str += random.choice(chars)
    return str

def GetPicPath():
    pic_full_path = []
    if os.path.isdir(input_path):
        for i in os.listdir(input_path):
            sub_dir = input_path + '/' + i
            if os.path.isdir(sub_dir):
                for n in os.listdir(sub_dir):
                    pic_full_path.append(sub_dir + '/' + n)
    return pic_full_path


def print_all_know_exif_tags():
	for k in sorted(TAGS):
		print k, TAGS[k]

def FormatTime(date):
    try:
        ts = time.mktime(time.strptime(date,'%Y:%m:%d %H:%M:%S'))
        return time.strftime('%Y-%m-%d %H:%M:%S',time.localtime(ts))
    except Exception, e:
        return False

def TrimTime(mtime):
    ts = time.mktime(time.strptime(mtime,'%Y-%m-%d %H:%M:%S'))
    return time.strftime('%Y%m%d',time.localtime(ts))

def CalcDays(mtime,birth_day):
    time_fmt = '%Y%m%d'
    days_born = (datetime.strptime(mtime,time_fmt) - datetime.strptime(birth_day,time_fmt)).days
    return str(days_born + 1)

def GenMd5(filename):
    file_tmp = open(filename,'rb')
    md5_value = md5(file_tmp.read())
    file_tmp.close()
    return md5_value.hexdigest()

def GetPicExif():
    pic_date = {}
    #pic_path = GetPicPath()
    for filename in IterFindFiles(input_path,fnexp):
        mtime = time.strftime('%Y-%m-%d %H:%M:%S',time.localtime(os.stat(filename).st_mtime))
    	try:
            img = Image.open(filename)
    	except Exception, e:
    		print filename,"skipping due to ",e
        try:
            exif_data = img._getexif()
        except Exception, e:
            print filename,"skipping due to ",e
        finally:
            if exif_data:
                if exif_data.has_key(36867):
                    pic_date[filename] = FormatTime(exif_data[36867]) and FormatTime(exif_data[36867])  or mtime
                elif exif_data.has_key(36868):
                    pic_date[filename] = FormatTime(exif_data[36868]) and FormatTime(exif_data[36868])  or mtime
                elif exif_data.has_key(306):
                    pic_date[filename] = FormatTime(exif_data[306]) and FormatTime(exif_data[306]) or mtime
                else:
                    pic_date[filename] = mtime
            else:
                pic_date[filename] = mtime

    return pic_date

def ArchivePic():
    pic_date = GetPicExif()
    new_dir_file_md5_list = []
    for pic,mtime in pic_date.items():
        std_out = "\033[1;33mAdd new picture \033[1;31m%s\033[0m\033[1;33m to dest path:%s\033[0m"%(os.path.split(pic)[1],output_path)
        new_dir = "%s/%s-(%sdays)"%(output_path,TrimTime(mtime),CalcDays(TrimTime(mtime),birth_day))
        if not os.path.exists(new_dir):
            os.mkdir(new_dir)
        new_file_name = '%s-%s-%s%s'%(pic_prefix,TrimTime(mtime),GenRandomStr(),pic_suffix)
        new_file_path = '%s/%s'%(new_dir,new_file_name)
        if not os.path.exists(new_file_path):
            try:
                if os.listdir(new_dir):
                    for i in os.listdir(new_dir):
                        hashvalue = GenMd5(os.path.join(new_dir,i))
                        new_dir_file_md5_list.append(hashvalue)
                    if GenMd5(pic) not in new_dir_file_md5_list:
                        shutil.copy2(pic,new_file_path)
                        print std_out
                else:
                    shutil.copy2(pic,new_file_path)
                    print std_out
            except Exception, e:
                print e
        else:
            while True:
                new_file_name = '%s-%s-%s%s'%(pic_prefix,TrimTime(mtime),GenRandomStr(),pic_suffix)
                if new_file_name not in os.lisdir(new_dir):
                    break
                else:
                    continue
            new_file_path = '%s/%s'%(new_dir,new_file_name)
            for i in os.listdir(new_dir):
                hashvalue = GenMd5(os.path.join(new_dir,i))
                new_dir_file_md5_list.append(hashvalue)
            if GenMd5(pic) not in new_dir_file_md5_list:
                try:
                    shutil.copy2(pic,new_file_path)
                    print std_out
                except Exception, e:
                    print e
    return 


if __name__ == "__main__":
    #input_path = r"D:\baby/"
    input_path = r"C:\users\xxr12\onedrive\pictures"
    #input_path = r"E:\MemArchPic"
    output_path = r"E:\Mybaby"
    fnexp = "*.jpg"
    pic_suffix = ".jpg"   #如果查找的是jpg文件,那文件后缀名也要匹配
    pic_prefix = "MYBABY"
    birth_day = '20150621'
    if not os.path.exists(output_path): 
        os.mkdir(output_path)
    if not os.path.exists(input_path):
        print "some of path not found!"
    else:
        ArchivePic()
    #print_all_know_exif_tags()