In [1]:
import sklearn
import numpy as np
In [2]:
import os
import re
In [3]:
dataset = {
(folder_name,int(re.findall(r"\d\d\d\d",file_name)[0])): "dataset/lfw/%s/%s" % (folder_name,file_name)
for folder_name in os.listdir("dataset/lfw/")
for file_name in os.listdir("dataset/lfw/"+folder_name)
}
#dataset[('Mehdi_Ghanimifard','1')] = 'dataset/lfw/Mehdi_Ghanimifard/Mehdi_Ghanimifard_0001.jpg'
In [ ]:
In [4]:
dataset_att = dict()
with open('dataset/pubfig_attributes.txt') as att_file:
for index, line in enumerate(att_file):
items = line.split('\t')
if index == 1:
attributes = items[2:]
if index > 1:
dataset_att[tuple(items[:2])] = np.array(items[2:]).astype(np.float)
In [ ]: