In [8]:
import pandas as pd
import numpy as np
import unicodedata
%matplotlib inline
In [9]:
SNIPPET_FILEPATH = "data/snippet-data.json"
In [10]:
# Parse the snippet records from the JSON file
data = pd.read_json(SNIPPET_FILEPATH, orient='values')['data']
In [11]:
# Group snippets by musuem art collection
def group_by_collection (data_set):
collections = {}
for item in data_set:
id = item['id']
try:
u_c_name = item['ocobjects'][0]['collections'][0]['name']
c_name = unicodedata.normalize('NFKD', u_c_name).encode('ascii','ignore') # Strip unicode encoding
collections[id] = c_name
except (IndexError, TypeError):
print "ID: ", id, " | COLLECTION FIELD IS EMPTY."
return collections
In [12]:
collections = group_by_collection(data) # Note that some snippets have empty collection fields
ID: 439 | COLLECTION FIELD IS EMPTY.
ID: 445 | COLLECTION FIELD IS EMPTY.
ID: 451 | COLLECTION FIELD IS EMPTY.
ID: 462 | COLLECTION FIELD IS EMPTY.
ID: 486 | COLLECTION FIELD IS EMPTY.
ID: 491 | COLLECTION FIELD IS EMPTY.
ID: 493 | COLLECTION FIELD IS EMPTY.
ID: 496 | COLLECTION FIELD IS EMPTY.
ID: 507 | COLLECTION FIELD IS EMPTY.
ID: 518 | COLLECTION FIELD IS EMPTY.
ID: 521 | COLLECTION FIELD IS EMPTY.
ID: 524 | COLLECTION FIELD IS EMPTY.
ID: 525 | COLLECTION FIELD IS EMPTY.
ID: 536 | COLLECTION FIELD IS EMPTY.
ID: 580 | COLLECTION FIELD IS EMPTY.
ID: 581 | COLLECTION FIELD IS EMPTY.
ID: 589 | COLLECTION FIELD IS EMPTY.
ID: 592 | COLLECTION FIELD IS EMPTY.
ID: 605 | COLLECTION FIELD IS EMPTY.
ID: 631 | COLLECTION FIELD IS EMPTY.
ID: 642 | COLLECTION FIELD IS EMPTY.
ID: 650 | COLLECTION FIELD IS EMPTY.
ID: 660 | COLLECTION FIELD IS EMPTY.
ID: 672 | COLLECTION FIELD IS EMPTY.
ID: 678 | COLLECTION FIELD IS EMPTY.
ID: 683 | COLLECTION FIELD IS EMPTY.
ID: 697 | COLLECTION FIELD IS EMPTY.
ID: 707 | COLLECTION FIELD IS EMPTY.
ID: 710 | COLLECTION FIELD IS EMPTY.
ID: 711 | COLLECTION FIELD IS EMPTY.
ID: 730 | COLLECTION FIELD IS EMPTY.
ID: 742 | COLLECTION FIELD IS EMPTY.
ID: 744 | COLLECTION FIELD IS EMPTY.
ID: 753 | COLLECTION FIELD IS EMPTY.
ID: 779 | COLLECTION FIELD IS EMPTY.
ID: 780 | COLLECTION FIELD IS EMPTY.
ID: 781 | COLLECTION FIELD IS EMPTY.
ID: 796 | COLLECTION FIELD IS EMPTY.
ID: 825 | COLLECTION FIELD IS EMPTY.
ID: 832 | COLLECTION FIELD IS EMPTY.
ID: 840 | COLLECTION FIELD IS EMPTY.
ID: 841 | COLLECTION FIELD IS EMPTY.
ID: 842 | COLLECTION FIELD IS EMPTY.
ID: 843 | COLLECTION FIELD IS EMPTY.
ID: 844 | COLLECTION FIELD IS EMPTY.
ID: 845 | COLLECTION FIELD IS EMPTY.
ID: 846 | COLLECTION FIELD IS EMPTY.
ID: 847 | COLLECTION FIELD IS EMPTY.
ID: 848 | COLLECTION FIELD IS EMPTY.
ID: 849 | COLLECTION FIELD IS EMPTY.
ID: 861 | COLLECTION FIELD IS EMPTY.
ID: 868 | COLLECTION FIELD IS EMPTY.
ID: 884 | COLLECTION FIELD IS EMPTY.
ID: 888 | COLLECTION FIELD IS EMPTY.
ID: 895 | COLLECTION FIELD IS EMPTY.
ID: 896 | COLLECTION FIELD IS EMPTY.
ID: 904 | COLLECTION FIELD IS EMPTY.
ID: 907 | COLLECTION FIELD IS EMPTY.
ID: 916 | COLLECTION FIELD IS EMPTY.
ID: 933 | COLLECTION FIELD IS EMPTY.
ID: 951 | COLLECTION FIELD IS EMPTY.
ID: 961 | COLLECTION FIELD IS EMPTY.
ID: 962 | COLLECTION FIELD IS EMPTY.
ID: 971 | COLLECTION FIELD IS EMPTY.
ID: 972 | COLLECTION FIELD IS EMPTY.
ID: 978 | COLLECTION FIELD IS EMPTY.
ID: 980 | COLLECTION FIELD IS EMPTY.
ID: 981 | COLLECTION FIELD IS EMPTY.
ID: 982 | COLLECTION FIELD IS EMPTY.
ID: 984 | COLLECTION FIELD IS EMPTY.
ID: 987 | COLLECTION FIELD IS EMPTY.
ID: 988 | COLLECTION FIELD IS EMPTY.
ID: 1000 | COLLECTION FIELD IS EMPTY.
ID: 1001 | COLLECTION FIELD IS EMPTY.
ID: 1003 | COLLECTION FIELD IS EMPTY.
ID: 1004 | COLLECTION FIELD IS EMPTY.
ID: 1007 | COLLECTION FIELD IS EMPTY.
ID: 1010 | COLLECTION FIELD IS EMPTY.
ID: 1016 | COLLECTION FIELD IS EMPTY.
ID: 1017 | COLLECTION FIELD IS EMPTY.
ID: 1019 | COLLECTION FIELD IS EMPTY.
ID: 1020 | COLLECTION FIELD IS EMPTY.
ID: 1021 | COLLECTION FIELD IS EMPTY.
ID: 1022 | COLLECTION FIELD IS EMPTY.
ID: 1023 | COLLECTION FIELD IS EMPTY.
ID: 1024 | COLLECTION FIELD IS EMPTY.
ID: 1025 | COLLECTION FIELD IS EMPTY.
ID: 1026 | COLLECTION FIELD IS EMPTY.
ID: 1033 | COLLECTION FIELD IS EMPTY.
ID: 1035 | COLLECTION FIELD IS EMPTY.
ID: 1042 | COLLECTION FIELD IS EMPTY.
ID: 1045 | COLLECTION FIELD IS EMPTY.
ID: 1050 | COLLECTION FIELD IS EMPTY.
ID: 1052 | COLLECTION FIELD IS EMPTY.
ID: 1057 | COLLECTION FIELD IS EMPTY.
ID: 1058 | COLLECTION FIELD IS EMPTY.
ID: 1061 | COLLECTION FIELD IS EMPTY.
ID: 1062 | COLLECTION FIELD IS EMPTY.
ID: 1066 | COLLECTION FIELD IS EMPTY.
ID: 1068 | COLLECTION FIELD IS EMPTY.
ID: 1069 | COLLECTION FIELD IS EMPTY.
ID: 1070 | COLLECTION FIELD IS EMPTY.
ID: 1071 | COLLECTION FIELD IS EMPTY.
ID: 1072 | COLLECTION FIELD IS EMPTY.
ID: 1074 | COLLECTION FIELD IS EMPTY.
ID: 1077 | COLLECTION FIELD IS EMPTY.
ID: 1082 | COLLECTION FIELD IS EMPTY.
ID: 1083 | COLLECTION FIELD IS EMPTY.
ID: 1084 | COLLECTION FIELD IS EMPTY.
ID: 1085 | COLLECTION FIELD IS EMPTY.
ID: 1089 | COLLECTION FIELD IS EMPTY.
ID: 1093 | COLLECTION FIELD IS EMPTY.
ID: 1094 | COLLECTION FIELD IS EMPTY.
ID: 1095 | COLLECTION FIELD IS EMPTY.
ID: 1096 | COLLECTION FIELD IS EMPTY.
ID: 1097 | COLLECTION FIELD IS EMPTY.
ID: 1099 | COLLECTION FIELD IS EMPTY.
ID: 1100 | COLLECTION FIELD IS EMPTY.
ID: 1101 | COLLECTION FIELD IS EMPTY.
ID: 1102 | COLLECTION FIELD IS EMPTY.
ID: 1103 | COLLECTION FIELD IS EMPTY.
ID: 1112 | COLLECTION FIELD IS EMPTY.
ID: 1114 | COLLECTION FIELD IS EMPTY.
ID: 1115 | COLLECTION FIELD IS EMPTY.
ID: 1121 | COLLECTION FIELD IS EMPTY.
ID: 1125 | COLLECTION FIELD IS EMPTY.
ID: 1128 | COLLECTION FIELD IS EMPTY.
ID: 1130 | COLLECTION FIELD IS EMPTY.
ID: 1134 | COLLECTION FIELD IS EMPTY.
ID: 1136 | COLLECTION FIELD IS EMPTY.
ID: 1141 | COLLECTION FIELD IS EMPTY.
ID: 1144 | COLLECTION FIELD IS EMPTY.
ID: 1154 | COLLECTION FIELD IS EMPTY.
ID: 1160 | COLLECTION FIELD IS EMPTY.
ID: 1165 | COLLECTION FIELD IS EMPTY.
ID: 1166 | COLLECTION FIELD IS EMPTY.
ID: 1167 | COLLECTION FIELD IS EMPTY.
ID: 1168 | COLLECTION FIELD IS EMPTY.
ID: 1169 | COLLECTION FIELD IS EMPTY.
ID: 1178 | COLLECTION FIELD IS EMPTY.
ID: 1183 | COLLECTION FIELD IS EMPTY.
ID: 1186 | COLLECTION FIELD IS EMPTY.
ID: 1187 | COLLECTION FIELD IS EMPTY.
ID: 1189 | COLLECTION FIELD IS EMPTY.
ID: 1190 | COLLECTION FIELD IS EMPTY.
ID: 1194 | COLLECTION FIELD IS EMPTY.
ID: 1196 | COLLECTION FIELD IS EMPTY.
ID: 1198 | COLLECTION FIELD IS EMPTY.
ID: 1205 | COLLECTION FIELD IS EMPTY.
ID: 1210 | COLLECTION FIELD IS EMPTY.
ID: 1212 | COLLECTION FIELD IS EMPTY.
ID: 1219 | COLLECTION FIELD IS EMPTY.
ID: 1220 | COLLECTION FIELD IS EMPTY.
ID: 1223 | COLLECTION FIELD IS EMPTY.
ID: 1224 | COLLECTION FIELD IS EMPTY.
ID: 1226 | COLLECTION FIELD IS EMPTY.
ID: 1232 | COLLECTION FIELD IS EMPTY.
ID: 1234 | COLLECTION FIELD IS EMPTY.
ID: 1235 | COLLECTION FIELD IS EMPTY.
ID: 1246 | COLLECTION FIELD IS EMPTY.
ID: 1247 | COLLECTION FIELD IS EMPTY.
ID: 1253 | COLLECTION FIELD IS EMPTY.
ID: 1260 | COLLECTION FIELD IS EMPTY.
ID: 1262 | COLLECTION FIELD IS EMPTY.
ID: 1263 | COLLECTION FIELD IS EMPTY.
ID: 1264 | COLLECTION FIELD IS EMPTY.
ID: 1265 | COLLECTION FIELD IS EMPTY.
ID: 1269 | COLLECTION FIELD IS EMPTY.
ID: 1270 | COLLECTION FIELD IS EMPTY.
ID: 1271 | COLLECTION FIELD IS EMPTY.
ID: 1274 | COLLECTION FIELD IS EMPTY.
ID: 1276 | COLLECTION FIELD IS EMPTY.
ID: 1278 | COLLECTION FIELD IS EMPTY.
ID: 1291 | COLLECTION FIELD IS EMPTY.
ID: 1304 | COLLECTION FIELD IS EMPTY.
ID: 1305 | COLLECTION FIELD IS EMPTY.
ID: 1339 | COLLECTION FIELD IS EMPTY.
ID: 1340 | COLLECTION FIELD IS EMPTY.
ID: 1346 | COLLECTION FIELD IS EMPTY.
ID: 1349 | COLLECTION FIELD IS EMPTY.
ID: 1355 | COLLECTION FIELD IS EMPTY.
ID: 1356 | COLLECTION FIELD IS EMPTY.
ID: 1357 | COLLECTION FIELD IS EMPTY.
ID: 1358 | COLLECTION FIELD IS EMPTY.
ID: 1364 | COLLECTION FIELD IS EMPTY.
ID: 1366 | COLLECTION FIELD IS EMPTY.
ID: 1367 | COLLECTION FIELD IS EMPTY.
ID: 1370 | COLLECTION FIELD IS EMPTY.
ID: 1371 | COLLECTION FIELD IS EMPTY.
ID: 1372 | COLLECTION FIELD IS EMPTY.
ID: 1373 | COLLECTION FIELD IS EMPTY.
ID: 1374 | COLLECTION FIELD IS EMPTY.
ID: 1377 | COLLECTION FIELD IS EMPTY.
ID: 1378 | COLLECTION FIELD IS EMPTY.
ID: 1379 | COLLECTION FIELD IS EMPTY.
ID: 1382 | COLLECTION FIELD IS EMPTY.
ID: 1389 | COLLECTION FIELD IS EMPTY.
ID: 1390 | COLLECTION FIELD IS EMPTY.
ID: 1400 | COLLECTION FIELD IS EMPTY.
ID: 1404 | COLLECTION FIELD IS EMPTY.
ID: 1407 | COLLECTION FIELD IS EMPTY.
ID: 1408 | COLLECTION FIELD IS EMPTY.
ID: 1409 | COLLECTION FIELD IS EMPTY.
ID: 1413 | COLLECTION FIELD IS EMPTY.
ID: 1419 | COLLECTION FIELD IS EMPTY.
ID: 1422 | COLLECTION FIELD IS EMPTY.
ID: 1425 | COLLECTION FIELD IS EMPTY.
ID: 1442 | COLLECTION FIELD IS EMPTY.
ID: 1443 | COLLECTION FIELD IS EMPTY.
ID: 1450 | COLLECTION FIELD IS EMPTY.
ID: 1451 | COLLECTION FIELD IS EMPTY.
ID: 1453 | COLLECTION FIELD IS EMPTY.
ID: 1456 | COLLECTION FIELD IS EMPTY.
ID: 1461 | COLLECTION FIELD IS EMPTY.
ID: 1462 | COLLECTION FIELD IS EMPTY.
ID: 1463 | COLLECTION FIELD IS EMPTY.
ID: 1464 | COLLECTION FIELD IS EMPTY.
ID: 1465 | COLLECTION FIELD IS EMPTY.
ID: 1466 | COLLECTION FIELD IS EMPTY.
ID: 1467 | COLLECTION FIELD IS EMPTY.
ID: 1475 | COLLECTION FIELD IS EMPTY.
ID: 1476 | COLLECTION FIELD IS EMPTY.
ID: 1477 | COLLECTION FIELD IS EMPTY.
ID: 1478 | COLLECTION FIELD IS EMPTY.
ID: 1480 | COLLECTION FIELD IS EMPTY.
ID: 1485 | COLLECTION FIELD IS EMPTY.
ID: 1486 | COLLECTION FIELD IS EMPTY.
ID: 1487 | COLLECTION FIELD IS EMPTY.
ID: 1492 | COLLECTION FIELD IS EMPTY.
ID: 1493 | COLLECTION FIELD IS EMPTY.
ID: 1503 | COLLECTION FIELD IS EMPTY.
ID: 1504 | COLLECTION FIELD IS EMPTY.
ID: 1507 | COLLECTION FIELD IS EMPTY.
ID: 1509 | COLLECTION FIELD IS EMPTY.
ID: 1511 | COLLECTION FIELD IS EMPTY.
ID: 1515 | COLLECTION FIELD IS EMPTY.
ID: 1523 | COLLECTION FIELD IS EMPTY.
ID: 1524 | COLLECTION FIELD IS EMPTY.
ID: 1531 | COLLECTION FIELD IS EMPTY.
ID: 1532 | COLLECTION FIELD IS EMPTY.
ID: 1533 | COLLECTION FIELD IS EMPTY.
ID: 1535 | COLLECTION FIELD IS EMPTY.
ID: 1540 | COLLECTION FIELD IS EMPTY.
ID: 1542 | COLLECTION FIELD IS EMPTY.
ID: 1543 | COLLECTION FIELD IS EMPTY.
ID: 1544 | COLLECTION FIELD IS EMPTY.
ID: 1548 | COLLECTION FIELD IS EMPTY.
ID: 1551 | COLLECTION FIELD IS EMPTY.
ID: 1555 | COLLECTION FIELD IS EMPTY.
ID: 1561 | COLLECTION FIELD IS EMPTY.
ID: 1563 | COLLECTION FIELD IS EMPTY.
ID: 1564 | COLLECTION FIELD IS EMPTY.
ID: 1565 | COLLECTION FIELD IS EMPTY.
ID: 1567 | COLLECTION FIELD IS EMPTY.
ID: 1568 | COLLECTION FIELD IS EMPTY.
ID: 1571 | COLLECTION FIELD IS EMPTY.
ID: 1577 | COLLECTION FIELD IS EMPTY.
ID: 1584 | COLLECTION FIELD IS EMPTY.
ID: 1592 | COLLECTION FIELD IS EMPTY.
ID: 1595 | COLLECTION FIELD IS EMPTY.
ID: 1599 | COLLECTION FIELD IS EMPTY.
ID: 1601 | COLLECTION FIELD IS EMPTY.
ID: 1602 | COLLECTION FIELD IS EMPTY.
ID: 1605 | COLLECTION FIELD IS EMPTY.
ID: 1607 | COLLECTION FIELD IS EMPTY.
ID: 1615 | COLLECTION FIELD IS EMPTY.
ID: 1618 | COLLECTION FIELD IS EMPTY.
ID: 1620 | COLLECTION FIELD IS EMPTY.
ID: 1622 | COLLECTION FIELD IS EMPTY.
ID: 1625 | COLLECTION FIELD IS EMPTY.
ID: 1633 | COLLECTION FIELD IS EMPTY.
ID: 1643 | COLLECTION FIELD IS EMPTY.
ID: 1645 | COLLECTION FIELD IS EMPTY.
ID: 1646 | COLLECTION FIELD IS EMPTY.
ID: 1649 | COLLECTION FIELD IS EMPTY.
ID: 1652 | COLLECTION FIELD IS EMPTY.
ID: 1658 | COLLECTION FIELD IS EMPTY.
ID: 1663 | COLLECTION FIELD IS EMPTY.
ID: 1664 | COLLECTION FIELD IS EMPTY.
ID: 1665 | COLLECTION FIELD IS EMPTY.
ID: 1668 | COLLECTION FIELD IS EMPTY.
ID: 1671 | COLLECTION FIELD IS EMPTY.
ID: 1673 | COLLECTION FIELD IS EMPTY.
ID: 1674 | COLLECTION FIELD IS EMPTY.
ID: 1679 | COLLECTION FIELD IS EMPTY.
ID: 1680 | COLLECTION FIELD IS EMPTY.
ID: 1681 | COLLECTION FIELD IS EMPTY.
ID: 1682 | COLLECTION FIELD IS EMPTY.
ID: 1684 | COLLECTION FIELD IS EMPTY.
ID: 1692 | COLLECTION FIELD IS EMPTY.
ID: 1694 | COLLECTION FIELD IS EMPTY.
ID: 1707 | COLLECTION FIELD IS EMPTY.
ID: 1708 | COLLECTION FIELD IS EMPTY.
ID: 1713 | COLLECTION FIELD IS EMPTY.
ID: 1715 | COLLECTION FIELD IS EMPTY.
ID: 1716 | COLLECTION FIELD IS EMPTY.
ID: 1718 | COLLECTION FIELD IS EMPTY.
ID: 1724 | COLLECTION FIELD IS EMPTY.
ID: 1725 | COLLECTION FIELD IS EMPTY.
ID: 1726 | COLLECTION FIELD IS EMPTY.
ID: 1727 | COLLECTION FIELD IS EMPTY.
ID: 1728 | COLLECTION FIELD IS EMPTY.
ID: 1732 | COLLECTION FIELD IS EMPTY.
ID: 1736 | COLLECTION FIELD IS EMPTY.
ID: 1741 | COLLECTION FIELD IS EMPTY.
ID: 1747 | COLLECTION FIELD IS EMPTY.
ID: 1751 | COLLECTION FIELD IS EMPTY.
ID: 1753 | COLLECTION FIELD IS EMPTY.
ID: 1755 | COLLECTION FIELD IS EMPTY.
ID: 1757 | COLLECTION FIELD IS EMPTY.
ID: 1759 | COLLECTION FIELD IS EMPTY.
ID: 1781 | COLLECTION FIELD IS EMPTY.
ID: 1785 | COLLECTION FIELD IS EMPTY.
ID: 1793 | COLLECTION FIELD IS EMPTY.
ID: 1808 | COLLECTION FIELD IS EMPTY.
ID: 1817 | COLLECTION FIELD IS EMPTY.
ID: 1821 | COLLECTION FIELD IS EMPTY.
ID: 1823 | COLLECTION FIELD IS EMPTY.
ID: 1829 | COLLECTION FIELD IS EMPTY.
ID: 1834 | COLLECTION FIELD IS EMPTY.
ID: 1838 | COLLECTION FIELD IS EMPTY.
ID: 1839 | COLLECTION FIELD IS EMPTY.
ID: 1840 | COLLECTION FIELD IS EMPTY.
ID: 1841 | COLLECTION FIELD IS EMPTY.
ID: 1842 | COLLECTION FIELD IS EMPTY.
ID: 1843 | COLLECTION FIELD IS EMPTY.
ID: 1844 | COLLECTION FIELD IS EMPTY.
ID: 1845 | COLLECTION FIELD IS EMPTY.
ID: 1846 | COLLECTION FIELD IS EMPTY.
ID: 1847 | COLLECTION FIELD IS EMPTY.
ID: 1848 | COLLECTION FIELD IS EMPTY.
ID: 1852 | COLLECTION FIELD IS EMPTY.
ID: 1855 | COLLECTION FIELD IS EMPTY.
ID: 1885 | COLLECTION FIELD IS EMPTY.
ID: 1887 | COLLECTION FIELD IS EMPTY.
ID: 1888 | COLLECTION FIELD IS EMPTY.
ID: 1890 | COLLECTION FIELD IS EMPTY.
ID: 1893 | COLLECTION FIELD IS EMPTY.
ID: 1895 | COLLECTION FIELD IS EMPTY.
ID: 1898 | COLLECTION FIELD IS EMPTY.
ID: 1913 | COLLECTION FIELD IS EMPTY.
ID: 1915 | COLLECTION FIELD IS EMPTY.
ID: 1916 | COLLECTION FIELD IS EMPTY.
ID: 1917 | COLLECTION FIELD IS EMPTY.
ID: 1919 | COLLECTION FIELD IS EMPTY.
ID: 1932 | COLLECTION FIELD IS EMPTY.
ID: 1933 | COLLECTION FIELD IS EMPTY.
ID: 1937 | COLLECTION FIELD IS EMPTY.
ID: 1948 | COLLECTION FIELD IS EMPTY.
ID: 1950 | COLLECTION FIELD IS EMPTY.
ID: 1956 | COLLECTION FIELD IS EMPTY.
ID: 1959 | COLLECTION FIELD IS EMPTY.
ID: 1960 | COLLECTION FIELD IS EMPTY.
ID: 1962 | COLLECTION FIELD IS EMPTY.
ID: 1963 | COLLECTION FIELD IS EMPTY.
ID: 1964 | COLLECTION FIELD IS EMPTY.
ID: 1965 | COLLECTION FIELD IS EMPTY.
ID: 1966 | COLLECTION FIELD IS EMPTY.
ID: 1968 | COLLECTION FIELD IS EMPTY.
ID: 1974 | COLLECTION FIELD IS EMPTY.
ID: 1976 | COLLECTION FIELD IS EMPTY.
ID: 1977 | COLLECTION FIELD IS EMPTY.
ID: 1978 | COLLECTION FIELD IS EMPTY.
ID: 1979 | COLLECTION FIELD IS EMPTY.
ID: 1981 | COLLECTION FIELD IS EMPTY.
ID: 1990 | COLLECTION FIELD IS EMPTY.
ID: 1999 | COLLECTION FIELD IS EMPTY.
ID: 2000 | COLLECTION FIELD IS EMPTY.
ID: 2003 | COLLECTION FIELD IS EMPTY.
ID: 2028 | COLLECTION FIELD IS EMPTY.
ID: 2031 | COLLECTION FIELD IS EMPTY.
ID: 2033 | COLLECTION FIELD IS EMPTY.
ID: 2034 | COLLECTION FIELD IS EMPTY.
ID: 2038 | COLLECTION FIELD IS EMPTY.
ID: 2041 | COLLECTION FIELD IS EMPTY.
ID: 2044 | COLLECTION FIELD IS EMPTY.
ID: 2060 | COLLECTION FIELD IS EMPTY.
ID: 2073 | COLLECTION FIELD IS EMPTY.
ID: 2075 | COLLECTION FIELD IS EMPTY.
ID: 2076 | COLLECTION FIELD IS EMPTY.
ID: 2088 | COLLECTION FIELD IS EMPTY.
ID: 2089 | COLLECTION FIELD IS EMPTY.
ID: 2090 | COLLECTION FIELD IS EMPTY.
ID: 2094 | COLLECTION FIELD IS EMPTY.
ID: 2100 | COLLECTION FIELD IS EMPTY.
ID: 2101 | COLLECTION FIELD IS EMPTY.
ID: 2103 | COLLECTION FIELD IS EMPTY.
ID: 2107 | COLLECTION FIELD IS EMPTY.
ID: 2109 | COLLECTION FIELD IS EMPTY.
ID: 2111 | COLLECTION FIELD IS EMPTY.
ID: 2116 | COLLECTION FIELD IS EMPTY.
ID: 2117 | COLLECTION FIELD IS EMPTY.
ID: 2118 | COLLECTION FIELD IS EMPTY.
ID: 2119 | COLLECTION FIELD IS EMPTY.
ID: 2121 | COLLECTION FIELD IS EMPTY.
ID: 2122 | COLLECTION FIELD IS EMPTY.
ID: 2126 | COLLECTION FIELD IS EMPTY.
ID: 2128 | COLLECTION FIELD IS EMPTY.
ID: 2132 | COLLECTION FIELD IS EMPTY.
ID: 2136 | COLLECTION FIELD IS EMPTY.
ID: 2140 | COLLECTION FIELD IS EMPTY.
ID: 2141 | COLLECTION FIELD IS EMPTY.
ID: 2143 | COLLECTION FIELD IS EMPTY.
ID: 2147 | COLLECTION FIELD IS EMPTY.
ID: 2152 | COLLECTION FIELD IS EMPTY.
ID: 2155 | COLLECTION FIELD IS EMPTY.
ID: 2157 | COLLECTION FIELD IS EMPTY.
ID: 2159 | COLLECTION FIELD IS EMPTY.
In [13]:
c_set = set(collections.values()) # Set of all art collections included in snippets
In [14]:
print "COLLECTION FREQUENCIES:\n"
values = collections.values()
total = len(values)
for c in c_set:
freq = values.count(c)
percent = (freq/float(total))*100
print c, "\n", freq, "snippets ask about this collection."
print '%0.2f'% percent, "percent of total snippets\n"
COLLECTION FREQUENCIES:
American Art
177 snippets ask about this collection.
14.92 percent of total snippets
Arts of the Americas
61 snippets ask about this collection.
5.14 percent of total snippets
Egyptian, Classical, Ancient Near Eastern Art
129 snippets ask about this collection.
10.88 percent of total snippets
Decorative Arts
125 snippets ask about this collection.
10.54 percent of total snippets
Arts of the Pacific Islands
7 snippets ask about this collection.
0.59 percent of total snippets
European Art
109 snippets ask about this collection.
9.19 percent of total snippets
Arts of Africa
139 snippets ask about this collection.
11.72 percent of total snippets
Elizabeth A. Sackler Center for Feminist Art
48 snippets ask about this collection.
4.05 percent of total snippets
Contemporary Art
365 snippets ask about this collection.
30.78 percent of total snippets
Arts of the Islamic World
5 snippets ask about this collection.
0.42 percent of total snippets
Asian Art
21 snippets ask about this collection.
1.77 percent of total snippets
Content source: seanjh/bkm-ask
Similar notebooks: