In [24]:
import pandas as pd
import pandas_profiling as pp
import numpy as np

In [9]:
commit_frame = pd.read_feather('povray-data/commit_frame.feather')

In [10]:
commit_frame.head()


Out[10]:
hexsha name_rev size author_name author_email authored_datetime author_tz_offset committer_name committer_email committed_datetime committer_tz_offset stats_total_files stats_total_lines stats_total_insertions stats_total_deletions encoding message
0 ea3d549a0c27c0dfb5c51e9fcd980866cfaf654b remotes/origin/release/v3.7.1 370 Anshu Arya github@anshuarya.com 2017-04-13 21:21:44 25200 Christoph Lipka c-lipka@users.noreply.github.com 2017-04-13 21:21:44 -7200 1 598 156 442 UTF-8 Update AVXFMA4 noise implementation (#268)\n\n...
1 8a8c73e2edc8d55ff3e9e6762eefccf19ae07914 remotes/origin/release/v3.7.1~1 710 Anshu Arya github@anshuarya.com 2017-04-13 21:19:21 25200 Christoph Lipka c-lipka@users.noreply.github.com 2017-04-13 21:19:21 -7200 9 357 352 5 UTF-8 Add alternative AVX-optimized noise implementa...
2 3adbf759bf0b6be311dfe4d9b75c781bb8208999 remotes/origin/release/v3.7.1~2 333 wfpokorny wfpokorny@yahoo.com 2017-04-12 20:41:44 14400 Christoph Lipka c-lipka@users.noreply.github.com 2017-04-12 20:41:44 -7200 1 5 2 3 UTF-8 Improve AA performance. (#270)\n\nEspecially h...
3 2be22dd2068c7e1bacf134b788775ca4579ef664 remotes/origin/release/v3.7.1~3 291 wfpokorny wfpokorny@yahoo.com 2017-04-06 11:18:13 14400 Christoph Lipka c-lipka@users.noreply.github.com 2017-04-06 11:18:13 -7200 1 18 15 3 UTF-8 Relax Parse_Lathe point checking for versions ...
4 59ab7f260bc1250591cc6b5e8f544ac53f134039 remotes/origin/release/v3.7.1~4 317 Christoph Lipka c-lipka@users.noreply.github.com 2017-04-04 14:16:39 -7200 Christoph Lipka c-lipka@users.noreply.github.com 2017-04-04 14:16:39 -7200 2 24 18 6 UTF-8 Fix optional parameters of command-line-style ...

In [29]:
# pp.ProfileReport(commit_frame[['size', 'author_name', 'committed_datetime', 'stats_total_files', 
#                                'stats_total_lines', 
#                                'stats_total_insertions', 'stats_total_deletions']])
commit_frame['author_tz_offset'] = commit_frame['author_tz_offset'].astype('int')
commit_frame['committer_tz_offset'] = commit_frame['committer_tz_offset'].astype('int')
report = pp.ProfileReport(commit_frame)
report.to_file('povray-commits-profile.html')

In [ ]: