In [11]:
import pandas as pd

git_log_raw = pd.read_csv(
    "../../buschmais-spring-petclinic/git_log_machine.log",
    sep='\u0012',
    names= ["raw"])
git_log_raw.head()


Out[11]:
raw
0 521d01db950e357cf81ef78c50daf290e92b309c 1 1 1
1 author Costin Leau
2 author-mail <cleau@vmware.com>
3 author-time 1259174752
4 author-tz +0000

In [15]:
git_log_raw['type'] = git_log_raw.raw.str.split(" ", n=1).str[0]
git_log_raw.melt


Out[15]:
raw type
0 521d01db950e357cf81ef78c50daf290e92b309c 1 1 1 521d01db950e357cf81ef78c50daf290e92b309c
1 author Costin Leau author
2 author-mail <cleau@vmware.com> author-mail
3 author-time 1259174752 author-time
4 author-tz +0000 author-tz
5 committer Michael Isvy committer
6 committer-mail <misvy@vmware.com> committer-mail
7 committer-time 1357722797 committer-time
8 committer-tz +0800 committer-tz
9 summary SPR-6447 summary
10 filename pom.xml filename
11 \t<?xml version="1.0" encoding="UTF-8"?> \t<?xml
12 09ed33a5fc01209b4190c74f405b2b1e523b739c 2 2 5 09ed33a5fc01209b4190c74f405b2b1e523b739c
13 author Antoine Rey author
14 author-mail <antoine.rey@free.fr> author-mail
15 author-time 1444980786 author-time
16 author-tz +0200 author-tz
17 committer Antoine Rey committer
18 committer-mail <antoine.rey@free.fr> committer-mail
19 committer-time 1444980808 committer-time
20 committer-tz +0200 committer-tz
21 summary #96 Reformat code with EditorConfig summary
22 previous 1aef94d6a86634f810b1eae448d4e2594eac5... previous
23 filename pom.xml filename
24 \t<project xmlns:xsi="http://www.w3.org/2001/X... \t<project
25 09ed33a5fc01209b4190c74f405b2b1e523b739c 3 3 09ed33a5fc01209b4190c74f405b2b1e523b739c
26 \t xsi:schemaLocation="http://maven.ap... \t
27 09ed33a5fc01209b4190c74f405b2b1e523b739c 4 4 09ed33a5fc01209b4190c74f405b2b1e523b739c
28 \t <modelVersion>4.0.0</modelVersion> \t
29 09ed33a5fc01209b4190c74f405b2b1e523b739c 5 5 09ed33a5fc01209b4190c74f405b2b1e523b739c
... ... ...
1446 \t </profile> \t
1447 540d31ed217c8ab36dcceda0ee72da7009c72ad7 419 5... 540d31ed217c8ab36dcceda0ee72da7009c72ad7
1448 \t </profiles> \t
1449 57e17d32b285d63c96747e5fed059ef1ea4cb529 226 5... 57e17d32b285d63c96747e5fed059ef1ea4cb529
1450 author Keith Donald author
1451 author-mail <kdonald@vmware.com> author-mail
1452 author-time 1261075904 author-time
1453 author-tz +0000 author-tz
1454 committer Michael Isvy committer
1455 committer-mail <misvy@vmware.com> committer-mail
1456 committer-time 1357722804 committer-time
1457 committer-tz +0800 committer-tz
1458 summary finally got rid of commons logging summary
1459 previous 905d9824b012ee6eceb8305cd15d521c3b4d1... previous
1460 filename pom.xml filename
1461 09ed33a5fc01209b4190c74f405b2b1e523b739c 406 5... 09ed33a5fc01209b4190c74f405b2b1e523b739c
1462 \t <url>demopetclinic</url> \t
1463 1741e85044b6378ec5d16f49ac9f85d918c2dd2a 488 5... 1741e85044b6378ec5d16f49ac9f85d918c2dd2a
1464 author Michael Isvy author
1465 author-mail <misvy@vmware.com> author-mail
1466 author-time 1366851620 author-time
1467 author-tz +0800 author-tz
1468 committer Michael Isvy committer
1469 committer-mail <misvy@vmware.com> committer-mail
1470 committer-time 1366851620 committer-time
1471 committer-tz +0800 committer-tz
1472 summary migrated to Hibernate-Validator 5.0.0.... summary
1473 previous 94109017dec44bb34ea7b2034d0ef6ba00760... previous
1474 filename pom.xml filename
1475 \t</project> \t</project>

1476 rows × 2 columns