In [1]:
%%time
import pandas as pd
dfs = pd.read_csv(
"../../linux/git_diff.log",
skip_blank_lines=False,
sep="\n",
encoding="latin-1",
chunksize=100000,
names=["raw"])
df = pd.concat(dfs)
df.tail()
In [2]:
df.info()