In [0]:
import json
import pandas as pd
import great_expectations as ge
In [0]:
# df = ge.read_csv("data/broken_timestamp_example.csv")
#Here's the dataframe
df_as_json = {
"other_var":[13,14,10,13,14],
"date_var":["2014-09-01","2014-10-30","2014-07-31","2014-09-01","2014-10-30"]
}
df = pd.DataFrame(df_as_json)
df = ge.dataset.pandas_dataset.PandasDataset(df)
df.head()
In [0]:
df.expect_column_values_to_be_dateutil_parseable('date_var')
In [0]:
df.dtypes
In [0]:
df.date_var[0]
In [0]:
df["date_var_dt"] = pd.to_datetime(df.date_var)
In [0]:
df.expect_column_values_to_be_dateutil_parseable('date_var_dt')
In [0]:
df.dtypes
In [0]:
?df.expect_column_value_lengths_to_be_between
In [0]:
df.expect_column_values_to_be_between(min_)