notebook.community

Edit and run



In [5]:

    
%matplotlib inline
import pandas as pd
import numpy as np
import seaborn as sb
import matplotlib.pyplot as plt
import pulp
sb.set()

pd.set_option('precision', 2)

macro_nutrients = [
              'kcal per 100 g ready to eat',
              'Protein_(g)',
              'Lipid_Tot_(g)',
              'FA_Sat_(g)',
              'Carbohydrt_(g)']

micro_nutrients = [
              'Fiber_TD_(g)',
              'Vit_A_RAE',
              'Vit_B6_(mg)',
              'Vit_B12_(mcg)',
              'Vit_C_(mg)',
              'Vit_E_(mg)',
              'Folate_DFE_(mcg)',
              'Vit_K_(mcg)',
              'Riboflavin_(mg)',
              'Calcium_(mg)',
              'Niacin_(mg)',
              'Cholestrl_(mg)',
              'FA_Mono_(g)',
              'FA_Poly_(g)',
              'Sugar_Tot_(g)',
              'soluble fiber',
              'total Flavonoid',
              'Iron_(mg)',
              'Alpha_Carot_(mcg)',
              'Beta_Carot_(mcg)',
              'Lycopene_(mcg)',
              'Lut+Zea_(mcg)',
              'Beta_Crypt_(mcg)',
              'Sodium_(mg)',
              'Selenium_(mcg)',
              'Potassium_(mg)',
              'Phytosterols(mg)Per 100 g']

nutrient_list = macro_nutrients + micro_nutrients

food_abbrev = ['almond',
                'apples',
                'apricot',
                'asparagus',
                'avocado',
                'banana',
                'barley',
                'kidney bean',
                'snap bean',
                'blueberry',
                'broccoli',
                'cabbage',
                'canola oil',
                'cantaloupe',
                'carrots',
                'cauliflower',
                'celery',
                'cherry',
                'collard',
                'corn flr',
                'corn starch',
                'corn grits',
                'swt corn',
                'cucumber',
                'garlic',
                'grapefruit',
                'grapes',
                'hazelnuts',
                'honeydew',
                'kiwi',
                'lemon',
                'lettuce',
                'macadamia',       
                'oats',            
                'olive oil',       
                'onions',          
                'orange',          
                'peach',           
                'peanut',         
                'pear',            
                'peas',            
                'grn pepper',     
                'pineapple',       
                'pistachio',       
                'potato',          
                'pumpkin',         
                'raspberry',     
                'rice',            
                'soy oil',         
                'spinach',         
                'squash',          
                'strawberry',    
                'sweet potato',    
                'tomato',        
                'walnut',         
                'watermelon',      
                'wheat',           
                'chickpea',       
                'lentil',         
                'soybean',        
                'tofu',            
                'buckwheat',   
                'sorghum',
                'rye',             
                'spelt',           
                'saflwer oil',
                'syrup cane',
                'hfcs'
                ]

ANIMALS =      ['beef',
                'dairy',
                'egg',
                'chicken',
                'pork',
                'salmon',
                'tuna']

food_abbrev += ANIMALS

SUBSETS_TO_REPLACE = map(lambda x: [x], ANIMALS) + [ANIMALS]

UDSA_COLNAME = 'USDA groups'
MAD_COLNAME = 'MAD (kcal/cap/d)'
ENERGY_COLNAME = 'Energ_Kcal'
data_frame = pd.DataFrame.from_csv('plVals.csv')
index2abbrev = dict(zip(data_frame.index, food_abbrev))
data_frame = data_frame.rename(index=index2abbrev)

# find the corresponding index of the columns in the dataframe to the nutrient list.
# it is enough if the prefix of the column name matches exactly the nutrien name
col_names = list(data_frame.columns)
col_ind_order = np.zeros((1, len(nutrient_list)))
nutrient_list_updated = [''] * len(nutrient_list)
for i, nutr in enumerate(nutrient_list):
    for j, col in enumerate(col_names):
        l_min = min(len(nutr), len(col))
        if nutr[:l_min] == col[:l_min]:
            col_ind_order[0, i] = j
            nutrient_list_updated[i] = col
            continue
nutrient_list = nutrient_list_updated
data = data_frame[nutrient_list].copy()
usda_group = data_frame[UDSA_COLNAME]

# correct to eaten mass basis, so that D entries will be in "per g ready2eat"
data.loc[:, nutrient_list[0]] = data[[nutrient_list[0]]] * 0.01 # convert first column from kcal/100g to kcal/g
for nutr in nutrient_list[1:]:
    # multiply each column the vector of kcal per 100 g ready2eat / kcal per 100 g
    data.loc[:, nutr] *= data.loc[:, nutrient_list[0]] / data_frame.loc[:, ENERGY_COLNAME]
data = data.rename(columns={nutrient_list[0]:'kcal'})
nutrient_list[0] = 'kcal'
data[pd.isnull(data)] = 0



In [63]:

    
for food_subset in SUBSETS_TO_REPLACE:
    # calculate how many grams of a certain animal-based food product is consumed in MAD
    MAD = pd.Series(data_frame.loc[:, MAD_COLNAME] / data.loc[:, 'kcal'], food_abbrev)
    MAD[pd.isnull(MAD)] = 0
    MAD_to_replace = MAD[food_subset]
    print '*** Attempting to replace:'
    print MAD_to_replace.to_string()
    
    # calculate the fraction of this animal portion from the total MAD diet
    MAD_fraction = sum(data_frame.loc[food_subset, MAD_COLNAME]) / data_frame[[MAD_COLNAME]].sum(numeric_only=True)
    
    # adjust the vector of required nutrients to more realistic values
    b_MAD_to_replace = data.loc[food_subset, :].transpose().dot(MAD_to_replace)
    b_const = b_MAD_to_replace.copy()
    b_const['Sugar_Tot_(g)'] = 90.0                  # set a more realistic sugar  upper bound
    b_const['Sodium_(mg)'] = 600.0                   # set a more realistic sodium upper bound (note that the rightful by-mass portion of the total 2300 mg/d of MAD_a is 790 mg/d 
    b_const['Calcium_(mg)'] = 1100.0 * MAD_fraction  # Calcium, see https://www.nlm.nih.gov/medlineplus/magazine/issues/winter11/articles/winter11pg12.html
    b_const['Niacin_(mg)'] = 15.0 * MAD_fraction     # niacin,  see https://www.nlm.nih.gov/medlineplus/ency/article/002409.htm
    b_const['Selenium_(mcg)'] = 55.0 * MAD_fraction  # set a more realistic selenium lower bound, see https://ods.od.nih.gov/factsheets/Selenium-HealthProfessional/
    
    b_const['Lipid_Tot_(g)'] = 0                     # we don't care about fat specifically, just calories
    b_const['Fiber_TD_(g)'] = 0                      # doesn't exist in animals anyway
    b_const['Vit_B12_(mcg)'] = 0                     # impossible to get from plants
    
    # create the LP using PuLP
    FREE_NUTRIENTS = ['FA_Sat_(g)', 'Cholestrl_(mg)', 'Sugar_Tot_(g)', 'Sodium_(mg)']
    EQUAL_NUTRIENTS = ['kcal']
    UPPER_BOUND_NUTRIENTS = []
    
    C  = -np.ones((1, data.shape[1]))
    
    lp = pulp.LpProblem('replace_animal_diet', pulp.LpMinimize)
    x = pulp.LpVariable.dicts('mass', food_abbrev)
    x_vec = map(x.get, food_abbrev)
    
    Ax = data.transpose().dot(x_vec)
    constraints = {}
    for nutr in set(nutrient_list):
        if nutr in UPPER_BOUND_NUTRIENTS:
            constraints[nutr] = pulp.lpSum(Ax[nutr]) <= b_const[nutr]
            lp += constraints[nutr], nutr
        elif nutr in EQUAL_NUTRIENTS:
            constraints[nutr] = pulp.lpSum(Ax[nutr]) == b_const[nutr]
            lp += constraints[nutr], nutr
        elif nutr in FREE_NUTRIENTS:
            constraints[nutr] = pulp.lpSum(Ax[nutr]) == b_const[nutr]
            pass
        else:
            constraints[nutr] = pulp.lpSum(Ax[nutr]) >= b_const[nutr]
            lp += constraints[nutr], nutr
    
    # generally set the upper bound on mass of a single food to 50
    # unless it is in the "hated foods" categorie
    upper_bounds = dict([(f, 50) for f in food_abbrev])
    upper_bounds['garlic'] = 5
    upper_bounds['asparagus'] = 20
    upper_bounds['broccoli'] = 20
    upper_bounds['collard'] = 20
    upper_bounds['macadamia'] = 20
    upper_bounds['spinach'] = 20
    upper_bounds['tofu'] = 20
    upper_bounds['soybean'] = 20

    for a in ANIMALS: # set all animal-based foods to 0 (i.e. don't allow any)
        upper_bounds[a] = 0
    
    for f, ub in upper_bounds.iteritems():
        constraints[f] = x[f] <= ub
        lp += constraints[f], '%s_ub' % f
        lp += x[f] >= 0, '%s_lb' % f

    lp.setObjective(pulp.lpSum(x))
    pulp_solver = pulp.PULP_CBC_CMD(msg=0, dual=1)
    lp.solve(pulp_solver)
    if lp.status != pulp.LpStatusOptimal:
        print "*** Found no solutions"
    else:
        SANE = pd.Series(map(pulp.value, map(x.get, food_abbrev)), food_abbrev)
        print "*** Alternative plant-based diet with total of %.1f (g): " % SANE.sum()
        print SANE[SANE > 0].to_string()
        for nutr in nutrient_list:
            if constraints[nutr].pi:
                print 'shadow price for %s: %.2f' % (nutr, constraints[nutr].pi)
        for f in set(upper_bounds.keys()).difference(ANIMALS):
            if constraints[f].pi:
                print 'shadow price for %s: %.2f' % (f, constraints[f].pi)
    print '=' * 50









    



*** Attempting to replace:
beef    65.5
*** Alternative plant-based diet with total of 114.0 (g): 
asparagus    20.0
barley        3.1
broccoli      7.2
garlic        5.0
hazelnuts     7.4
peanut       11.4
spinach      20.0
soybean      20.0
tofu         20.0
shadow price for kcal: -7.02
shadow price for Protein_(g): 77.98
shadow price for FA_Mono_(g): 70.70
shadow price for Selenium_(mcg): 47.16
shadow price for tofu: -2.49
shadow price for soybean: -2.66
shadow price for spinach: -0.10
shadow price for asparagus: -0.40
shadow price for garlic: -0.21
==================================================
*** Attempting to replace:
dairy    219.5
*** Alternative plant-based diet with total of 145.8 (g): 
barley         13.2
kidney bean     1.1
carrots         3.7
garlic          5.0
grapes         34.0
peanut          9.2
pistachio      19.7
spinach        20.0
soybean        20.0
tofu           20.0
shadow price for kcal: -0.48
shadow price for Protein_(g): 8.41
shadow price for Vit_A_RAE_(mcg)_: 0.08
shadow price for Riboflavin_(mg): 62.22
shadow price for Selenium_(mcg): 7.28
shadow price for Potassium_(mg): 0.13
shadow price for tofu: -0.05
shadow price for soybean: -0.52
shadow price for spinach: -0.43
shadow price for garlic: -0.46
==================================================
*** Attempting to replace:
egg    24.3
*** Found no solutions
==================================================
*** Attempting to replace:
chicken    74.3
*** Found no solutions
==================================================
*** Attempting to replace:
pork    29.8
*** Alternative plant-based diet with total of 28.9 (g): 
almond       13.2
barley        7.3
garlic        5.0
peanut        0.7
pistachio     2.7
shadow price for kcal: 0.07
shadow price for Vit_A_RAE_(mcg)_: 0.01
shadow price for Calcium_(mg): 0.12
shadow price for Selenium_(mcg): 6.87
shadow price for garlic: -0.29
==================================================
*** Attempting to replace:
salmon    7.2
*** Found no solutions
==================================================
*** Attempting to replace:
tuna    4
*** Found no solutions
==================================================
*** Attempting to replace:
beef        65.5
dairy      219.5
egg         24.3
chicken     74.3
pork        29.8
salmon       7.2
tuna         4.0
*** Found no solutions
==================================================