notebook.community

Edit and run



In [32]:

    
import pandas as pd #work with data as tables
import numpy as np #use number matrices
import matplotlib.pyplot as plt
import tensorflow as tf



In [33]:

    
# step 1
dataframe = pd.read_csv('data.csv')



In [34]:

    
dataframe.head()

dataframe = dataframe[0:10]
dataframe



In [35]:

    
dataframe = dataframe.drop(['index', 'price','sq_price'], axis=1)



In [36]:

    
dataframe.head()



In [41]:

    
# step 2
# 1 is good buy and 0 is bad buy
dataframe.loc[:, ('y1')] = [1, 1, 1, 0, 0, 1, 0, 1, 1,1]
dataframe.loc[:, ('y2')] = dataframe['y1'] == 0
dataframe.loc[:, ('y2')] = dataframe['y2'].astype(int)
dataframe



In [43]:

    
# step 3 - prepare data for tensorflow (tensors)
# tensors are a generic version of vectors and matrices
#vector is a list of list of numbers (1D tensor)
#matrix is a list of list numbers (2D Tensor)
#list of list of list of numbers (3D tensor)
#......
#convert features to input tensor
inputX = dataframe.loc[:, ['area', 'bathrooms']].as_matrix()
#convert labels to input tensors
inputY = dataframe.loc[:, ['y1', 'y2']].as_matrix()



In [57]:

    
#step 4 - write out our hyperparneters
learning_rate = 0.000001
training_epochs = 2000
display_step = 50
n_samples = inputY.size









    Out[57]:





20



In [55]:

    
#step 5 - Create our computation graph/neural network
x = tf.placeholder(tf.float32, [None, 2]) 
W = tf.Variable(tf.zeros([2, 2]))           
b = tf.Variable(tf.zeros([2]))   
y_values = tf.add(tf.matmul(x, W), b)       
y = tf.nn.softmax(y_values)
y_ = tf.placeholder(tf.float32, [None,2])



In [56]:

    
#step  6 - perform training
# Cost function: Mean squared error
cost = tf.reduce_sum(tf.pow(y_ - y, 2))/(2*n_samples)
# Gradient descent
optimizer = tf.train.GradientDescentOptimizer(learning_rate).minimize(cost)



In [58]:

    
# Initialize variabls and tensorflow session
init = tf.initialize_all_variables()
sess = tf.Session()
sess.run(init)



In [61]:

    
for i in range(training_epochs):  
    sess.run(optimizer, feed_dict={x: inputX, y_: inputY}) # Take a gradient descent step using our inputs and labels

    # That's all! The rest of the cell just outputs debug messages. 
    # Display logs per epoch step
    if (i) % display_step == 0:
        cc = sess.run(cost, feed_dict={x: inputX, y_:inputY})
        print("Training step:", '%04d' % (i), "cost=", "{:.9f}".format(cc)) #, \"W=", sess.run(W), "b=", sess.run(b)

print("Optimization Finished!")
training_cost = sess.run(cost, feed_dict={x: inputX, y_: inputY})
print("Training cost=", training_cost, "W=", sess.run(W), "b=", sess.run(b), '\n')









    



Training step: 0000 cost= 0.114958666
Training step: 0050 cost= 0.109539941
Training step: 0100 cost= 0.109539866
Training step: 0150 cost= 0.109539807
Training step: 0200 cost= 0.109539732
Training step: 0250 cost= 0.109539673
Training step: 0300 cost= 0.109539606
Training step: 0350 cost= 0.109539531
Training step: 0400 cost= 0.109539464
Training step: 0450 cost= 0.109539405
Training step: 0500 cost= 0.109539315
Training step: 0550 cost= 0.109539248
Training step: 0600 cost= 0.109539196
Training step: 0650 cost= 0.109539129
Training step: 0700 cost= 0.109539054
Training step: 0750 cost= 0.109538987
Training step: 0800 cost= 0.109538913
Training step: 0850 cost= 0.109538853
Training step: 0900 cost= 0.109538779
Training step: 0950 cost= 0.109538712
Training step: 1000 cost= 0.109538652
Training step: 1050 cost= 0.109538577
Training step: 1100 cost= 0.109538510
Training step: 1150 cost= 0.109538436
Training step: 1200 cost= 0.109538361
Training step: 1250 cost= 0.109538302
Training step: 1300 cost= 0.109538235
Training step: 1350 cost= 0.109538175
Training step: 1400 cost= 0.109538101
Training step: 1450 cost= 0.109538034
Training step: 1500 cost= 0.109537959
Training step: 1550 cost= 0.109537885
Training step: 1600 cost= 0.109537825
Training step: 1650 cost= 0.109537765
Training step: 1700 cost= 0.109537683
Training step: 1750 cost= 0.109537624
Training step: 1800 cost= 0.109537557
Training step: 1850 cost= 0.109537482
Training step: 1900 cost= 0.109537408
Training step: 1950 cost= 0.109537348
Optimization Finished!
Training cost= 0.109537 W= [[  2.14149564e-04  -2.14149914e-04]
 [  5.12748193e-05  -5.12747974e-05]] b= [  1.19155184e-05  -1.19155284e-05]



In [62]:

    
sess.run(y, feed_dict={x: inputX })









    Out[62]:





array([[ 0.71125221,  0.28874779],
       [ 0.66498977,  0.33501023],
       [ 0.73657656,  0.26342347],
       [ 0.64718789,  0.35281211],
       [ 0.78335613,  0.2166439 ],
       [ 0.70069474,  0.29930523],
       [ 0.65866327,  0.34133676],
       [ 0.64828628,  0.35171372],
       [ 0.64368278,  0.35631716],
       [ 0.65480113,  0.3451989 ]], dtype=float32)



In [ ]:



In [ ]:

	index	area	bathrooms	price	sq_price
0	0	2104.0	3.0	399900.0	190.066540
1	1	1600.0	3.0	329900.0	206.187500
2	2	2400.0	3.0	369000.0	153.750000
3	3	1416.0	2.0	232000.0	163.841808
4	4	3000.0	4.0	539900.0	179.966667
5	5	1985.0	4.0	299900.0	151.083123
6	6	1534.0	3.0	314900.0	205.280313
7	7	1427.0	3.0	198999.0	139.452698
8	8	1380.0	3.0	212000.0	153.623188
9	9	1494.0	3.0	242500.0	162.315930

	area	bathrooms
0	2104.0	3.0
1	1600.0	3.0
2	2400.0	3.0
3	1416.0	2.0
4	3000.0	4.0

	area	bathrooms	y1	y2
0	2104.0	3.0	1	0
1	1600.0	3.0	1	0
2	2400.0	3.0	1	0
3	1416.0	2.0	0	1
4	3000.0	4.0	0	1
5	1985.0	4.0	1	0
6	1534.0	3.0	0	1
7	1427.0	3.0	1	0
8	1380.0	3.0	1	0
9	1494.0	3.0	1	0