In [1]:

    
%matplotlib inline
%config InlineBackend.figure_format='retina'

# import everything we need first
from tensorflow.keras import utils
import numpy as np
from sklearn.model_selection import train_test_split
import pylab as plt

from astroNN.models import Galaxy10CNN
from astroNN.datasets import galaxy10
from astroNN.datasets.galaxy10 import galaxy10cls_lookup, galaxy10_confusion

# To load images and labels (will download automatically at the first time)
# First time downloading location will be ~/.astroNN/datasets/
images, labels = galaxy10.load_data()

# To convert the labels to categorical 10 classes
labels = utils.to_categorical(labels, 10)

# Select 10 of the images to inspect
img = None
plt.ion()
print('===================Data Inspection===================')
for counter, i in enumerate(range(np.random.randint(0, labels.shape[0], size=10).shape[0])):
    img = plt.imshow(images[i])
    plt.title('Class {}: {} \n Random Demo images {} of 10'.format(np.argmax(labels[i]), galaxy10cls_lookup(labels[i]), counter+1))
    plt.draw()
    plt.pause(2.)
plt.close('all')
print('===============Data Inspection Finished===============')

# To convert to desirable type
labels = labels.astype(np.float32)
images = images.astype(np.float32)

# Split the dataset into training set and testing set
train_idx, test_idx = train_test_split(np.arange(labels.shape[0]), test_size=0.1)
train_images, train_labels, test_images, test_labels = images[train_idx], labels[train_idx], images[test_idx], labels[test_idx]

# To create a neural network instance
galaxy10net = Galaxy10CNN()

# set maximium epochs the neural network can run, set 5 to get quick result
galaxy10net.max_epochs = 5

# To train the nerual net
# astroNN will normalize the data by default
galaxy10net.train(train_images, train_labels)

# print model summary before training
galaxy10net.keras_model.summary()

# After the training, you can test the neural net performance
# Please notice predicted_labels are labels predicted from neural network. test_labels are ground truth from the dataset
predicted_labels = galaxy10net.test(test_images)

# Convert predicted_labels to class
prediction_class = np.argmax(predicted_labels, axis=1)

# Convert test_labels to class
test_class = np.argmax(test_labels, axis=1)

# Prepare a confusion matrix
confusion_matrix = np.zeros((10,10))

# create the confusion matrix
for counter, i in enumerate(prediction_class):
    confusion_matrix[i, test_class[counter]] += 1

# Plot the confusion matrix
galaxy10_confusion(confusion_matrix)









    



WARNING:tensorflow:From c:\users\henry\documents\github\astronn\astroNN\models\base_master_nn.py:22: The name tf.keras.backend.get_session is deprecated. Please use tf.compat.v1.keras.backend.get_session instead.

WARNING! Gaia environment variable GAIA_TOOLS_DATA not set
C:\Users\Henry\.astroNN\datasets\Galaxy10.h5 was found!
===================Data Inspection===================






    












    












    












    












    












    












    












    












    












    












    



===============Data Inspection Finished===============
Number of Training Data: 17646, Number of Validation Data: 1960
====Message from Normalizer====
You selected mode: 255
Featurewise Center: False
Datawise Center: False
Featurewise std Center: False
Datawise std Center: False
====Message ends====
====Message from Normalizer====
You selected mode: 0
Featurewise Center: False
Datawise Center: False
Featurewise std Center: False
Datawise std Center: False
====Message ends====
WARNING:tensorflow:From C:\Users\Henry\Miniconda3\lib\site-packages\tensorflow_core\python\ops\resource_variable_ops.py:1635: calling BaseResourceVariable.__init__ (from tensorflow.python.ops.resource_variable_ops) with constraint is deprecated and will be removed in a future version.
Instructions for updating:
If using Keras pass *_constraint arguments to layers.
WARNING:tensorflow:From c:\users\henry\documents\github\astronn\astroNN\models\base_cnn.py:274: Model.fit_generator (from tensorflow.python.keras.engine.training) is deprecated and will be removed in a future version.
Instructions for updating:
Please use Model.fit, which supports generators.
Epoch 1/5
Epoch 1/5
275/275 - 8s - loss: 11.5597 - categorical_accuracy: 0.2862 - val_loss: 11.3466 - val_categorical_accuracy: 0.3010
Epoch 2/5
Epoch 1/5

Epoch 00002: ReduceLROnPlateau reducing learning rate to 0.0024999999441206455.
275/275 - 5s - loss: 11.5033 - categorical_accuracy: 0.2905 - val_loss: 11.3966 - val_categorical_accuracy: 0.2964
Epoch 3/5
Epoch 1/5
275/275 - 5s - loss: 8.1051 - categorical_accuracy: 0.3028 - val_loss: 1.6873 - val_categorical_accuracy: 0.3375
Epoch 4/5
Epoch 1/5
275/275 - 5s - loss: 1.6628 - categorical_accuracy: 0.3686 - val_loss: 1.5186 - val_categorical_accuracy: 0.4073
Epoch 5/5
Epoch 1/5
275/275 - 5s - loss: 1.5436 - categorical_accuracy: 0.3981 - val_loss: 1.4887 - val_categorical_accuracy: 0.4125
Completed Training, 26.66s in total
Model: "model"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
=================================================================
input (InputLayer)           [(None, 69, 69, 3)]       0         
_________________________________________________________________
conv2d (Conv2D)              (None, 69, 69, 8)         224       
_________________________________________________________________
activation (Activation)      (None, 69, 69, 8)         0         
_________________________________________________________________
conv2d_1 (Conv2D)            (None, 69, 69, 16)        1168      
_________________________________________________________________
activation_1 (Activation)    (None, 69, 69, 16)        0         
_________________________________________________________________
max_pooling2d (MaxPooling2D) (None, 17, 17, 16)        0         
_________________________________________________________________
flatten (Flatten)            (None, 4624)              0         
_________________________________________________________________
dropout (Dropout)            (None, 4624)              0         
_________________________________________________________________
dense (Dense)                (None, 256)               1184000   
_________________________________________________________________
activation_2 (Activation)    (None, 256)               0         
_________________________________________________________________
dropout_1 (Dropout)          (None, 256)               0         
_________________________________________________________________
dense_1 (Dense)              (None, 128)               32896     
_________________________________________________________________
activation_3 (Activation)    (None, 128)               0         
_________________________________________________________________
dense_2 (Dense)              (None, 10)                1290      
_________________________________________________________________
output (Activation)          (None, 10)                0         
=================================================================
Total params: 1,219,578
Trainable params: 1,219,578
Non-trainable params: 0
_________________________________________________________________
Starting Inference
WARNING:tensorflow:From c:\users\henry\documents\github\astronn\astroNN\models\base_cnn.py:405: Model.predict_generator (from tensorflow.python.keras.engine.training) is deprecated and will be removed in a future version.
Instructions for updating:
Please use Model.predict, which supports generators.
Completed Inference, 0.38s elapsed






    



c:\users\henry\documents\github\astronn\astroNN\datasets\galaxy10.py:143: UserWarning: Matplotlib is currently using module://ipykernel.pylab.backend_inline, which is a non-GUI backend, so cannot show the figure.
  fig.show()

Galaxy10 Tutorial

Introduction

Authors and Basic Information

This tutorial will be using astroNN

Acknowledgments