Binary classification with tensorflow

tensorflow

Binary Classification for Simple Data

import tensorflow as tf
import matplotlib.pyplot as plt

# Simple input data, 6 x 2
x_data = [[1,2], [2,3], [3,1], [4,3], [5,3], [6,2]]
# Answer, 6 x 1
y_data = [[0,], [0], [0], [1], [1], [1]]

# Placeholders for a tensor that will be always fed.
X = tf.placeholder(tf.float32, shape=[None, 2])
Y = tf.placeholder(tf.float32, shape=[None, 1])
# Weight, 2 x 1
W = tf.Variable(tf.random_normal([2,1]), name='weight')
# Bias, 1
b = tf.Variable(tf.random_normal([1]), name='bias')

# Hypothesis using sigmoid: tf.div(1., 1. + tf.exp(tf.matmul(X, W) + b))
hypothesis = tf.sigmoid(tf.matmul(X, W) + b)

# Cost function
cost = -tf.reduce_mean(\
        Y * tf.log(hypothesis) + (1 - Y) * tf.log(1 - hypothesis))
# Gradient descent optimizer
train = tf.train.GradientDescentOptimizer(learning_rate=0.01).minimize(cost)

# Output function: True if hypthesis>.5 else False
predicted = tf.cast(hypothesis > 0.5, dtype=tf.float32)
# Accuracy computation
accuracy = tf.reduce_mean(tf.cast(tf.equal(predicted, Y), dtype=tf.float32))

trials = [i for i in range(10001)]
costs = []
# Launch graph
with tf.Session() as sess:
    # Initialize Tensorflow variables
    sess.run(tf.global_variables_initializer())

    for step in range(10001):
        # Training
        cost_val, _ = sess.run([cost, train], feed_dict={X:x_data, Y:y_data})
        costs.append(cost_val)

    # Accuracy check for trained input data
    h, p, a = sess.run([hypothesis, predicted, accuracy],\
                      feed_dict={X:x_data, Y:y_data})

    print("Hypothesis, Prediction")
    for i in range(len(h)):
        print("{0} {1}".format(h[i], p[i]))
    print("Acuracy: {0}".format(a))

    plt.plot(trials, costs)
    plt.title("Costs")
    plt.xlabel("trial")
    plt.ylabel("costs")
    plt.grid()
    plt.show()

Hypothesis, Prediction
[ 0.041998] [ 0.]
[ 0.17176442] [ 0.]
[ 0.35488054] [ 0.]
[ 0.75937283] [ 1.]
[ 0.92487144] [ 1.]
[ 0.97536916] [ 1.]
Accuracy: 1.0

Image 1. Binary classification for simple data

Classifying diabetes

Data for diabetes
X_n is a factor for diabetes.
If Y is 1, he/she has diabetes. If 0, he/she does not.

Image 2. Input & output for diabetes

import numpy as np
import tensorflow as tf
import matplotlib.pyplot as plt

# Load data from file
xy = np.loadtxt("data-03-diabetes.csv", delimiter=",", dtype=np.float32)
# Input, all rows and n-1 columns
x_data = xy[:, 0:-1]
# Answer, all rows and last column
y_data = xy[:, [-1]]

# Placeholders for a tensor that will be always fed.
X = tf.placeholder(tf.float32, shape=[None, 8])
Y = tf.placeholder(tf.float32, shape=[None, 1])
# Weight, 2 x 1
W = tf.Variable(tf.random_normal([8,1]), name='weight')
# Bias, 1
b = tf.Variable(tf.random_normal([1]), name='bias')

# Hypothesis using sigmoid: tf.div(1., 1. + tf.exp(tf.matmul(X, W) + b))
hypothesis = tf.sigmoid(tf.matmul(X, W) + b)

# Cost function
cost = -tf.reduce_mean(\
        Y * tf.log(hypothesis) + (1 - Y) * tf.log(1 - hypothesis))
# Gradient descent optimizer
train = tf.train.GradientDescentOptimizer(learning_rate=0.01).minimize(cost)

# Output function: True if hypthesis>.5 else False
predicted = tf.cast(hypothesis > 0.5, dtype=tf.float32)
# Accuracy computation
accuracy = tf.reduce_mean(tf.cast(tf.equal(predicted, Y), dtype=tf.float32))

maxTrials = 20001
trials = [i for i in range(maxTrials)]
costs = []
# Launch graph
with tf.Session() as sess:
    # Initialize Tensorflow variables
    sess.run(tf.global_variables_initializer())

    for step in range(maxTrials):
        # Training
        cost_val, _ = sess.run([cost, train], feed_dict={X:x_data, Y:y_data})
        costs.append(cost_val)

    # Accuracy check for trained input data
    h, p, a = sess.run([hypothesis, predicted, accuracy],\
                      feed_dict={X:x_data, Y:y_data})

    print("Acuracy: {0}".format(a))

    plt.plot(trials, costs)
    plt.title("Costs")
    plt.xlabel("trial")
    plt.ylabel("costs")
    plt.grid()
    plt.show()

Accuracy: 0.7694334387779236

Image 3. Binary classification for diabetes

Universe In Computer

Header$type=social_icons

$type=grid$count=3$meta=0$sn=0$rm=0

11. Binary Classification with TensorFlow

TOC

Binary Classification for Simple Data

Classifying diabetes

라벨:

COMMENTS

Labels

RECENT$type=list-tab$date=0$au=0$c=5

REPLIES$type=list-tab$com=0$c=4$src=recent-comments

RANDOM$type=list-tab$date=0$au=0$c=5$src=random-posts

$type=grid$count=3$meta=0$sn=0$rm=0

11. Binary Classification with TensorFlow

TOC

Binary Classification for Simple Data

Classifying diabetes

라벨:

SHARE:

COMMENTS

Labels

RECENT$type=list-tab$date=0$au=0$c=5

REPLIES$type=list-tab$com=0$c=4$src=recent-comments

RANDOM$type=list-tab$date=0$au=0$c=5$src=random-posts