1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192 |
- import tensorflow as tf
- import numpy as np
- def get_one_hot(targets, nb_classes):
- res = np.eye(nb_classes)[np.array(targets).reshape(-1)]
- return res.reshape(list(targets.shape)+[nb_classes])
- def load(file):
- raw_data = np.loadtxt(file, delimiter=',')
- data_size = len(raw_data)
- np.random.shuffle(raw_data)
- ret = np.split(raw_data, [1,], axis=1)
- return ret
- train_pieces = load('SPECT.train')
- train_label = train_pieces[0]
- train_data = train_pieces[1]
- # train_label = train_label - 1
- train_label = train_label.flatten().astype(int)
- train_label = get_one_hot(train_label, 2)
- val_pieces = load('SPECT.test')
- val_label = val_pieces[0]
- val_data = val_pieces[1]
- # val_label = val_label - 1
- val_label = val_label.flatten().astype(int)
- val_label2 = val_label.flatten().astype(int)
- val_label = get_one_hot(val_label, 2)
- # learning params
- learning_rate = 0.005
- training_epochs = 200
- batch_size = 16
- # network params
- n_hidden_1 = 32
- n_hidden_2 = 8
- n_input = 22
- n_classses = 2
- # model
- x = tf.placeholder("float", [None, n_input])
- y = tf.placeholder("float", [None, n_classses])
- def mlp(_X, _weights, _biases):
- layer1 = tf.nn.sigmoid(tf.add(tf.matmul(_X, _weights['h1']), _biases['b1']))
- layer2 = tf.nn.sigmoid(tf.add(tf.matmul(layer1, _weights['h2']), _biases['b2']))
- return tf.matmul(layer2, _weights['out']) + _biases['out']
- weights = {
- 'h1' : tf.Variable(tf.random_normal([n_input, n_hidden_1])),
- 'h2' : tf.Variable(tf.random_normal([n_hidden_1, n_hidden_2])),
- 'out' : tf.Variable(tf.random_normal([n_hidden_2, n_classses]))
- }
- biases = {
- 'b1' : tf.Variable(tf.random_normal([n_hidden_1])),
- 'b2' : tf.Variable(tf.random_normal([n_hidden_2])),
- 'out' : tf.Variable(tf.random_normal([n_classses]))
- }
- pred = mlp(x, weights, biases)
- cost = tf.reduce_mean(tf.nn.softmax_cross_entropy_with_logits_v2(labels=y, logits=pred))
- optimizer = tf.train.AdamOptimizer(learning_rate=learning_rate).minimize(cost)
- init = tf.global_variables_initializer()
- train_data_batches = np.array_split(train_data, len(train_data) // batch_size)
- train_label_batches = np.array_split(train_label, len(train_label) // batch_size)
- correct_prediction = tf.equal(tf.argmax(pred, 1), tf.argmax(y, 1))
- pred_label = tf.argmax(pred, 1)
- with tf.Session() as sess:
- sess.run(init)
- #Training cycle
- for epoch in range(training_epochs):
- for i, j in zip(train_data_batches, train_label_batches):
- sess.run(optimizer, feed_dict={x: i, y: j})
- accuracy = tf.reduce_mean(tf.cast(correct_prediction, "float"))
- pl = pred_label.eval({x: val_data, y: val_label})
- TP = sum(pl[i] == 1 and val_label2[i] == 1 for i in range(len(val_label2)))
- FP = sum(pl[i] == 1 and val_label2[i] == 0 for i in range(len(val_label2)))
- FN = sum(pl[i] == 0 and val_label2[i] == 1 for i in range(len(val_label2)))
- P = TP / (TP + FP)
- R = TP / (TP + FN)
- print("Train Accuracy:", accuracy.eval({x: train_data, y: train_label}))
- print("Val Accuracy:", accuracy.eval({x: val_data, y: val_label}))
- print('F1', 2 * P * R / (P + R))
|