Skip to content

Commit 1252ebc

Browse files
committed
lot of stuff
1 parent b1a8ef8 commit 1252ebc

20 files changed

+534520
-52
lines changed

Diff for: features.txt

+57
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,57 @@
1+
word_freq_make: continuous.
2+
word_freq_address: continuous.
3+
word_freq_all: continuous.
4+
word_freq_3d: continuous.
5+
word_freq_our: continuous.
6+
word_freq_over: continuous.
7+
word_freq_remove: continuous.
8+
word_freq_internet: continuous.
9+
word_freq_order: continuous.
10+
word_freq_mail: continuous.
11+
word_freq_receive: continuous.
12+
word_freq_will: continuous.
13+
word_freq_people: continuous.
14+
word_freq_report: continuous.
15+
word_freq_addresses: continuous.
16+
word_freq_free: continuous.
17+
word_freq_business: continuous.
18+
word_freq_email: continuous.
19+
word_freq_you: continuous.
20+
word_freq_credit: continuous.
21+
word_freq_your: continuous.
22+
word_freq_font: continuous.
23+
word_freq_000: continuous.
24+
word_freq_money: continuous.
25+
word_freq_hp: continuous.
26+
word_freq_hpl: continuous.
27+
word_freq_george: continuous.
28+
word_freq_650: continuous.
29+
word_freq_lab: continuous.
30+
word_freq_labs: continuous.
31+
word_freq_telnet: continuous.
32+
word_freq_857: continuous.
33+
word_freq_data: continuous.
34+
word_freq_415: continuous.
35+
word_freq_85: continuous.
36+
word_freq_technology: continuous.
37+
word_freq_1999: continuous.
38+
word_freq_parts: continuous.
39+
word_freq_pm: continuous.
40+
word_freq_direct: continuous.
41+
word_freq_cs: continuous.
42+
word_freq_meeting: continuous.
43+
word_freq_original: continuous.
44+
word_freq_project: continuous.
45+
word_freq_re: continuous.
46+
word_freq_edu: continuous.
47+
word_freq_table: continuous.
48+
word_freq_conference: continuous.
49+
char_freq_;: continuous.
50+
char_freq_(: continuous.
51+
char_freq_[: continuous.
52+
char_freq_!: continuous.
53+
char_freq_$: continuous.
54+
char_freq_#: continuous.
55+
capital_run_length_average: continuous.
56+
capital_run_length_longest: continuous.
57+
capital_run_length_total: continuous.

Diff for: get_data.py

+50
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,50 @@
1+
# Script to read in the spambase.data files and get a format we can use
2+
3+
import pickle
4+
import csv
5+
import svmlight_loader
6+
7+
filename = 'spambase.train'
8+
9+
f = open(filename, 'r')
10+
11+
data = []
12+
freader = csv.reader(f, delimiter=',')
13+
for row in freader:
14+
data.append(row)
15+
16+
f.close()
17+
18+
#print data
19+
20+
# There are 58 columns in the data...
21+
# 57 are attributes
22+
# 48 are frequency of a word
23+
# 6 are frequency of a punctuation mark
24+
# 3 are data on sequences of characters
25+
# Last is label
26+
num_attributes = 57
27+
28+
attributes = []
29+
labels = []
30+
for example in data:
31+
attributes.append(example[:num_attributes])
32+
labels.append(example[num_attributes])
33+
34+
# convert the strings to numbers
35+
for row in range(len(attributes)):
36+
for col in range(num_attributes):
37+
attributes[row][col] = float(attributes[row][col])
38+
39+
for x in range(len(labels)):
40+
labels[x] = float(labels[x])
41+
42+
print attributes[0]
43+
attr_out = open('train_data.pickle', 'w')
44+
label_out = open('train_label.pickle', 'w')
45+
46+
pickle.dump(attributes, attr_out)
47+
pickle.dump(labels, label_out)
48+
49+
attr_out.close()
50+
label_out.close()

Diff for: get_data_reduced.py

+51
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,51 @@
1+
# Script to read in the spambase.data files and get a format we can use
2+
3+
import pickle
4+
import csv
5+
import svmlight_loader
6+
7+
filename = 'spambase.test'
8+
9+
f = open(filename, 'r')
10+
11+
data = []
12+
freader = csv.reader(f, delimiter=',')
13+
for row in freader:
14+
data.append(row)
15+
16+
f.close()
17+
18+
#print data
19+
20+
# There are 58 columns in the data...
21+
# 57 are attributes
22+
# 48 are frequency of a word
23+
# 6 are frequency of a punctuation mark
24+
# 3 are data on sequences of characters
25+
# Last is label
26+
num_attributes = 57
27+
28+
attributes = []
29+
labels = []
30+
for example in data:
31+
#attributes.append(example[:num_attributes])
32+
attributes.append(example[:54])
33+
labels.append(example[num_attributes])
34+
35+
# convert the strings to numbers
36+
for row in range(len(attributes)):
37+
for col in range(54):
38+
attributes[row][col] = float(attributes[row][col])
39+
40+
for x in range(len(labels)):
41+
labels[x] = float(labels[x])
42+
43+
print attributes[0]
44+
attr_out = open('test_data_reduced.pickle', 'w')
45+
label_out = open('test_label.pickle', 'w')
46+
47+
pickle.dump(attributes, attr_out)
48+
pickle.dump(labels, label_out)
49+
50+
attr_out.close()
51+
label_out.close()

Diff for: neural_network_1_hidden.py

+13-13
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,7 @@ def sigmoid(x):
1212
def sigmoid_derivative(x):
1313
return sigmoid(x) * (1 - sigmoid(x))
1414

15-
class NeuralNetwork:
15+
class NeuralNetwork_1HL:
1616

1717
def __init__(self, num_inputs, num_hidden_neurons, num_outputs):
1818
self.num_inputs = num_inputs
@@ -81,17 +81,17 @@ def get_output(self, inputs):
8181
return self.feed_forward(inputs)[1][1]
8282

8383
# main program ##########################################################################
84-
xor_net = NeuralNetwork(2, 3, 1)
85-
a = np.array([1.,1.])
86-
b = np.array([1.,0.])
87-
c = np.array([0.,1.])
88-
d = np.array([0.,0.])
89-
examples = [a, b, c, d]
90-
labels = [np.array([0.]), np.array([1.]), np.array([1.]), np.array([0.])]
84+
# xor_net = NeuralNetwork_1HL(2, 3, 1)
85+
# a = np.array([1.,1.])
86+
# b = np.array([1.,0.])
87+
# c = np.array([0.,1.])
88+
# d = np.array([0.,0.])
89+
# examples = [a, b, c, d]
90+
# labels = [np.array([0.]), np.array([1.]), np.array([1.]), np.array([0.])]
9191

92-
xor_net.train_network(4, examples, labels, 5000, 0.3)
92+
# xor_net.train_network(4, examples, labels, 5000, 0.3)
9393

94-
print xor_net.get_output(a)
95-
print xor_net.get_output(b)
96-
print xor_net.get_output(c)
97-
print xor_net.get_output(d)
94+
# print xor_net.get_output(a)
95+
# print xor_net.get_output(b)
96+
# print xor_net.get_output(c)
97+
# print xor_net.get_output(d)

Diff for: neural_network_2_hidden.py

+13-13
Original file line numberDiff line numberDiff line change
@@ -11,7 +11,7 @@ def sigmoid(x):
1111
def sigmoid_derivative(x):
1212
return sigmoid(x) * (1 - sigmoid(x))
1313

14-
class NeuralNetwork:
14+
class NeuralNetwork_2HL:
1515

1616
def __init__(self, num_inputs, num_hidden_first, num_hidden_second, num_outputs):
1717
self.num_inputs = num_inputs
@@ -98,17 +98,17 @@ def get_output(self, inputs):
9898
return self.feed_forward(inputs)[1][2]
9999

100100
# main program ##########################################################################
101-
xor_net = NeuralNetwork(2, 3, 3, 1)
102-
a = np.array([1.,1.])
103-
b = np.array([1.,0.])
104-
c = np.array([0.,1.])
105-
d = np.array([0.,0.])
106-
examples = [a, b, c, d]
107-
labels = [np.array([0.]), np.array([1.]), np.array([1.]), np.array([0.])]
101+
# xor_net = NeuralNetwork_2HL(2, 3, 3, 1)
102+
# a = np.array([1.,1.])
103+
# b = np.array([1.,0.])
104+
# c = np.array([0.,1.])
105+
# d = np.array([0.,0.])
106+
# examples = [a, b, c, d]
107+
# labels = [np.array([0.]), np.array([1.]), np.array([1.]), np.array([0.])]
108108

109-
xor_net.train_network(4, examples, labels, 5000, 0.3)
109+
# xor_net.train_network(4, examples, labels, 5000, 0.3)
110110

111-
print xor_net.get_output(a)
112-
print xor_net.get_output(b)
113-
print xor_net.get_output(c)
114-
print xor_net.get_output(d)
111+
# print xor_net.get_output(a)
112+
# print xor_net.get_output(b)
113+
# print xor_net.get_output(c)
114+
# print xor_net.get_output(d)

0 commit comments

Comments
 (0)