|
12 | 12 | "sys.path.append(\"../../../\")\n",
|
13 | 13 | "from Util.Util import DataUtil\n",
|
14 | 14 | "\n",
|
15 |
| - "(x_train, y_train), (x_test, y_test) = DataUtil.gen_noisy_linear()" |
| 15 | + "(x_train, y_train), (x_test, y_test) = DataUtil.gen_noisy_linear()\n", |
| 16 | + "idx = [True] * 100 + [False]\n", |
| 17 | + "features_lists = [set() for _ in range(100)] + [{0, 1}]" |
16 | 18 | ]
|
17 | 19 | },
|
18 | 20 | {
|
|
27 | 29 | "name": "stdout",
|
28 | 30 | "output_type": "stream",
|
29 | 31 | "text": [
|
30 |
| - "Shuffling data...\n", |
31 |
| - "Generating data info...\n", |
32 |
| - "Transforming data...\n", |
33 | 32 | "============================================================\n",
|
34 | 33 | "Decision tree performance\n",
|
35 | 34 | "------------------------------------------------------------\n",
|
|
41 | 40 | "------------------------------------------------------------\n",
|
42 | 41 | "Data : 10000 training samples, 1500 test samples\n",
|
43 | 42 | "Features : 0 categorical, 100 numerical\n",
|
44 |
| - "-> No pre-processing methods were applied\n", |
45 | 43 | "============================================================\n",
|
46 | 44 | "Deep model input: Continuous features only\n",
|
47 | 45 | "------------------------------------------------------------\n",
|
|
55 | 53 | "------------------------------------------------------------\n",
|
56 | 54 | "Activation : ['step', 'one_hot']\n",
|
57 | 55 | "Batch size : 128\n",
|
58 |
| - "Epoch num : 20\n", |
| 56 | + "Epoch num : 5\n", |
59 | 57 | "Optimizer : Adam\n",
|
60 | 58 | "Metric : acc\n",
|
61 | 59 | "Loss : cross_entropy\n",
|
62 | 60 | "lr : 0.001\n",
|
63 | 61 | "lb : 0.0\n",
|
64 | 62 | "------------------------------------------------------------\n",
|
65 |
| - "Noises : None\n", |
66 |
| - "------------------------------------------------------------\n", |
67 | 63 | "============================================================\n",
|
68 | 64 | "Initial performance\n",
|
69 | 65 | "------------------------------------------------------------\n",
|
70 | 66 | "Train acc: 1.0\n",
|
71 | 67 | "Test acc: 0.815333\n",
|
72 | 68 | "------------------------------------------------------------\n",
|
73 | 69 | "\n",
|
74 |
| - "## # Main # Progress bar initialized ##" |
75 |
| - ] |
76 |
| - }, |
77 |
| - { |
78 |
| - "name": "stderr", |
79 |
| - "output_type": "stream", |
80 |
| - "text": [ |
81 |
| - "../../../_Dist/NeuralNetworks/c_NeuralNetwork/NNCore.py:1015: UserWarning: Early stopped at n_epoch=1 due to 'Over-fitting'\n", |
82 |
| - " warnings.warn(warn_msg)\n" |
83 |
| - ] |
84 |
| - }, |
85 |
| - { |
86 |
| - "name": "stdout", |
87 |
| - "output_type": "stream", |
88 |
| - "text": [ |
89 |
| - "## # Main # (20 : 0 -> 1) Task Finished. Time Cost: 0 h 0 min 9.004 s; Average: 0 h 0 min 9.004 s ##\n", |
90 |
| - "============================================================\n", |
91 |
| - "History score summary of NoisyLinear (test) - snapshot 0\n", |
92 |
| - "------------------------------------------------------------\n", |
93 |
| - "Mean : Train - 0.9318; Test - 0.7562\n", |
94 |
| - "Std : Train - 0.0685; Test - 0.5302\n", |
95 |
| - "------------------------------------------------------------\n", |
96 |
| - "============================================================\n", |
97 |
| - "Model performance on test set\n", |
98 |
| - "------------------------------------------------------------\n", |
99 |
| - "acc: 0.686667\n", |
100 |
| - "------------------------------------------------------------\n", |
101 |
| - "Shuffling data...\n", |
102 |
| - "Generating data info...\n", |
103 |
| - "Transforming data...\n", |
| 70 | + "## # Main # (5 : 0 -> 5) Task Finished. Time Cost: 0 h 0 min 29.29 s; Average: 0 h 0 min 5.857 s ##\n", |
| 71 | + "Test acc: 0.724\n", |
104 | 72 | "============================================================\n",
|
105 | 73 | "Decision tree performance\n",
|
106 | 74 | "------------------------------------------------------------\n",
|
107 | 75 | "Train : 1.0\n",
|
108 |
| - "Test : 0.814666666667\n", |
| 76 | + "Test : 0.811333333333\n", |
109 | 77 | "------------------------------------------------------------\n",
|
110 | 78 | "============================================================\n",
|
111 | 79 | "This is a 2-classes problem\n",
|
112 | 80 | "------------------------------------------------------------\n",
|
113 | 81 | "Data : 10000 training samples, 1500 test samples\n",
|
114 | 82 | "Features : 0 categorical, 100 numerical\n",
|
115 |
| - "-> No pre-processing methods were applied\n", |
116 | 83 | "============================================================\n",
|
117 | 84 | "Deep model input: Continuous features only\n",
|
118 | 85 | "------------------------------------------------------------\n",
|
119 | 86 | "Using raw values in categorical columns without embedding\n",
|
120 | 87 | "------------------------------------------------------------\n",
|
121 | 88 | "Using dropout with keep_prob = 0.5\n",
|
122 | 89 | "Training without batch norm\n",
|
123 |
| - "Hidden units: [862, 863]\n", |
| 90 | + "Hidden units: [860, 861]\n", |
124 | 91 | "============================================================\n",
|
125 | 92 | "Hyper parameters\n",
|
126 | 93 | "------------------------------------------------------------\n",
|
127 | 94 | "Activation : ['step', 'softmax']\n",
|
128 | 95 | "Batch size : 128\n",
|
129 |
| - "Epoch num : 20\n", |
| 96 | + "Epoch num : 5\n", |
130 | 97 | "Optimizer : Adam\n",
|
131 | 98 | "Metric : acc\n",
|
132 | 99 | "Loss : cross_entropy\n",
|
133 | 100 | "lr : 0.001\n",
|
134 | 101 | "lb : 0.0\n",
|
135 | 102 | "------------------------------------------------------------\n",
|
136 |
| - "Noises : None\n", |
137 |
| - "------------------------------------------------------------\n", |
138 | 103 | "============================================================\n",
|
139 | 104 | "Initial performance\n",
|
140 | 105 | "------------------------------------------------------------\n",
|
141 | 106 | "Train acc: 1.0\n",
|
142 |
| - "Test acc: 0.814667\n", |
| 107 | + "Test acc: 0.811333\n", |
143 | 108 | "------------------------------------------------------------\n",
|
144 | 109 | "\n",
|
145 |
| - "## # Main # [--- ] : 2 / 20 ## Time Cost: 0 h 0 min 16.72 s; Average: 0 h 0 min 8.362 s " |
146 |
| - ] |
147 |
| - }, |
148 |
| - { |
149 |
| - "name": "stderr", |
150 |
| - "output_type": "stream", |
151 |
| - "text": [ |
152 |
| - "../../../_Dist/NeuralNetworks/c_NeuralNetwork/NNCore.py:1015: UserWarning: Early stopped at n_epoch=3 due to 'Over-fitting'\n", |
153 |
| - " warnings.warn(warn_msg)\n" |
154 |
| - ] |
155 |
| - }, |
156 |
| - { |
157 |
| - "name": "stdout", |
158 |
| - "output_type": "stream", |
159 |
| - "text": [ |
160 |
| - "## # Main # (20 : 0 -> 2) Task Finished. Time Cost: 0 h 0 min 18.39 s; Average: 0 h 0 min 9.196 s ##\n", |
161 |
| - "============================================================\n", |
162 |
| - "History score summary of NoisyLinear (test) - snapshot 0\n", |
163 |
| - "------------------------------------------------------------\n", |
164 |
| - "Mean : Train - 0.8101; Test - 0.8433\n", |
165 |
| - "Std : Train - 0.0128; Test - 0.2110\n", |
166 |
| - "------------------------------------------------------------\n", |
167 |
| - "============================================================\n", |
168 |
| - "Model performance on test set\n", |
169 |
| - "------------------------------------------------------------\n", |
170 |
| - "acc: 0.810667\n", |
171 |
| - "------------------------------------------------------------\n", |
172 |
| - "Shuffling data...\n", |
173 |
| - "Generating data info...\n", |
174 |
| - "Transforming data...\n", |
| 110 | + "## # Main # (5 : 0 -> 5) Task Finished. Time Cost: 0 h 0 min 25.96 s; Average: 0 h 0 min 5.192 s ##\n", |
| 111 | + "Test acc: 0.887333\n", |
175 | 112 | "============================================================\n",
|
176 | 113 | "Decision tree performance\n",
|
177 | 114 | "------------------------------------------------------------\n",
|
|
183 | 120 | "------------------------------------------------------------\n",
|
184 | 121 | "Data : 10000 training samples, 1500 test samples\n",
|
185 | 122 | "Features : 0 categorical, 100 numerical\n",
|
186 |
| - "-> No pre-processing methods were applied\n", |
187 | 123 | "============================================================\n",
|
188 | 124 | "Deep model input: Continuous features only\n",
|
189 | 125 | "------------------------------------------------------------\n",
|
190 | 126 | "Using raw values in categorical columns without embedding\n",
|
191 | 127 | "------------------------------------------------------------\n",
|
192 | 128 | "Using dropout with keep_prob = 0.5\n",
|
193 | 129 | "Training without batch norm\n",
|
194 |
| - "Hidden units: [873, 874]\n", |
| 130 | + "Hidden units: [867, 868]\n", |
195 | 131 | "============================================================\n",
|
196 | 132 | "Hyper parameters\n",
|
197 | 133 | "------------------------------------------------------------\n",
|
198 | 134 | "Activation : ['tanh', 'softmax']\n",
|
199 | 135 | "Batch size : 128\n",
|
200 |
| - "Epoch num : 20\n", |
| 136 | + "Epoch num : 5\n", |
201 | 137 | "Optimizer : Adam\n",
|
202 | 138 | "Metric : acc\n",
|
203 | 139 | "Loss : cross_entropy\n",
|
204 | 140 | "lr : 0.001\n",
|
205 | 141 | "lb : 0.0\n",
|
206 | 142 | "------------------------------------------------------------\n",
|
207 |
| - "Noises : None\n", |
208 |
| - "------------------------------------------------------------\n", |
209 | 143 | "============================================================\n",
|
210 | 144 | "Initial performance\n",
|
211 | 145 | "------------------------------------------------------------\n",
|
212 |
| - "Train acc: 0.787\n", |
213 |
| - "Test acc: 0.820667\n", |
| 146 | + "Train acc: 0.8104\n", |
| 147 | + "Test acc: 0.855333\n", |
214 | 148 | "------------------------------------------------------------\n",
|
215 | 149 | "\n",
|
216 |
| - "## # Main # (20 : 0 -> 1) Task Finished. Time Cost: 0 h 0 min 7.939 s; Average: 0 h 0 min 7.939 s ##\n", |
217 |
| - "============================================================\n", |
218 |
| - "History score summary of NoisyLinear (test) - snapshot 0\n", |
219 |
| - "------------------------------------------------------------\n", |
220 |
| - "Mean : Train - 0.7920; Test - 0.8280\n", |
221 |
| - "Std : Train - 0.0113; Test - 0.2904\n", |
222 |
| - "------------------------------------------------------------\n", |
223 |
| - "============================================================\n", |
224 |
| - "Model performance on test set\n", |
225 |
| - "------------------------------------------------------------\n", |
226 |
| - "acc: 0.796667\n", |
227 |
| - "------------------------------------------------------------\n" |
| 150 | + "## # Main # (5 : 0 -> 5) Task Finished. Time Cost: 0 h 0 min 29.02 s; Average: 0 h 0 min 5.804 s ##\n", |
| 151 | + "Test acc: 0.95\n" |
228 | 152 | ]
|
229 | 153 | }
|
230 | 154 | ],
|
231 | 155 | "source": [
|
232 | 156 | "from Toolbox import DT2NNWrapper\n",
|
233 | 157 | "\n",
|
234 | 158 | "nn = DT2NNWrapper(\n",
|
235 |
| - " \"NoisyLinear\",\n", |
236 |
| - " model_param_settings={\"activations\": [\"step\", \"one_hot\"]},\n", |
| 159 | + " \"NoisyLinear\", idx, features_lists,\n", |
| 160 | + " model_param_settings={\n", |
| 161 | + " \"activations\": [\"step\", \"one_hot\"],\n", |
| 162 | + " \"n_epoch\": 5\n", |
| 163 | + " },\n", |
237 | 164 | " verbose_settings={\"metric\": \"acc\"}\n",
|
238 | 165 | ").fit(x_train, y_train, x_test, y_test)\n",
|
239 | 166 | "\n",
|
240 | 167 | "nn = DT2NNWrapper(\n",
|
241 |
| - " \"NoisyLinear\",\n", |
242 |
| - " model_param_settings={\"activations\": [\"step\", \"softmax\"]},\n", |
| 168 | + " \"NoisyLinear\", idx, features_lists,\n", |
| 169 | + " model_param_settings={\n", |
| 170 | + " \"activations\": [\"step\", \"softmax\"],\n", |
| 171 | + " \"n_epoch\": 5\n", |
| 172 | + " },\n", |
243 | 173 | " verbose_settings={\"metric\": \"acc\"}\n",
|
244 | 174 | ").fit(x_train, y_train, x_test, y_test)\n",
|
245 | 175 | "\n",
|
246 | 176 | "nn = DT2NNWrapper(\n",
|
247 |
| - " \"NoisyLinear\",\n", |
248 |
| - " model_param_settings={\"activations\": [\"tanh\", \"softmax\"]},\n", |
| 177 | + " \"NoisyLinear\", idx, features_lists,\n", |
| 178 | + " model_param_settings={\n", |
| 179 | + " \"activations\": [\"tanh\", \"softmax\"],\n", |
| 180 | + " \"n_epoch\": 5\n", |
| 181 | + " },\n", |
249 | 182 | " verbose_settings={\"metric\": \"acc\"}\n",
|
250 | 183 | ").fit(x_train, y_train, x_test, y_test)"
|
251 | 184 | ]
|
|
272 | 205 | }
|
273 | 206 | },
|
274 | 207 | "nbformat": 4,
|
275 |
| - "nbformat_minor": 1 |
| 208 | + "nbformat_minor": 0 |
276 | 209 | }
|
0 commit comments