Upload P2 - Secom Notebook - Mercury.ipynb
Browse files
P2 - Secom Notebook - Mercury.ipynb
CHANGED
@@ -26,7 +26,7 @@
|
|
26 |
},
|
27 |
{
|
28 |
"cell_type": "code",
|
29 |
-
"execution_count":
|
30 |
"metadata": {
|
31 |
"slideshow": {
|
32 |
"slide_type": "skip"
|
@@ -53,7 +53,7 @@
|
|
53 |
},
|
54 |
{
|
55 |
"cell_type": "code",
|
56 |
-
"execution_count":
|
57 |
"metadata": {
|
58 |
"slideshow": {
|
59 |
"slide_type": "skip"
|
@@ -64,7 +64,7 @@
|
|
64 |
"data": {
|
65 |
"application/mercury+json": {
|
66 |
"allow_download": true,
|
67 |
-
"code_uid": "App.0.40.24.1-
|
68 |
"continuous_update": false,
|
69 |
"description": "Recumpute everything dynamically",
|
70 |
"full_screen": true,
|
@@ -96,7 +96,7 @@
|
|
96 |
},
|
97 |
{
|
98 |
"cell_type": "code",
|
99 |
-
"execution_count":
|
100 |
"metadata": {
|
101 |
"slideshow": {
|
102 |
"slide_type": "skip"
|
@@ -138,7 +138,7 @@
|
|
138 |
},
|
139 |
{
|
140 |
"cell_type": "code",
|
141 |
-
"execution_count":
|
142 |
"metadata": {
|
143 |
"slideshow": {
|
144 |
"slide_type": "skip"
|
@@ -195,7 +195,7 @@
|
|
195 |
},
|
196 |
{
|
197 |
"cell_type": "code",
|
198 |
-
"execution_count":
|
199 |
"metadata": {
|
200 |
"slideshow": {
|
201 |
"slide_type": "skip"
|
@@ -290,7 +290,7 @@
|
|
290 |
},
|
291 |
{
|
292 |
"cell_type": "code",
|
293 |
-
"execution_count":
|
294 |
"metadata": {
|
295 |
"slideshow": {
|
296 |
"slide_type": "skip"
|
@@ -341,7 +341,7 @@
|
|
341 |
},
|
342 |
{
|
343 |
"cell_type": "code",
|
344 |
-
"execution_count":
|
345 |
"metadata": {
|
346 |
"slideshow": {
|
347 |
"slide_type": "skip"
|
@@ -419,7 +419,7 @@
|
|
419 |
},
|
420 |
{
|
421 |
"cell_type": "code",
|
422 |
-
"execution_count":
|
423 |
"metadata": {
|
424 |
"slideshow": {
|
425 |
"slide_type": "skip"
|
@@ -499,7 +499,7 @@
|
|
499 |
},
|
500 |
{
|
501 |
"cell_type": "code",
|
502 |
-
"execution_count":
|
503 |
"metadata": {
|
504 |
"slideshow": {
|
505 |
"slide_type": "skip"
|
@@ -585,7 +585,7 @@
|
|
585 |
},
|
586 |
{
|
587 |
"cell_type": "code",
|
588 |
-
"execution_count":
|
589 |
"metadata": {
|
590 |
"slideshow": {
|
591 |
"slide_type": "skip"
|
@@ -648,7 +648,7 @@
|
|
648 |
},
|
649 |
{
|
650 |
"cell_type": "code",
|
651 |
-
"execution_count":
|
652 |
"metadata": {
|
653 |
"slideshow": {
|
654 |
"slide_type": "skip"
|
@@ -737,7 +737,7 @@
|
|
737 |
},
|
738 |
{
|
739 |
"cell_type": "code",
|
740 |
-
"execution_count":
|
741 |
"metadata": {
|
742 |
"slideshow": {
|
743 |
"slide_type": "skip"
|
@@ -818,7 +818,7 @@
|
|
818 |
},
|
819 |
{
|
820 |
"cell_type": "code",
|
821 |
-
"execution_count":
|
822 |
"metadata": {
|
823 |
"slideshow": {
|
824 |
"slide_type": "skip"
|
@@ -832,17 +832,17 @@
|
|
832 |
"yes",
|
833 |
"no"
|
834 |
],
|
835 |
-
"code_uid": "Select.0.40.16.25-
|
836 |
"disabled": false,
|
837 |
"hidden": false,
|
838 |
"label": "Drop Duplicates",
|
839 |
-
"model_id": "
|
840 |
"url_key": "",
|
841 |
"value": "yes",
|
842 |
"widget": "Select"
|
843 |
},
|
844 |
"application/vnd.jupyter.widget-view+json": {
|
845 |
-
"model_id": "
|
846 |
"version_major": 2,
|
847 |
"version_minor": 0
|
848 |
},
|
@@ -856,18 +856,18 @@
|
|
856 |
{
|
857 |
"data": {
|
858 |
"application/mercury+json": {
|
859 |
-
"code_uid": "Text.0.40.15.28-
|
860 |
"disabled": false,
|
861 |
"hidden": false,
|
862 |
"label": "Missing Value Threeshold",
|
863 |
-
"model_id": "
|
864 |
"rows": 1,
|
865 |
"url_key": "",
|
866 |
"value": "80",
|
867 |
"widget": "Text"
|
868 |
},
|
869 |
"application/vnd.jupyter.widget-view+json": {
|
870 |
-
"model_id": "
|
871 |
"version_major": 2,
|
872 |
"version_minor": 0
|
873 |
},
|
@@ -881,18 +881,18 @@
|
|
881 |
{
|
882 |
"data": {
|
883 |
"application/mercury+json": {
|
884 |
-
"code_uid": "Text.0.40.15.31-
|
885 |
"disabled": false,
|
886 |
"hidden": false,
|
887 |
"label": "Variance Threshold",
|
888 |
-
"model_id": "
|
889 |
"rows": 1,
|
890 |
"url_key": "",
|
891 |
"value": "0",
|
892 |
"widget": "Text"
|
893 |
},
|
894 |
"application/vnd.jupyter.widget-view+json": {
|
895 |
-
"model_id": "
|
896 |
"version_major": 2,
|
897 |
"version_minor": 0
|
898 |
},
|
@@ -906,18 +906,18 @@
|
|
906 |
{
|
907 |
"data": {
|
908 |
"application/mercury+json": {
|
909 |
-
"code_uid": "Text.0.40.15.34-
|
910 |
"disabled": false,
|
911 |
"hidden": false,
|
912 |
"label": "Correlation Threshold",
|
913 |
-
"model_id": "
|
914 |
"rows": 1,
|
915 |
"url_key": "",
|
916 |
"value": "1",
|
917 |
"widget": "Text"
|
918 |
},
|
919 |
"application/vnd.jupyter.widget-view+json": {
|
920 |
-
"model_id": "
|
921 |
"version_major": 2,
|
922 |
"version_minor": 0
|
923 |
},
|
@@ -937,17 +937,17 @@
|
|
937 |
4,
|
938 |
5
|
939 |
],
|
940 |
-
"code_uid": "Select.0.40.16.38-
|
941 |
"disabled": false,
|
942 |
"hidden": false,
|
943 |
"label": "Outlier Removal Threshold",
|
944 |
-
"model_id": "
|
945 |
"url_key": "",
|
946 |
"value": "none",
|
947 |
"widget": "Select"
|
948 |
},
|
949 |
"application/vnd.jupyter.widget-view+json": {
|
950 |
-
"model_id": "
|
951 |
"version_major": 2,
|
952 |
"version_minor": 0
|
953 |
},
|
@@ -967,17 +967,17 @@
|
|
967 |
"minmax",
|
968 |
"robust"
|
969 |
],
|
970 |
-
"code_uid": "Select.0.40.16.46-
|
971 |
"disabled": false,
|
972 |
"hidden": false,
|
973 |
"label": "Scaling Variables",
|
974 |
-
"model_id": "
|
975 |
"url_key": "",
|
976 |
"value": "none",
|
977 |
"widget": "Select"
|
978 |
},
|
979 |
"application/vnd.jupyter.widget-view+json": {
|
980 |
-
"model_id": "
|
981 |
"version_major": 2,
|
982 |
"version_minor": 0
|
983 |
},
|
@@ -997,17 +997,17 @@
|
|
997 |
"knn",
|
998 |
"most_frequent"
|
999 |
],
|
1000 |
-
"code_uid": "Select.0.40.16.50-
|
1001 |
"disabled": false,
|
1002 |
"hidden": false,
|
1003 |
"label": "Imputation Methods",
|
1004 |
-
"model_id": "
|
1005 |
"url_key": "",
|
1006 |
"value": "mean",
|
1007 |
"widget": "Select"
|
1008 |
},
|
1009 |
"application/vnd.jupyter.widget-view+json": {
|
1010 |
-
"model_id": "
|
1011 |
"version_major": 2,
|
1012 |
"version_minor": 0
|
1013 |
},
|
@@ -1028,17 +1028,17 @@
|
|
1028 |
"pca",
|
1029 |
"boruta"
|
1030 |
],
|
1031 |
-
"code_uid": "Select.0.40.16.55-
|
1032 |
"disabled": false,
|
1033 |
"hidden": false,
|
1034 |
"label": "Feature Selection",
|
1035 |
-
"model_id": "
|
1036 |
"url_key": "",
|
1037 |
"value": "none",
|
1038 |
"widget": "Select"
|
1039 |
},
|
1040 |
"application/vnd.jupyter.widget-view+json": {
|
1041 |
-
"model_id": "
|
1042 |
"version_major": 2,
|
1043 |
"version_minor": 0
|
1044 |
},
|
@@ -1058,17 +1058,17 @@
|
|
1058 |
"undersampling",
|
1059 |
"rose"
|
1060 |
],
|
1061 |
-
"code_uid": "Select.0.40.16.59-
|
1062 |
"disabled": false,
|
1063 |
"hidden": false,
|
1064 |
"label": "Imbalance Treatment",
|
1065 |
-
"model_id": "
|
1066 |
"url_key": "",
|
1067 |
"value": "none",
|
1068 |
"widget": "Select"
|
1069 |
},
|
1070 |
"application/vnd.jupyter.widget-view+json": {
|
1071 |
-
"model_id": "
|
1072 |
"version_major": 2,
|
1073 |
"version_minor": 0
|
1074 |
},
|
@@ -1091,17 +1091,17 @@
|
|
1091 |
"decision_tree",
|
1092 |
"xgboost"
|
1093 |
],
|
1094 |
-
"code_uid": "Select.0.40.16.64-
|
1095 |
"disabled": false,
|
1096 |
"hidden": false,
|
1097 |
"label": "Model Selection",
|
1098 |
-
"model_id": "
|
1099 |
"url_key": "",
|
1100 |
"value": "xgboost",
|
1101 |
"widget": "Select"
|
1102 |
},
|
1103 |
"application/vnd.jupyter.widget-view+json": {
|
1104 |
-
"model_id": "
|
1105 |
"version_major": 2,
|
1106 |
"version_minor": 0
|
1107 |
},
|
@@ -1209,7 +1209,7 @@
|
|
1209 |
},
|
1210 |
{
|
1211 |
"cell_type": "code",
|
1212 |
-
"execution_count":
|
1213 |
"metadata": {
|
1214 |
"slideshow": {
|
1215 |
"slide_type": "skip"
|
@@ -1290,7 +1290,7 @@
|
|
1290 |
},
|
1291 |
{
|
1292 |
"cell_type": "code",
|
1293 |
-
"execution_count":
|
1294 |
"metadata": {
|
1295 |
"slideshow": {
|
1296 |
"slide_type": "skip"
|
@@ -1328,7 +1328,7 @@
|
|
1328 |
},
|
1329 |
{
|
1330 |
"cell_type": "code",
|
1331 |
-
"execution_count":
|
1332 |
"metadata": {
|
1333 |
"slideshow": {
|
1334 |
"slide_type": "slide"
|
@@ -1481,7 +1481,7 @@
|
|
1481 |
},
|
1482 |
{
|
1483 |
"cell_type": "code",
|
1484 |
-
"execution_count":
|
1485 |
"metadata": {
|
1486 |
"slideshow": {
|
1487 |
"slide_type": "slide"
|
|
|
26 |
},
|
27 |
{
|
28 |
"cell_type": "code",
|
29 |
+
"execution_count": 18,
|
30 |
"metadata": {
|
31 |
"slideshow": {
|
32 |
"slide_type": "skip"
|
|
|
53 |
},
|
54 |
{
|
55 |
"cell_type": "code",
|
56 |
+
"execution_count": 19,
|
57 |
"metadata": {
|
58 |
"slideshow": {
|
59 |
"slide_type": "skip"
|
|
|
64 |
"data": {
|
65 |
"application/mercury+json": {
|
66 |
"allow_download": true,
|
67 |
+
"code_uid": "App.0.40.24.1-rand2c9ab9e7",
|
68 |
"continuous_update": false,
|
69 |
"description": "Recumpute everything dynamically",
|
70 |
"full_screen": true,
|
|
|
96 |
},
|
97 |
{
|
98 |
"cell_type": "code",
|
99 |
+
"execution_count": 20,
|
100 |
"metadata": {
|
101 |
"slideshow": {
|
102 |
"slide_type": "skip"
|
|
|
138 |
},
|
139 |
{
|
140 |
"cell_type": "code",
|
141 |
+
"execution_count": 21,
|
142 |
"metadata": {
|
143 |
"slideshow": {
|
144 |
"slide_type": "skip"
|
|
|
195 |
},
|
196 |
{
|
197 |
"cell_type": "code",
|
198 |
+
"execution_count": 22,
|
199 |
"metadata": {
|
200 |
"slideshow": {
|
201 |
"slide_type": "skip"
|
|
|
290 |
},
|
291 |
{
|
292 |
"cell_type": "code",
|
293 |
+
"execution_count": 23,
|
294 |
"metadata": {
|
295 |
"slideshow": {
|
296 |
"slide_type": "skip"
|
|
|
341 |
},
|
342 |
{
|
343 |
"cell_type": "code",
|
344 |
+
"execution_count": 24,
|
345 |
"metadata": {
|
346 |
"slideshow": {
|
347 |
"slide_type": "skip"
|
|
|
419 |
},
|
420 |
{
|
421 |
"cell_type": "code",
|
422 |
+
"execution_count": 25,
|
423 |
"metadata": {
|
424 |
"slideshow": {
|
425 |
"slide_type": "skip"
|
|
|
499 |
},
|
500 |
{
|
501 |
"cell_type": "code",
|
502 |
+
"execution_count": 26,
|
503 |
"metadata": {
|
504 |
"slideshow": {
|
505 |
"slide_type": "skip"
|
|
|
585 |
},
|
586 |
{
|
587 |
"cell_type": "code",
|
588 |
+
"execution_count": 27,
|
589 |
"metadata": {
|
590 |
"slideshow": {
|
591 |
"slide_type": "skip"
|
|
|
648 |
},
|
649 |
{
|
650 |
"cell_type": "code",
|
651 |
+
"execution_count": 28,
|
652 |
"metadata": {
|
653 |
"slideshow": {
|
654 |
"slide_type": "skip"
|
|
|
737 |
},
|
738 |
{
|
739 |
"cell_type": "code",
|
740 |
+
"execution_count": 29,
|
741 |
"metadata": {
|
742 |
"slideshow": {
|
743 |
"slide_type": "skip"
|
|
|
818 |
},
|
819 |
{
|
820 |
"cell_type": "code",
|
821 |
+
"execution_count": 30,
|
822 |
"metadata": {
|
823 |
"slideshow": {
|
824 |
"slide_type": "skip"
|
|
|
832 |
"yes",
|
833 |
"no"
|
834 |
],
|
835 |
+
"code_uid": "Select.0.40.16.25-randb785d2a5",
|
836 |
"disabled": false,
|
837 |
"hidden": false,
|
838 |
"label": "Drop Duplicates",
|
839 |
+
"model_id": "f5c9c8b77b8a4b92bfeaebfd09688f8a",
|
840 |
"url_key": "",
|
841 |
"value": "yes",
|
842 |
"widget": "Select"
|
843 |
},
|
844 |
"application/vnd.jupyter.widget-view+json": {
|
845 |
+
"model_id": "f5c9c8b77b8a4b92bfeaebfd09688f8a",
|
846 |
"version_major": 2,
|
847 |
"version_minor": 0
|
848 |
},
|
|
|
856 |
{
|
857 |
"data": {
|
858 |
"application/mercury+json": {
|
859 |
+
"code_uid": "Text.0.40.15.28-rand76290b78",
|
860 |
"disabled": false,
|
861 |
"hidden": false,
|
862 |
"label": "Missing Value Threeshold",
|
863 |
+
"model_id": "2a1d81490e1e439ba214219a0bfa56b3",
|
864 |
"rows": 1,
|
865 |
"url_key": "",
|
866 |
"value": "80",
|
867 |
"widget": "Text"
|
868 |
},
|
869 |
"application/vnd.jupyter.widget-view+json": {
|
870 |
+
"model_id": "2a1d81490e1e439ba214219a0bfa56b3",
|
871 |
"version_major": 2,
|
872 |
"version_minor": 0
|
873 |
},
|
|
|
881 |
{
|
882 |
"data": {
|
883 |
"application/mercury+json": {
|
884 |
+
"code_uid": "Text.0.40.15.31-rand3a34547a",
|
885 |
"disabled": false,
|
886 |
"hidden": false,
|
887 |
"label": "Variance Threshold",
|
888 |
+
"model_id": "e0e229e9864545099ba169ad272273f5",
|
889 |
"rows": 1,
|
890 |
"url_key": "",
|
891 |
"value": "0",
|
892 |
"widget": "Text"
|
893 |
},
|
894 |
"application/vnd.jupyter.widget-view+json": {
|
895 |
+
"model_id": "e0e229e9864545099ba169ad272273f5",
|
896 |
"version_major": 2,
|
897 |
"version_minor": 0
|
898 |
},
|
|
|
906 |
{
|
907 |
"data": {
|
908 |
"application/mercury+json": {
|
909 |
+
"code_uid": "Text.0.40.15.34-rand79b594f6",
|
910 |
"disabled": false,
|
911 |
"hidden": false,
|
912 |
"label": "Correlation Threshold",
|
913 |
+
"model_id": "3c42c9d218934722a7c2ebcaa9715d34",
|
914 |
"rows": 1,
|
915 |
"url_key": "",
|
916 |
"value": "1",
|
917 |
"widget": "Text"
|
918 |
},
|
919 |
"application/vnd.jupyter.widget-view+json": {
|
920 |
+
"model_id": "3c42c9d218934722a7c2ebcaa9715d34",
|
921 |
"version_major": 2,
|
922 |
"version_minor": 0
|
923 |
},
|
|
|
937 |
4,
|
938 |
5
|
939 |
],
|
940 |
+
"code_uid": "Select.0.40.16.38-randb65fcc34",
|
941 |
"disabled": false,
|
942 |
"hidden": false,
|
943 |
"label": "Outlier Removal Threshold",
|
944 |
+
"model_id": "577bf130efe0427f82fbb99a6e6f8796",
|
945 |
"url_key": "",
|
946 |
"value": "none",
|
947 |
"widget": "Select"
|
948 |
},
|
949 |
"application/vnd.jupyter.widget-view+json": {
|
950 |
+
"model_id": "577bf130efe0427f82fbb99a6e6f8796",
|
951 |
"version_major": 2,
|
952 |
"version_minor": 0
|
953 |
},
|
|
|
967 |
"minmax",
|
968 |
"robust"
|
969 |
],
|
970 |
+
"code_uid": "Select.0.40.16.46-rand2e347045",
|
971 |
"disabled": false,
|
972 |
"hidden": false,
|
973 |
"label": "Scaling Variables",
|
974 |
+
"model_id": "1775424536e64ff899ca0d6ec93ea978",
|
975 |
"url_key": "",
|
976 |
"value": "none",
|
977 |
"widget": "Select"
|
978 |
},
|
979 |
"application/vnd.jupyter.widget-view+json": {
|
980 |
+
"model_id": "1775424536e64ff899ca0d6ec93ea978",
|
981 |
"version_major": 2,
|
982 |
"version_minor": 0
|
983 |
},
|
|
|
997 |
"knn",
|
998 |
"most_frequent"
|
999 |
],
|
1000 |
+
"code_uid": "Select.0.40.16.50-randa094eed0",
|
1001 |
"disabled": false,
|
1002 |
"hidden": false,
|
1003 |
"label": "Imputation Methods",
|
1004 |
+
"model_id": "a35dad0324ce44578f8ce2609662f4ec",
|
1005 |
"url_key": "",
|
1006 |
"value": "mean",
|
1007 |
"widget": "Select"
|
1008 |
},
|
1009 |
"application/vnd.jupyter.widget-view+json": {
|
1010 |
+
"model_id": "a35dad0324ce44578f8ce2609662f4ec",
|
1011 |
"version_major": 2,
|
1012 |
"version_minor": 0
|
1013 |
},
|
|
|
1028 |
"pca",
|
1029 |
"boruta"
|
1030 |
],
|
1031 |
+
"code_uid": "Select.0.40.16.55-rande9681438",
|
1032 |
"disabled": false,
|
1033 |
"hidden": false,
|
1034 |
"label": "Feature Selection",
|
1035 |
+
"model_id": "ee69abf9627d44c09da90a79fe98c447",
|
1036 |
"url_key": "",
|
1037 |
"value": "none",
|
1038 |
"widget": "Select"
|
1039 |
},
|
1040 |
"application/vnd.jupyter.widget-view+json": {
|
1041 |
+
"model_id": "ee69abf9627d44c09da90a79fe98c447",
|
1042 |
"version_major": 2,
|
1043 |
"version_minor": 0
|
1044 |
},
|
|
|
1058 |
"undersampling",
|
1059 |
"rose"
|
1060 |
],
|
1061 |
+
"code_uid": "Select.0.40.16.59-randc218b629",
|
1062 |
"disabled": false,
|
1063 |
"hidden": false,
|
1064 |
"label": "Imbalance Treatment",
|
1065 |
+
"model_id": "d2da0edfb49d45e680d72f1cd59b956d",
|
1066 |
"url_key": "",
|
1067 |
"value": "none",
|
1068 |
"widget": "Select"
|
1069 |
},
|
1070 |
"application/vnd.jupyter.widget-view+json": {
|
1071 |
+
"model_id": "d2da0edfb49d45e680d72f1cd59b956d",
|
1072 |
"version_major": 2,
|
1073 |
"version_minor": 0
|
1074 |
},
|
|
|
1091 |
"decision_tree",
|
1092 |
"xgboost"
|
1093 |
],
|
1094 |
+
"code_uid": "Select.0.40.16.64-rand3f39df1a",
|
1095 |
"disabled": false,
|
1096 |
"hidden": false,
|
1097 |
"label": "Model Selection",
|
1098 |
+
"model_id": "c277aac8be5a4a21a048ea6cab3b9501",
|
1099 |
"url_key": "",
|
1100 |
"value": "xgboost",
|
1101 |
"widget": "Select"
|
1102 |
},
|
1103 |
"application/vnd.jupyter.widget-view+json": {
|
1104 |
+
"model_id": "c277aac8be5a4a21a048ea6cab3b9501",
|
1105 |
"version_major": 2,
|
1106 |
"version_minor": 0
|
1107 |
},
|
|
|
1209 |
},
|
1210 |
{
|
1211 |
"cell_type": "code",
|
1212 |
+
"execution_count": 31,
|
1213 |
"metadata": {
|
1214 |
"slideshow": {
|
1215 |
"slide_type": "skip"
|
|
|
1290 |
},
|
1291 |
{
|
1292 |
"cell_type": "code",
|
1293 |
+
"execution_count": 32,
|
1294 |
"metadata": {
|
1295 |
"slideshow": {
|
1296 |
"slide_type": "skip"
|
|
|
1328 |
},
|
1329 |
{
|
1330 |
"cell_type": "code",
|
1331 |
+
"execution_count": 33,
|
1332 |
"metadata": {
|
1333 |
"slideshow": {
|
1334 |
"slide_type": "slide"
|
|
|
1481 |
},
|
1482 |
{
|
1483 |
"cell_type": "code",
|
1484 |
+
"execution_count": 34,
|
1485 |
"metadata": {
|
1486 |
"slideshow": {
|
1487 |
"slide_type": "slide"
|