diff --git a/machine_learning/NaiveBayes.ipynb b/machine_learning/NaiveBayes.ipynb
index 5a427c5cb965..0d3142efc68f 100644
--- a/machine_learning/NaiveBayes.ipynb
+++ b/machine_learning/NaiveBayes.ipynb
@@ -3,9 +3,7 @@
{
"cell_type": "code",
"execution_count": 1,
- "metadata": {
- "collapsed": true
- },
+ "metadata": {},
"outputs": [],
"source": [
"from sklearn import datasets\n",
@@ -15,9 +13,7 @@
{
"cell_type": "code",
"execution_count": 2,
- "metadata": {
- "collapsed": true
- },
+ "metadata": {},
"outputs": [],
"source": [
"iris = datasets.load_iris()"
@@ -26,9 +22,7 @@
{
"cell_type": "code",
"execution_count": 3,
- "metadata": {
- "collapsed": true
- },
+ "metadata": {},
"outputs": [],
"source": [
"df = pd.DataFrame(iris.data)\n",
@@ -38,9 +32,7 @@
{
"cell_type": "code",
"execution_count": 4,
- "metadata": {
- "collapsed": true
- },
+ "metadata": {},
"outputs": [],
"source": [
"def abc(k, *val):\n",
@@ -58,67 +50,11 @@
{
"data": {
"text/plain": [
- "0 1\n",
- "1 0\n",
- "2 0\n",
- "3 0\n",
- "4 1\n",
- "5 1\n",
- "6 0\n",
- "7 1\n",
- "8 0\n",
- "9 0\n",
- "10 1\n",
- "11 0\n",
- "12 0\n",
- "13 0\n",
- "14 1\n",
- "15 1\n",
- "16 1\n",
- "17 1\n",
- "18 1\n",
- "19 1\n",
- "20 1\n",
- "21 1\n",
- "22 0\n",
- "23 1\n",
- "24 0\n",
- "25 1\n",
- "26 1\n",
- "27 1\n",
- "28 1\n",
- "29 0\n",
- " ..\n",
- "120 1\n",
- "121 1\n",
- "122 1\n",
- "123 1\n",
- "124 1\n",
- "125 1\n",
- "126 1\n",
- "127 1\n",
- "128 1\n",
- "129 1\n",
- "130 1\n",
- "131 1\n",
- "132 1\n",
- "133 1\n",
- "134 1\n",
- "135 1\n",
- "136 1\n",
- "137 1\n",
- "138 1\n",
- "139 1\n",
- "140 1\n",
- "141 1\n",
- "142 1\n",
- "143 1\n",
- "144 1\n",
- "145 1\n",
- "146 1\n",
- "147 1\n",
- "148 1\n",
- "149 1\n",
+ "0 1\n",
+ "1 0\n",
+ "2 0\n",
+ "3 0\n",
+ "4 1\n",
"Name: sl, dtype: int64"
]
},
@@ -128,15 +64,13 @@
}
],
"source": [
- "df.sl.apply(abc, args=(5,))"
+ "df.sl.apply(abc, args=(5,)).head()"
]
},
{
"cell_type": "code",
"execution_count": null,
- "metadata": {
- "collapsed": true
- },
+ "metadata": {},
"outputs": [],
"source": []
},
@@ -174,6 +108,19 @@
"data": {
"text/html": [
"
\n",
+ "\n",
"
\n",
" \n",
" \n",
@@ -244,1341 +191,170 @@
" | a | \n",
" a | \n",
"
\n",
- " \n",
- " | 5 | \n",
- " 5.4 | \n",
- " 3.9 | \n",
- " 1.7 | \n",
- " 0.4 | \n",
- " b | \n",
- " d | \n",
- " a | \n",
- " a | \n",
- "
\n",
- " \n",
- " | 6 | \n",
- " 4.6 | \n",
- " 3.4 | \n",
- " 1.4 | \n",
- " 0.3 | \n",
- " a | \n",
- " c | \n",
- " a | \n",
- " a | \n",
- "
\n",
- " \n",
- " | 7 | \n",
- " 5.0 | \n",
- " 3.4 | \n",
- " 1.5 | \n",
- " 0.2 | \n",
- " a | \n",
- " c | \n",
- " a | \n",
- " a | \n",
- "
\n",
- " \n",
- " | 8 | \n",
- " 4.4 | \n",
- " 2.9 | \n",
- " 1.4 | \n",
- " 0.2 | \n",
- " a | \n",
- " b | \n",
- " a | \n",
- " a | \n",
- "
\n",
- " \n",
- " | 9 | \n",
- " 4.9 | \n",
- " 3.1 | \n",
- " 1.5 | \n",
- " 0.1 | \n",
- " a | \n",
- " c | \n",
- " a | \n",
- " a | \n",
- "
\n",
- " \n",
- " | 10 | \n",
- " 5.4 | \n",
- " 3.7 | \n",
- " 1.5 | \n",
- " 0.2 | \n",
- " b | \n",
- " c | \n",
- " a | \n",
- " a | \n",
- "
\n",
- " \n",
- " | 11 | \n",
- " 4.8 | \n",
- " 3.4 | \n",
- " 1.6 | \n",
- " 0.2 | \n",
- " a | \n",
- " c | \n",
- " a | \n",
- " a | \n",
- "
\n",
- " \n",
- " | 12 | \n",
- " 4.8 | \n",
- " 3.0 | \n",
- " 1.4 | \n",
- " 0.1 | \n",
- " a | \n",
- " b | \n",
- " a | \n",
- " a | \n",
- "
\n",
- " \n",
- " | 13 | \n",
- " 4.3 | \n",
- " 3.0 | \n",
- " 1.1 | \n",
- " 0.1 | \n",
- " a | \n",
- " b | \n",
- " a | \n",
- " a | \n",
- "
\n",
- " \n",
- " | 14 | \n",
- " 5.8 | \n",
- " 4.0 | \n",
- " 1.2 | \n",
- " 0.2 | \n",
- " b | \n",
- " d | \n",
- " a | \n",
- " a | \n",
- "
\n",
- " \n",
- " | 15 | \n",
- " 5.7 | \n",
- " 4.4 | \n",
- " 1.5 | \n",
- " 0.4 | \n",
- " b | \n",
- " d | \n",
- " a | \n",
- " a | \n",
- "
\n",
- " \n",
- " | 16 | \n",
- " 5.4 | \n",
- " 3.9 | \n",
- " 1.3 | \n",
- " 0.4 | \n",
- " b | \n",
- " d | \n",
- " a | \n",
- " a | \n",
- "
\n",
- " \n",
- " | 17 | \n",
- " 5.1 | \n",
- " 3.5 | \n",
- " 1.4 | \n",
- " 0.3 | \n",
- " b | \n",
- " c | \n",
- " a | \n",
- " a | \n",
- "
\n",
- " \n",
- " | 18 | \n",
- " 5.7 | \n",
- " 3.8 | \n",
- " 1.7 | \n",
- " 0.3 | \n",
- " b | \n",
- " d | \n",
- " a | \n",
- " a | \n",
- "
\n",
- " \n",
- " | 19 | \n",
- " 5.1 | \n",
- " 3.8 | \n",
- " 1.5 | \n",
- " 0.3 | \n",
- " b | \n",
- " d | \n",
- " a | \n",
- " a | \n",
- "
\n",
- " \n",
- " | 20 | \n",
- " 5.4 | \n",
- " 3.4 | \n",
- " 1.7 | \n",
- " 0.2 | \n",
- " b | \n",
- " c | \n",
- " a | \n",
- " a | \n",
- "
\n",
- " \n",
- " | 21 | \n",
- " 5.1 | \n",
- " 3.7 | \n",
- " 1.5 | \n",
- " 0.4 | \n",
- " b | \n",
- " c | \n",
- " a | \n",
- " a | \n",
- "
\n",
- " \n",
- " | 22 | \n",
- " 4.6 | \n",
- " 3.6 | \n",
- " 1.0 | \n",
- " 0.2 | \n",
- " a | \n",
- " c | \n",
- " a | \n",
- " a | \n",
+ " \n",
+ "
\n",
+ "
"
+ ],
+ "text/plain": [
+ " sl sw pl pw sl_labeled sw_labeled pl_labeled pw_labeled\n",
+ "0 5.1 3.5 1.4 0.2 b c a a\n",
+ "1 4.9 3.0 1.4 0.2 a b a a\n",
+ "2 4.7 3.2 1.3 0.2 a c a a\n",
+ "3 4.6 3.1 1.5 0.2 a c a a\n",
+ "4 5.0 3.6 1.4 0.2 a c a a"
+ ]
+ },
+ "execution_count": 7,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "df['sl_labeled'] = toLabel(df, 'sl')\n",
+ "df['sw_labeled'] = toLabel(df, 'sw')\n",
+ "df['pl_labeled'] = toLabel(df, 'pl')\n",
+ "df['pw_labeled'] = toLabel(df, 'pw')\n",
+ "df.head()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 8,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "df.drop(['sl', 'sw', 'pl', 'pw'], axis = 1, inplace = True)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 9,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "{'a', 'b', 'c', 'd'}"
+ ]
+ },
+ "execution_count": 9,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "set(df['sl_labeled'])"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 10,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "df[\"output\"] = iris.target"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 11,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " sl_labeled | \n",
+ " sw_labeled | \n",
+ " pl_labeled | \n",
+ " pw_labeled | \n",
+ " output | \n",
"
\n",
+ " \n",
+ " \n",
" \n",
- " | 23 | \n",
- " 5.1 | \n",
- " 3.3 | \n",
- " 1.7 | \n",
- " 0.5 | \n",
+ " 0 | \n",
" b | \n",
" c | \n",
" a | \n",
" a | \n",
+ " 0 | \n",
"
\n",
" \n",
- " | 24 | \n",
- " 4.8 | \n",
- " 3.4 | \n",
- " 1.9 | \n",
- " 0.2 | \n",
- " a | \n",
- " c | \n",
- " a | \n",
- " a | \n",
- "
\n",
- " \n",
- " | 25 | \n",
- " 5.0 | \n",
- " 3.0 | \n",
- " 1.6 | \n",
- " 0.2 | \n",
+ " 1 | \n",
" a | \n",
" b | \n",
" a | \n",
" a | \n",
+ " 0 | \n",
"
\n",
" \n",
- " | 26 | \n",
- " 5.0 | \n",
- " 3.4 | \n",
- " 1.6 | \n",
- " 0.4 | \n",
+ " 2 | \n",
" a | \n",
" c | \n",
" a | \n",
" a | \n",
+ " 0 | \n",
"
\n",
" \n",
- " | 27 | \n",
- " 5.2 | \n",
- " 3.5 | \n",
- " 1.5 | \n",
- " 0.2 | \n",
- " b | \n",
- " c | \n",
- " a | \n",
+ " 3 | \n",
" a | \n",
- "
\n",
- " \n",
- " | 28 | \n",
- " 5.2 | \n",
- " 3.4 | \n",
- " 1.4 | \n",
- " 0.2 | \n",
- " b | \n",
" c | \n",
" a | \n",
" a | \n",
+ " 0 | \n",
"
\n",
" \n",
- " | 29 | \n",
- " 4.7 | \n",
- " 3.2 | \n",
- " 1.6 | \n",
- " 0.2 | \n",
+ " 4 | \n",
" a | \n",
" c | \n",
" a | \n",
" a | \n",
- "
\n",
- " \n",
- " | ... | \n",
- " ... | \n",
- " ... | \n",
- " ... | \n",
- " ... | \n",
- " ... | \n",
- " ... | \n",
- " ... | \n",
- " ... | \n",
- "
\n",
- " \n",
- " | 120 | \n",
- " 6.9 | \n",
- " 3.2 | \n",
- " 5.7 | \n",
- " 2.3 | \n",
- " d | \n",
- " c | \n",
- " d | \n",
- " d | \n",
- "
\n",
- " \n",
- " | 121 | \n",
- " 5.6 | \n",
- " 2.8 | \n",
- " 4.9 | \n",
- " 2.0 | \n",
- " b | \n",
- " b | \n",
- " c | \n",
- " d | \n",
- "
\n",
- " \n",
- " | 122 | \n",
- " 7.7 | \n",
- " 2.8 | \n",
- " 6.7 | \n",
- " 2.0 | \n",
- " d | \n",
- " b | \n",
- " d | \n",
- " d | \n",
- "
\n",
- " \n",
- " | 123 | \n",
- " 6.3 | \n",
- " 2.7 | \n",
- " 4.9 | \n",
- " 1.8 | \n",
- " c | \n",
- " b | \n",
- " c | \n",
- " c | \n",
- "
\n",
- " \n",
- " | 124 | \n",
- " 6.7 | \n",
- " 3.3 | \n",
- " 5.7 | \n",
- " 2.1 | \n",
- " c | \n",
- " c | \n",
- " d | \n",
- " d | \n",
- "
\n",
- " \n",
- " | 125 | \n",
- " 7.2 | \n",
- " 3.2 | \n",
- " 6.0 | \n",
- " 1.8 | \n",
- " d | \n",
- " c | \n",
- " d | \n",
- " c | \n",
- "
\n",
- " \n",
- " | 126 | \n",
- " 6.2 | \n",
- " 2.8 | \n",
- " 4.8 | \n",
- " 1.8 | \n",
- " c | \n",
- " b | \n",
- " c | \n",
- " c | \n",
- "
\n",
- " \n",
- " | 127 | \n",
- " 6.1 | \n",
- " 3.0 | \n",
- " 4.9 | \n",
- " 1.8 | \n",
- " c | \n",
- " b | \n",
- " c | \n",
- " c | \n",
- "
\n",
- " \n",
- " | 128 | \n",
- " 6.4 | \n",
- " 2.8 | \n",
- " 5.6 | \n",
- " 2.1 | \n",
- " c | \n",
- " b | \n",
- " d | \n",
- " d | \n",
- "
\n",
- " \n",
- " | 129 | \n",
- " 7.2 | \n",
- " 3.0 | \n",
- " 5.8 | \n",
- " 1.6 | \n",
- " d | \n",
- " b | \n",
- " d | \n",
- " c | \n",
- "
\n",
- " \n",
- " | 130 | \n",
- " 7.4 | \n",
- " 2.8 | \n",
- " 6.1 | \n",
- " 1.9 | \n",
- " d | \n",
- " b | \n",
- " d | \n",
- " d | \n",
- "
\n",
- " \n",
- " | 131 | \n",
- " 7.9 | \n",
- " 3.8 | \n",
- " 6.4 | \n",
- " 2.0 | \n",
- " d | \n",
- " d | \n",
- " d | \n",
- " d | \n",
- "
\n",
- " \n",
- " | 132 | \n",
- " 6.4 | \n",
- " 2.8 | \n",
- " 5.6 | \n",
- " 2.2 | \n",
- " c | \n",
- " b | \n",
- " d | \n",
- " d | \n",
- "
\n",
- " \n",
- " | 133 | \n",
- " 6.3 | \n",
- " 2.8 | \n",
- " 5.1 | \n",
- " 1.5 | \n",
- " c | \n",
- " b | \n",
- " c | \n",
- " c | \n",
- "
\n",
- " \n",
- " | 134 | \n",
- " 6.1 | \n",
- " 2.6 | \n",
- " 5.6 | \n",
- " 1.4 | \n",
- " c | \n",
- " b | \n",
- " d | \n",
- " c | \n",
- "
\n",
- " \n",
- " | 135 | \n",
- " 7.7 | \n",
- " 3.0 | \n",
- " 6.1 | \n",
- " 2.3 | \n",
- " d | \n",
- " b | \n",
- " d | \n",
- " d | \n",
- "
\n",
- " \n",
- " | 136 | \n",
- " 6.3 | \n",
- " 3.4 | \n",
- " 5.6 | \n",
- " 2.4 | \n",
- " c | \n",
- " c | \n",
- " d | \n",
- " d | \n",
- "
\n",
- " \n",
- " | 137 | \n",
- " 6.4 | \n",
- " 3.1 | \n",
- " 5.5 | \n",
- " 1.8 | \n",
- " c | \n",
- " c | \n",
- " d | \n",
- " c | \n",
- "
\n",
- " \n",
- " | 138 | \n",
- " 6.0 | \n",
- " 3.0 | \n",
- " 4.8 | \n",
- " 1.8 | \n",
- " c | \n",
- " b | \n",
- " c | \n",
- " c | \n",
- "
\n",
- " \n",
- " | 139 | \n",
- " 6.9 | \n",
- " 3.1 | \n",
- " 5.4 | \n",
- " 2.1 | \n",
- " d | \n",
- " c | \n",
- " d | \n",
- " d | \n",
- "
\n",
- " \n",
- " | 140 | \n",
- " 6.7 | \n",
- " 3.1 | \n",
- " 5.6 | \n",
- " 2.4 | \n",
- " c | \n",
- " c | \n",
- " d | \n",
- " d | \n",
- "
\n",
- " \n",
- " | 141 | \n",
- " 6.9 | \n",
- " 3.1 | \n",
- " 5.1 | \n",
- " 2.3 | \n",
- " d | \n",
- " c | \n",
- " c | \n",
- " d | \n",
- "
\n",
- " \n",
- " | 142 | \n",
- " 5.8 | \n",
- " 2.7 | \n",
- " 5.1 | \n",
- " 1.9 | \n",
- " b | \n",
- " b | \n",
- " c | \n",
- " d | \n",
- "
\n",
- " \n",
- " | 143 | \n",
- " 6.8 | \n",
- " 3.2 | \n",
- " 5.9 | \n",
- " 2.3 | \n",
- " c | \n",
- " c | \n",
- " d | \n",
- " d | \n",
- "
\n",
- " \n",
- " | 144 | \n",
- " 6.7 | \n",
- " 3.3 | \n",
- " 5.7 | \n",
- " 2.5 | \n",
- " c | \n",
- " c | \n",
- " d | \n",
- " d | \n",
- "
\n",
- " \n",
- " | 145 | \n",
- " 6.7 | \n",
- " 3.0 | \n",
- " 5.2 | \n",
- " 2.3 | \n",
- " c | \n",
- " b | \n",
- " c | \n",
- " d | \n",
- "
\n",
- " \n",
- " | 146 | \n",
- " 6.3 | \n",
- " 2.5 | \n",
- " 5.0 | \n",
- " 1.9 | \n",
- " c | \n",
- " a | \n",
- " c | \n",
- " d | \n",
- "
\n",
- " \n",
- " | 147 | \n",
- " 6.5 | \n",
- " 3.0 | \n",
- " 5.2 | \n",
- " 2.0 | \n",
- " c | \n",
- " b | \n",
- " c | \n",
- " d | \n",
- "
\n",
- " \n",
- " | 148 | \n",
- " 6.2 | \n",
- " 3.4 | \n",
- " 5.4 | \n",
- " 2.3 | \n",
- " c | \n",
- " c | \n",
- " d | \n",
- " d | \n",
- "
\n",
- " \n",
- " | 149 | \n",
- " 5.9 | \n",
- " 3.0 | \n",
- " 5.1 | \n",
- " 1.8 | \n",
- " c | \n",
- " b | \n",
- " c | \n",
- " c | \n",
- "
\n",
- " \n",
- "
\n",
- "
150 rows × 8 columns
\n",
- "
"
- ],
- "text/plain": [
- " sl sw pl pw sl_labeled sw_labeled pl_labeled pw_labeled\n",
- "0 5.1 3.5 1.4 0.2 b c a a\n",
- "1 4.9 3.0 1.4 0.2 a b a a\n",
- "2 4.7 3.2 1.3 0.2 a c a a\n",
- "3 4.6 3.1 1.5 0.2 a c a a\n",
- "4 5.0 3.6 1.4 0.2 a c a a\n",
- "5 5.4 3.9 1.7 0.4 b d a a\n",
- "6 4.6 3.4 1.4 0.3 a c a a\n",
- "7 5.0 3.4 1.5 0.2 a c a a\n",
- "8 4.4 2.9 1.4 0.2 a b a a\n",
- "9 4.9 3.1 1.5 0.1 a c a a\n",
- "10 5.4 3.7 1.5 0.2 b c a a\n",
- "11 4.8 3.4 1.6 0.2 a c a a\n",
- "12 4.8 3.0 1.4 0.1 a b a a\n",
- "13 4.3 3.0 1.1 0.1 a b a a\n",
- "14 5.8 4.0 1.2 0.2 b d a a\n",
- "15 5.7 4.4 1.5 0.4 b d a a\n",
- "16 5.4 3.9 1.3 0.4 b d a a\n",
- "17 5.1 3.5 1.4 0.3 b c a a\n",
- "18 5.7 3.8 1.7 0.3 b d a a\n",
- "19 5.1 3.8 1.5 0.3 b d a a\n",
- "20 5.4 3.4 1.7 0.2 b c a a\n",
- "21 5.1 3.7 1.5 0.4 b c a a\n",
- "22 4.6 3.6 1.0 0.2 a c a a\n",
- "23 5.1 3.3 1.7 0.5 b c a a\n",
- "24 4.8 3.4 1.9 0.2 a c a a\n",
- "25 5.0 3.0 1.6 0.2 a b a a\n",
- "26 5.0 3.4 1.6 0.4 a c a a\n",
- "27 5.2 3.5 1.5 0.2 b c a a\n",
- "28 5.2 3.4 1.4 0.2 b c a a\n",
- "29 4.7 3.2 1.6 0.2 a c a a\n",
- ".. ... ... ... ... ... ... ... ...\n",
- "120 6.9 3.2 5.7 2.3 d c d d\n",
- "121 5.6 2.8 4.9 2.0 b b c d\n",
- "122 7.7 2.8 6.7 2.0 d b d d\n",
- "123 6.3 2.7 4.9 1.8 c b c c\n",
- "124 6.7 3.3 5.7 2.1 c c d d\n",
- "125 7.2 3.2 6.0 1.8 d c d c\n",
- "126 6.2 2.8 4.8 1.8 c b c c\n",
- "127 6.1 3.0 4.9 1.8 c b c c\n",
- "128 6.4 2.8 5.6 2.1 c b d d\n",
- "129 7.2 3.0 5.8 1.6 d b d c\n",
- "130 7.4 2.8 6.1 1.9 d b d d\n",
- "131 7.9 3.8 6.4 2.0 d d d d\n",
- "132 6.4 2.8 5.6 2.2 c b d d\n",
- "133 6.3 2.8 5.1 1.5 c b c c\n",
- "134 6.1 2.6 5.6 1.4 c b d c\n",
- "135 7.7 3.0 6.1 2.3 d b d d\n",
- "136 6.3 3.4 5.6 2.4 c c d d\n",
- "137 6.4 3.1 5.5 1.8 c c d c\n",
- "138 6.0 3.0 4.8 1.8 c b c c\n",
- "139 6.9 3.1 5.4 2.1 d c d d\n",
- "140 6.7 3.1 5.6 2.4 c c d d\n",
- "141 6.9 3.1 5.1 2.3 d c c d\n",
- "142 5.8 2.7 5.1 1.9 b b c d\n",
- "143 6.8 3.2 5.9 2.3 c c d d\n",
- "144 6.7 3.3 5.7 2.5 c c d d\n",
- "145 6.7 3.0 5.2 2.3 c b c d\n",
- "146 6.3 2.5 5.0 1.9 c a c d\n",
- "147 6.5 3.0 5.2 2.0 c b c d\n",
- "148 6.2 3.4 5.4 2.3 c c d d\n",
- "149 5.9 3.0 5.1 1.8 c b c c\n",
- "\n",
- "[150 rows x 8 columns]"
- ]
- },
- "execution_count": 7,
- "metadata": {},
- "output_type": "execute_result"
- }
- ],
- "source": [
- "df['sl_labeled'] = toLabel(df, 'sl')\n",
- "df['sw_labeled'] = toLabel(df, 'sw')\n",
- "df['pl_labeled'] = toLabel(df, 'pl')\n",
- "df['pw_labeled'] = toLabel(df, 'pw')\n",
- "df"
- ]
- },
- {
- "cell_type": "code",
- "execution_count": 8,
- "metadata": {},
- "outputs": [],
- "source": [
- "df.drop(['sl', 'sw', 'pl', 'pw'], axis = 1, inplace = True)"
- ]
- },
- {
- "cell_type": "code",
- "execution_count": 9,
- "metadata": {},
- "outputs": [
- {
- "data": {
- "text/plain": [
- "{'a', 'b', 'c', 'd'}"
- ]
- },
- "execution_count": 9,
- "metadata": {},
- "output_type": "execute_result"
- }
- ],
- "source": [
- "set(df['sl_labeled'])"
- ]
- },
- {
- "cell_type": "code",
- "execution_count": 12,
- "metadata": {},
- "outputs": [],
- "source": [
- "df[\"output\"] = iris.target"
- ]
- },
- {
- "cell_type": "code",
- "execution_count": 13,
- "metadata": {},
- "outputs": [
- {
- "data": {
- "text/html": [
- "\n",
- "
\n",
- " \n",
- " \n",
- " | \n",
- " sl_labeled | \n",
- " sw_labeled | \n",
- " pl_labeled | \n",
- " pw_labeled | \n",
- " output | \n",
- "
\n",
- " \n",
- " \n",
- " \n",
- " | 0 | \n",
- " b | \n",
- " c | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 1 | \n",
- " a | \n",
- " b | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 2 | \n",
- " a | \n",
- " c | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 3 | \n",
- " a | \n",
- " c | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 4 | \n",
- " a | \n",
- " c | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 5 | \n",
- " b | \n",
- " d | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 6 | \n",
- " a | \n",
- " c | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 7 | \n",
- " a | \n",
- " c | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 8 | \n",
- " a | \n",
- " b | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 9 | \n",
- " a | \n",
- " c | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 10 | \n",
- " b | \n",
- " c | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 11 | \n",
- " a | \n",
- " c | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 12 | \n",
- " a | \n",
- " b | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 13 | \n",
- " a | \n",
- " b | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 14 | \n",
- " b | \n",
- " d | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 15 | \n",
- " b | \n",
- " d | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 16 | \n",
- " b | \n",
- " d | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 17 | \n",
- " b | \n",
- " c | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 18 | \n",
- " b | \n",
- " d | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 19 | \n",
- " b | \n",
- " d | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 20 | \n",
- " b | \n",
- " c | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 21 | \n",
- " b | \n",
- " c | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 22 | \n",
- " a | \n",
- " c | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 23 | \n",
- " b | \n",
- " c | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 24 | \n",
- " a | \n",
- " c | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 25 | \n",
- " a | \n",
- " b | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 26 | \n",
- " a | \n",
- " c | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 27 | \n",
- " b | \n",
- " c | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 28 | \n",
- " b | \n",
- " c | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | 29 | \n",
- " a | \n",
- " c | \n",
- " a | \n",
- " a | \n",
- " 0 | \n",
- "
\n",
- " \n",
- " | ... | \n",
- " ... | \n",
- " ... | \n",
- " ... | \n",
- " ... | \n",
- " ... | \n",
- "
\n",
- " \n",
- " | 120 | \n",
- " d | \n",
- " c | \n",
- " d | \n",
- " d | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 121 | \n",
- " b | \n",
- " b | \n",
- " c | \n",
- " d | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 122 | \n",
- " d | \n",
- " b | \n",
- " d | \n",
- " d | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 123 | \n",
- " c | \n",
- " b | \n",
- " c | \n",
- " c | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 124 | \n",
- " c | \n",
- " c | \n",
- " d | \n",
- " d | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 125 | \n",
- " d | \n",
- " c | \n",
- " d | \n",
- " c | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 126 | \n",
- " c | \n",
- " b | \n",
- " c | \n",
- " c | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 127 | \n",
- " c | \n",
- " b | \n",
- " c | \n",
- " c | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 128 | \n",
- " c | \n",
- " b | \n",
- " d | \n",
- " d | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 129 | \n",
- " d | \n",
- " b | \n",
- " d | \n",
- " c | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 130 | \n",
- " d | \n",
- " b | \n",
- " d | \n",
- " d | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 131 | \n",
- " d | \n",
- " d | \n",
- " d | \n",
- " d | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 132 | \n",
- " c | \n",
- " b | \n",
- " d | \n",
- " d | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 133 | \n",
- " c | \n",
- " b | \n",
- " c | \n",
- " c | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 134 | \n",
- " c | \n",
- " b | \n",
- " d | \n",
- " c | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 135 | \n",
- " d | \n",
- " b | \n",
- " d | \n",
- " d | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 136 | \n",
- " c | \n",
- " c | \n",
- " d | \n",
- " d | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 137 | \n",
- " c | \n",
- " c | \n",
- " d | \n",
- " c | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 138 | \n",
- " c | \n",
- " b | \n",
- " c | \n",
- " c | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 139 | \n",
- " d | \n",
- " c | \n",
- " d | \n",
- " d | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 140 | \n",
- " c | \n",
- " c | \n",
- " d | \n",
- " d | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 141 | \n",
- " d | \n",
- " c | \n",
- " c | \n",
- " d | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 142 | \n",
- " b | \n",
- " b | \n",
- " c | \n",
- " d | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 143 | \n",
- " c | \n",
- " c | \n",
- " d | \n",
- " d | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 144 | \n",
- " c | \n",
- " c | \n",
- " d | \n",
- " d | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 145 | \n",
- " c | \n",
- " b | \n",
- " c | \n",
- " d | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 146 | \n",
- " c | \n",
- " a | \n",
- " c | \n",
- " d | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 147 | \n",
- " c | \n",
- " b | \n",
- " c | \n",
- " d | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 148 | \n",
- " c | \n",
- " c | \n",
- " d | \n",
- " d | \n",
- " 2 | \n",
- "
\n",
- " \n",
- " | 149 | \n",
- " c | \n",
- " b | \n",
- " c | \n",
- " c | \n",
- " 2 | \n",
+ " 0 | \n",
"
\n",
" \n",
"
\n",
- "
150 rows × 5 columns
\n",
"
"
],
"text/plain": [
- " sl_labeled sw_labeled pl_labeled pw_labeled output\n",
- "0 b c a a 0\n",
- "1 a b a a 0\n",
- "2 a c a a 0\n",
- "3 a c a a 0\n",
- "4 a c a a 0\n",
- "5 b d a a 0\n",
- "6 a c a a 0\n",
- "7 a c a a 0\n",
- "8 a b a a 0\n",
- "9 a c a a 0\n",
- "10 b c a a 0\n",
- "11 a c a a 0\n",
- "12 a b a a 0\n",
- "13 a b a a 0\n",
- "14 b d a a 0\n",
- "15 b d a a 0\n",
- "16 b d a a 0\n",
- "17 b c a a 0\n",
- "18 b d a a 0\n",
- "19 b d a a 0\n",
- "20 b c a a 0\n",
- "21 b c a a 0\n",
- "22 a c a a 0\n",
- "23 b c a a 0\n",
- "24 a c a a 0\n",
- "25 a b a a 0\n",
- "26 a c a a 0\n",
- "27 b c a a 0\n",
- "28 b c a a 0\n",
- "29 a c a a 0\n",
- ".. ... ... ... ... ...\n",
- "120 d c d d 2\n",
- "121 b b c d 2\n",
- "122 d b d d 2\n",
- "123 c b c c 2\n",
- "124 c c d d 2\n",
- "125 d c d c 2\n",
- "126 c b c c 2\n",
- "127 c b c c 2\n",
- "128 c b d d 2\n",
- "129 d b d c 2\n",
- "130 d b d d 2\n",
- "131 d d d d 2\n",
- "132 c b d d 2\n",
- "133 c b c c 2\n",
- "134 c b d c 2\n",
- "135 d b d d 2\n",
- "136 c c d d 2\n",
- "137 c c d c 2\n",
- "138 c b c c 2\n",
- "139 d c d d 2\n",
- "140 c c d d 2\n",
- "141 d c c d 2\n",
- "142 b b c d 2\n",
- "143 c c d d 2\n",
- "144 c c d d 2\n",
- "145 c b c d 2\n",
- "146 c a c d 2\n",
- "147 c b c d 2\n",
- "148 c c d d 2\n",
- "149 c b c c 2\n",
- "\n",
- "[150 rows x 5 columns]"
+ " sl_labeled sw_labeled pl_labeled pw_labeled output\n",
+ "0 b c a a 0\n",
+ "1 a b a a 0\n",
+ "2 a c a a 0\n",
+ "3 a c a a 0\n",
+ "4 a c a a 0"
]
},
- "execution_count": 13,
+ "execution_count": 11,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
- "df"
+ "df.head()"
]
},
{
"cell_type": "code",
- "execution_count": 14,
- "metadata": {
- "collapsed": true
- },
+ "execution_count": 12,
+ "metadata": {},
"outputs": [],
"source": [
"def fit(data):\n",
@@ -1601,30 +377,30 @@
},
{
"cell_type": "code",
- "execution_count": 15,
+ "execution_count": 13,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
- "{0: {'pl_labeled': {'a': 50},\n",
- " 'pw_labeled': {'a': 50},\n",
+ "{0: {'total_count': 50,\n",
" 'sl_labeled': {'a': 28, 'b': 22},\n",
- " 'sw_labeled': {'a': 1, 'b': 7, 'c': 32, 'd': 10},\n",
- " 'total_count': 50},\n",
- " 1: {'pl_labeled': {'b': 7, 'c': 43},\n",
- " 'pw_labeled': {'b': 10, 'c': 40},\n",
- " 'sl_labeled': {'a': 3, 'b': 21, 'c': 24, 'd': 2},\n",
+ " 'sw_labeled': {'a': 1, 'b': 7, 'd': 10, 'c': 32},\n",
+ " 'pl_labeled': {'a': 50},\n",
+ " 'pw_labeled': {'a': 50}},\n",
+ " 1: {'total_count': 50,\n",
+ " 'sl_labeled': {'a': 3, 'b': 21, 'd': 2, 'c': 24},\n",
" 'sw_labeled': {'a': 13, 'b': 29, 'c': 8},\n",
- " 'total_count': 50},\n",
- " 2: {'pl_labeled': {'c': 20, 'd': 30},\n",
- " 'pw_labeled': {'c': 16, 'd': 34},\n",
- " 'sl_labeled': {'a': 1, 'b': 5, 'c': 29, 'd': 15},\n",
- " 'sw_labeled': {'a': 5, 'b': 28, 'c': 15, 'd': 2},\n",
- " 'total_count': 50}}"
+ " 'pl_labeled': {'b': 7, 'c': 43},\n",
+ " 'pw_labeled': {'b': 10, 'c': 40}},\n",
+ " 2: {'total_count': 50,\n",
+ " 'sl_labeled': {'a': 1, 'b': 5, 'd': 15, 'c': 29},\n",
+ " 'sw_labeled': {'a': 5, 'b': 28, 'd': 2, 'c': 15},\n",
+ " 'pl_labeled': {'d': 30, 'c': 20},\n",
+ " 'pw_labeled': {'d': 34, 'c': 16}}}"
]
},
- "execution_count": 15,
+ "execution_count": 13,
"metadata": {},
"output_type": "execute_result"
}
@@ -1632,12 +408,19 @@
"source": [
"fit(df)"
]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "metadata": {},
+ "outputs": [],
+ "source": []
}
],
"metadata": {
"anaconda-cloud": {},
"kernelspec": {
- "display_name": "Python [default]",
+ "display_name": "Python 3",
"language": "python",
"name": "python3"
},
@@ -1651,7 +434,7 @@
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
- "version": "3.6.5"
+ "version": "3.7.1"
}
},
"nbformat": 4,
diff --git a/project_euler/problem_13/num.txt b/project_euler/problem_13/num.txt
new file mode 100644
index 000000000000..43b568e812a8
--- /dev/null
+++ b/project_euler/problem_13/num.txt
@@ -0,0 +1,100 @@
+37107287533902102798797998220837590246510135740250
+46376937677490009712648124896970078050417018260538
+74324986199524741059474233309513058123726617309629
+91942213363574161572522430563301811072406154908250
+23067588207539346171171980310421047513778063246676
+89261670696623633820136378418383684178734361726757
+28112879812849979408065481931592621691275889832738
+44274228917432520321923589422876796487670272189318
+47451445736001306439091167216856844588711603153276
+70386486105843025439939619828917593665686757934951
+62176457141856560629502157223196586755079324193331
+64906352462741904929101432445813822663347944758178
+92575867718337217661963751590579239728245598838407
+58203565325359399008402633568948830189458628227828
+80181199384826282014278194139940567587151170094390
+35398664372827112653829987240784473053190104293586
+86515506006295864861532075273371959191420517255829
+71693888707715466499115593487603532921714970056938
+54370070576826684624621495650076471787294438377604
+53282654108756828443191190634694037855217779295145
+36123272525000296071075082563815656710885258350721
+45876576172410976447339110607218265236877223636045
+17423706905851860660448207621209813287860733969412
+81142660418086830619328460811191061556940512689692
+51934325451728388641918047049293215058642563049483
+62467221648435076201727918039944693004732956340691
+15732444386908125794514089057706229429197107928209
+55037687525678773091862540744969844508330393682126
+18336384825330154686196124348767681297534375946515
+80386287592878490201521685554828717201219257766954
+78182833757993103614740356856449095527097864797581
+16726320100436897842553539920931837441497806860984
+48403098129077791799088218795327364475675590848030
+87086987551392711854517078544161852424320693150332
+59959406895756536782107074926966537676326235447210
+69793950679652694742597709739166693763042633987085
+41052684708299085211399427365734116182760315001271
+65378607361501080857009149939512557028198746004375
+35829035317434717326932123578154982629742552737307
+94953759765105305946966067683156574377167401875275
+88902802571733229619176668713819931811048770190271
+25267680276078003013678680992525463401061632866526
+36270218540497705585629946580636237993140746255962
+24074486908231174977792365466257246923322810917141
+91430288197103288597806669760892938638285025333403
+34413065578016127815921815005561868836468420090470
+23053081172816430487623791969842487255036638784583
+11487696932154902810424020138335124462181441773470
+63783299490636259666498587618221225225512486764533
+67720186971698544312419572409913959008952310058822
+95548255300263520781532296796249481641953868218774
+76085327132285723110424803456124867697064507995236
+37774242535411291684276865538926205024910326572967
+23701913275725675285653248258265463092207058596522
+29798860272258331913126375147341994889534765745501
+18495701454879288984856827726077713721403798879715
+38298203783031473527721580348144513491373226651381
+34829543829199918180278916522431027392251122869539
+40957953066405232632538044100059654939159879593635
+29746152185502371307642255121183693803580388584903
+41698116222072977186158236678424689157993532961922
+62467957194401269043877107275048102390895523597457
+23189706772547915061505504953922979530901129967519
+86188088225875314529584099251203829009407770775672
+11306739708304724483816533873502340845647058077308
+82959174767140363198008187129011875491310547126581
+97623331044818386269515456334926366572897563400500
+42846280183517070527831839425882145521227251250327
+55121603546981200581762165212827652751691296897789
+32238195734329339946437501907836945765883352399886
+75506164965184775180738168837861091527357929701337
+62177842752192623401942399639168044983993173312731
+32924185707147349566916674687634660915035914677504
+99518671430235219628894890102423325116913619626622
+73267460800591547471830798392868535206946944540724
+76841822524674417161514036427982273348055556214818
+97142617910342598647204516893989422179826088076852
+87783646182799346313767754307809363333018982642090
+10848802521674670883215120185883543223812876952786
+71329612474782464538636993009049310363619763878039
+62184073572399794223406235393808339651327408011116
+66627891981488087797941876876144230030984490851411
+60661826293682836764744779239180335110989069790714
+85786944089552990653640447425576083659976645795096
+66024396409905389607120198219976047599490197230297
+64913982680032973156037120041377903785566085089252
+16730939319872750275468906903707539413042652315011
+94809377245048795150954100921645863754710598436791
+78639167021187492431995700641917969777599028300699
+15368713711936614952811305876380278410754449733078
+40789923115535562561142322423255033685442488917353
+44889911501440648020369068063960672322193204149535
+41503128880339536053299340368006977710650566631954
+81234880673210146739058568557934581403627822703280
+82616570773948327592232845941706525094512325230608
+22918802058777319719839450180888072429661980811197
+77158542502016545090413245809786882778948721859617
+72107838435069186155435662884062257473692284509516
+20849603980134001723930671666823555245252804609722
+53503534226472524250874054075591789781264330331690
diff --git a/project_euler/problem_13/sol2.py b/project_euler/problem_13/sol2.py
new file mode 100644
index 000000000000..c1416bcd6e7d
--- /dev/null
+++ b/project_euler/problem_13/sol2.py
@@ -0,0 +1,5 @@
+sum = 0
+with open("num.txt",'r') as f:
+ for line in f:
+ sum += int(line)
+print(str(sum)[:10])
diff --git a/project_euler/problem_16/sol2.py b/project_euler/problem_16/sol2.py
new file mode 100644
index 000000000000..cce3d2354bb1
--- /dev/null
+++ b/project_euler/problem_16/sol2.py
@@ -0,0 +1,6 @@
+from __future__ import print_function
+n = 2**1000
+r = 0
+while n:
+ r, n = r + n % 10, n // 10
+print(r)