|
55 | 55 | },
|
56 | 56 | {
|
57 | 57 | "cell_type": "code",
|
58 |
| - "execution_count": null, |
| 58 | + "execution_count": 2, |
59 | 59 | "id": "e633540e",
|
60 | 60 | "metadata": {},
|
61 | 61 | "outputs": [],
|
|
72 | 72 | },
|
73 | 73 | {
|
74 | 74 | "cell_type": "code",
|
75 |
| - "execution_count": null, |
| 75 | + "execution_count": 3, |
76 | 76 | "id": "775b2b8f",
|
77 | 77 | "metadata": {},
|
78 | 78 | "outputs": [],
|
|
83 | 83 | },
|
84 | 84 | {
|
85 | 85 | "cell_type": "code",
|
86 |
| - "execution_count": null, |
| 86 | + "execution_count": 4, |
87 | 87 | "id": "50e97690",
|
88 | 88 | "metadata": {},
|
89 | 89 | "outputs": [],
|
|
104 | 104 | },
|
105 | 105 | {
|
106 | 106 | "cell_type": "code",
|
107 |
| - "execution_count": null, |
| 107 | + "execution_count": 5, |
108 | 108 | "id": "8ffae7d8",
|
109 | 109 | "metadata": {},
|
110 |
| - "outputs": [], |
| 110 | + "outputs": [ |
| 111 | + { |
| 112 | + "data": { |
| 113 | + "text/plain": [ |
| 114 | + "Gender Exited\n", |
| 115 | + "Female 0 20\n", |
| 116 | + " 1 80\n", |
| 117 | + "Male 0 3346\n", |
| 118 | + " 1 654\n", |
| 119 | + "Name: Exited, dtype: int64" |
| 120 | + ] |
| 121 | + }, |
| 122 | + "execution_count": 5, |
| 123 | + "metadata": {}, |
| 124 | + "output_type": "execute_result" |
| 125 | + } |
| 126 | + ], |
111 | 127 | "source": [
|
112 | 128 | "training_set.groupby([\"Gender\", \"Exited\"])[\"Exited\"].count()"
|
113 | 129 | ]
|
|
132 | 148 | },
|
133 | 149 | {
|
134 | 150 | "cell_type": "code",
|
135 |
| - "execution_count": null, |
| 151 | + "execution_count": 6, |
136 | 152 | "id": "b562a655",
|
137 | 153 | "metadata": {},
|
138 | 154 | "outputs": [],
|
|
142 | 158 | },
|
143 | 159 | {
|
144 | 160 | "cell_type": "code",
|
145 |
| - "execution_count": null, |
| 161 | + "execution_count": 7, |
146 | 162 | "id": "080f075b",
|
147 | 163 | "metadata": {},
|
148 |
| - "outputs": [], |
| 164 | + "outputs": [ |
| 165 | + { |
| 166 | + "data": { |
| 167 | + "text/html": [ |
| 168 | + "<div>\n", |
| 169 | + "<style scoped>\n", |
| 170 | + " .dataframe tbody tr th:only-of-type {\n", |
| 171 | + " vertical-align: middle;\n", |
| 172 | + " }\n", |
| 173 | + "\n", |
| 174 | + " .dataframe tbody tr th {\n", |
| 175 | + " vertical-align: top;\n", |
| 176 | + " }\n", |
| 177 | + "\n", |
| 178 | + " .dataframe thead th {\n", |
| 179 | + " text-align: right;\n", |
| 180 | + " }\n", |
| 181 | + "</style>\n", |
| 182 | + "<table border=\"1\" class=\"dataframe\">\n", |
| 183 | + " <thead>\n", |
| 184 | + " <tr style=\"text-align: right;\">\n", |
| 185 | + " <th></th>\n", |
| 186 | + " <th>RowNumber</th>\n", |
| 187 | + " <th>CustomerId</th>\n", |
| 188 | + " <th>Surname</th>\n", |
| 189 | + " <th>CreditScore</th>\n", |
| 190 | + " <th>Geography</th>\n", |
| 191 | + " <th>Gender</th>\n", |
| 192 | + " <th>Age</th>\n", |
| 193 | + " <th>Tenure</th>\n", |
| 194 | + " <th>Balance</th>\n", |
| 195 | + " <th>NumOfProducts</th>\n", |
| 196 | + " <th>HasCrCard</th>\n", |
| 197 | + " <th>IsActiveMember</th>\n", |
| 198 | + " <th>EstimatedSalary</th>\n", |
| 199 | + " <th>Exited</th>\n", |
| 200 | + " </tr>\n", |
| 201 | + " </thead>\n", |
| 202 | + " <tbody>\n", |
| 203 | + " <tr>\n", |
| 204 | + " <th>0</th>\n", |
| 205 | + " <td>8274</td>\n", |
| 206 | + " <td>15709643</td>\n", |
| 207 | + " <td>Gray</td>\n", |
| 208 | + " <td>675</td>\n", |
| 209 | + " <td>France</td>\n", |
| 210 | + " <td>Male</td>\n", |
| 211 | + " <td>32</td>\n", |
| 212 | + " <td>1</td>\n", |
| 213 | + " <td>0.00</td>\n", |
| 214 | + " <td>3</td>\n", |
| 215 | + " <td>1</td>\n", |
| 216 | + " <td>0</td>\n", |
| 217 | + " <td>85901.09</td>\n", |
| 218 | + " <td>0</td>\n", |
| 219 | + " </tr>\n", |
| 220 | + " <tr>\n", |
| 221 | + " <th>1</th>\n", |
| 222 | + " <td>8277</td>\n", |
| 223 | + " <td>15775131</td>\n", |
| 224 | + " <td>Bartlett</td>\n", |
| 225 | + " <td>580</td>\n", |
| 226 | + " <td>Spain</td>\n", |
| 227 | + " <td>Male</td>\n", |
| 228 | + " <td>32</td>\n", |
| 229 | + " <td>9</td>\n", |
| 230 | + " <td>142188.20</td>\n", |
| 231 | + " <td>2</td>\n", |
| 232 | + " <td>0</td>\n", |
| 233 | + " <td>1</td>\n", |
| 234 | + " <td>128028.60</td>\n", |
| 235 | + " <td>0</td>\n", |
| 236 | + " </tr>\n", |
| 237 | + " <tr>\n", |
| 238 | + " <th>2</th>\n", |
| 239 | + " <td>8281</td>\n", |
| 240 | + " <td>15745716</td>\n", |
| 241 | + " <td>McGregor</td>\n", |
| 242 | + " <td>706</td>\n", |
| 243 | + " <td>Spain</td>\n", |
| 244 | + " <td>Male</td>\n", |
| 245 | + " <td>53</td>\n", |
| 246 | + " <td>7</td>\n", |
| 247 | + " <td>0.00</td>\n", |
| 248 | + " <td>2</td>\n", |
| 249 | + " <td>0</td>\n", |
| 250 | + " <td>1</td>\n", |
| 251 | + " <td>117939.17</td>\n", |
| 252 | + " <td>0</td>\n", |
| 253 | + " </tr>\n", |
| 254 | + " <tr>\n", |
| 255 | + " <th>3</th>\n", |
| 256 | + " <td>8282</td>\n", |
| 257 | + " <td>15598485</td>\n", |
| 258 | + " <td>Pinto</td>\n", |
| 259 | + " <td>567</td>\n", |
| 260 | + " <td>Spain</td>\n", |
| 261 | + " <td>Male</td>\n", |
| 262 | + " <td>40</td>\n", |
| 263 | + " <td>8</td>\n", |
| 264 | + " <td>28649.64</td>\n", |
| 265 | + " <td>1</td>\n", |
| 266 | + " <td>1</td>\n", |
| 267 | + " <td>1</td>\n", |
| 268 | + " <td>95140.62</td>\n", |
| 269 | + " <td>0</td>\n", |
| 270 | + " </tr>\n", |
| 271 | + " <tr>\n", |
| 272 | + " <th>4</th>\n", |
| 273 | + " <td>8284</td>\n", |
| 274 | + " <td>15754569</td>\n", |
| 275 | + " <td>Pagnotto</td>\n", |
| 276 | + " <td>664</td>\n", |
| 277 | + " <td>France</td>\n", |
| 278 | + " <td>Male</td>\n", |
| 279 | + " <td>57</td>\n", |
| 280 | + " <td>1</td>\n", |
| 281 | + " <td>0.00</td>\n", |
| 282 | + " <td>2</td>\n", |
| 283 | + " <td>1</td>\n", |
| 284 | + " <td>1</td>\n", |
| 285 | + " <td>56562.57</td>\n", |
| 286 | + " <td>0</td>\n", |
| 287 | + " </tr>\n", |
| 288 | + " </tbody>\n", |
| 289 | + "</table>\n", |
| 290 | + "</div>" |
| 291 | + ], |
| 292 | + "text/plain": [ |
| 293 | + " RowNumber CustomerId Surname CreditScore Geography Gender Age Tenure \\\n", |
| 294 | + "0 8274 15709643 Gray 675 France Male 32 1 \n", |
| 295 | + "1 8277 15775131 Bartlett 580 Spain Male 32 9 \n", |
| 296 | + "2 8281 15745716 McGregor 706 Spain Male 53 7 \n", |
| 297 | + "3 8282 15598485 Pinto 567 Spain Male 40 8 \n", |
| 298 | + "4 8284 15754569 Pagnotto 664 France Male 57 1 \n", |
| 299 | + "\n", |
| 300 | + " Balance NumOfProducts HasCrCard IsActiveMember EstimatedSalary \\\n", |
| 301 | + "0 0.00 3 1 0 85901.09 \n", |
| 302 | + "1 142188.20 2 0 1 128028.60 \n", |
| 303 | + "2 0.00 2 0 1 117939.17 \n", |
| 304 | + "3 28649.64 1 1 1 95140.62 \n", |
| 305 | + "4 0.00 2 1 1 56562.57 \n", |
| 306 | + "\n", |
| 307 | + " Exited \n", |
| 308 | + "0 0 \n", |
| 309 | + "1 0 \n", |
| 310 | + "2 0 \n", |
| 311 | + "3 0 \n", |
| 312 | + "4 0 " |
| 313 | + ] |
| 314 | + }, |
| 315 | + "execution_count": 7, |
| 316 | + "metadata": {}, |
| 317 | + "output_type": "execute_result" |
| 318 | + } |
| 319 | + ], |
149 | 320 | "source": [
|
150 | 321 | "new_prod_data = pd.read_csv(NEW_PROD_DATA_URL)\n",
|
151 | 322 | "new_prod_data.head()"
|
|
161 | 332 | },
|
162 | 333 | {
|
163 | 334 | "cell_type": "code",
|
164 |
| - "execution_count": null, |
| 335 | + "execution_count": 8, |
165 | 336 | "id": "e17d8121",
|
166 | 337 | "metadata": {},
|
167 | 338 | "outputs": [],
|
|
171 | 342 | },
|
172 | 343 | {
|
173 | 344 | "cell_type": "code",
|
174 |
| - "execution_count": null, |
| 345 | + "execution_count": 9, |
175 | 346 | "id": "8cfdb549",
|
176 | 347 | "metadata": {},
|
177 | 348 | "outputs": [],
|
|
322 | 493 | " return model.predict_proba(encoded_df.to_numpy())"
|
323 | 494 | ]
|
324 | 495 | },
|
| 496 | + { |
| 497 | + "cell_type": "code", |
| 498 | + "execution_count": null, |
| 499 | + "id": "c7739e4e", |
| 500 | + "metadata": {}, |
| 501 | + "outputs": [], |
| 502 | + "source": [ |
| 503 | + "# installing the Unbox Python API\n", |
| 504 | + "!pip install unboxapi" |
| 505 | + ] |
| 506 | + }, |
325 | 507 | {
|
326 | 508 | "cell_type": "code",
|
327 | 509 | "execution_count": null,
|
|
0 commit comments