{"metadata":{"kernelspec":{"language":"python","display_name":"Python 3","name":"python3"},"language_info":{"name":"python","version":"3.7.9","mimetype":"text/x-python","codemirror_mode":{"name":"ipython","version":3},"pygments_lexer":"ipython3","nbconvert_exporter":"python","file_extension":".py"}},"nbformat_minor":4,"nbformat":4,"cells":[{"cell_type":"markdown","source":"## Decision Trees tutorial & improving hosting with skops 🌲\n\nIn this notebook I will walk you through decision trees and how to inspect them, and we will later improve model hosting using [skops](https://skops.readthedocs.io/en/stable/). We will load the dataset and split. ","metadata":{}},{"cell_type":"code","source":"from sklearn.datasets import load_breast_cancer\nfrom sklearn.model_selection import train_test_split","metadata":{"execution":{"iopub.status.busy":"2022-12-01T13:21:16.196274Z","iopub.execute_input":"2022-12-01T13:21:16.196592Z","iopub.status.idle":"2022-12-01T13:21:16.523656Z","shell.execute_reply.started":"2022-12-01T13:21:16.196567Z","shell.execute_reply":"2022-12-01T13:21:16.522085Z"},"trusted":true},"execution_count":3,"outputs":[]},{"cell_type":"code","source":"cancer = load_breast_cancer()\ndata = pd.DataFrame(cancer.data, columns=[cancer.feature_names])\ndata.head()","metadata":{"execution":{"iopub.status.busy":"2022-12-01T13:21:16.668054Z","iopub.execute_input":"2022-12-01T13:21:16.668383Z","iopub.status.idle":"2022-12-01T13:21:16.719596Z","shell.execute_reply.started":"2022-12-01T13:21:16.668356Z","shell.execute_reply":"2022-12-01T13:21:16.717624Z"},"trusted":true},"execution_count":4,"outputs":[{"execution_count":4,"output_type":"execute_result","data":{"text/plain":" mean radius mean texture mean perimeter mean area mean smoothness \\\n0 17.99 10.38 122.80 1001.0 0.11840 \n1 20.57 17.77 132.90 1326.0 0.08474 \n2 19.69 21.25 130.00 1203.0 0.10960 \n3 11.42 20.38 77.58 386.1 0.14250 \n4 20.29 14.34 135.10 1297.0 0.10030 \n\n mean compactness mean concavity mean concave points mean symmetry \\\n0 0.27760 0.3001 0.14710 0.2419 \n1 0.07864 0.0869 0.07017 0.1812 \n2 0.15990 0.1974 0.12790 0.2069 \n3 0.28390 0.2414 0.10520 0.2597 \n4 0.13280 0.1980 0.10430 0.1809 \n\n mean fractal dimension ... worst radius worst texture worst perimeter \\\n0 0.07871 ... 25.38 17.33 184.60 \n1 0.05667 ... 24.99 23.41 158.80 \n2 0.05999 ... 23.57 25.53 152.50 \n3 0.09744 ... 14.91 26.50 98.87 \n4 0.05883 ... 22.54 16.67 152.20 \n\n worst area worst smoothness worst compactness worst concavity \\\n0 2019.0 0.1622 0.6656 0.7119 \n1 1956.0 0.1238 0.1866 0.2416 \n2 1709.0 0.1444 0.4245 0.4504 \n3 567.7 0.2098 0.8663 0.6869 \n4 1575.0 0.1374 0.2050 0.4000 \n\n worst concave points worst symmetry worst fractal dimension \n0 0.2654 0.4601 0.11890 \n1 0.1860 0.2750 0.08902 \n2 0.2430 0.3613 0.08758 \n3 0.2575 0.6638 0.17300 \n4 0.1625 0.2364 0.07678 \n\n[5 rows x 30 columns]","text/html":"
