{ "cells": [ { "cell_type": "markdown", "source": [ "## (1) Import libraries" ], "metadata": {} }, { "cell_type": "code", "execution_count": 1, "source": [ "import pandas as pd\n", "from pycaret.datasets import get_data\n", "\n", "import sweetviz as sv" ], "outputs": [], "metadata": {} }, { "cell_type": "code", "execution_count": 2, "source": [ "# Record version of key libraries\n", "from importlib.metadata import version\n", "\n", "print('sweetviz==%s' % version('sweetviz'))" ], "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "sweetviz==2.1.3\n" ] } ], "metadata": {} }, { "cell_type": "markdown", "source": [ "## (2) Get data" ], "metadata": {} }, { "cell_type": "code", "execution_count": 8, "source": [ "# Select a pre-packaged data for testing\n", "df = get_data('diabetes', verbose=True)" ], "outputs": [ { "output_type": "display_data", "data": { "text/plain": [ " Number of times pregnant \\\n", "0 6 \n", "1 1 \n", "2 8 \n", "3 1 \n", "4 0 \n", "\n", " Plasma glucose concentration a 2 hours in an oral glucose tolerance test \\\n", "0 148 \n", "1 85 \n", "2 183 \n", "3 89 \n", "4 137 \n", "\n", " Diastolic blood pressure (mm Hg) Triceps skin fold thickness (mm) \\\n", "0 72 35 \n", "1 66 29 \n", "2 64 0 \n", "3 66 23 \n", "4 40 35 \n", "\n", " 2-Hour serum insulin (mu U/ml) \\\n", "0 0 \n", "1 0 \n", "2 0 \n", "3 94 \n", "4 168 \n", "\n", " Body mass index (weight in kg/(height in m)^2) Diabetes pedigree function \\\n", "0 33.6 0.627 \n", "1 26.6 0.351 \n", "2 23.3 0.672 \n", "3 28.1 0.167 \n", "4 43.1 2.288 \n", "\n", " Age (years) Class variable \n", "0 50 1 \n", "1 31 0 \n", "2 32 1 \n", "3 21 0 \n", "4 33 1 " ], "text/html": [ "
\n", " | Number of times pregnant | \n", "Plasma glucose concentration a 2 hours in an oral glucose tolerance test | \n", "Diastolic blood pressure (mm Hg) | \n", "Triceps skin fold thickness (mm) | \n", "2-Hour serum insulin (mu U/ml) | \n", "Body mass index (weight in kg/(height in m)^2) | \n", "Diabetes pedigree function | \n", "Age (years) | \n", "Class variable | \n", "
---|---|---|---|---|---|---|---|---|---|
0 | \n", "6 | \n", "148 | \n", "72 | \n", "35 | \n", "0 | \n", "33.6 | \n", "0.627 | \n", "50 | \n", "1 | \n", "
1 | \n", "1 | \n", "85 | \n", "66 | \n", "29 | \n", "0 | \n", "26.6 | \n", "0.351 | \n", "31 | \n", "0 | \n", "
2 | \n", "8 | \n", "183 | \n", "64 | \n", "0 | \n", "0 | \n", "23.3 | \n", "0.672 | \n", "32 | \n", "1 | \n", "
3 | \n", "1 | \n", "89 | \n", "66 | \n", "23 | \n", "94 | \n", "28.1 | \n", "0.167 | \n", "21 | \n", "0 | \n", "
4 | \n", "0 | \n", "137 | \n", "40 | \n", "35 | \n", "168 | \n", "43.1 | \n", "2.288 | \n", "33 | \n", "1 | \n", "