{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "# Lab 5 - Python Code" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "Authors: Valerie Dube, Erzo Garay, Juan Marcos Guerrero y Matias Villalba" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "## Replication and Data analysis" ] }, { "cell_type": "code", "execution_count": 45, "metadata": {}, "outputs": [], "source": [ "# Libraries\n", "import numpy as np\n", "import pandas as pd\n", "import seaborn as sns\n", "import matplotlib.pyplot as plt\n", "import statsmodels.api as sm\n", "import statsmodels.formula.api as smf\n", "import hdmpy as hdm\n", "\n", "from sklearn.base import BaseEstimator\n", "from sklearn.pipeline import make_pipeline\n", "from sklearn.preprocessing import StandardScaler\n", "from sklearn.model_selection import KFold, cross_val_predict\n", "from sklearn.linear_model import LassoCV, Lasso\n", "from sklearn.tree import DecisionTreeRegressor\n", "from sklearn.ensemble import GradientBoostingRegressor, RandomForestRegressor" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "### 1. Descriptives" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "#### 1.1. Descriptive table" ] }, { "cell_type": "code", "execution_count": 31, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | y | \n", "w | \n", "gender_female | \n", "gender_male | \n", "gender_transgender | \n", "ethnicgrp_asian | \n", "ethnicgrp_black | \n", "ethnicgrp_mixed_multiple | \n", "ethnicgrp_other | \n", "ethnicgrp_white | \n", "partners1 | \n", "postlaunch | \n", "msm | \n", "age | \n", "imd_decile | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "1 | \n", "1 | \n", "0 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "0 | \n", "27 | \n", "5 | \n", "
1 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "19 | \n", "6 | \n", "
2 | \n", "0 | \n", "1 | \n", "0 | \n", "1 | \n", "0 | \n", "0 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "0 | \n", "26 | \n", "4 | \n", "
3 | \n", "0 | \n", "0 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "1 | \n", "0 | \n", "0 | \n", "20 | \n", "2 | \n", "
4 | \n", "1 | \n", "1 | \n", "1 | \n", "0 | \n", "0 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "0 | \n", "24 | \n", "3 | \n", "