{ "cells": [ { "cell_type": "code", "execution_count": 18, "id": "7c5d059b-ed8a-4e2e-9420-25890f648895", "metadata": { "scrolled": true }, "outputs": [], "source": [ "import pandas as pd\n", "import psycopg2 as pg\n", "import matplotlib.pyplot as plt\n", "import numpy as np\n", "from sklearn.model_selection import train_test_split\n", "import xgboost as xgb\n", "from sklearn.metrics import confusion_matrix,matthews_corrcoef,accuracy_score\n", "import optuna\n", "import pickle\n", "from sklearn.feature_selection import SequentialFeatureSelector\n", "reload = False\n", "def norm(x):\n", " if len(x)==1 and x[0]=='':\n", " return []\n", " else:\n", " return x\n", "if reload:\n", " engine = pg.connect(\"dbname='safeidx' user='fbk_mpba' host='172.104.247.67' port='5432' password='fbk2024$'\")\n", " df = pd.read_sql('select * from data_safeidx', con=engine)\n", " with open('data.pkl','wb') as f:\n", " pickle.dump(df,f)\n", "else:\n", " with open('data.pkl','rb') as f:\n", " df = pickle.load(f)\n", " #df = pd.read_csv('pid.csv').drop(columns='Unnamed: 0')\n", " #df.evacuation_vehicles = df.evacuation_vehicles.apply(lambda x:norm(x.replace(' ','').replace('[','').replace(']','').split(',')))" ] }, { "cell_type": "code", "execution_count": 4, "id": "25ebaf4f-f7bd-4119-930f-410bb78f0b27", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
| \n", " | difficulty | \n", "cause | \n", "town | \n", "province | \n", "gender | \n", "equipment | \n", "helmet | \n", "destination | \n", "diagnosis | \n", "india | \n", "age | \n", "country | \n", "injury_side | \n", "injury_general_location | \n", "evacuation_vehicles | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "novice | \n", "fall_alone | \n", "SIKLOS | \n", "\n", " | F | \n", "ski | \n", "None | \n", "hospital_emergency_room | \n", "distortion | \n", "None | \n", "32.0 | \n", "Ungheria | \n", "L | \n", "lower_limbs | \n", "[akja] | \n", "
| 1 | \n", "advanced | \n", "fall_alone | \n", "MALMO | \n", "\n", " | M | \n", "ski | \n", "None | \n", "hospital_emergency_room | \n", "bruise | \n", "None | \n", "32.0 | \n", "Svezia | \n", "R | \n", "skull_or_face | \n", "[akja] | \n", "
| 2 | \n", "advanced | \n", "fall_alone | \n", "CALDARO | \n", "BZ | \n", "F | \n", "ski | \n", "None | \n", "domicile | \n", "other | \n", "None | \n", "12.0 | \n", "Italia | \n", "R | \n", "None | \n", "[snowmobile] | \n", "
| 3 | \n", "advanced | \n", "collision_person | \n", "LINZ | \n", "\n", " | M | \n", "ski | \n", "None | \n", "hospital_emergency_room | \n", "bruise | \n", "None | \n", "58.0 | \n", "Austria | \n", "R | \n", "lower_limbs | \n", "[snowmobile] | \n", "
| 4 | \n", "advanced | \n", "collision_person | \n", "RUSAVA | \n", "\n", " | M | \n", "ski | \n", "None | \n", "other | \n", "bruise | \n", "None | \n", "25.0 | \n", "Repubblica Ceca | \n", "L | \n", "lower_limbs | \n", "[other] | \n", "