{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "# Pandas" ] }, { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "import pandas as pd" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [], "source": [ "pd_df = pd.read_json('flights.json.gz', lines=True)" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | AvgTicketPrice | \n", "Cancelled | \n", "Carrier | \n", "Dest | \n", "DestAirportID | \n", "DestCityName | \n", "DestCountry | \n", "DestLocation | \n", "DestRegion | \n", "DestWeather | \n", "... | \n", "FlightTimeMin | \n", "Origin | \n", "OriginAirportID | \n", "OriginCityName | \n", "OriginCountry | \n", "OriginLocation | \n", "OriginRegion | \n", "OriginWeather | \n", "dayOfWeek | \n", "timestamp | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "841.265642 | \n", "False | \n", "Kibana Airlines | \n", "Sydney Kingsford Smith International Airport | \n", "SYD | \n", "Sydney | \n", "AU | \n", "{'lat': '-33.94609833', 'lon': '151.177002'} | \n", "SE-BD | \n", "Rain | \n", "... | \n", "1030.770416 | \n", "Frankfurt am Main Airport | \n", "FRA | \n", "Frankfurt am Main | \n", "DE | \n", "{'lat': '50.033333', 'lon': '8.570556'} | \n", "DE-HE | \n", "Sunny | \n", "0 | \n", "2018-01-01 00:00:00 | \n", "
1 | \n", "882.982662 | \n", "False | \n", "Logstash Airways | \n", "Venice Marco Polo Airport | \n", "VE05 | \n", "Venice | \n", "IT | \n", "{'lat': '45.505299', 'lon': '12.3519'} | \n", "IT-34 | \n", "Sunny | \n", "... | \n", "464.389481 | \n", "Cape Town International Airport | \n", "CPT | \n", "Cape Town | \n", "ZA | \n", "{'lat': '-33.96480179', 'lon': '18.60169983'} | \n", "SE-BD | \n", "Clear | \n", "0 | \n", "2018-01-01 18:27:00 | \n", "
2 | \n", "190.636904 | \n", "False | \n", "Logstash Airways | \n", "Venice Marco Polo Airport | \n", "VE05 | \n", "Venice | \n", "IT | \n", "{'lat': '45.505299', 'lon': '12.3519'} | \n", "IT-34 | \n", "Cloudy | \n", "... | \n", "0.000000 | \n", "Venice Marco Polo Airport | \n", "VE05 | \n", "Venice | \n", "IT | \n", "{'lat': '45.505299', 'lon': '12.3519'} | \n", "IT-34 | \n", "Rain | \n", "0 | \n", "2018-01-01 17:11:14 | \n", "
3 | \n", "181.694216 | \n", "True | \n", "Kibana Airlines | \n", "Treviso-Sant'Angelo Airport | \n", "TV01 | \n", "Treviso | \n", "IT | \n", "{'lat': '45.648399', 'lon': '12.1944'} | \n", "IT-34 | \n", "Clear | \n", "... | \n", "222.749059 | \n", "Naples International Airport | \n", "NA01 | \n", "Naples | \n", "IT | \n", "{'lat': '40.886002', 'lon': '14.2908'} | \n", "IT-72 | \n", "Thunder & Lightning | \n", "0 | \n", "2018-01-01 10:33:28 | \n", "
4 | \n", "730.041778 | \n", "False | \n", "Kibana Airlines | \n", "Xi'an Xianyang International Airport | \n", "XIY | \n", "Xi'an | \n", "CN | \n", "{'lat': '34.447102', 'lon': '108.751999'} | \n", "SE-BD | \n", "Clear | \n", "... | \n", "785.779071 | \n", "Licenciado Benito Juarez International Airport | \n", "AICM | \n", "Mexico City | \n", "MX | \n", "{'lat': '19.4363', 'lon': '-99.072098'} | \n", "MX-DIF | \n", "Damaging Wind | \n", "0 | \n", "2018-01-01 05:13:00 | \n", "
5 rows × 27 columns
\n", "\n", " | AvgTicketPrice | \n", "DistanceKilometers | \n", "DistanceMiles | \n", "FlightDelayMin | \n", "FlightTimeHour | \n", "FlightTimeMin | \n", "dayOfWeek | \n", "
---|---|---|---|---|---|---|---|
count | \n", "13059.000000 | \n", "13059.000000 | \n", "13059.000000 | \n", "13059.000000 | \n", "13059.000000 | \n", "13059.000000 | \n", "13059.000000 | \n", "
mean | \n", "628.253689 | \n", "7092.142455 | \n", "4406.853013 | \n", "47.335171 | \n", "8.518797 | \n", "511.127842 | \n", "2.835975 | \n", "
std | \n", "266.396861 | \n", "4578.438497 | \n", "2844.909787 | \n", "96.746711 | \n", "5.579233 | \n", "334.753952 | \n", "1.939439 | \n", "
min | \n", "100.020528 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "
25% | \n", "409.893816 | \n", "2459.705673 | \n", "1528.390247 | \n", "0.000000 | \n", "4.205553 | \n", "252.333192 | \n", "1.000000 | \n", "
50% | \n", "640.556668 | \n", "7610.330866 | \n", "4728.840363 | \n", "0.000000 | \n", "8.384086 | \n", "503.045170 | \n", "3.000000 | \n", "
75% | \n", "842.185470 | \n", "9736.637600 | \n", "6050.066114 | \n", "15.000000 | \n", "12.006934 | \n", "720.416036 | \n", "4.000000 | \n", "
max | \n", "1199.729053 | \n", "19881.482315 | \n", "12353.780369 | \n", "360.000000 | \n", "31.715034 | \n", "1902.902032 | \n", "6.000000 | \n", "
\n", " | AvgTicketPrice | \n", "Cancelled | \n", "Carrier | \n", "Dest | \n", "DestAirportID | \n", "DestCityName | \n", "DestCountry | \n", "DestLocation | \n", "DestRegion | \n", "DestWeather | \n", "... | \n", "FlightTimeMin | \n", "Origin | \n", "OriginAirportID | \n", "OriginCityName | \n", "OriginCountry | \n", "OriginLocation | \n", "OriginRegion | \n", "OriginWeather | \n", "dayOfWeek | \n", "timestamp | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "841.265642 | \n", "False | \n", "Kibana Airlines | \n", "Sydney Kingsford Smith International Airport | \n", "SYD | \n", "Sydney | \n", "AU | \n", "{'lat': '-33.94609833', 'lon': '151.177002'} | \n", "SE-BD | \n", "Rain | \n", "... | \n", "1030.770416 | \n", "Frankfurt am Main Airport | \n", "FRA | \n", "Frankfurt am Main | \n", "DE | \n", "{'lat': '50.033333', 'lon': '8.570556'} | \n", "DE-HE | \n", "Sunny | \n", "0 | \n", "2019-05-27T00:00:00 | \n", "
1 | \n", "882.982662 | \n", "False | \n", "Logstash Airways | \n", "Venice Marco Polo Airport | \n", "VE05 | \n", "Venice | \n", "IT | \n", "{'lat': '45.505299', 'lon': '12.3519'} | \n", "IT-34 | \n", "Sunny | \n", "... | \n", "464.389481 | \n", "Cape Town International Airport | \n", "CPT | \n", "Cape Town | \n", "ZA | \n", "{'lat': '-33.96480179', 'lon': '18.60169983'} | \n", "SE-BD | \n", "Clear | \n", "0 | \n", "2019-05-27T18:27:00 | \n", "
2 | \n", "190.636904 | \n", "False | \n", "Logstash Airways | \n", "Venice Marco Polo Airport | \n", "VE05 | \n", "Venice | \n", "IT | \n", "{'lat': '45.505299', 'lon': '12.3519'} | \n", "IT-34 | \n", "Cloudy | \n", "... | \n", "0.000000 | \n", "Venice Marco Polo Airport | \n", "VE05 | \n", "Venice | \n", "IT | \n", "{'lat': '45.505299', 'lon': '12.3519'} | \n", "IT-34 | \n", "Rain | \n", "0 | \n", "2019-05-27T17:11:14 | \n", "
3 | \n", "181.694216 | \n", "True | \n", "Kibana Airlines | \n", "Treviso-Sant'Angelo Airport | \n", "TV01 | \n", "Treviso | \n", "IT | \n", "{'lat': '45.648399', 'lon': '12.1944'} | \n", "IT-34 | \n", "Clear | \n", "... | \n", "222.749059 | \n", "Naples International Airport | \n", "NA01 | \n", "Naples | \n", "IT | \n", "{'lat': '40.886002', 'lon': '14.2908'} | \n", "IT-72 | \n", "Thunder & Lightning | \n", "0 | \n", "2019-05-27T10:33:28 | \n", "
4 | \n", "730.041778 | \n", "False | \n", "Kibana Airlines | \n", "Xi'an Xianyang International Airport | \n", "XIY | \n", "Xi'an | \n", "CN | \n", "{'lat': '34.447102', 'lon': '108.751999'} | \n", "SE-BD | \n", "Clear | \n", "... | \n", "785.779071 | \n", "Licenciado Benito Juarez International Airport | \n", "AICM | \n", "Mexico City | \n", "MX | \n", "{'lat': '19.4363', 'lon': '-99.072098'} | \n", "MX-DIF | \n", "Damaging Wind | \n", "0 | \n", "2019-05-27T05:13:00 | \n", "
5 rows × 27 columns
\n", "\n", " | AvgTicketPrice | \n", "DistanceKilometers | \n", "DistanceMiles | \n", "FlightDelayMin | \n", "FlightTimeMin | \n", "dayOfWeek | \n", "
---|---|---|---|---|---|---|
count | \n", "13059.000000 | \n", "13059.000000 | \n", "13059.000000 | \n", "13059.000000 | \n", "13059.000000 | \n", "13059.000000 | \n", "
mean | \n", "628.253689 | \n", "7092.142457 | \n", "4406.853010 | \n", "47.335171 | \n", "511.127842 | \n", "2.835975 | \n", "
std | \n", "266.386661 | \n", "4578.263193 | \n", "2844.800855 | \n", "96.743006 | \n", "334.741135 | \n", "1.939365 | \n", "
min | \n", "100.020531 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "
25% | \n", "410.008918 | \n", "2470.545974 | \n", "1535.126118 | \n", "0.000000 | \n", "252.064162 | \n", "1.000000 | \n", "
50% | \n", "640.387285 | \n", "7612.072403 | \n", "4729.922470 | \n", "0.000000 | \n", "503.148975 | \n", "3.000000 | \n", "
75% | \n", "842.259390 | \n", "9735.660463 | \n", "6049.583389 | \n", "15.000000 | \n", "720.505705 | \n", "4.068000 | \n", "
max | \n", "1199.729004 | \n", "19881.482422 | \n", "12353.780273 | \n", "360.000000 | \n", "1902.901978 | \n", "6.000000 | \n", "