{ "cells": [ { "cell_type": "code", "execution_count": 23, "metadata": {}, "outputs": [], "source": [ "import numpy as np\n", "import pandas as pd\n", "import matplotlib.pyplot as plt" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [], "source": [ "s1 = pd.Series(np.random.randn(10))" ] }, { "cell_type": "code", "execution_count": 4, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "0 -1.114610\n", "1 -0.016532\n", "2 -0.483466\n", "3 -0.181992\n", "4 -0.850196\n", "5 -0.141419\n", "6 0.775546\n", "7 -0.442790\n", "8 0.457040\n", "9 0.376961\n", "dtype: float64" ] }, "execution_count": 4, "metadata": {}, "output_type": "execute_result" } ], "source": [ "s1" ] }, { "cell_type": "code", "execution_count": 5, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "pandas.core.series.Series" ] }, "execution_count": 5, "metadata": {}, "output_type": "execute_result" } ], "source": [ "type(s1)" ] }, { "cell_type": "code", "execution_count": 7, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "\n", "RangeIndex: 7698 entries, 0 to 7697\n", "Data columns (total 14 columns):\n", "0 7698 non-null int64\n", "1 7698 non-null object\n", "2 7649 non-null object\n", "3 7698 non-null object\n", "4 7698 non-null object\n", "5 7698 non-null object\n", "6 7698 non-null float64\n", "7 7698 non-null float64\n", "8 7698 non-null int64\n", "9 7698 non-null object\n", "10 7698 non-null object\n", "11 7698 non-null object\n", "12 7698 non-null object\n", "13 7698 non-null object\n", "dtypes: float64(2), int64(2), object(10)\n", "memory usage: 842.1+ KB\n" ] } ], "source": [ "airports = pd.read_csv(r\"G:\\X-Lab\\LearningFiles\\DataSci\\data\\airports.dat\", header=None)\n", "airports.info()" ] }, { "cell_type": "code", "execution_count": 12, "metadata": {}, "outputs": [], "source": [ "airports.columns = [\"airport_id\", \"name\", \"city\", \"country\", \"IATA\", \"ICAO\", \"lat\", \"lon\", \"altitude\", \"timezone\", \"DST\", \"Tz database timezone\", \"type\", \"source\"]" ] }, { "cell_type": "code", "execution_count": 13, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
airport_idnamecitycountryIATAICAOlatlonaltitudetimezoneDSTTz database timezonetypesource
768814101Rustaq AirportAl Masna'ahOmanMNHOORQ23.64055657.487500349\\N\\N\\NairportOurAirports
768914102Laguindingan AirportCagayan de Oro CityPhilippinesCGYRPMY8.612203124.456496190\\N\\N\\NairportOurAirports
769014103Kostomuksha AirportKostomukshaRussia\\NULPM64.61799630.687000681\\N\\N\\NairportOurAirports
769114104Privolzhskiy Air BaseAstrakhanRussia\\NXRAP46.39600047.893000-66\\N\\N\\NairportOurAirports
769214105Kubinka Air BaseKubinkaRussia\\NUUMB55.61169536.650002614\\N\\N\\NairportOurAirports
769314106Rogachyovo Air BaseBelayaRussia\\NULDA71.61669952.478298272\\N\\N\\NairportOurAirports
769414107Ulan-Ude East AirportUlan UdeRussia\\NXIUW51.849998107.7379991670\\N\\N\\NairportOurAirports
769514108Krechevitsy Air BaseNovgorodRussia\\NULLK58.62500031.38500085\\N\\N\\NairportOurAirports
769614109Desierto de Atacama AirportCopiapoChileCPOSCAT-27.261200-70.779198670\\N\\N\\NairportOurAirports
769714110Melitopol Air BaseMelitopolUkraine\\NUKDM46.88000135.3050000\\N\\N\\NairportOurAirports
\n", "
" ], "text/plain": [ " airport_id name city \\\n", "7688 14101 Rustaq Airport Al Masna'ah \n", "7689 14102 Laguindingan Airport Cagayan de Oro City \n", "7690 14103 Kostomuksha Airport Kostomuksha \n", "7691 14104 Privolzhskiy Air Base Astrakhan \n", "7692 14105 Kubinka Air Base Kubinka \n", "7693 14106 Rogachyovo Air Base Belaya \n", "7694 14107 Ulan-Ude East Airport Ulan Ude \n", "7695 14108 Krechevitsy Air Base Novgorod \n", "7696 14109 Desierto de Atacama Airport Copiapo \n", "7697 14110 Melitopol Air Base Melitopol \n", "\n", " country IATA ICAO lat lon altitude timezone DST \\\n", "7688 Oman MNH OORQ 23.640556 57.487500 349 \\N \\N \n", "7689 Philippines CGY RPMY 8.612203 124.456496 190 \\N \\N \n", "7690 Russia \\N ULPM 64.617996 30.687000 681 \\N \\N \n", "7691 Russia \\N XRAP 46.396000 47.893000 -66 \\N \\N \n", "7692 Russia \\N UUMB 55.611695 36.650002 614 \\N \\N \n", "7693 Russia \\N ULDA 71.616699 52.478298 272 \\N \\N \n", "7694 Russia \\N XIUW 51.849998 107.737999 1670 \\N \\N \n", "7695 Russia \\N ULLK 58.625000 31.385000 85 \\N \\N \n", "7696 Chile CPO SCAT -27.261200 -70.779198 670 \\N \\N \n", "7697 Ukraine \\N UKDM 46.880001 35.305000 0 \\N \\N \n", "\n", " Tz database timezone type source \n", "7688 \\N airport OurAirports \n", "7689 \\N airport OurAirports \n", "7690 \\N airport OurAirports \n", "7691 \\N airport OurAirports \n", "7692 \\N airport OurAirports \n", "7693 \\N airport OurAirports \n", "7694 \\N airport OurAirports \n", "7695 \\N airport OurAirports \n", "7696 \\N airport OurAirports \n", "7697 \\N airport OurAirports " ] }, "execution_count": 13, "metadata": {}, "output_type": "execute_result" } ], "source": [ "airports.tail(10)" ] }, { "cell_type": "code", "execution_count": 22, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "237" ] }, "execution_count": 22, "metadata": {}, "output_type": "execute_result" } ], "source": [ "# 哪个国家拥有的机场最多\n", "airports.country.unique().size" ] }, { "cell_type": "code", "execution_count": 25, "metadata": {}, "outputs": [], "source": [ "max_airports_num = airports.groupby(\"country\")" ] }, { "cell_type": "code", "execution_count": 35, "metadata": {}, "outputs": [], "source": [ "max_airports_countries = max_airports_num[\"airport_id\"].agg(np.size).sort_values(ascending=False)[0:10]" ] }, { "cell_type": "code", "execution_count": 36, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "pandas.core.series.Series" ] }, "execution_count": 36, "metadata": {}, "output_type": "execute_result" } ], "source": [ "type(max_airports_countries)" ] }, { "cell_type": "code", "execution_count": 38, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "country\n", "United States 1512\n", "Canada 430\n", "Australia 334\n", "Brazil 264\n", "Russia 264\n", "Germany 249\n", "China 241\n", "France 217\n", "United Kingdom 167\n", "India 148\n", "Name: airport_id, dtype: int64" ] }, "execution_count": 38, "metadata": {}, "output_type": "execute_result" } ], "source": [ "max_airports_countries" ] }, { "cell_type": "code", "execution_count": 58, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "Text(0.5, 1.0, 'Those countries owns most airports')" ] }, "execution_count": 58, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "%matplotlib inline\n", "plt.style.use(\"seaborn-dark\")\n", "plt.bar(data=max_airports_countries, x=max_airports_countries.index, height=max_airports_countries.values, facecolor = 'lightskyblue')\n", "plt.xticks(rotation=45)\n", "plt.xlabel(\"Country\")\n", "plt.ylabel(\"Airport Number\")\n", "plt.title(\"Those countries owns most airports\")" ] }, { "cell_type": "code", "execution_count": 62, "metadata": {}, "outputs": [], "source": [ "min_alt_agg = airports.groupby(\"country\")" ] }, { "cell_type": "code", "execution_count": 65, "metadata": {}, "outputs": [], "source": [ "min_alt_countries = min_alt_agg[\"altitude\"].agg(np.mean).sort_values(ascending=True)[0:10]" ] }, { "cell_type": "code", "execution_count": 66, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "country\n", "Kiribati 4.611111\n", "Cayman Islands 6.333333\n", "Johnston Atoll 7.000000\n", "Maldives 8.090909\n", "Tuvalu 9.000000\n", "British Indian Ocean Territory 9.000000\n", "Turks and Caicos Islands 9.333333\n", "Seychelles 9.500000\n", "Marshall Islands 9.875000\n", "Cocos (Keeling) Islands 10.000000\n", "Name: altitude, dtype: float64" ] }, "execution_count": 66, "metadata": {}, "output_type": "execute_result" } ], "source": [ "min_alt_countries" ] } ], "metadata": { "kernelspec": { "display_name": "Python 3", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.7.4" } }, "nbformat": 4, "nbformat_minor": 2 }