From a8ce91f7901f9f91dab1fdaa09903208de466535 Mon Sep 17 00:00:00 2001
From: zhouwei713 <736552883@qq.com>
Date: Wed, 13 Nov 2019 15:07:23 +0800
Subject: [PATCH] add gdp regression code
---
.idea/workspace.xml | 20 +-
.../GDP_analyse-checkpoint.ipynb | 7133 +++++++++++++++++
.../Untitled-checkpoint.ipynb | 6 +
...PI_NY.GDP.MKTP.CD_DS2_zh_csv_v2_424460.zip | Bin 0 -> 115590 bytes
GDP_analyse/Country_data.csv | 267 +
GDP_analyse/GDP_analyse.ipynb | 7133 +++++++++++++++++
GDP_analyse/GDP_data.csv | 265 +
...PI_NY.GDP.MKTP.CD_DS2_zh_csv_v2_424460.csv | 2 +
GDP_analyse/Untitled.ipynb | 6 +
GDP_analyse/test.txt | 3 +
GDP_regression/Country_data.csv | 267 +
GDP_regression/GDP_data.csv | 265 +
GDP_regression/main.py | 120 +
football/yingchao/analyse.py | 6 +-
14 files changed, 15479 insertions(+), 14 deletions(-)
create mode 100644 GDP_analyse/.ipynb_checkpoints/GDP_analyse-checkpoint.ipynb
create mode 100644 GDP_analyse/.ipynb_checkpoints/Untitled-checkpoint.ipynb
create mode 100644 GDP_analyse/API_NY.GDP.MKTP.CD_DS2_zh_csv_v2_424460.zip
create mode 100644 GDP_analyse/Country_data.csv
create mode 100644 GDP_analyse/GDP_analyse.ipynb
create mode 100644 GDP_analyse/GDP_data.csv
create mode 100644 GDP_analyse/Metadata_Indicator_API_NY.GDP.MKTP.CD_DS2_zh_csv_v2_424460.csv
create mode 100644 GDP_analyse/Untitled.ipynb
create mode 100644 GDP_analyse/test.txt
create mode 100644 GDP_regression/Country_data.csv
create mode 100644 GDP_regression/GDP_data.csv
create mode 100644 GDP_regression/main.py
diff --git a/.idea/workspace.xml b/.idea/workspace.xml
index 6d59da9..48cc8db 100644
--- a/.idea/workspace.xml
+++ b/.idea/workspace.xml
@@ -3,10 +3,7 @@
-
-
-
-
+
@@ -73,19 +70,19 @@
-
+
-
-
-
-
+
-
+
+
+
+
@@ -275,7 +272,8 @@
-
+
+
diff --git a/GDP_analyse/.ipynb_checkpoints/GDP_analyse-checkpoint.ipynb b/GDP_analyse/.ipynb_checkpoints/GDP_analyse-checkpoint.ipynb
new file mode 100644
index 0000000..7b87c81
--- /dev/null
+++ b/GDP_analyse/.ipynb_checkpoints/GDP_analyse-checkpoint.ipynb
@@ -0,0 +1,7133 @@
+{
+ "cells": [
+ {
+ "cell_type": "code",
+ "execution_count": 1,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "import pandas as pd"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 2,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "from pyecharts import options as opts\n",
+ "from pyecharts.charts import Pie, Bar"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 3,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "gdp = pd.read_csv('GDP_data.csv')"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 4,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "country = pd.read_csv('Country_data.csv')"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 5,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "country_data = country.dropna(subset=['Income_Group'])"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 54,
+ "metadata": {
+ "collapsed": true
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "
\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " Country Name | \n",
+ " Country Code | \n",
+ " Region | \n",
+ " Income_Group | \n",
+ " Unnamed: 4 | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " 阿鲁巴 | \n",
+ " ABW | \n",
+ " NaN | \n",
+ " 高收入国家 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " 阿富汗 | \n",
+ " AFG | \n",
+ " 南亚 | \n",
+ " 低收入国家 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " 安哥拉 | \n",
+ " AGO | \n",
+ " 撒哈拉以南非洲地区(不包括高收入) | \n",
+ " 中低等收入国家 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " 阿尔巴尼亚 | \n",
+ " ALB | \n",
+ " 欧洲与中亚地区(不包括高收入) | \n",
+ " 中高等收入国家 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " 安道尔共和国 | \n",
+ " AND | \n",
+ " NaN | \n",
+ " 高收入国家 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 259 | \n",
+ " 科索沃 | \n",
+ " XKX | \n",
+ " 欧洲与中亚地区(不包括高收入) | \n",
+ " 中高等收入国家 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 260 | \n",
+ " 也门共和国 | \n",
+ " YEM | \n",
+ " 中东与北非地区(不包括高收入) | \n",
+ " 低收入国家 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 261 | \n",
+ " 南非 | \n",
+ " ZAF | \n",
+ " 撒哈拉以南非洲地区(不包括高收入) | \n",
+ " 中高等收入国家 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 262 | \n",
+ " 赞比亚 | \n",
+ " ZMB | \n",
+ " 撒哈拉以南非洲地区(不包括高收入) | \n",
+ " 中低等收入国家 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 263 | \n",
+ " 津巴布韦 | \n",
+ " ZWE | \n",
+ " 撒哈拉以南非洲地区(不包括高收入) | \n",
+ " 中低等收入国家 | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
217 rows × 5 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " Country Name Country Code Region Income_Group Unnamed: 4\n",
+ "0 阿鲁巴 ABW NaN 高收入国家 NaN\n",
+ "1 阿富汗 AFG 南亚 低收入国家 NaN\n",
+ "2 安哥拉 AGO 撒哈拉以南非洲地区(不包括高收入) 中低等收入国家 NaN\n",
+ "3 阿尔巴尼亚 ALB 欧洲与中亚地区(不包括高收入) 中高等收入国家 NaN\n",
+ "4 安道尔共和国 AND NaN 高收入国家 NaN\n",
+ ".. ... ... ... ... ...\n",
+ "259 科索沃 XKX 欧洲与中亚地区(不包括高收入) 中高等收入国家 NaN\n",
+ "260 也门共和国 YEM 中东与北非地区(不包括高收入) 低收入国家 NaN\n",
+ "261 南非 ZAF 撒哈拉以南非洲地区(不包括高收入) 中高等收入国家 NaN\n",
+ "262 赞比亚 ZMB 撒哈拉以南非洲地区(不包括高收入) 中低等收入国家 NaN\n",
+ "263 津巴布韦 ZWE 撒哈拉以南非洲地区(不包括高收入) 中低等收入国家 NaN\n",
+ "\n",
+ "[217 rows x 5 columns]"
+ ]
+ },
+ "execution_count": 54,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "country_data"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 73,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "rank_cuntry = country_data.groupby('Income_Group').size()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 72,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "[47, 60, 31, 79]"
+ ]
+ },
+ "execution_count": 72,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "country_data.groupby('Income_Group').size().values.tolist()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 81,
+ "metadata": {
+ "scrolled": true
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ " \n",
+ "\n",
+ "\n",
+ "\n"
+ ],
+ "text/plain": [
+ ""
+ ]
+ },
+ "execution_count": 81,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "# 各个收入等级分布\n",
+ "pie = Pie()\n",
+ "pie.add(\"\", [list(z) for z in zip(rank_cuntry.index.tolist(), rank_cuntry.values.tolist())],\n",
+ " radius=[\"30%\", \"75%\"], center=[\"45%\", \"50%\"], rosetype=\"radius\",\n",
+ " )\n",
+ "pie.set_global_opts(title_opts=opts.TitleOpts(title=\"各个收入等级分布\"))\n",
+ "pie.set_series_opts(label_opts=opts.LabelOpts(formatter=\"{b}, {d}%\"))\n",
+ "pie.render_notebook()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 89,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "high = country_data[country_data['Income_Group'] == '高收入国家']"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 94,
+ "metadata": {
+ "scrolled": true
+ },
+ "outputs": [],
+ "source": [
+ "# 高收入国家2018年的GDP\n",
+ "high_gdp = pd.merge(high, gdp, how='inner')\n",
+ "high_gdp['2018'] = high_gdp['2018'].apply(lambda x: x/1000000000000)\n",
+ "high_gdp_top10 = high_gdp[['Country Name', 'Country Code', '2018']].sort_values(by='2018', ascending=False)[:10]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 101,
+ "metadata": {
+ "scrolled": true
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ " \n",
+ "\n",
+ "\n",
+ "\n"
+ ],
+ "text/plain": [
+ ""
+ ]
+ },
+ "execution_count": 101,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "bar = Bar()\n",
+ "bar.add_xaxis(high_gdp_top10['Country Name'].values.tolist())\n",
+ "bar.add_yaxis(\"\", high_gdp_top10['2018'].values.tolist())\n",
+ "bar.reversal_axis()\n",
+ "bar.set_series_opts(label_opts=opts.LabelOpts(position=\"right\"))\n",
+ "bar.set_global_opts(title_opts=opts.TitleOpts(title=\"高收入国家GDP Top10\", subtitle=\"\"),\n",
+ " xaxis_opts=opts.AxisOpts(\n",
+ " axislabel_opts=opts.LabelOpts(formatter=\"{value} /万亿\")\n",
+ " ),)\n",
+ "bar.render_notebook()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 113,
+ "metadata": {
+ "scrolled": true
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ " \n",
+ "\n",
+ "\n",
+ "\n"
+ ],
+ "text/plain": [
+ ""
+ ]
+ },
+ "execution_count": 113,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "high_gdp_top20 = high_gdp[['Country Name', 'Country Code', '2018']].sort_values(by='2018', ascending=False)[:20]\n",
+ "\n",
+ "bar = Bar()\n",
+ "bar.add_xaxis(high_gdp_top20['Country Name'].values.tolist())\n",
+ "bar.add_yaxis(\"\", high_gdp_top20['2018'].values.tolist())\n",
+ "bar.reversal_axis()\n",
+ "bar.set_series_opts(label_opts=opts.LabelOpts(position=\"right\"))\n",
+ "bar.set_global_opts(title_opts=opts.TitleOpts(title=\"高收入国家GDP Top20\", subtitle=\"\"),\n",
+ " xaxis_opts=opts.AxisOpts(\n",
+ " axislabel_opts=opts.LabelOpts(formatter=\"{value} /万亿\")\n",
+ " ),)\n",
+ "bar.render_notebook()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 119,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "# 中高等收入国家\n",
+ "mid_high = country_data[country_data['Income_Group'] == '中高等收入国家']\n",
+ "mid_high_gdp = pd.merge(mid_high, gdp, how='inner')\n",
+ "mid_high_gdp['2018'] = mid_high_gdp['2018'].apply(lambda x: x/1000000000000)\n",
+ "mid_high_gdp_top10 = mid_high_gdp[['Country Name', 'Country Code', '2018']].sort_values(by='2018', ascending=False)[:10]\n",
+ "mid_high_gdp_top20 = mid_high_gdp[['Country Name', 'Country Code', '2018']].sort_values(by='2018', ascending=False)[:20]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 117,
+ "metadata": {
+ "scrolled": true
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ " \n",
+ "\n",
+ "\n",
+ "\n"
+ ],
+ "text/plain": [
+ ""
+ ]
+ },
+ "execution_count": 117,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "bar = Bar()\n",
+ "bar.add_xaxis(mid_high_gdp_top10['Country Name'].values.tolist())\n",
+ "bar.add_yaxis(\"\", mid_high_gdp_top10['2018'].values.tolist())\n",
+ "bar.reversal_axis()\n",
+ "bar.set_series_opts(label_opts=opts.LabelOpts(position=\"right\"))\n",
+ "bar.set_global_opts(title_opts=opts.TitleOpts(title=\"中高等收入国家GDP Top10\", subtitle=\"\"),\n",
+ " xaxis_opts=opts.AxisOpts(\n",
+ " axislabel_opts=opts.LabelOpts(formatter=\"{value} /万亿\")\n",
+ " ),)\n",
+ "bar.render_notebook()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 120,
+ "metadata": {
+ "scrolled": true
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ " \n",
+ "\n",
+ "\n",
+ "\n"
+ ],
+ "text/plain": [
+ ""
+ ]
+ },
+ "execution_count": 120,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "bar = Bar()\n",
+ "bar.add_xaxis(mid_high_gdp_top20['Country Name'].values.tolist())\n",
+ "bar.add_yaxis(\"\", mid_high_gdp_top20['2018'].values.tolist())\n",
+ "bar.reversal_axis()\n",
+ "bar.set_series_opts(label_opts=opts.LabelOpts(position=\"right\"))\n",
+ "bar.set_global_opts(title_opts=opts.TitleOpts(title=\"中高等收入国家GDP Top20\", subtitle=\"\"),\n",
+ " xaxis_opts=opts.AxisOpts(\n",
+ " axislabel_opts=opts.LabelOpts(formatter=\"{value} /万亿\")\n",
+ " ),)\n",
+ "bar.render_notebook()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 121,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "# 中低等收入国家\n",
+ "mid_low = country_data[country_data['Income_Group'] == '中低等收入国家']\n",
+ "mid_low_gdp = pd.merge(mid_low, gdp, how='inner')\n",
+ "mid_low_gdp['2018'] = mid_low_gdp['2018'].apply(lambda x: x/1000000000000)\n",
+ "mid_low_gdp_top10 = mid_low_gdp[['Country Name', 'Country Code', '2018']].sort_values(by='2018', ascending=False)[:10]\n",
+ "mid_low_gdp_top20 = mid_low_gdp[['Country Name', 'Country Code', '2018']].sort_values(by='2018', ascending=False)[:20]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 122,
+ "metadata": {
+ "scrolled": true
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ " \n",
+ "\n",
+ "\n",
+ "\n"
+ ],
+ "text/plain": [
+ ""
+ ]
+ },
+ "execution_count": 122,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "bar = Bar()\n",
+ "bar.add_xaxis(mid_low_gdp_top10['Country Name'].values.tolist())\n",
+ "bar.add_yaxis(\"\", mid_low_gdp_top10['2018'].values.tolist())\n",
+ "bar.reversal_axis()\n",
+ "bar.set_series_opts(label_opts=opts.LabelOpts(position=\"right\"))\n",
+ "bar.set_global_opts(title_opts=opts.TitleOpts(title=\"中低等收入国家GDP Top10\", subtitle=\"\"),\n",
+ " xaxis_opts=opts.AxisOpts(\n",
+ " axislabel_opts=opts.LabelOpts(formatter=\"{value} /万亿\")\n",
+ " ),)\n",
+ "bar.render_notebook()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 123,
+ "metadata": {
+ "scrolled": true
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ " \n",
+ "\n",
+ "\n",
+ "\n"
+ ],
+ "text/plain": [
+ ""
+ ]
+ },
+ "execution_count": 123,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "bar = Bar()\n",
+ "bar.add_xaxis(mid_low_gdp_top20['Country Name'].values.tolist())\n",
+ "bar.add_yaxis(\"\", mid_low_gdp_top20['2018'].values.tolist())\n",
+ "bar.reversal_axis()\n",
+ "bar.set_series_opts(label_opts=opts.LabelOpts(position=\"right\"))\n",
+ "bar.set_global_opts(title_opts=opts.TitleOpts(title=\"中低等收入国家GDP Top20\", subtitle=\"\"),\n",
+ " xaxis_opts=opts.AxisOpts(\n",
+ " axislabel_opts=opts.LabelOpts(formatter=\"{value} /万亿\")\n",
+ " ),)\n",
+ "bar.render_notebook()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 126,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "# 低等收入国家\n",
+ "low = country_data[country_data['Income_Group'] == '低收入国家']\n",
+ "low_gdp = pd.merge(low, gdp, how='inner')\n",
+ "low_gdp['2018'] = low_gdp['2018'].apply(lambda x: x/1000000000000)\n",
+ "low_gdp_top10 = low_gdp[['Country Name', 'Country Code', '2018']].sort_values(by='2018', ascending=False)[:10]\n",
+ "low_gdp_top20 = low_gdp[['Country Name', 'Country Code', '2018']].sort_values(by='2018', ascending=False)[:20]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 127,
+ "metadata": {
+ "scrolled": true
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ " \n",
+ "\n",
+ "\n",
+ "\n"
+ ],
+ "text/plain": [
+ ""
+ ]
+ },
+ "execution_count": 127,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "bar = Bar()\n",
+ "bar.add_xaxis(low_gdp_top10['Country Name'].values.tolist())\n",
+ "bar.add_yaxis(\"\", low_gdp_top10['2018'].values.tolist())\n",
+ "bar.reversal_axis()\n",
+ "bar.set_series_opts(label_opts=opts.LabelOpts(position=\"right\"))\n",
+ "bar.set_global_opts(title_opts=opts.TitleOpts(title=\"低等收入国家GDP Top10\", subtitle=\"\"),\n",
+ " xaxis_opts=opts.AxisOpts(\n",
+ " axislabel_opts=opts.LabelOpts(formatter=\"{value} /万亿\")\n",
+ " ),)\n",
+ "bar.render_notebook()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 129,
+ "metadata": {
+ "scrolled": true
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ " \n",
+ "\n",
+ "\n",
+ "\n"
+ ],
+ "text/plain": [
+ ""
+ ]
+ },
+ "execution_count": 129,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "bar = Bar()\n",
+ "bar.add_xaxis(low_gdp_top20['Country Name'].values.tolist())\n",
+ "bar.add_yaxis(\"\", low_gdp_top20['2018'].values.tolist())\n",
+ "bar.reversal_axis()\n",
+ "bar.set_series_opts(label_opts=opts.LabelOpts(position=\"right\"))\n",
+ "bar.set_global_opts(title_opts=opts.TitleOpts(title=\"低等收入国家GDP Top20\", subtitle=\"\"),\n",
+ " xaxis_opts=opts.AxisOpts(\n",
+ " axislabel_opts=opts.LabelOpts(formatter=\"{value} /万亿\")\n",
+ " ),)\n",
+ "bar.render_notebook()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 91,
+ "metadata": {
+ "scrolled": true
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " Country Name | \n",
+ " Country Code | \n",
+ " Region | \n",
+ " Income_Group | \n",
+ " Unnamed: 4 | \n",
+ " Indicator Name | \n",
+ " Indicator Code | \n",
+ " 1960 | \n",
+ " 1961 | \n",
+ " 1962 | \n",
+ " ... | \n",
+ " 2011 | \n",
+ " 2012 | \n",
+ " 2013 | \n",
+ " 2014 | \n",
+ " 2015 | \n",
+ " 2016 | \n",
+ " 2017 | \n",
+ " 2018 | \n",
+ " 2019 | \n",
+ " Unnamed: 64 | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " 阿鲁巴 | \n",
+ " ABW | \n",
+ " NaN | \n",
+ " 高收入国家 | \n",
+ " NaN | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " ... | \n",
+ " 2.549721e+09 | \n",
+ " 2.534637e+09 | \n",
+ " 2.581564e+09 | \n",
+ " 2.649721e+09 | \n",
+ " 2.691620e+09 | \n",
+ " 2.646927e+09 | \n",
+ " 2.700559e+09 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " 安道尔共和国 | \n",
+ " AND | \n",
+ " NaN | \n",
+ " 高收入国家 | \n",
+ " NaN | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " ... | \n",
+ " 3.442063e+09 | \n",
+ " 3.164615e+09 | \n",
+ " 3.281585e+09 | \n",
+ " 3.350736e+09 | \n",
+ " 2.811489e+09 | \n",
+ " 2.877312e+09 | \n",
+ " 3.013387e+09 | \n",
+ " 3.236544e+09 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " 阿拉伯联合酋长国 | \n",
+ " ARE | \n",
+ " NaN | \n",
+ " 高收入国家 | \n",
+ " NaN | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " ... | \n",
+ " 3.506660e+11 | \n",
+ " 3.745906e+11 | \n",
+ " 3.901076e+11 | \n",
+ " 4.031371e+11 | \n",
+ " 3.581351e+11 | \n",
+ " 3.570451e+11 | \n",
+ " 3.825751e+11 | \n",
+ " 4.141789e+11 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " 安提瓜和巴布达 | \n",
+ " ATG | \n",
+ " NaN | \n",
+ " 高收入国家 | \n",
+ " NaN | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " ... | \n",
+ " 1.142043e+09 | \n",
+ " 1.211412e+09 | \n",
+ " 1.192920e+09 | \n",
+ " 1.275577e+09 | \n",
+ " 1.359195e+09 | \n",
+ " 1.464630e+09 | \n",
+ " 1.510085e+09 | \n",
+ " 1.623804e+09 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " 澳大利亚 | \n",
+ " AUS | \n",
+ " NaN | \n",
+ " 高收入国家 | \n",
+ " NaN | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " 1.857767e+10 | \n",
+ " 1.965394e+10 | \n",
+ " 1.989249e+10 | \n",
+ " ... | \n",
+ " 1.396650e+12 | \n",
+ " 1.546152e+12 | \n",
+ " 1.576184e+12 | \n",
+ " 1.467484e+12 | \n",
+ " 1.351520e+12 | \n",
+ " 1.210028e+12 | \n",
+ " 1.330803e+12 | \n",
+ " 1.432195e+12 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 74 | \n",
+ " 特立尼达和多巴哥 | \n",
+ " TTO | \n",
+ " NaN | \n",
+ " 高收入国家 | \n",
+ " NaN | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " 5.356701e+08 | \n",
+ " 5.849612e+08 | \n",
+ " 6.193192e+08 | \n",
+ " ... | \n",
+ " 2.543301e+10 | \n",
+ " 2.576933e+10 | \n",
+ " 2.711026e+10 | \n",
+ " 2.747797e+10 | \n",
+ " 2.512152e+10 | \n",
+ " 2.174639e+10 | \n",
+ " 2.225046e+10 | \n",
+ " 2.341035e+10 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 75 | \n",
+ " 乌拉圭 | \n",
+ " URY | \n",
+ " NaN | \n",
+ " 高收入国家 | \n",
+ " NaN | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " 1.242289e+09 | \n",
+ " 1.547389e+09 | \n",
+ " 1.710004e+09 | \n",
+ " ... | \n",
+ " 4.796244e+10 | \n",
+ " 5.126439e+10 | \n",
+ " 5.753123e+10 | \n",
+ " 5.723601e+10 | \n",
+ " 5.327430e+10 | \n",
+ " 5.268761e+10 | \n",
+ " 5.648899e+10 | \n",
+ " 5.959689e+10 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 76 | \n",
+ " 美国 | \n",
+ " USA | \n",
+ " NaN | \n",
+ " 高收入国家 | \n",
+ " NaN | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " 5.433000e+11 | \n",
+ " 5.633000e+11 | \n",
+ " 6.051000e+11 | \n",
+ " ... | \n",
+ " 1.554258e+13 | \n",
+ " 1.619701e+13 | \n",
+ " 1.678485e+13 | \n",
+ " 1.752175e+13 | \n",
+ " 1.821930e+13 | \n",
+ " 1.870719e+13 | \n",
+ " 1.948539e+13 | \n",
+ " 2.049410e+13 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 77 | \n",
+ " 英屬維爾京群島 | \n",
+ " VGB | \n",
+ " NaN | \n",
+ " 高收入国家 | \n",
+ " NaN | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " ... | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 78 | \n",
+ " 美属维京群岛 | \n",
+ " VIR | \n",
+ " NaN | \n",
+ " 高收入国家 | \n",
+ " NaN | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " ... | \n",
+ " 4.239000e+09 | \n",
+ " 4.095000e+09 | \n",
+ " 3.762000e+09 | \n",
+ " 3.622000e+09 | \n",
+ " 3.748000e+09 | \n",
+ " 3.863000e+09 | \n",
+ " 3.855000e+09 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
79 rows × 68 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " Country Name Country Code Region Income_Group Unnamed: 4 Indicator Name \\\n",
+ "0 阿鲁巴 ABW NaN 高收入国家 NaN GDP(现价美元) \n",
+ "1 安道尔共和国 AND NaN 高收入国家 NaN GDP(现价美元) \n",
+ "2 阿拉伯联合酋长国 ARE NaN 高收入国家 NaN GDP(现价美元) \n",
+ "3 安提瓜和巴布达 ATG NaN 高收入国家 NaN GDP(现价美元) \n",
+ "4 澳大利亚 AUS NaN 高收入国家 NaN GDP(现价美元) \n",
+ ".. ... ... ... ... ... ... \n",
+ "74 特立尼达和多巴哥 TTO NaN 高收入国家 NaN GDP(现价美元) \n",
+ "75 乌拉圭 URY NaN 高收入国家 NaN GDP(现价美元) \n",
+ "76 美国 USA NaN 高收入国家 NaN GDP(现价美元) \n",
+ "77 英屬維爾京群島 VGB NaN 高收入国家 NaN GDP(现价美元) \n",
+ "78 美属维京群岛 VIR NaN 高收入国家 NaN GDP(现价美元) \n",
+ "\n",
+ " Indicator Code 1960 1961 1962 ... \\\n",
+ "0 NY.GDP.MKTP.CD NaN NaN NaN ... \n",
+ "1 NY.GDP.MKTP.CD NaN NaN NaN ... \n",
+ "2 NY.GDP.MKTP.CD NaN NaN NaN ... \n",
+ "3 NY.GDP.MKTP.CD NaN NaN NaN ... \n",
+ "4 NY.GDP.MKTP.CD 1.857767e+10 1.965394e+10 1.989249e+10 ... \n",
+ ".. ... ... ... ... ... \n",
+ "74 NY.GDP.MKTP.CD 5.356701e+08 5.849612e+08 6.193192e+08 ... \n",
+ "75 NY.GDP.MKTP.CD 1.242289e+09 1.547389e+09 1.710004e+09 ... \n",
+ "76 NY.GDP.MKTP.CD 5.433000e+11 5.633000e+11 6.051000e+11 ... \n",
+ "77 NY.GDP.MKTP.CD NaN NaN NaN ... \n",
+ "78 NY.GDP.MKTP.CD NaN NaN NaN ... \n",
+ "\n",
+ " 2011 2012 2013 2014 2015 \\\n",
+ "0 2.549721e+09 2.534637e+09 2.581564e+09 2.649721e+09 2.691620e+09 \n",
+ "1 3.442063e+09 3.164615e+09 3.281585e+09 3.350736e+09 2.811489e+09 \n",
+ "2 3.506660e+11 3.745906e+11 3.901076e+11 4.031371e+11 3.581351e+11 \n",
+ "3 1.142043e+09 1.211412e+09 1.192920e+09 1.275577e+09 1.359195e+09 \n",
+ "4 1.396650e+12 1.546152e+12 1.576184e+12 1.467484e+12 1.351520e+12 \n",
+ ".. ... ... ... ... ... \n",
+ "74 2.543301e+10 2.576933e+10 2.711026e+10 2.747797e+10 2.512152e+10 \n",
+ "75 4.796244e+10 5.126439e+10 5.753123e+10 5.723601e+10 5.327430e+10 \n",
+ "76 1.554258e+13 1.619701e+13 1.678485e+13 1.752175e+13 1.821930e+13 \n",
+ "77 NaN NaN NaN NaN NaN \n",
+ "78 4.239000e+09 4.095000e+09 3.762000e+09 3.622000e+09 3.748000e+09 \n",
+ "\n",
+ " 2016 2017 2018 2019 Unnamed: 64 \n",
+ "0 2.646927e+09 2.700559e+09 NaN NaN NaN \n",
+ "1 2.877312e+09 3.013387e+09 3.236544e+09 NaN NaN \n",
+ "2 3.570451e+11 3.825751e+11 4.141789e+11 NaN NaN \n",
+ "3 1.464630e+09 1.510085e+09 1.623804e+09 NaN NaN \n",
+ "4 1.210028e+12 1.330803e+12 1.432195e+12 NaN NaN \n",
+ ".. ... ... ... ... ... \n",
+ "74 2.174639e+10 2.225046e+10 2.341035e+10 NaN NaN \n",
+ "75 5.268761e+10 5.648899e+10 5.959689e+10 NaN NaN \n",
+ "76 1.870719e+13 1.948539e+13 2.049410e+13 NaN NaN \n",
+ "77 NaN NaN NaN NaN NaN \n",
+ "78 3.863000e+09 3.855000e+09 NaN NaN NaN \n",
+ "\n",
+ "[79 rows x 68 columns]"
+ ]
+ },
+ "execution_count": 91,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "high_gdp"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 4,
+ "metadata": {
+ "scrolled": true
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " Country Name | \n",
+ " Country Code | \n",
+ " Indicator Name | \n",
+ " Indicator Code | \n",
+ " 1960 | \n",
+ " 1961 | \n",
+ " 1962 | \n",
+ " 1963 | \n",
+ " 1964 | \n",
+ " 1965 | \n",
+ " ... | \n",
+ " 2011 | \n",
+ " 2012 | \n",
+ " 2013 | \n",
+ " 2014 | \n",
+ " 2015 | \n",
+ " 2016 | \n",
+ " 2017 | \n",
+ " 2018 | \n",
+ " 2019 | \n",
+ " Unnamed: 64 | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " 阿鲁巴 | \n",
+ " ABW | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " ... | \n",
+ " 2.549721e+09 | \n",
+ " 2.534637e+09 | \n",
+ " 2.581564e+09 | \n",
+ " 2.649721e+09 | \n",
+ " 2.691620e+09 | \n",
+ " 2.646927e+09 | \n",
+ " 2.700559e+09 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " 阿富汗 | \n",
+ " AFG | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " 5.377778e+08 | \n",
+ " 5.488889e+08 | \n",
+ " 5.466667e+08 | \n",
+ " 7.511112e+08 | \n",
+ " 8.000000e+08 | \n",
+ " 1.006667e+09 | \n",
+ " ... | \n",
+ " 1.780428e+10 | \n",
+ " 2.000162e+10 | \n",
+ " 2.056105e+10 | \n",
+ " 2.048487e+10 | \n",
+ " 1.990711e+10 | \n",
+ " 1.936264e+10 | \n",
+ " 2.019176e+10 | \n",
+ " 1.936297e+10 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " 安哥拉 | \n",
+ " AGO | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " ... | \n",
+ " 1.117897e+11 | \n",
+ " 1.280529e+11 | \n",
+ " 1.367099e+11 | \n",
+ " 1.457122e+11 | \n",
+ " 1.161936e+11 | \n",
+ " 1.011239e+11 | \n",
+ " 1.221238e+11 | \n",
+ " 1.057510e+11 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " 阿尔巴尼亚 | \n",
+ " ALB | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " ... | \n",
+ " 1.289087e+10 | \n",
+ " 1.231978e+10 | \n",
+ " 1.277628e+10 | \n",
+ " 1.322825e+10 | \n",
+ " 1.138693e+10 | \n",
+ " 1.186135e+10 | \n",
+ " 1.302506e+10 | \n",
+ " 1.505888e+10 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " 安道尔共和国 | \n",
+ " AND | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " ... | \n",
+ " 3.442063e+09 | \n",
+ " 3.164615e+09 | \n",
+ " 3.281585e+09 | \n",
+ " 3.350736e+09 | \n",
+ " 2.811489e+09 | \n",
+ " 2.877312e+09 | \n",
+ " 3.013387e+09 | \n",
+ " 3.236544e+09 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 259 | \n",
+ " 科索沃 | \n",
+ " XKX | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " ... | \n",
+ " 6.691827e+09 | \n",
+ " 6.499936e+09 | \n",
+ " 7.071960e+09 | \n",
+ " 7.386891e+09 | \n",
+ " 6.440612e+09 | \n",
+ " 6.714712e+09 | \n",
+ " 7.227765e+09 | \n",
+ " 7.900269e+09 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 260 | \n",
+ " 也门共和国 | \n",
+ " YEM | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " ... | \n",
+ " 3.272642e+10 | \n",
+ " 3.540134e+10 | \n",
+ " 4.041523e+10 | \n",
+ " 4.322859e+10 | \n",
+ " 4.262833e+10 | \n",
+ " 3.096824e+10 | \n",
+ " 2.681870e+10 | \n",
+ " 2.691440e+10 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 261 | \n",
+ " 南非 | \n",
+ " ZAF | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " 7.575397e+09 | \n",
+ " 7.972997e+09 | \n",
+ " 8.497997e+09 | \n",
+ " 9.423396e+09 | \n",
+ " 1.037400e+10 | \n",
+ " 1.133440e+10 | \n",
+ " ... | \n",
+ " 4.164170e+11 | \n",
+ " 3.963294e+11 | \n",
+ " 3.666449e+11 | \n",
+ " 3.506376e+11 | \n",
+ " 3.174156e+11 | \n",
+ " 2.963409e+11 | \n",
+ " 3.492681e+11 | \n",
+ " 3.682882e+11 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 262 | \n",
+ " 赞比亚 | \n",
+ " ZMB | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " 7.130000e+08 | \n",
+ " 6.962857e+08 | \n",
+ " 6.931429e+08 | \n",
+ " 7.187143e+08 | \n",
+ " 8.394286e+08 | \n",
+ " 1.082857e+09 | \n",
+ " ... | \n",
+ " 2.346010e+10 | \n",
+ " 2.550337e+10 | \n",
+ " 2.804546e+10 | \n",
+ " 2.715063e+10 | \n",
+ " 2.115439e+10 | \n",
+ " 2.095475e+10 | \n",
+ " 2.586814e+10 | \n",
+ " 2.672007e+10 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 263 | \n",
+ " 津巴布韦 | \n",
+ " ZWE | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " 1.052990e+09 | \n",
+ " 1.096647e+09 | \n",
+ " 1.117602e+09 | \n",
+ " 1.159512e+09 | \n",
+ " 1.217138e+09 | \n",
+ " 1.311436e+09 | \n",
+ " ... | \n",
+ " 1.410192e+10 | \n",
+ " 1.711485e+10 | \n",
+ " 1.909102e+10 | \n",
+ " 1.949552e+10 | \n",
+ " 1.996312e+10 | \n",
+ " 2.054868e+10 | \n",
+ " 2.281301e+10 | \n",
+ " 3.100052e+10 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
264 rows × 65 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " Country Name Country Code Indicator Name Indicator Code 1960 \\\n",
+ "0 阿鲁巴 ABW GDP(现价美元) NY.GDP.MKTP.CD NaN \n",
+ "1 阿富汗 AFG GDP(现价美元) NY.GDP.MKTP.CD 5.377778e+08 \n",
+ "2 安哥拉 AGO GDP(现价美元) NY.GDP.MKTP.CD NaN \n",
+ "3 阿尔巴尼亚 ALB GDP(现价美元) NY.GDP.MKTP.CD NaN \n",
+ "4 安道尔共和国 AND GDP(现价美元) NY.GDP.MKTP.CD NaN \n",
+ ".. ... ... ... ... ... \n",
+ "259 科索沃 XKX GDP(现价美元) NY.GDP.MKTP.CD NaN \n",
+ "260 也门共和国 YEM GDP(现价美元) NY.GDP.MKTP.CD NaN \n",
+ "261 南非 ZAF GDP(现价美元) NY.GDP.MKTP.CD 7.575397e+09 \n",
+ "262 赞比亚 ZMB GDP(现价美元) NY.GDP.MKTP.CD 7.130000e+08 \n",
+ "263 津巴布韦 ZWE GDP(现价美元) NY.GDP.MKTP.CD 1.052990e+09 \n",
+ "\n",
+ " 1961 1962 1963 1964 1965 \\\n",
+ "0 NaN NaN NaN NaN NaN \n",
+ "1 5.488889e+08 5.466667e+08 7.511112e+08 8.000000e+08 1.006667e+09 \n",
+ "2 NaN NaN NaN NaN NaN \n",
+ "3 NaN NaN NaN NaN NaN \n",
+ "4 NaN NaN NaN NaN NaN \n",
+ ".. ... ... ... ... ... \n",
+ "259 NaN NaN NaN NaN NaN \n",
+ "260 NaN NaN NaN NaN NaN \n",
+ "261 7.972997e+09 8.497997e+09 9.423396e+09 1.037400e+10 1.133440e+10 \n",
+ "262 6.962857e+08 6.931429e+08 7.187143e+08 8.394286e+08 1.082857e+09 \n",
+ "263 1.096647e+09 1.117602e+09 1.159512e+09 1.217138e+09 1.311436e+09 \n",
+ "\n",
+ " ... 2011 2012 2013 2014 \\\n",
+ "0 ... 2.549721e+09 2.534637e+09 2.581564e+09 2.649721e+09 \n",
+ "1 ... 1.780428e+10 2.000162e+10 2.056105e+10 2.048487e+10 \n",
+ "2 ... 1.117897e+11 1.280529e+11 1.367099e+11 1.457122e+11 \n",
+ "3 ... 1.289087e+10 1.231978e+10 1.277628e+10 1.322825e+10 \n",
+ "4 ... 3.442063e+09 3.164615e+09 3.281585e+09 3.350736e+09 \n",
+ ".. ... ... ... ... ... \n",
+ "259 ... 6.691827e+09 6.499936e+09 7.071960e+09 7.386891e+09 \n",
+ "260 ... 3.272642e+10 3.540134e+10 4.041523e+10 4.322859e+10 \n",
+ "261 ... 4.164170e+11 3.963294e+11 3.666449e+11 3.506376e+11 \n",
+ "262 ... 2.346010e+10 2.550337e+10 2.804546e+10 2.715063e+10 \n",
+ "263 ... 1.410192e+10 1.711485e+10 1.909102e+10 1.949552e+10 \n",
+ "\n",
+ " 2015 2016 2017 2018 2019 Unnamed: 64 \n",
+ "0 2.691620e+09 2.646927e+09 2.700559e+09 NaN NaN NaN \n",
+ "1 1.990711e+10 1.936264e+10 2.019176e+10 1.936297e+10 NaN NaN \n",
+ "2 1.161936e+11 1.011239e+11 1.221238e+11 1.057510e+11 NaN NaN \n",
+ "3 1.138693e+10 1.186135e+10 1.302506e+10 1.505888e+10 NaN NaN \n",
+ "4 2.811489e+09 2.877312e+09 3.013387e+09 3.236544e+09 NaN NaN \n",
+ ".. ... ... ... ... ... ... \n",
+ "259 6.440612e+09 6.714712e+09 7.227765e+09 7.900269e+09 NaN NaN \n",
+ "260 4.262833e+10 3.096824e+10 2.681870e+10 2.691440e+10 NaN NaN \n",
+ "261 3.174156e+11 2.963409e+11 3.492681e+11 3.682882e+11 NaN NaN \n",
+ "262 2.115439e+10 2.095475e+10 2.586814e+10 2.672007e+10 NaN NaN \n",
+ "263 1.996312e+10 2.054868e+10 2.281301e+10 3.100052e+10 NaN NaN \n",
+ "\n",
+ "[264 rows x 65 columns]"
+ ]
+ },
+ "execution_count": 4,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "gdp"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 10,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "country_gdp = pd.merge(country_data, gdp, how='inner')"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 57,
+ "metadata": {
+ "collapsed": true
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " Country Name | \n",
+ " Country Code | \n",
+ " Region | \n",
+ " Income_Group | \n",
+ " Unnamed: 4 | \n",
+ " Indicator Name | \n",
+ " Indicator Code | \n",
+ " 1960 | \n",
+ " 1961 | \n",
+ " 1962 | \n",
+ " ... | \n",
+ " 2011 | \n",
+ " 2012 | \n",
+ " 2013 | \n",
+ " 2014 | \n",
+ " 2015 | \n",
+ " 2016 | \n",
+ " 2017 | \n",
+ " 2018 | \n",
+ " 2019 | \n",
+ " Unnamed: 64 | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " 阿鲁巴 | \n",
+ " ABW | \n",
+ " NaN | \n",
+ " 高收入国家 | \n",
+ " NaN | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " ... | \n",
+ " 2.549721e+09 | \n",
+ " 2.534637e+09 | \n",
+ " 2.581564e+09 | \n",
+ " 2.649721e+09 | \n",
+ " 2.691620e+09 | \n",
+ " 2.646927e+09 | \n",
+ " 2.700559e+09 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " 阿富汗 | \n",
+ " AFG | \n",
+ " 南亚 | \n",
+ " 低收入国家 | \n",
+ " NaN | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " 5.377778e+08 | \n",
+ " 5.488889e+08 | \n",
+ " 5.466667e+08 | \n",
+ " ... | \n",
+ " 1.780428e+10 | \n",
+ " 2.000162e+10 | \n",
+ " 2.056105e+10 | \n",
+ " 2.048487e+10 | \n",
+ " 1.990711e+10 | \n",
+ " 1.936264e+10 | \n",
+ " 2.019176e+10 | \n",
+ " 1.936297e+10 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " 安哥拉 | \n",
+ " AGO | \n",
+ " 撒哈拉以南非洲地区(不包括高收入) | \n",
+ " 中低等收入国家 | \n",
+ " NaN | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " ... | \n",
+ " 1.117897e+11 | \n",
+ " 1.280529e+11 | \n",
+ " 1.367099e+11 | \n",
+ " 1.457122e+11 | \n",
+ " 1.161936e+11 | \n",
+ " 1.011239e+11 | \n",
+ " 1.221238e+11 | \n",
+ " 1.057510e+11 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " 阿尔巴尼亚 | \n",
+ " ALB | \n",
+ " 欧洲与中亚地区(不包括高收入) | \n",
+ " 中高等收入国家 | \n",
+ " NaN | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " ... | \n",
+ " 1.289087e+10 | \n",
+ " 1.231978e+10 | \n",
+ " 1.277628e+10 | \n",
+ " 1.322825e+10 | \n",
+ " 1.138693e+10 | \n",
+ " 1.186135e+10 | \n",
+ " 1.302506e+10 | \n",
+ " 1.505888e+10 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " 安道尔共和国 | \n",
+ " AND | \n",
+ " NaN | \n",
+ " 高收入国家 | \n",
+ " NaN | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " ... | \n",
+ " 3.442063e+09 | \n",
+ " 3.164615e+09 | \n",
+ " 3.281585e+09 | \n",
+ " 3.350736e+09 | \n",
+ " 2.811489e+09 | \n",
+ " 2.877312e+09 | \n",
+ " 3.013387e+09 | \n",
+ " 3.236544e+09 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " 211 | \n",
+ " 科索沃 | \n",
+ " XKX | \n",
+ " 欧洲与中亚地区(不包括高收入) | \n",
+ " 中高等收入国家 | \n",
+ " NaN | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " ... | \n",
+ " 6.691827e+09 | \n",
+ " 6.499936e+09 | \n",
+ " 7.071960e+09 | \n",
+ " 7.386891e+09 | \n",
+ " 6.440612e+09 | \n",
+ " 6.714712e+09 | \n",
+ " 7.227765e+09 | \n",
+ " 7.900269e+09 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 212 | \n",
+ " 也门共和国 | \n",
+ " YEM | \n",
+ " 中东与北非地区(不包括高收入) | \n",
+ " 低收入国家 | \n",
+ " NaN | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " ... | \n",
+ " 3.272642e+10 | \n",
+ " 3.540134e+10 | \n",
+ " 4.041523e+10 | \n",
+ " 4.322859e+10 | \n",
+ " 4.262833e+10 | \n",
+ " 3.096824e+10 | \n",
+ " 2.681870e+10 | \n",
+ " 2.691440e+10 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 213 | \n",
+ " 南非 | \n",
+ " ZAF | \n",
+ " 撒哈拉以南非洲地区(不包括高收入) | \n",
+ " 中高等收入国家 | \n",
+ " NaN | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " 7.575397e+09 | \n",
+ " 7.972997e+09 | \n",
+ " 8.497997e+09 | \n",
+ " ... | \n",
+ " 4.164170e+11 | \n",
+ " 3.963294e+11 | \n",
+ " 3.666449e+11 | \n",
+ " 3.506376e+11 | \n",
+ " 3.174156e+11 | \n",
+ " 2.963409e+11 | \n",
+ " 3.492681e+11 | \n",
+ " 3.682882e+11 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 214 | \n",
+ " 赞比亚 | \n",
+ " ZMB | \n",
+ " 撒哈拉以南非洲地区(不包括高收入) | \n",
+ " 中低等收入国家 | \n",
+ " NaN | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " 7.130000e+08 | \n",
+ " 6.962857e+08 | \n",
+ " 6.931429e+08 | \n",
+ " ... | \n",
+ " 2.346010e+10 | \n",
+ " 2.550337e+10 | \n",
+ " 2.804546e+10 | \n",
+ " 2.715063e+10 | \n",
+ " 2.115439e+10 | \n",
+ " 2.095475e+10 | \n",
+ " 2.586814e+10 | \n",
+ " 2.672007e+10 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ " 215 | \n",
+ " 津巴布韦 | \n",
+ " ZWE | \n",
+ " 撒哈拉以南非洲地区(不包括高收入) | \n",
+ " 中低等收入国家 | \n",
+ " NaN | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " 1.052990e+09 | \n",
+ " 1.096647e+09 | \n",
+ " 1.117602e+09 | \n",
+ " ... | \n",
+ " 1.410192e+10 | \n",
+ " 1.711485e+10 | \n",
+ " 1.909102e+10 | \n",
+ " 1.949552e+10 | \n",
+ " 1.996312e+10 | \n",
+ " 2.054868e+10 | \n",
+ " 2.281301e+10 | \n",
+ " 3.100052e+10 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
216 rows × 68 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " Country Name Country Code Region Income_Group Unnamed: 4 \\\n",
+ "0 阿鲁巴 ABW NaN 高收入国家 NaN \n",
+ "1 阿富汗 AFG 南亚 低收入国家 NaN \n",
+ "2 安哥拉 AGO 撒哈拉以南非洲地区(不包括高收入) 中低等收入国家 NaN \n",
+ "3 阿尔巴尼亚 ALB 欧洲与中亚地区(不包括高收入) 中高等收入国家 NaN \n",
+ "4 安道尔共和国 AND NaN 高收入国家 NaN \n",
+ ".. ... ... ... ... ... \n",
+ "211 科索沃 XKX 欧洲与中亚地区(不包括高收入) 中高等收入国家 NaN \n",
+ "212 也门共和国 YEM 中东与北非地区(不包括高收入) 低收入国家 NaN \n",
+ "213 南非 ZAF 撒哈拉以南非洲地区(不包括高收入) 中高等收入国家 NaN \n",
+ "214 赞比亚 ZMB 撒哈拉以南非洲地区(不包括高收入) 中低等收入国家 NaN \n",
+ "215 津巴布韦 ZWE 撒哈拉以南非洲地区(不包括高收入) 中低等收入国家 NaN \n",
+ "\n",
+ " Indicator Name Indicator Code 1960 1961 1962 \\\n",
+ "0 GDP(现价美元) NY.GDP.MKTP.CD NaN NaN NaN \n",
+ "1 GDP(现价美元) NY.GDP.MKTP.CD 5.377778e+08 5.488889e+08 5.466667e+08 \n",
+ "2 GDP(现价美元) NY.GDP.MKTP.CD NaN NaN NaN \n",
+ "3 GDP(现价美元) NY.GDP.MKTP.CD NaN NaN NaN \n",
+ "4 GDP(现价美元) NY.GDP.MKTP.CD NaN NaN NaN \n",
+ ".. ... ... ... ... ... \n",
+ "211 GDP(现价美元) NY.GDP.MKTP.CD NaN NaN NaN \n",
+ "212 GDP(现价美元) NY.GDP.MKTP.CD NaN NaN NaN \n",
+ "213 GDP(现价美元) NY.GDP.MKTP.CD 7.575397e+09 7.972997e+09 8.497997e+09 \n",
+ "214 GDP(现价美元) NY.GDP.MKTP.CD 7.130000e+08 6.962857e+08 6.931429e+08 \n",
+ "215 GDP(现价美元) NY.GDP.MKTP.CD 1.052990e+09 1.096647e+09 1.117602e+09 \n",
+ "\n",
+ " ... 2011 2012 2013 2014 \\\n",
+ "0 ... 2.549721e+09 2.534637e+09 2.581564e+09 2.649721e+09 \n",
+ "1 ... 1.780428e+10 2.000162e+10 2.056105e+10 2.048487e+10 \n",
+ "2 ... 1.117897e+11 1.280529e+11 1.367099e+11 1.457122e+11 \n",
+ "3 ... 1.289087e+10 1.231978e+10 1.277628e+10 1.322825e+10 \n",
+ "4 ... 3.442063e+09 3.164615e+09 3.281585e+09 3.350736e+09 \n",
+ ".. ... ... ... ... ... \n",
+ "211 ... 6.691827e+09 6.499936e+09 7.071960e+09 7.386891e+09 \n",
+ "212 ... 3.272642e+10 3.540134e+10 4.041523e+10 4.322859e+10 \n",
+ "213 ... 4.164170e+11 3.963294e+11 3.666449e+11 3.506376e+11 \n",
+ "214 ... 2.346010e+10 2.550337e+10 2.804546e+10 2.715063e+10 \n",
+ "215 ... 1.410192e+10 1.711485e+10 1.909102e+10 1.949552e+10 \n",
+ "\n",
+ " 2015 2016 2017 2018 2019 Unnamed: 64 \n",
+ "0 2.691620e+09 2.646927e+09 2.700559e+09 NaN NaN NaN \n",
+ "1 1.990711e+10 1.936264e+10 2.019176e+10 1.936297e+10 NaN NaN \n",
+ "2 1.161936e+11 1.011239e+11 1.221238e+11 1.057510e+11 NaN NaN \n",
+ "3 1.138693e+10 1.186135e+10 1.302506e+10 1.505888e+10 NaN NaN \n",
+ "4 2.811489e+09 2.877312e+09 3.013387e+09 3.236544e+09 NaN NaN \n",
+ ".. ... ... ... ... ... ... \n",
+ "211 6.440612e+09 6.714712e+09 7.227765e+09 7.900269e+09 NaN NaN \n",
+ "212 4.262833e+10 3.096824e+10 2.681870e+10 2.691440e+10 NaN NaN \n",
+ "213 3.174156e+11 2.963409e+11 3.492681e+11 3.682882e+11 NaN NaN \n",
+ "214 2.115439e+10 2.095475e+10 2.586814e+10 2.672007e+10 NaN NaN \n",
+ "215 1.996312e+10 2.054868e+10 2.281301e+10 3.100052e+10 NaN NaN \n",
+ "\n",
+ "[216 rows x 68 columns]"
+ ]
+ },
+ "execution_count": 57,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "country_gdp"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 58,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "# country_gdp['2018'] = country_gdp['2018'].apply(lambda x: x/1000000000000)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 59,
+ "metadata": {
+ "scrolled": true
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " Country Name | \n",
+ " Country Code | \n",
+ " 2018 | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 202 | \n",
+ " 美国 | \n",
+ " USA | \n",
+ " 20.494100 | \n",
+ "
\n",
+ " \n",
+ " 36 | \n",
+ " 中国 | \n",
+ " CHN | \n",
+ " 13.608152 | \n",
+ "
\n",
+ " \n",
+ " 97 | \n",
+ " 日本 | \n",
+ " JPN | \n",
+ " 4.970916 | \n",
+ "
\n",
+ " \n",
+ " 50 | \n",
+ " 德国 | \n",
+ " DEU | \n",
+ " 3.996759 | \n",
+ "
\n",
+ " \n",
+ " 68 | \n",
+ " 英国 | \n",
+ " GBR | \n",
+ " 2.825208 | \n",
+ "
\n",
+ " \n",
+ " 64 | \n",
+ " 法国 | \n",
+ " FRA | \n",
+ " 2.777535 | \n",
+ "
\n",
+ " \n",
+ " 89 | \n",
+ " 印度 | \n",
+ " IND | \n",
+ " 2.726323 | \n",
+ "
\n",
+ " \n",
+ " 94 | \n",
+ " 意大利 | \n",
+ " ITA | \n",
+ " 2.073902 | \n",
+ "
\n",
+ " \n",
+ " 26 | \n",
+ " 巴西 | \n",
+ " BRA | \n",
+ " 1.868626 | \n",
+ "
\n",
+ " \n",
+ " 32 | \n",
+ " 加拿大 | \n",
+ " CAN | \n",
+ " 1.712510 | \n",
+ "
\n",
+ " \n",
+ " 164 | \n",
+ " 俄罗斯联邦 | \n",
+ " RUS | \n",
+ " 1.657554 | \n",
+ "
\n",
+ " \n",
+ " 104 | \n",
+ " 大韩民国 | \n",
+ " KOR | \n",
+ " 1.619424 | \n",
+ "
\n",
+ " \n",
+ " 10 | \n",
+ " 澳大利亚 | \n",
+ " AUS | \n",
+ " 1.432195 | \n",
+ "
\n",
+ " \n",
+ " 59 | \n",
+ " 西班牙 | \n",
+ " ESP | \n",
+ " 1.426189 | \n",
+ "
\n",
+ " \n",
+ " 124 | \n",
+ " 墨西哥 | \n",
+ " MEX | \n",
+ " 1.223809 | \n",
+ "
\n",
+ " \n",
+ " 87 | \n",
+ " 印度尼西亚 | \n",
+ " IDN | \n",
+ " 1.042173 | \n",
+ "
\n",
+ " \n",
+ " 143 | \n",
+ " 荷兰 | \n",
+ " NLD | \n",
+ " 0.913658 | \n",
+ "
\n",
+ " \n",
+ " 166 | \n",
+ " 沙特阿拉伯 | \n",
+ " SAU | \n",
+ " 0.782483 | \n",
+ "
\n",
+ " \n",
+ " 196 | \n",
+ " 土耳其 | \n",
+ " TUR | \n",
+ " 0.766509 | \n",
+ "
\n",
+ " \n",
+ " 33 | \n",
+ " 瑞士 | \n",
+ " CHE | \n",
+ " 0.705501 | \n",
+ "
\n",
+ " \n",
+ " 155 | \n",
+ " 波兰 | \n",
+ " POL | \n",
+ " 0.585783 | \n",
+ "
\n",
+ " \n",
+ " 181 | \n",
+ " 瑞典 | \n",
+ " SWE | \n",
+ " 0.551032 | \n",
+ "
\n",
+ " \n",
+ " 14 | \n",
+ " 比利时 | \n",
+ " BEL | \n",
+ " 0.531767 | \n",
+ "
\n",
+ " \n",
+ " 6 | \n",
+ " 阿根廷 | \n",
+ " ARG | \n",
+ " 0.518475 | \n",
+ "
\n",
+ " \n",
+ " 189 | \n",
+ " 泰国 | \n",
+ " THA | \n",
+ " 0.504993 | \n",
+ "
\n",
+ " \n",
+ " 11 | \n",
+ " 奥地利 | \n",
+ " AUT | \n",
+ " 0.455737 | \n",
+ "
\n",
+ " \n",
+ " 144 | \n",
+ " 挪威 | \n",
+ " NOR | \n",
+ " 0.434751 | \n",
+ "
\n",
+ " \n",
+ " 5 | \n",
+ " 阿拉伯联合酋长国 | \n",
+ " ARE | \n",
+ " 0.414179 | \n",
+ "
\n",
+ " \n",
+ " 141 | \n",
+ " 尼日利亚 | \n",
+ " NGA | \n",
+ " 0.397270 | \n",
+ "
\n",
+ " \n",
+ " 90 | \n",
+ " 爱尔兰 | \n",
+ " IRL | \n",
+ " 0.382487 | \n",
+ "
\n",
+ " \n",
+ " 93 | \n",
+ " 以色列 | \n",
+ " ISR | \n",
+ " 0.369690 | \n",
+ "
\n",
+ " \n",
+ " 213 | \n",
+ " 南非 | \n",
+ " ZAF | \n",
+ " 0.368288 | \n",
+ "
\n",
+ " \n",
+ " 169 | \n",
+ " 新加坡 | \n",
+ " SGP | \n",
+ " 0.364157 | \n",
+ "
\n",
+ " \n",
+ " 82 | \n",
+ " 中国香港特别行政区 | \n",
+ " HKG | \n",
+ " 0.362993 | \n",
+ "
\n",
+ " \n",
+ " 137 | \n",
+ " 马来西亚 | \n",
+ " MYS | \n",
+ " 0.354348 | \n",
+ "
\n",
+ " \n",
+ " 53 | \n",
+ " 丹麦 | \n",
+ " DNK | \n",
+ " 0.352058 | \n",
+ "
\n",
+ " \n",
+ " 152 | \n",
+ " 菲律宾 | \n",
+ " PHL | \n",
+ " 0.330910 | \n",
+ "
\n",
+ " \n",
+ " 41 | \n",
+ " 哥伦比亚 | \n",
+ " COL | \n",
+ " 0.330228 | \n",
+ "
\n",
+ " \n",
+ " 149 | \n",
+ " 巴基斯坦 | \n",
+ " PAK | \n",
+ " 0.312570 | \n",
+ "
\n",
+ " \n",
+ " 35 | \n",
+ " 智利 | \n",
+ " CHL | \n",
+ " 0.298231 | \n",
+ "
\n",
+ " \n",
+ " 17 | \n",
+ " 孟加拉国 | \n",
+ " BGD | \n",
+ " 0.274025 | \n",
+ "
\n",
+ " \n",
+ " 62 | \n",
+ " 芬兰 | \n",
+ " FIN | \n",
+ " 0.273961 | \n",
+ "
\n",
+ " \n",
+ " 57 | \n",
+ " 阿拉伯埃及共和国 | \n",
+ " EGY | \n",
+ " 0.250895 | \n",
+ "
\n",
+ " \n",
+ " 49 | \n",
+ " 捷克共和国 | \n",
+ " CZE | \n",
+ " 0.245226 | \n",
+ "
\n",
+ " \n",
+ " 208 | \n",
+ " 越南 | \n",
+ " VNM | \n",
+ " 0.244948 | \n",
+ "
\n",
+ " \n",
+ " 163 | \n",
+ " 罗马尼亚 | \n",
+ " ROU | \n",
+ " 0.239553 | \n",
+ "
\n",
+ " \n",
+ " 158 | \n",
+ " 葡萄牙 | \n",
+ " PRT | \n",
+ " 0.237979 | \n",
+ "
\n",
+ " \n",
+ " 91 | \n",
+ " 伊拉克 | \n",
+ " IRQ | \n",
+ " 0.225914 | \n",
+ "
\n",
+ " \n",
+ " 151 | \n",
+ " 秘鲁 | \n",
+ " PER | \n",
+ " 0.222238 | \n",
+ "
\n",
+ " \n",
+ " 76 | \n",
+ " 希腊 | \n",
+ " GRC | \n",
+ " 0.218032 | \n",
+ "
\n",
+ " \n",
+ " 147 | \n",
+ " 新西兰 | \n",
+ " NZL | \n",
+ " 0.205025 | \n",
+ "
\n",
+ " \n",
+ " 162 | \n",
+ " 卡塔尔 | \n",
+ " QAT | \n",
+ " 0.192009 | \n",
+ "
\n",
+ " \n",
+ " 55 | \n",
+ " 阿尔及利亚 | \n",
+ " DZA | \n",
+ " 0.180689 | \n",
+ "
\n",
+ " \n",
+ " 98 | \n",
+ " 哈萨克斯坦 | \n",
+ " KAZ | \n",
+ " 0.170539 | \n",
+ "
\n",
+ " \n",
+ " 86 | \n",
+ " 匈牙利 | \n",
+ " HUN | \n",
+ " 0.155703 | \n",
+ "
\n",
+ " \n",
+ " 105 | \n",
+ " 科威特 | \n",
+ " KWT | \n",
+ " 0.141678 | \n",
+ "
\n",
+ " \n",
+ " 200 | \n",
+ " 乌克兰 | \n",
+ " UKR | \n",
+ " 0.130832 | \n",
+ "
\n",
+ " \n",
+ " 119 | \n",
+ " 摩洛哥 | \n",
+ " MAR | \n",
+ " 0.118495 | \n",
+ "
\n",
+ " \n",
+ " 56 | \n",
+ " 厄瓜多尔 | \n",
+ " ECU | \n",
+ " 0.108398 | \n",
+ "
\n",
+ " \n",
+ " 179 | \n",
+ " 斯洛伐克共和国 | \n",
+ " SVK | \n",
+ " 0.106472 | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
"
+ ],
+ "text/plain": [
+ " Country Name Country Code 2018\n",
+ "202 美国 USA 20.494100\n",
+ "36 中国 CHN 13.608152\n",
+ "97 日本 JPN 4.970916\n",
+ "50 德国 DEU 3.996759\n",
+ "68 英国 GBR 2.825208\n",
+ "64 法国 FRA 2.777535\n",
+ "89 印度 IND 2.726323\n",
+ "94 意大利 ITA 2.073902\n",
+ "26 巴西 BRA 1.868626\n",
+ "32 加拿大 CAN 1.712510\n",
+ "164 俄罗斯联邦 RUS 1.657554\n",
+ "104 大韩民国 KOR 1.619424\n",
+ "10 澳大利亚 AUS 1.432195\n",
+ "59 西班牙 ESP 1.426189\n",
+ "124 墨西哥 MEX 1.223809\n",
+ "87 印度尼西亚 IDN 1.042173\n",
+ "143 荷兰 NLD 0.913658\n",
+ "166 沙特阿拉伯 SAU 0.782483\n",
+ "196 土耳其 TUR 0.766509\n",
+ "33 瑞士 CHE 0.705501\n",
+ "155 波兰 POL 0.585783\n",
+ "181 瑞典 SWE 0.551032\n",
+ "14 比利时 BEL 0.531767\n",
+ "6 阿根廷 ARG 0.518475\n",
+ "189 泰国 THA 0.504993\n",
+ "11 奥地利 AUT 0.455737\n",
+ "144 挪威 NOR 0.434751\n",
+ "5 阿拉伯联合酋长国 ARE 0.414179\n",
+ "141 尼日利亚 NGA 0.397270\n",
+ "90 爱尔兰 IRL 0.382487\n",
+ "93 以色列 ISR 0.369690\n",
+ "213 南非 ZAF 0.368288\n",
+ "169 新加坡 SGP 0.364157\n",
+ "82 中国香港特别行政区 HKG 0.362993\n",
+ "137 马来西亚 MYS 0.354348\n",
+ "53 丹麦 DNK 0.352058\n",
+ "152 菲律宾 PHL 0.330910\n",
+ "41 哥伦比亚 COL 0.330228\n",
+ "149 巴基斯坦 PAK 0.312570\n",
+ "35 智利 CHL 0.298231\n",
+ "17 孟加拉国 BGD 0.274025\n",
+ "62 芬兰 FIN 0.273961\n",
+ "57 阿拉伯埃及共和国 EGY 0.250895\n",
+ "49 捷克共和国 CZE 0.245226\n",
+ "208 越南 VNM 0.244948\n",
+ "163 罗马尼亚 ROU 0.239553\n",
+ "158 葡萄牙 PRT 0.237979\n",
+ "91 伊拉克 IRQ 0.225914\n",
+ "151 秘鲁 PER 0.222238\n",
+ "76 希腊 GRC 0.218032\n",
+ "147 新西兰 NZL 0.205025\n",
+ "162 卡塔尔 QAT 0.192009\n",
+ "55 阿尔及利亚 DZA 0.180689\n",
+ "98 哈萨克斯坦 KAZ 0.170539\n",
+ "86 匈牙利 HUN 0.155703\n",
+ "105 科威特 KWT 0.141678\n",
+ "200 乌克兰 UKR 0.130832\n",
+ "119 摩洛哥 MAR 0.118495\n",
+ "56 厄瓜多尔 ECU 0.108398\n",
+ "179 斯洛伐克共和国 SVK 0.106472"
+ ]
+ },
+ "execution_count": 59,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "country_gdp[['Country Name', 'Country Code', '2018']].sort_values(by='2018', ascending=False)[:60]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "#############################\n",
+ "# 历年GDP分析"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 11,
+ "metadata": {
+ "scrolled": true
+ },
+ "outputs": [],
+ "source": [
+ "df_china = country_gdp[country_gdp['Country Name']=='中国']"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 12,
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stderr",
+ "output_type": "stream",
+ "text": [
+ "c:\\users\\wei.zhou\\appdata\\local\\programs\\python\\python37-32\\lib\\site-packages\\ipykernel_launcher.py:2: SettingWithCopyWarning: \n",
+ "A value is trying to be set on a copy of a slice from a DataFrame.\n",
+ "Try using .loc[row_indexer,col_indexer] = value instead\n",
+ "\n",
+ "See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy\n",
+ " \n"
+ ]
+ }
+ ],
+ "source": [
+ "for i in range(1960, 2019):\n",
+ " df_china[str(i)] = df_china[str(i)].apply(lambda x: x/1000000000000)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 13,
+ "metadata": {
+ "collapsed": true
+ },
+ "outputs": [
+ {
+ "name": "stderr",
+ "output_type": "stream",
+ "text": [
+ "c:\\users\\wei.zhou\\appdata\\local\\programs\\python\\python37-32\\lib\\site-packages\\ipykernel_launcher.py:3: SettingWithCopyWarning: \n",
+ "A value is trying to be set on a copy of a slice from a DataFrame.\n",
+ "Try using .loc[row_indexer,col_indexer] = value instead\n",
+ "\n",
+ "See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy\n",
+ " This is separate from the ipykernel package so we can avoid doing imports until\n"
+ ]
+ },
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " Country Name | \n",
+ " Country Code | \n",
+ " Region | \n",
+ " Income_Group | \n",
+ " Unnamed: 4 | \n",
+ " Indicator Name | \n",
+ " Indicator Code | \n",
+ " 1960 | \n",
+ " 1961 | \n",
+ " 1962 | \n",
+ " ... | \n",
+ " 2011 | \n",
+ " 2012 | \n",
+ " 2013 | \n",
+ " 2014 | \n",
+ " 2015 | \n",
+ " 2016 | \n",
+ " 2017 | \n",
+ " 2018 | \n",
+ " 2019 | \n",
+ " Unnamed: 64 | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 202 | \n",
+ " 美国 | \n",
+ " USA | \n",
+ " NaN | \n",
+ " 高收入国家 | \n",
+ " NaN | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " 0.5433 | \n",
+ " 0.5633 | \n",
+ " 0.6051 | \n",
+ " ... | \n",
+ " 15.542581 | \n",
+ " 16.197007 | \n",
+ " 16.784849 | \n",
+ " 17.521747 | \n",
+ " 18.219298 | \n",
+ " 18.707188 | \n",
+ " 19.485394 | \n",
+ " 20.4941 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
1 rows × 68 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " Country Name Country Code Region Income_Group Unnamed: 4 Indicator Name \\\n",
+ "202 美国 USA NaN 高收入国家 NaN GDP(现价美元) \n",
+ "\n",
+ " Indicator Code 1960 1961 1962 ... 2011 2012 \\\n",
+ "202 NY.GDP.MKTP.CD 0.5433 0.5633 0.6051 ... 15.542581 16.197007 \n",
+ "\n",
+ " 2013 2014 2015 2016 2017 2018 2019 \\\n",
+ "202 16.784849 17.521747 18.219298 18.707188 19.485394 20.4941 NaN \n",
+ "\n",
+ " Unnamed: 64 \n",
+ "202 NaN \n",
+ "\n",
+ "[1 rows x 68 columns]"
+ ]
+ },
+ "execution_count": 13,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "df_usa = country_gdp[country_gdp['Country Name']=='美国']\n",
+ "for i in range(1960, 2019):\n",
+ " df_usa[str(i)] = df_usa[str(i)].apply(lambda x: x/1000000000000)\n",
+ "df_usa"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 14,
+ "metadata": {
+ "collapsed": true
+ },
+ "outputs": [
+ {
+ "name": "stderr",
+ "output_type": "stream",
+ "text": [
+ "c:\\users\\wei.zhou\\appdata\\local\\programs\\python\\python37-32\\lib\\site-packages\\ipykernel_launcher.py:3: SettingWithCopyWarning: \n",
+ "A value is trying to be set on a copy of a slice from a DataFrame.\n",
+ "Try using .loc[row_indexer,col_indexer] = value instead\n",
+ "\n",
+ "See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy\n",
+ " This is separate from the ipykernel package so we can avoid doing imports until\n"
+ ]
+ },
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " Country Name | \n",
+ " Country Code | \n",
+ " Region | \n",
+ " Income_Group | \n",
+ " Unnamed: 4 | \n",
+ " Indicator Name | \n",
+ " Indicator Code | \n",
+ " 1960 | \n",
+ " 1961 | \n",
+ " 1962 | \n",
+ " ... | \n",
+ " 2011 | \n",
+ " 2012 | \n",
+ " 2013 | \n",
+ " 2014 | \n",
+ " 2015 | \n",
+ " 2016 | \n",
+ " 2017 | \n",
+ " 2018 | \n",
+ " 2019 | \n",
+ " Unnamed: 64 | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 97 | \n",
+ " 日本 | \n",
+ " JPN | \n",
+ " NaN | \n",
+ " 高收入国家 | \n",
+ " NaN | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " 0.044307 | \n",
+ " 0.053509 | \n",
+ " 0.060723 | \n",
+ " ... | \n",
+ " 6.15746 | \n",
+ " 6.203213 | \n",
+ " 5.155717 | \n",
+ " 4.850414 | \n",
+ " 4.389476 | \n",
+ " 4.926667 | \n",
+ " 4.859951 | \n",
+ " 4.970916 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
1 rows × 68 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " Country Name Country Code Region Income_Group Unnamed: 4 Indicator Name \\\n",
+ "97 日本 JPN NaN 高收入国家 NaN GDP(现价美元) \n",
+ "\n",
+ " Indicator Code 1960 1961 1962 ... 2011 2012 \\\n",
+ "97 NY.GDP.MKTP.CD 0.044307 0.053509 0.060723 ... 6.15746 6.203213 \n",
+ "\n",
+ " 2013 2014 2015 2016 2017 2018 2019 \\\n",
+ "97 5.155717 4.850414 4.389476 4.926667 4.859951 4.970916 NaN \n",
+ "\n",
+ " Unnamed: 64 \n",
+ "97 NaN \n",
+ "\n",
+ "[1 rows x 68 columns]"
+ ]
+ },
+ "execution_count": 14,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "df_jpn = country_gdp[country_gdp['Country Name']=='日本']\n",
+ "for i in range(1960, 2019):\n",
+ " df_jpn[str(i)] = df_jpn[str(i)].apply(lambda x: x/1000000000000)\n",
+ "df_jpn"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 15,
+ "metadata": {
+ "collapsed": true
+ },
+ "outputs": [
+ {
+ "name": "stderr",
+ "output_type": "stream",
+ "text": [
+ "c:\\users\\wei.zhou\\appdata\\local\\programs\\python\\python37-32\\lib\\site-packages\\ipykernel_launcher.py:3: SettingWithCopyWarning: \n",
+ "A value is trying to be set on a copy of a slice from a DataFrame.\n",
+ "Try using .loc[row_indexer,col_indexer] = value instead\n",
+ "\n",
+ "See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy\n",
+ " This is separate from the ipykernel package so we can avoid doing imports until\n"
+ ]
+ },
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " Country Name | \n",
+ " Country Code | \n",
+ " Region | \n",
+ " Income_Group | \n",
+ " Unnamed: 4 | \n",
+ " Indicator Name | \n",
+ " Indicator Code | \n",
+ " 1960 | \n",
+ " 1961 | \n",
+ " 1962 | \n",
+ " ... | \n",
+ " 2011 | \n",
+ " 2012 | \n",
+ " 2013 | \n",
+ " 2014 | \n",
+ " 2015 | \n",
+ " 2016 | \n",
+ " 2017 | \n",
+ " 2018 | \n",
+ " 2019 | \n",
+ " Unnamed: 64 | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 50 | \n",
+ " 德国 | \n",
+ " DEU | \n",
+ " NaN | \n",
+ " 高收入国家 | \n",
+ " NaN | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " NaN | \n",
+ " ... | \n",
+ " 3.757698 | \n",
+ " 3.543984 | \n",
+ " 3.752514 | \n",
+ " 3.898727 | \n",
+ " 3.381389 | \n",
+ " 3.495163 | \n",
+ " 3.693204 | \n",
+ " 3.996759 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
1 rows × 68 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " Country Name Country Code Region Income_Group Unnamed: 4 Indicator Name \\\n",
+ "50 德国 DEU NaN 高收入国家 NaN GDP(现价美元) \n",
+ "\n",
+ " Indicator Code 1960 1961 1962 ... 2011 2012 2013 \\\n",
+ "50 NY.GDP.MKTP.CD NaN NaN NaN ... 3.757698 3.543984 3.752514 \n",
+ "\n",
+ " 2014 2015 2016 2017 2018 2019 Unnamed: 64 \n",
+ "50 3.898727 3.381389 3.495163 3.693204 3.996759 NaN NaN \n",
+ "\n",
+ "[1 rows x 68 columns]"
+ ]
+ },
+ "execution_count": 15,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "df_de = country_gdp[country_gdp['Country Name']=='德国']\n",
+ "for i in range(1960, 2019):\n",
+ " df_de[str(i)] = df_de[str(i)].apply(lambda x: x/1000000000000)\n",
+ "df_de"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 16,
+ "metadata": {
+ "collapsed": true
+ },
+ "outputs": [
+ {
+ "name": "stderr",
+ "output_type": "stream",
+ "text": [
+ "c:\\users\\wei.zhou\\appdata\\local\\programs\\python\\python37-32\\lib\\site-packages\\ipykernel_launcher.py:3: SettingWithCopyWarning: \n",
+ "A value is trying to be set on a copy of a slice from a DataFrame.\n",
+ "Try using .loc[row_indexer,col_indexer] = value instead\n",
+ "\n",
+ "See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy\n",
+ " This is separate from the ipykernel package so we can avoid doing imports until\n"
+ ]
+ },
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " Country Name | \n",
+ " Country Code | \n",
+ " Region | \n",
+ " Income_Group | \n",
+ " Unnamed: 4 | \n",
+ " Indicator Name | \n",
+ " Indicator Code | \n",
+ " 1960 | \n",
+ " 1961 | \n",
+ " 1962 | \n",
+ " ... | \n",
+ " 2011 | \n",
+ " 2012 | \n",
+ " 2013 | \n",
+ " 2014 | \n",
+ " 2015 | \n",
+ " 2016 | \n",
+ " 2017 | \n",
+ " 2018 | \n",
+ " 2019 | \n",
+ " Unnamed: 64 | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 68 | \n",
+ " 英国 | \n",
+ " GBR | \n",
+ " NaN | \n",
+ " 高收入国家 | \n",
+ " NaN | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " 0.072328 | \n",
+ " 0.076694 | \n",
+ " 0.080602 | \n",
+ " ... | \n",
+ " 2.634896 | \n",
+ " 2.676605 | \n",
+ " 2.753565 | \n",
+ " 3.034729 | \n",
+ " 2.896421 | \n",
+ " 2.659239 | \n",
+ " 2.637866 | \n",
+ " 2.825208 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
1 rows × 68 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " Country Name Country Code Region Income_Group Unnamed: 4 Indicator Name \\\n",
+ "68 英国 GBR NaN 高收入国家 NaN GDP(现价美元) \n",
+ "\n",
+ " Indicator Code 1960 1961 1962 ... 2011 2012 \\\n",
+ "68 NY.GDP.MKTP.CD 0.072328 0.076694 0.080602 ... 2.634896 2.676605 \n",
+ "\n",
+ " 2013 2014 2015 2016 2017 2018 2019 \\\n",
+ "68 2.753565 3.034729 2.896421 2.659239 2.637866 2.825208 NaN \n",
+ "\n",
+ " Unnamed: 64 \n",
+ "68 NaN \n",
+ "\n",
+ "[1 rows x 68 columns]"
+ ]
+ },
+ "execution_count": 16,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "df_uk = country_gdp[country_gdp['Country Name']=='英国']\n",
+ "for i in range(1960, 2019):\n",
+ " df_uk[str(i)] = df_uk[str(i)].apply(lambda x: x/1000000000000)\n",
+ "df_uk"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 17,
+ "metadata": {
+ "scrolled": true
+ },
+ "outputs": [],
+ "source": [
+ "year_str = [str(i) for i in range(1960, 2019)]\n",
+ "\n",
+ "china_gdp = df_china[year_str].values.tolist()[0]\n",
+ "usa_gdp = df_usa[year_str].values.tolist()[0]\n",
+ "jpn_gdp = df_jpn[year_str].values.tolist()[0]\n",
+ "de_gdp = df_de[year_str].values.tolist()[0]\n",
+ "uk_gdp = df_uk[year_str].values.tolist()[0]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 154,
+ "metadata": {
+ "collapsed": true
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " Country Name | \n",
+ " Country Code | \n",
+ " Region | \n",
+ " Income_Group | \n",
+ " Unnamed: 4 | \n",
+ " Indicator Name | \n",
+ " Indicator Code | \n",
+ " 1960 | \n",
+ " 1961 | \n",
+ " 1962 | \n",
+ " ... | \n",
+ " 2011 | \n",
+ " 2012 | \n",
+ " 2013 | \n",
+ " 2014 | \n",
+ " 2015 | \n",
+ " 2016 | \n",
+ " 2017 | \n",
+ " 2018 | \n",
+ " 2019 | \n",
+ " Unnamed: 64 | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 36 | \n",
+ " 中国 | \n",
+ " CHN | \n",
+ " 东亚与太平洋地区(不包括高收入) | \n",
+ " 中高等收入国家 | \n",
+ " NaN | \n",
+ " GDP(现价美元) | \n",
+ " NY.GDP.MKTP.CD | \n",
+ " 0.059716 | \n",
+ " 0.050057 | \n",
+ " 0.047209 | \n",
+ " ... | \n",
+ " 7.5515 | \n",
+ " 8.532231 | \n",
+ " 9.570406 | \n",
+ " 10.438529 | \n",
+ " 11.015542 | \n",
+ " 11.137946 | \n",
+ " 12.143491 | \n",
+ " 13.608152 | \n",
+ " NaN | \n",
+ " NaN | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
1 rows × 68 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " Country Name Country Code Region Income_Group Unnamed: 4 \\\n",
+ "36 中国 CHN 东亚与太平洋地区(不包括高收入) 中高等收入国家 NaN \n",
+ "\n",
+ " Indicator Name Indicator Code 1960 1961 1962 ... 2011 \\\n",
+ "36 GDP(现价美元) NY.GDP.MKTP.CD 0.059716 0.050057 0.047209 ... 7.5515 \n",
+ "\n",
+ " 2012 2013 2014 2015 2016 2017 2018 \\\n",
+ "36 8.532231 9.570406 10.438529 11.015542 11.137946 12.143491 13.608152 \n",
+ "\n",
+ " 2019 Unnamed: 64 \n",
+ "36 NaN NaN \n",
+ "\n",
+ "[1 rows x 68 columns]"
+ ]
+ },
+ "execution_count": 154,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "df_china"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 18,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "from pyecharts.charts import Scatter\n",
+ "\n",
+ "def scatter_base(choose, values, country) -> Scatter:\n",
+ " c = (\n",
+ " Scatter()\n",
+ " .add_xaxis(choose)\n",
+ " .add_yaxis(\"%s历年GDP\" % country, values)\n",
+ " .set_global_opts(title_opts=opts.TitleOpts(title=\"\"),\n",
+ " # datazoom_opts=opts.DataZoomOpts(),\n",
+ " yaxis_opts=opts.AxisOpts(\n",
+ " axislabel_opts=opts.LabelOpts(formatter=\"{value} /万亿\")\n",
+ " )\n",
+ " )\n",
+ " .set_series_opts(label_opts=opts.LabelOpts(is_show=False))\n",
+ " )\n",
+ " return c"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 19,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ " \n",
+ "\n",
+ "\n",
+ "\n"
+ ],
+ "text/plain": [
+ ""
+ ]
+ },
+ "execution_count": 19,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "scatter_base(year_str, china_gdp, '中国').render_notebook()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 20,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ " \n",
+ "\n",
+ "\n",
+ "\n"
+ ],
+ "text/plain": [
+ ""
+ ]
+ },
+ "execution_count": 20,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "scatter_base(year_str, usa_gdp, '美国').render_notebook()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 21,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ " \n",
+ "\n",
+ "\n",
+ "\n"
+ ],
+ "text/plain": [
+ ""
+ ]
+ },
+ "execution_count": 21,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "scatter_base(year_str, jpn_gdp, '日本').render_notebook()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 22,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ " \n",
+ "\n",
+ "\n",
+ "\n"
+ ],
+ "text/plain": [
+ ""
+ ]
+ },
+ "execution_count": 22,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "scatter_base(year_str, de_gdp, '德国').render_notebook()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 23,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ " \n",
+ "\n",
+ "\n",
+ "\n"
+ ],
+ "text/plain": [
+ ""
+ ]
+ },
+ "execution_count": 23,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "scatter_base(year_str, uk_gdp, '英国').render_notebook()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 24,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "import sklearn.pipeline as pl\n",
+ "import sklearn.linear_model as lm\n",
+ "import sklearn.preprocessing as sp\n",
+ "import matplotlib.pyplot as mp\n",
+ "import numpy as np\n",
+ "import sklearn.metrics as sm"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 25,
+ "metadata": {
+ "collapsed": true
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "array([[1960],\n",
+ " [1961],\n",
+ " [1962],\n",
+ " [1963],\n",
+ " [1964],\n",
+ " [1965],\n",
+ " [1966],\n",
+ " [1967],\n",
+ " [1968],\n",
+ " [1969],\n",
+ " [1970],\n",
+ " [1971],\n",
+ " [1972],\n",
+ " [1973],\n",
+ " [1974],\n",
+ " [1975],\n",
+ " [1976],\n",
+ " [1977],\n",
+ " [1978],\n",
+ " [1979],\n",
+ " [1980],\n",
+ " [1981],\n",
+ " [1982],\n",
+ " [1983],\n",
+ " [1984],\n",
+ " [1985],\n",
+ " [1986],\n",
+ " [1987],\n",
+ " [1988],\n",
+ " [1989],\n",
+ " [1990],\n",
+ " [1991],\n",
+ " [1992],\n",
+ " [1993],\n",
+ " [1994],\n",
+ " [1995],\n",
+ " [1996],\n",
+ " [1997],\n",
+ " [1998],\n",
+ " [1999],\n",
+ " [2000],\n",
+ " [2001],\n",
+ " [2002],\n",
+ " [2003],\n",
+ " [2004],\n",
+ " [2005],\n",
+ " [2006],\n",
+ " [2007],\n",
+ " [2008],\n",
+ " [2009],\n",
+ " [2010],\n",
+ " [2011],\n",
+ " [2012],\n",
+ " [2013],\n",
+ " [2014],\n",
+ " [2015],\n",
+ " [2016],\n",
+ " [2017],\n",
+ " [2018]])"
+ ]
+ },
+ "execution_count": 25,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "year = [i for i in range(1960, 2019)]\n",
+ "X = np.array(year)\n",
+ "X = X.reshape(-1, 1)\n",
+ "X"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 26,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "y = usa_gdp"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 27,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "model = pl.make_pipeline(\n",
+ " sp.PolynomialFeatures(5), # 多项式特征拓展器\n",
+ " lm.LinearRegression() # 线性回归器\n",
+ ")\n",
+ "# 训练模型\n",
+ "model.fit(X, y)\n",
+ "# 求预测值y\n",
+ "pred_y = model.predict(X)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 244,
+ "metadata": {
+ "collapsed": true
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "array([ 0.67561513, 0.64550236, 0.63069893, 0.6310778 , 0.64651146,\n",
+ " 0.67687193, 0.7220308 , 0.78185916, 0.85622766, 0.94500648,\n",
+ " 1.04806535, 1.16527352, 1.29649978, 1.44161246, 1.60047942,\n",
+ " 1.77296806, 1.9589453 , 2.15827761, 2.37083099, 2.59647097,\n",
+ " 2.8350626 , 3.08647047, 3.35055872, 3.62719099, 3.91623047,\n",
+ " 4.21753986, 4.53098142, 4.8564169 , 5.19370761, 5.54271437,\n",
+ " 5.90329754, 6.27531699, 6.65863212, 7.05310188, 7.4585847 ,\n",
+ " 7.87493857, 8.302021 , 8.739689 , 9.18779914, 9.64620748,\n",
+ " 10.11476961, 10.59334065, 11.08177525, 11.57992755, 12.08765123,\n",
+ " 12.60479949, 13.13122504, 13.66678012, 14.21131649, 14.7646854 ,\n",
+ " 15.32673766, 15.89732355, 16.47629291, 17.06349506, 17.65877886,\n",
+ " 18.26199267, 18.87298437, 19.49160136, 20.11769053])"
+ ]
+ },
+ "execution_count": 244,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "pred_y"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 34,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "array([-6.56811530e-01, -4.31663493e-01, -2.35026973e-01, -6.53989891e-02,\n",
+ " 7.87281703e-02, 1.98866952e-01, 2.96534541e-01, 3.73252871e-01,\n",
+ " 4.30548622e-01, 4.69953232e-01, 4.93002894e-01, 5.01238570e-01,\n",
+ " 4.96205988e-01, 4.79455654e-01, 4.52542849e-01, 4.17027639e-01,\n",
+ " 3.74474880e-01, 3.26454222e-01, 2.74540110e-01, 2.20311797e-01,\n",
+ " 1.65353340e-01, 1.11253613e-01, 5.96063043e-02, 1.20099274e-02,\n",
+ " -2.99321770e-02, -6.46118355e-02, -9.04160388e-02, -1.05726933e-01,\n",
+ " -1.08921820e-01, -9.83731464e-02, -7.24485036e-02, -2.95106209e-02,\n",
+ " 3.20826372e-02, 1.13978281e-01, 2.17828195e-01, 3.45289144e-01,\n",
+ " 4.98022782e-01, 6.77695650e-01, 8.85979189e-01, 1.12454974e+00,\n",
+ " 1.39508854e+00, 1.69928175e+00, 2.03882045e+00, 2.41540061e+00,\n",
+ " 2.83072316e+00, 3.28649394e+00, 3.78442374e+00, 4.32622827e+00,\n",
+ " 4.91362820e+00, 5.54834914e+00, 6.23212165e+00, 6.96668128e+00,\n",
+ " 7.75376850e+00, 8.59512877e+00, 9.49251254e+00, 1.04476752e+01,\n",
+ " 1.14623772e+01, 1.25383838e+01, 1.36774655e+01, 1.48813976e+01])"
+ ]
+ },
+ "execution_count": 34,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "p_year = [i for i in range(1960, 2020)]\n",
+ "p_X = np.array(p_year)\n",
+ "p_X = p_X.reshape(-1, 1)\n",
+ "p_pred_y = model.predict(p_X)\n",
+ "p_pred_y"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 245,
+ "metadata": {
+ "collapsed": true
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "[0.5433,\n",
+ " 0.5633,\n",
+ " 0.6051,\n",
+ " 0.6386,\n",
+ " 0.6858,\n",
+ " 0.7437,\n",
+ " 0.815,\n",
+ " 0.8617,\n",
+ " 0.9425,\n",
+ " 1.0199,\n",
+ " 1.073303,\n",
+ " 1.16485,\n",
+ " 1.27911,\n",
+ " 1.425376,\n",
+ " 1.545243,\n",
+ " 1.684904,\n",
+ " 1.873412,\n",
+ " 2.081826,\n",
+ " 2.351599,\n",
+ " 2.627334,\n",
+ " 2.857307,\n",
+ " 3.207042,\n",
+ " 3.343789,\n",
+ " 3.634038,\n",
+ " 4.037613,\n",
+ " 4.338979,\n",
+ " 4.579631,\n",
+ " 4.855215,\n",
+ " 5.236438,\n",
+ " 5.64158,\n",
+ " 5.963144,\n",
+ " 6.158129,\n",
+ " 6.520327,\n",
+ " 6.858559,\n",
+ " 7.287236,\n",
+ " 7.639749,\n",
+ " 8.073122,\n",
+ " 8.577554463,\n",
+ " 9.062818211,\n",
+ " 9.630664202,\n",
+ " 10.252345464,\n",
+ " 10.581821399,\n",
+ " 10.936419054,\n",
+ " 11.458243878,\n",
+ " 12.213729147,\n",
+ " 13.036640229,\n",
+ " 13.814611414,\n",
+ " 14.45185865,\n",
+ " 14.712844084,\n",
+ " 14.448933025,\n",
+ " 14.992052727,\n",
+ " 15.542581104,\n",
+ " 16.197007349,\n",
+ " 16.78484919,\n",
+ " 17.521746534,\n",
+ " 18.219297584,\n",
+ " 18.707188235,\n",
+ " 19.485393853,\n",
+ " 20.4941]"
+ ]
+ },
+ "execution_count": 245,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "y"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 31,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "image/png": "\n",
+ "text/plain": [
+ "