import numpy as np
import pandas as pd
import statsmodels.api as sm
## テーブルの読み込み
df = pd.read_excel("./pwt1001.xlsx", sheet_name="Data")
df_jp = df[df["country"] == "Japan"] # 日本のデータのみ抽出
df_tab = df_jp.loc[:,["year","rgdpna","emp", "avh", "rnna"]] # 関連する列だけ抽出
df_tab.head() # 表示
year | rgdpna | emp | avh | rnna | |
---|---|---|---|---|---|
6090 | 1950 | 272826.00000 | 39.407654 | 2030.413757 | 790520.8125 |
6091 | 1951 | 297234.68750 | 40.384689 | 2012.990686 | 833484.4375 |
6092 | 1952 | 333982.59375 | 41.342064 | 1995.717124 | 865191.6875 |
6093 | 1953 | 356372.46875 | 42.261971 | 1978.591787 | 893951.9375 |
6094 | 1954 | 374102.46875 | 42.801991 | 2008.945400 | 929572.2500 |