import pandas as pd
import numpy as np
shipping = pd.read_excel('shipping1997.xlsx',sheet_name=0)
states = pd.read_excel('shipping1997.xlsx', sheet_name=1)
commodities = pd.read_excel('shipping1997.xlsx', sheet_name=2)
distances = pd.read_excel('shipping1997.xlsx', sheet_name=3)
state_dict = dict(zip(states['State'], states['Abbreviation']))
# for i in shipping['origin']:
# ship_origin = shipping['origin'][i]
# value_var = state_dict.get(ship_origin)
# shipping['origin_state'][i] = value_var
# shipping['origin_state'] = shipping['origin'].apply(state_dict)
# shipping['dest_state'] = shipping['dest'].apply(state_dict)
for i in distances['adjacent'].index:
distances['adjacent'][i] = (distances['adjacent'][i] == 1)
shipping.merge(distances, on=['origin', 'dest'])
/shared-libs/python3.7/py-core/lib/python3.7/site-packages/ipykernel_launcher.py:19: SettingWithCopyWarning:
A value is trying to be set on a copy of a slice from a DataFrame
See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
/shared-libs/python3.7/py/lib/python3.7/site-packages/pandas/core/indexing.py:1637: SettingWithCopyWarning:
A value is trying to be set on a copy of a slice from a DataFrame
See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
self._setitem_single_block(indexer, value, name)