import pandas as pd

# turn on print for all rows
pd.set_option('display.max_rows', None)

# build the orginal DataFrame w/ all the rows/columns
df = pd.read_csv('WHO.csv', delimiter = ',', index_col=0)

# display the DataFrame details
print('Data Frame Info:')
print(df.info())

print("*"  * 60)

# save the number of rows in the orginal DataFrame
orginal_count = df.shape[0]

# create a new DataFrame w/ selected non-null columns only
df2 = df.loc[df['Environment and public health workers density (per 10 000 population)'].notnull(), ['CountryID','Environment and public health workers density (per 10 000 population)']]

# display the new DataFrame details
print(df2.info())

print("*"  * 60)

# save the number of rows in the orginal DataFrame
updated_count = df2.shape[0]

# print the modified DataFrame
print(df2)

print("*"  * 60)

print("The total number of Countries is {}, there are {} Countries with data".format(orginal_count, updated_count))
