import pandas as pd


df = pd.read_excel('data/kgz_misc_popp.xlsx')
df


print(df)


# Columns of the dataframe
print(df.columns)


# Printing a specific column
print(df['latitude'])


print(df['nam'])


# enter your code


print(df['nam'].loc[3])


print(df.loc[3])


# Showing only the first 5 lines
df.head(5)


df.loc[10:15, 'nam':'latitude']


df.loc[df['nam'] == 'MANAS']


df.loc[df['tile_id'] == 1]


# enter your code


print(df.dtypes)


df.loc[df['tile_id'] == '1']


df.loc[df['latitude']<40, ['nam','tile_id','longitude']]


# enter your code


import numpy as np


df.loc[4,'nam'] = np.nan


df['nam'].loc[4]


df.dropna()

df


df['tile_id']+100


print('Max \n', df.max())
print('----------------------------')
print('\nMin \n', df.min())


print(f'Lenght of our dataframe: {len(df)} rows.')


df[['tile_id','end_id']].max()


print(f'Lenght of our dataframe: {len(df)} rows.')
print(f"Max of ids : {df[['tile_id','end_id']].max()}. \n\nMin of temperatur : {df[['tile_id','end_id']].min()}")


temp_random = np.random.random(len(df))*(df['tile_id'].max()-df['tile_id'].min()) + df['tile_id'].min()
df['tile_id2'] = temp_random.round(1)

df


df['mean_tile_id'] = (df['tile_id'] + df['tile_id2'])/2.0
df


df['mean_tile_id'] = df.loc[:,['tile_id','tile_id2']].mean(axis=1)
df


# enter your code


df.to_excel('data/new_sheet.xlsx')


# Select my subset of data
df_subset = df.loc[:,['latitude','longitude','tile_id']]


# Write to excel file
df_subset.to_excel('data/new_sheet.xlsx')


# Read from excel file
df1 = pd.read_excel('data/new_sheet.xlsx')
df1


print(df1.columns)


df.to_excel('data/new_sheet.xlsx', index=False)


df1 = pd.read_excel('data/new_sheet.xlsx')
df1


file = open('data/new_sheet.txt', 'w')
file.write(df_subset.to_string())
file.close()


df1 = pd.read_table('data/new_sheet.txt', delim_whitespace=True)
df1


df.to_csv('data/new_sheet.csv', index= False)


df1 = pd.read_csv('data/new_sheet.csv')
df1


df1 = pd.read_csv('data/new_sheet.csv', usecols=['latitude','longitude','tile_id'])
df1

More Advanced Python - Import data files¶

Excel Sheet Manipulation¶

Data manipulation in Pandas¶

Now let's save the data to a file!¶