| | |
| | """676_252_1434_72 |
| | |
| | Automatically generated by Colab. |
| | |
| | Original file is located at |
| | https://colab.research.google.com/drive/1FniZJX1OfI1PltPCXhpw50znN1aYMFcP |
| | """ |
| |
|
| | import numpy as np |
| | import pandas as pd |
| |
|
| | import os |
| | for dirname, _, filenames in os.walk('/content/world_bank_data_2025.csv'): |
| | for filename in filenames: |
| | print(os.path.join(dirname, filename)) |
| |
|
| | import pandas as pd |
| | import seaborn as sns |
| | import matplotlib.pyplot as plt |
| |
|
| | df = pd.read_csv('/content/world_bank_data_2025.csv') |
| | df.head() |
| |
|
| | print("Shape of dataset:", df.shape) |
| | print("COlumns:\n", df.columns.tolist()) |
| | print("\nMissing values:\n", df.isnull().sum()) |
| | df.dtypes |
| |
|
| | indicators = df.columns.difference(['country_name', 'country_id', 'year']) |
| | df_clean = df.dropna(subset=indicators, how='all') |
| |
|
| | top_countries = df_clean.groupby('country_name')['GDP (Current USD)'].mean().nlargest(10).index |
| | gdp_plot = df_clean[df_clean['country_name'].isin(top_countries)] |
| |
|
| | plt.figure(figsize=(12, 6)) |
| | sns.lineplot(data=gdp_plot, x='year', y='GDP (Current USD)', hue='country_name') |
| | plt.title('GDP Trends (Top 10 Countries by Avg GDP)') |
| | plt.ylabel('GDP in USD') |
| | plt.xticks(rotation=45) |
| | plt.grid(True) |
| | plt.tight_layout() |
| | plt.show() |
| |
|
| | numeric_df = df_clean.select_dtypes(include=['number']).drop(columns=['year']) |
| | plt.figure(figsize=(10, 8)) |
| | sns.heatmap(numeric_df.corr(), annot=True, cmap='coolwarm', fmt='.2f') |
| | plt.title('Correlation Between Economic Indicators') |
| | plt.show() |
| |
|
| | inflation_2020 = df_clean[df_clean['year'] == 2020] |
| | plt.figure(figsize=(12, 5)) |
| | sns.histplot(inflation_2020['Inflation (CPI %)'].dropna(), bins=30, kde=True, color='orange') |
| | plt.title('Inflation Rate Distribution - 2020') |
| | plt.xlabel('Inflation (CPI %)') |
| | plt.grid(True) |
| | plt.show() |