import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns

plt.style.use('seaborn-v0_8')
sns.set_palette("husl")
%matplotlib inline
%config InlineBackend.figure_format = 'retina'

df = pd.read_csv("datasets/ahb_2023.csv", skiprows=1)

print("Dataset Shape:", df.shape)
print("\nFirst few rows:")
df.head()

Dataset Shape: (11, 9)

First few rows:

df_clean = df.iloc[:7].copy()
df_clean.columns = ['sl_no', 'indicators', '2017', '2018', '2019', '2020', '2021', '2022', 'source']
df_clean.reset_index(drop=True, inplace=True)
print("Cleaned Data Shape:", df_clean.shape)
df_clean

Cleaned Data Shape: (7, 9)

def extract_values(text):
    if pd.isna(text):
        return np.nan, np.nan
    text = str(text)
    # Extract numbers and density values
    numbers = text.split('[')
    count = numbers[0].strip()
    density = numbers[1].replace(']', '').strip() if len(numbers) > 1 else np.nan
    return count, density
years = ['2017', '2018', '2019', '2020', '2021', '2022']
for year in years:
    # Extract count and density for each year
    df_clean[[f'{year}_count', f'{year}_density']] = df_clean[year].apply(
        lambda x: pd.Series(extract_values(x))
    )
    df_clean[f'{year}_count'] = pd.to_numeric(df_clean[f'{year}_count'], errors='coerce')
    df_clean[f'{year}_density'] = pd.to_numeric(df_clean[f'{year}_density'], errors='coerce')
print("Transformed Data Columns:")
print(df_clean.columns.tolist())
df_clean[['indicators'] + [f'{year}_count' for year in years] + [f'{year}_density' for year in years]].head()

Transformed Data Columns:
['sl_no', 'indicators', '2017', '2018', '2019', '2020', '2021', '2022', 'source', '2017_count', '2017_density', '2018_count', '2018_density', '2019_count', '2019_density', '2020_count', '2020_density', '2021_count', '2021_density', '2022_count', '2022_density']

plt.figure(figsize=(14, 8))

indicators = df_clean['indicators'].tolist()
colors = plt.cm.Set3(np.linspace(0, 1, len(indicators)))

for i, indicator in enumerate(indicators):
    densities = [df_clean.loc[i, f'{year}_density'] for year in years]
    plt.plot(years, densities, marker='o', linewidth=2.5, markersize=6, 
             label=indicator.split('(')[0][:30] + '...', color=colors[i])

plt.title('Healthcare Workforce Density Trends (2017-2022)\nPer 10,000 Population', 
          fontsize=16, fontweight='bold', pad=20)
plt.xlabel('Year', fontsize=12)
plt.ylabel('Density (per 10,000 population)', fontsize=12)
plt.legend(bbox_to_anchor=(1.05, 1), loc='upper left', fontsize=9)
plt.grid(True, alpha=0.3)
plt.xticks(rotation=45)
plt.tight_layout()
plt.show()

plt.figure(figsize=(12, 8))
densities_2022 = [df_clean.loc[i, '2022_density'] for i in range(len(df_clean))]
short_labels = [indicator.split('(')[0].strip()[:25] for indicator in df_clean['indicators']]

bars = plt.barh(short_labels, densities_2022, color=plt.cm.viridis(np.linspace(0, 1, len(short_labels))))
plt.title('Healthcare Workforce Density in 2022\n(Per 10,000 Population)', 
          fontsize=16, fontweight='bold', pad=20)
plt.xlabel('Density (per 10,000 population)', fontsize=12)
for bar in bars:
    width = bar.get_width()
    plt.text(width + 0.1, bar.get_y() + bar.get_height()/2, 
             f'{width:.2f}', ha='left', va='center', fontweight='bold')
plt.tight_layout()
plt.show()

plt.figure(figsize=(14, 8))
workforce_data = []
for i in range(len(df_clean)):
    counts = [df_clean.loc[i, f'{year}_count'] for year in years]
    workforce_data.append(counts)

workforce_data = np.array(workforce_data)
short_labels = [indicator.split('(')[0].strip()[:20] for indicator in df_clean['indicators']]

plt.stackplot(years, workforce_data, labels=short_labels, alpha=0.8)
plt.title('Composition of Healthcare Workforce Over Time', fontsize=16, fontweight='bold', pad=20)
plt.xlabel('Year', fontsize=12)
plt.ylabel('Number of Healthcare Workers', fontsize=12)
plt.legend(bbox_to_anchor=(1.05, 1), loc='upper left', fontsize=9)
plt.grid(True, alpha=0.3)
plt.xticks(rotation=45)
plt.tight_layout()
plt.show()

plt.figure(figsize=(12, 8))
density_matrix = []
for i in range(len(df_clean)):
    row = [df_clean.loc[i, f'{year}_density'] for year in years]
    density_matrix.append(row)

density_matrix = np.array(density_matrix)
short_labels = [indicator.split('(')[0].strip()[:25] for indicator in df_clean['indicators']]

sns.heatmap(density_matrix, 
            xticklabels=years, 
            yticklabels=short_labels,
            annot=True, 
            fmt='.2f', 
            cmap='YlOrRd',
            cbar_kws={'label': 'Density (per 10,000)'})

plt.title('Healthcare Workforce Density Heatmap (2017-2022)', 
          fontsize=16, fontweight='bold', pad=20)
plt.xlabel('Year', fontsize=12)
plt.ylabel('Healthcare Workforce Category', fontsize=12)
plt.tight_layout()
plt.show()

plt.figure(figsize=(12, 8))
percentage_changes = []
for i in range(len(df_clean)):
    density_2017 = df_clean.loc[i, '2017_density']
    density_2022 = df_clean.loc[i, '2022_density']
    if density_2017 > 0:
        pct_change = ((density_2022 - density_2017) / density_2017) * 100
    else:
        pct_change = 0
    percentage_changes.append(pct_change)
short_labels = [indicator.split('(')[0].strip()[:25] for indicator in df_clean['indicators']]
colors = ['green' if x >= 0 else 'red' for x in percentage_changes]
bars = plt.barh(short_labels, percentage_changes, color=colors, alpha=0.7)
plt.title('Percentage Change in Workforce Density (2022 vs 2017)', 
          fontsize=16, fontweight='bold', pad=20)
plt.xlabel('Percentage Change (%)', fontsize=12)
plt.axvline(x=0, color='black', linestyle='-', alpha=0.3)
for bar in bars:
    width = bar.get_width()
    plt.text(width + (1 if width >= 0 else -5), bar.get_y() + bar.get_height()/2, 
             f'{width:.1f}%', ha='left' if width >= 0 else 'right', 
             va='center', fontweight='bold')
plt.tight_layout()
plt.show()

	sl.no	Indicators	2017	2018	2019	2020	2021	2022	Source
0	1.0	Number of Doctors and density (per 10,000 popu...	345\n [4.3]	337\n [4.6]	318\n [4.32]	336\n[4.62]	354\n[4.64]	354\n[4.64]	HRM, MoH
1	2.0	Number of Nurses and density (per 10,000 popul...	1264 [16.2]	1202 [16.5]	1364 [18.6]	1517\n[20.9]	1608\n[21.07]	1505\n[19.71]	HRM, MoH
2	3.0	Number of Pharmacists and density (per 10,000 ...	36\n [0.5]	44\n [0.6]	43 \n[0.6]	42\n[0.6]	46\n[0.6]	45\n[0.6]	HRM, MoH
3	4.0	Number HA,CO and BHW [density (per 10,000 popu...	636\n [8.1]	604 \n[8.3]	620 \n[8.4]	650\n[8.9]	683\n[8.95]	672\n[8.80]	HRM, MoH
4	5.0	Number of Drungtshos (Indigenous Physicians) a...	55\n [0.7]	53\n [0.7]	54 \n[0.7]	52\n[0.7]	59\n[0.77]	79\n[1.03]	HRM, MoH

	sl_no	indicators	2017	2018	2019	2020	2021	2022	source
0	1.0	Number of Doctors and density (per 10,000 popu...	345\n [4.3]	337\n [4.6]	318\n [4.32]	336\n[4.62]	354\n[4.64]	354\n[4.64]	HRM, MoH
1	2.0	Number of Nurses and density (per 10,000 popul...	1264 [16.2]	1202 [16.5]	1364 [18.6]	1517\n[20.9]	1608\n[21.07]	1505\n[19.71]	HRM, MoH
2	3.0	Number of Pharmacists and density (per 10,000 ...	36\n [0.5]	44\n [0.6]	43 \n[0.6]	42\n[0.6]	46\n[0.6]	45\n[0.6]	HRM, MoH
3	4.0	Number HA,CO and BHW [density (per 10,000 popu...	636\n [8.1]	604 \n[8.3]	620 \n[8.4]	650\n[8.9]	683\n[8.95]	672\n[8.80]	HRM, MoH
4	5.0	Number of Drungtshos (Indigenous Physicians) a...	55\n [0.7]	53\n [0.7]	54 \n[0.7]	52\n[0.7]	59\n[0.77]	79\n[1.03]	HRM, MoH
5	6.0	Number of sMenpas (Sowa Menpas) and density (p...	113 \n[1.4]	113 \n[1.5]	116 \n[1.6]	137\n[1.9]	146\n[1.9]	175\n[2.29]	HRM, MoH
6	7.0	Number and distribution of health facilities (...	276\n [3.6]	279 \n[3.8]	288\n [3.9]	289\n[4.0]	289\n[3.85]	291\n[3.81]	HMIS, MoH

	indicators	2017_count	2018_count	2019_count	2020_count	2021_count	2022_count	2017_density	2018_density	2019_density	2020_density	2021_density	2022_density
0	Number of Doctors and density (per 10,000 popu...	345	337	318	336	354	354	4.3	4.6	4.32	4.62	4.64	4.64
1	Number of Nurses and density (per 10,000 popul...	1264	1202	1364	1517	1608	1505	16.2	16.5	18.60	20.90	21.07	19.71
2	Number of Pharmacists and density (per 10,000 ...	36	44	43	42	46	45	0.5	0.6	0.60	0.60	0.60	0.60
3	Number HA,CO and BHW [density (per 10,000 popu...	636	604	620	650	683	672	8.1	8.3	8.40	8.90	8.95	8.80
4	Number of Drungtshos (Indigenous Physicians) a...	55	53	54	52	59	79	0.7	0.7	0.70	0.70	0.77	1.03

Findings from heat map(Key Findings & Trends)¶

Ratios (2022 data)¶

Code Explanation for me to understand¶

Why use these?¶