Health-Economic-Analysis-CEA-PSA/cost_effectiveness_analysis_PSA.py at main · bcm9/Health-Economic-Analysis-CEA-PSA · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
"""
Health Economic Analysis: Cost-Effectiveness Analysis (CEA) with Probabilistic Sensitivity Analysis (PSA)

Script compares two different interventions, calculating the total cost, health outcomes (in QALYs), and the incremental cost-effectiveness ratio (ICER).

1. Calculate the total cost of each intervention, including costs associated with treatment, outpatient visits, and tests.
2. Compute the cost-effectiveness in terms of cost per QALY for each intervention.
3. Discount future costs and QALYs to their present values using a standard discount rate, reflecting the time value of money and societal preferences for current consumption.
4. Compute the Incremental Cost-Effectiveness Ratio (ICER) to determine the cost per additional QALY gained when one intervention is used instead of the other.
5. Perform a PSA by running simulations with random sampling from specified distributions for costs and QALYs. This accounts for uncertainty in model parameters, providing a more robust analysis of cost-effectiveness.

"""
import pandas as pd
import numpy as np
import seaborn as sns
import matplotlib.pyplot as plt

######################################################################################################################################################
# Define key financial and health-related variables for interventions
######################################################################################################################################################
cost_intervention_A = 10000  # Base cost in GBP for standard intervention
cost_intervention_B = 15000  # Base cost in GBP for new intervention

qaly_intervention_A = 2 # Quality-Adjusted Life Years for A
qaly_intervention_B = 2.5  # Quality-Adjusted Life Years for B

# Hypothetical costs in GBP for additional health care utilisation
cost_per_outpatient_visit = 0
cost_per_test = 0

# Quantity of additional health care utilisation for each intervention
number_of_visits_A = 0
number_of_tests_A = 0
number_of_visits_B = 0
number_of_tests_B = 0

# Parameters for discounting future costs and QALYs to their present values
discount_rate = 0.035  # Discount rate according to NICE guidelines is 3.5%
years = 5             # Time horizon for the analysis

# Willingness to pay threshold
wtp = 20000  # £20,000 per QALY

# Distributions for PSA, mean, standard deviation set as 20% of mean
n_simulations=1000

# Proportional SDs for costs and QALYs based on typical variability
cost_sd = 0.05  # 5% of mean for costs
qaly_sd = 0.01  # 1% of mean for QALYs

cost_intervention_A_dist = np.random.normal(cost_intervention_A, cost_intervention_A * cost_sd, n_simulations)
cost_intervention_B_dist = np.random.normal(cost_intervention_B, cost_intervention_B * cost_sd, n_simulations)
qaly_intervention_A_dist = np.random.normal(qaly_intervention_A, qaly_intervention_A * qaly_sd, n_simulations)
qaly_intervention_B_dist = np.random.normal(qaly_intervention_B, qaly_intervention_B * qaly_sd, n_simulations)

# Plot distributions
# Create a 1x2 panel plot
fig, axes = plt.subplots(1, 2, figsize=(14, 6))
plt.rcParams['font.family'] = 'Calibri'
# Plot costs
fs=20
sns.histplot(cost_intervention_A_dist, kde=True, color="#ADD8E6", label="Intervention A", ax=axes[0],alpha=0.5)
sns.histplot(cost_intervention_B_dist, kde=True, color="#90EE90", label="Intervention B", ax=axes[0],alpha=0.5)
axes[0].set_title('Cost Distribution', fontsize=fs, fontweight='bold')
axes[0].set_xlabel('Cost (£)', fontsize=fs, fontweight='bold')
axes[0].set_ylabel('Frequency', fontsize=fs, fontweight='bold')
axes[0].tick_params(axis='both', which='major', labelsize=14)
axes[0].legend(frameon=False, framealpha=0.1)
axes[0].grid(True, linestyle='--', alpha=0.2)
# Plot QALYs
sns.histplot(qaly_intervention_A_dist, kde=True, color="#ADD8E6", label="Intervention A", ax=axes[1],alpha=0.5)
sns.histplot(qaly_intervention_B_dist, kde=True, color="#90EE90", label="Intervention B", ax=axes[1],alpha=0.5)
axes[1].set_title('QALY Distribution', fontsize=fs, fontweight='bold')
axes[1].set_xlabel('QALYs', fontsize=fs, fontweight='bold')
axes[1].set_ylabel('', fontsize=fs, fontweight='bold')
axes[1].tick_params(axis='both', which='major', labelsize=14)
axes[1].grid(True, linestyle='--', alpha=0.2)
plt.tight_layout()
# Save the figure
save_folder = 'C:/Users/bc22/OneDrive/Documents/code/HE_code/Cost effectiveness analysis/'
plt.savefig(save_folder + 'CE_PSA_kde.png', dpi=300, bbox_inches='tight')
plt.show()

######################################################################################################################################################
# Function definitions
######################################################################################################################################################
# Calculate the total cost of an intervention by summing base costs, and costs from outpatient visits and tests.
def total_cost(base_cost, visits, visit_cost, tests, test_cost):
    return base_cost + (visits * visit_cost) + (tests * test_cost)

# Discounting function
def discount_value(value, rate, years):
    return value / ((1 + rate) ** years)

# Calculate the cost per QALY
def calculate_cost_per_qaly(cost, qaly):
    if qaly == 0:
        return float('inf')  # Avoid division by zero; assume infinite cost effectiveness
    return cost / qaly

# Calculate ICER based on QALYs
# An ICER shows the extra costs divided by the extra benefit when comparing two treatments or interventions.
# It shows how much more you have to spend to gain an additional unit of health benefit (like one extra healthy year, QALY).
# This makes it easier to decide if the extra cost is worth the extra benefit.
def calculate_icer(cost1, cost2, qaly1, qaly2):
    """Calculates the Incremental Cost-Effectiveness Ratio (ICER) between two interventions."""
    delta_cost = abs(cost2 - cost1)
    delta_qaly = qaly2 - qaly1
    if delta_qaly == 0:
        return float('inf')  # Prevent division by zero
    return delta_cost / delta_qaly

######################################################################################################################################################
# Run PSA simulations
#####################################################################################################################################################
results = []
for i in range(n_simulations):
    # Draw random values from distributions
    cost_A = np.random.choice(cost_intervention_A_dist)
    cost_B = np.random.choice(cost_intervention_B_dist)
    qaly_A = np.random.choice(qaly_intervention_A_dist)
    qaly_B = np.random.choice(qaly_intervention_B_dist)

    # Calculate total costs
    total_cost_A = total_cost(cost_A, number_of_visits_A, cost_per_outpatient_visit, number_of_tests_A, cost_per_test)
    total_cost_B = total_cost(cost_B, number_of_visits_B, cost_per_outpatient_visit, number_of_tests_B, cost_per_test)

    # Apply discounting
    discounted_cost_A = discount_value(total_cost_A, discount_rate, years)
    discounted_cost_B = discount_value(total_cost_B, discount_rate, years)

    # Calculate cost per QALY
    cost_per_qaly_A = calculate_cost_per_qaly(discounted_cost_A, qaly_A)
    cost_per_qaly_B = calculate_cost_per_qaly(discounted_cost_B, qaly_B)

    # Calculate ICER
    icer = calculate_icer(discounted_cost_A, discounted_cost_B, qaly_A, qaly_B)

    # Results is list of output of simulations
    results.append((discounted_cost_A, discounted_cost_B, qaly_A, qaly_B, icer))

######################################################################################################################################################
# Convert results to a DataFrame
#####################################################################################################################################################
PSA_results = pd.DataFrame(results, columns=['Discounted Cost A', 'Discounted Cost B', 'QALY A', 'QALY B', 'ICER'])

######################################################################################################################################################
# Print summary statistics
#####################################################################################################################################################
print(PSA_results.describe())

######################################################################################################################################################
# Plot results with CEA plane
#####################################################################################################################################################
delta_cost = PSA_results['Discounted Cost B'] - PSA_results['Discounted Cost A']
delta_qaly = PSA_results['QALY B'] - PSA_results['QALY A']

# Calculate the mean ICER across all simulations. Can be volatile due to the influence of extreme values, especially when QALY differences are small.
mean_icer = PSA_results['ICER'].mean()
# Stable mean ICER provides a more stable and central estimate.
mean_icer_stable = delta_cost.mean() / delta_qaly.mean()

plt.figure(figsize=(7, 6))
plt.rcParams['font.family'] = 'Calibri'
plt.scatter(delta_qaly, delta_cost, color='#3498db', label='PSA results', zorder=5, s=50, alpha=0.7, edgecolors='k')
plt.axhline(0, color='black', linestyle='-')  # Horizontal zero line
plt.axvline(0, color='black', linestyle='-')  # Vertical zero line

# Plot WTP threshold
x_values = [min(-5, -max(delta_qaly) * 1.2), max(5, max(delta_qaly) * 1.2)]
y_values = [x * wtp for x in x_values]
plt.plot(x_values, y_values, color='#d62728', linestyle=':', label=f'WTP £{wtp:,.0f}/QALY')

# Formatting plot
plt.xlim(-abs(max(delta_qaly)) * 1.2, abs(max(delta_qaly)) * 1.2)
# plt.ylim(-abs(max(delta_cost)) * 1.2, abs(max(delta_cost)) * 1.2)
plt.ylim(-30000, 30000)
plt.xticks(fontsize=14)
plt.yticks(fontsize=14)
plt.xlabel(r'$\Delta$ QALYs', fontsize=fs, fontweight='bold')
plt.ylabel(r'$\Delta$ Cost (£)', fontsize=fs, fontweight='bold')
plt.title(f'Cost-Effectiveness Plane (Mean ICER: £{mean_icer_stable:,.0f}/QALY)', fontsize=fs-3, fontweight='bold')
plt.legend(loc='upper left', fontsize=12, frameon=False, framealpha=0.1)
plt.grid(True, linestyle='--', alpha=0.2)
# Save the figure
plt.savefig(save_folder + 'CE_plane_PSA.png', dpi=300, bbox_inches='tight')
plt.show()

#################################################################################################################################################################
# Summarise the results in a DataFrame
#################################################################################################################################################################
df_summary = pd.DataFrame({
    'Mean Discounted Cost': [PSA_results['Discounted Cost A'].mean(), PSA_results['Discounted Cost B'].mean()],
    'Mean QALYs': [PSA_results['QALY A'].mean(), PSA_results['QALY B'].mean()],
    'Mean Incremental Cost': [delta_cost.mean(), None],
    'Mean Incremental QALY': [delta_qaly.mean(), None],
    'Mean ICER': [mean_icer_stable, None]
}, index=['Intervention A', 'Intervention B'])

print(df_summary)

######################################################################################################################################################
# Calculate Jackknife 95% CI
#####################################################################################################################################################
# Define a function to calculate the mean ICER excluding each observation
def jackknife_mean(df, column):
    n = len(df)
    jackknife_means = []
    for i in range(n):
        # Exclude the ith observation and calculate the mean
        jackknife_sample = df.drop(index=i)
        jackknife_mean = jackknife_sample[column].mean()
        jackknife_means.append(jackknife_mean)
    return np.array(jackknife_means)

# Calculate the jackknife mean ICERs
jackknife_means = jackknife_mean(PSA_results, 'ICER')

# If ICER is negative, make jk means negative as such
if mean_icer_stable < 0:
    jackknife_means=-abs(jackknife_means)

# Calculate the jackknife estimate of variance
n = len(PSA_results)
jackknife_variance = (n - 1) / n * np.sum((jackknife_means - mean_icer_stable) ** 2)

# Calculate the standard error
jackknife_se = np.sqrt(jackknife_variance)

# Calculate the 95% CI
confidence_level = 0.95
z_score = 1.96  # For 95% confidence interval

lower_bound = mean_icer_stable - z_score * jackknife_se
upper_bound = mean_icer_stable + z_score * jackknife_se

print(f"95% Jackknife CI for the Mean ICER: (£{lower_bound:.2f}, £{upper_bound:.2f})")