Ludek's Blog About People Analytics: Harnessing Bayesian analysis for business process simulation

Luděk Stehlík

import pandas as pd # table with all pilot nominees nominees=pd.read_excel("./dataBayesSim.xlsx", sheet_name="nominees") # table with all pilot participants participants=pd.read_excel("./dataBayesSim.xlsx", sheet_name="participants") # showing first few rows of the tables nominees.head(5)

# estimating the participation rate nominated = nominees.shape[0] participated = nominees['participation'].sum() # setting up the model with pm.Model() as participationModel: # assigning a flat Beta prior for p p = pm.Beta("p", alpha=1, beta=1) # defining likelihood obs = pm.Binomial("obs", p=p, n=nominated, observed=participated) # running mcmc idata = pm.sample(3000, tune=500, chains=3, cores=1) # generating posterior predictive sample participationModelPosterior = pm.sample_posterior_predictive(idata, extend_inferencedata=True)

import arviz as az # trace plot showing the evolution of parameter vector over the iterations of Markov chain(s) #az.plot_trace(idata, kind="trace", divergences="bottom", show=True) # posterior predictive check #az.plot_ppc(participationModelPosterior, num_pp_samples=500, random_seed=7, alpha=0.3, textsize=14, kind='kde', show=True) # tabular and visual summary of the posterior probability distribution of the p parameter value az.summary(idata).round(2)

# setting up the Poisson model with pm.Model() as referralModel: # weakly informative exponential prior for lambda parameter with mean 3 lambda_ = pm.Exponential('lambda', 1/3) # alternative flat prior for lambda parameter #lambda_ = pm.Uniform('lambda', lower=0, upper=25) # Poisson likelihood y_obs = pm.Poisson('y_obs', mu=lambda_, observed=participants['referrals']) # running mcmc trace = pm.sample(3000, tune=500, chains=3, cores=1) # generating posterior predictive sample referralModelPosterior = pm.sample_posterior_predictive(trace, extend_inferencedata=True)

# trace plot showing the evolution of parameter vector over the iterations of Markov chain(s) #az.plot_trace(trace, kind="trace", divergences="bottom", show=True) # posterior predictive check #az.plot_ppc(referralModelPosterior, num_pp_samples=500, random_seed=7, alpha=0.3, textsize=14, kind='kde', show=True) # tabular and visual summary of the posterior probability distribution of the p parameter value az.summary(trace).round(2)

import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
sns.set_theme(style="white")

# sampling from the posterior distribution the parameters p and lambda
posterior = pd.DataFrame({
    'p': idata['posterior']['p'].values.flatten(),
    'lambda': trace['posterior']['lambda'].values.flatten()
})

# computing expected number of referrals with 1500 nominees
posterior['expectedReferrals'] = 1500*posterior['p']*posterior['lambda']

# computing summary statistics
m = posterior['expectedReferrals'].mean().round(1)
Q1 = np.percentile(posterior['expectedReferrals'], 25).round(1)
Q2 = np.percentile(posterior['expectedReferrals'], 50).round(1)
Q3 = np.percentile(posterior['expectedReferrals'], 75).round(1)

# visualizing results
sns.histplot(posterior['expectedReferrals'], bins=30, kde=True, color='#5b7db6').set(xlabel ="Number of new referrals", ylabel = "Count")
plt.gcf().suptitle('Expected referrals for program rollout to all 1500 employees', fontsize=13)
plt.gca().set_title(f'Mean={m}, Q1={Q1}, Median={Q2}, Q3={Q3}', fontsize=10)
plt.show()

Stehlík (2023, Sept. 17). Ludek's Blog About People Analytics: Harnessing Bayesian analysis for business process simulation. Retrieved from https://blog-about-people-analytics.netlify.app/posts/2023-09-17-bayesian-simulation/

@misc{stehlík2023harnessing, author = {Stehlík, Luděk}, title = {Ludek's Blog About People Analytics: Harnessing Bayesian analysis for business process simulation}, url = {https://blog-about-people-analytics.netlify.app/posts/2023-09-17-bayesian-simulation/}, year = {2023} }

Harnessing Bayesian analysis for business process simulation

Author

Affiliation

Published

Citation

Footnotes

Citation