Could you share some of the code that you’ve used to regularize the betas? I am interested in this approach.
This is the stan model:
functions {
vector seeiittd(real time,
vector state,
vector params,
real beta_left_t,
real beta_left,
real grad_beta,
real population) {
real nu = params[1];
real gamma = params[2];
real kappa = params[3];
real omega = params[4];
// Unpack state
real S = state[1];
real E1 = state[2];
real E2 = state[3];
real I1 = state[4];
real I2 = state[5];
real T1 = state[6];
real T2 = state[7];
real D = state[8];
real infection_rate;
real nuE1 = nu * E1;
real nuE2 = nu * E2;
real gammaI1 = gamma * I1;
real gammaI2 = gamma * I2;
real kappaT1 = kappa * T1;
real kappaT2 = kappa * T2;
real dS_dt;
real dE1_dt;
real dE2_dt;
real dI1_dt;
real dI2_dt;
real dT1_dt;
real dT2_dt;
real dD_dt;
real beta = grad_beta * (time - beta_left_t) + beta_left;
infection_rate = beta * (I1 + I2) * S / population;
dS_dt = -infection_rate;
dE1_dt = infection_rate - nuE1;
dE2_dt = nuE1 - nuE2;
dI1_dt = nuE2 - gammaI1;
dI2_dt = gammaI1 - gammaI2;
dT1_dt = gammaI2 * omega - kappaT1;
dT2_dt = kappaT1 - kappaT2;
dD_dt = kappaT2;
return [dS_dt, dE1_dt, dE2_dt, dI1_dt, dI2_dt, dT1_dt, dT2_dt, dD_dt]';
}
// https://github.com/spinkney/helpful_stan_functions/blob/main/functions/ode/odeint_rk4.stan
vector[] odeint_rk4(real t0, vector y0, real hh, int num_steps, int num_sub_steps,
vector params, vector beta_left_t, vector beta_right_t,
vector beta_left, vector grad_beta, real population
){
int d = num_elements(y0);
vector[d] y[num_steps+1];
vector[d] k1; vector[d] k2; vector[d] k3; vector[d] k4;
real t = t0;
int k = 1;
real h = hh/num_sub_steps;
y[1] = y0;
// Integrate at grid of time points
for(i in 1:num_steps){
y[i+1] = y[i];
for(j in 1:num_sub_steps){
if (t >= beta_right_t[k])
k += 1;
k1 = h * seeiittd(t , y[i+1] , params, beta_left_t[k], beta_left[k], grad_beta[k], population);
k2 = h * seeiittd(t + 0.5 * h, y[i+1] + 0.5 * k1, params, beta_left_t[k], beta_left[k], grad_beta[k], population);
k3 = h * seeiittd(t + 0.5 * h, y[i+1] + 0.5 * k2, params, beta_left_t[k], beta_left[k], grad_beta[k], population);
k4 = h * seeiittd(t + h , y[i+1] + k3 , params, beta_left_t[k], beta_left[k], grad_beta[k], population);
y[i+1] = y[i+1] + (k1 + 2.0 * k2 + 2.0 * k3 + k4) / 6.0;
t = t + h;
}
}
return(y);
}
}
data {
real initial_time;
int<lower=1> n_beta_pieces;
vector<lower=0>[n_beta_pieces] beta_left_t;
vector<lower=0>[n_beta_pieces] beta_right_t;
int<lower=1> T;
real times[T];
int<lower=1> n_disease_states;
real<lower=0> population;
int<lower=1> deaths_length;
int<lower=1> deaths_starts[deaths_length];
int<lower=1> deaths_stops[deaths_length];
int<lower=0> deaths[deaths_length];
int real_data_length;
real real_data[real_data_length];
int integer_data_length;
int integer_data[integer_data_length];
int<lower=0, upper=1> compute_likelihood;
int beta_linear_discontinuous;
int beta_linear_continuous;
int beta_constant_discontinuous;
real beta_regularization;
int num_sub_steps;
}
transformed data {
real mu_dL = 4.00;
real sigma_dL = 0.20;
real mu_dI = 3.06;
real sigma_dI = 0.21;
real mu_dT = 16.00;
real sigma_dT = 0.71;
int max_lag = 13;
real h = times[1] - initial_time;
int num_steps = T;
}
parameters {
real<lower=0, upper=1> initial_state_raw[2];
vector<lower=0>[n_beta_pieces] beta_left;
vector<lower=0>[beta_linear_discontinuous ? n_beta_pieces : 0] beta_right;
real<lower=0> dL;
real<lower=0> dI;
real<lower=0> dT;
real<lower=0, upper=1> omega;
real<lower=0> reciprocal_phi_deaths;
vector<lower=0>[beta_regularization < 0 ? 1 : 0] beta_reg;
}
transformed parameters {
vector<lower=0>[n_beta_pieces] dummy_beta_right;
real dummy_beta_reg = beta_regularization < 0 ? beta_reg[1] : beta_regularization;
vector[n_disease_states] initial_state;
vector[n_beta_pieces] grad_beta;
real nu;
real gamma;
real kappa;
real phi_deaths;
vector[n_disease_states] state_estimate[T+1];
vector[T+1] S;
vector[T+1] E1;
vector[T+1] E2;
vector[T+1] I1;
vector[T+1] I2;
vector[T+1] T1;
vector[T+1] T2;
vector[T+1] D;
vector[T] daily_infections;
vector[T] daily_deaths;
vector[T] effective_reproduction_number;
if(beta_linear_discontinuous){
dummy_beta_right = beta_right;
} else if(beta_linear_continuous){
if(n_beta_pieces > 1){
dummy_beta_right[:n_beta_pieces-1] = beta_left[2:];
}
dummy_beta_right[n_beta_pieces] = beta_left[n_beta_pieces];
} else if(beta_constant_discontinuous){
dummy_beta_right = beta_left;
} else{
reject("Select an ansatz!");
}
initial_state[1] = (population-5.0)*initial_state_raw[1] + 1.0;
initial_state[2] = (population-5.0)*(1.0-initial_state_raw[1])*initial_state_raw[2]/2.0 + 1.0;
initial_state[3] = (population-5.0)*(1.0-initial_state_raw[1])*initial_state_raw[2]/2.0 + 1.0;
initial_state[4] = (population-5.0)*(1.0-initial_state_raw[1])*(1.0-initial_state_raw[2])/2.0 + 1.0;
initial_state[5] = (population-5.0)*(1.0-initial_state_raw[1])*(1.0-initial_state_raw[2])/2.0 + 1.0;
initial_state[6] = 0.0;
initial_state[7] = 0.0;
initial_state[8] = 0.0;
grad_beta = (dummy_beta_right - beta_left) ./ (beta_right_t - beta_left_t);
nu = 2.0/dL;
gamma = 2.0/dI;
kappa = 2.0/dT;
phi_deaths = 1.0 / reciprocal_phi_deaths;
{
vector[4] params = [nu, gamma, kappa, omega]';
state_estimate = odeint_rk4(
initial_time, initial_state, h, num_steps, num_sub_steps,
params, beta_left_t, beta_right_t, beta_left, grad_beta, population
);
}
S = to_vector(state_estimate[, 1]);
E1 = to_vector(state_estimate[, 2]);
E2 = to_vector(state_estimate[, 3]);
I1 = to_vector(state_estimate[, 4]);
I2 = to_vector(state_estimate[, 5]);
T1 = to_vector(state_estimate[, 6]);
T2 = to_vector(state_estimate[, 7]);
D = to_vector(state_estimate[, 8]);
daily_infections = S[:T] - S[2:] + machine_precision();
daily_deaths = D[2:] - D[:T] + machine_precision();
{
vector[T+1] I = I1 + I2;
effective_reproduction_number= (daily_infections ./ I[:T])*dI;
}
}
model {
initial_state_raw[1] ~ beta(5.0, 0.5);
initial_state_raw[2] ~ beta(1.1, 1.1);
beta_left ~ normal(0, 0.5);
if(beta_regularization < 0){
dummy_beta_reg ~ lognormal(log(-beta_regularization), 1);
}
if(beta_regularization && n_beta_pieces > 1){
if (beta_linear_discontinuous){
//Not clear what is appropriate here
dummy_beta_right ~ normal(beta_left, dummy_beta_reg);
beta_left[2:] ~ normal(dummy_beta_right[:n_beta_pieces-1], dummy_beta_reg);
}else{
beta_left[2:] ~ normal(beta_left[:n_beta_pieces-1], dummy_beta_reg);
}
}
beta_right ~ normal(0, 0.5);
dL ~ normal(mu_dL, sigma_dL);
dI ~ normal(mu_dI, sigma_dI);
dT ~ normal(mu_dT, sigma_dT);
omega ~ beta(100, 9803);
reciprocal_phi_deaths ~ exponential(5);
if (compute_likelihood == 1) {
for (i in 1:deaths_length) {
target += neg_binomial_2_lpmf(deaths[i] |
sum(daily_deaths[deaths_starts[i]:deaths_stops[i]]), phi_deaths);
}
}
}
generated quantities {
vector[T-1] growth_rate = (log(daily_infections[2:]) - log(daily_infections[:T-1]))*100;
int pred_deaths[deaths_length];
for (i in 1:deaths_length) {
pred_deaths[i] = neg_binomial_2_rng(sum(daily_deaths[deaths_starts[i]:deaths_stops[i]]),
phi_deaths);
}
}
I think the interface is mostly the same as before. I did add some things:
int beta_linear_discontinuous;
int beta_linear_continuous;
int beta_constant_discontinuous;
real beta_regularization;
int num_sub_steps;
- Setting to one either of
beta_linear_discontinuous
,beta_linear_continuous
orbeta_constant_discontinuous
selects the corresponding ansatz forbeta
-
num_sub_steps
lets you perform intermediate rk4 steps. Set to one for the original behavior
For beta_regularization
: there are three behaviors:
-
beta_regularization=0
: no regularization -
beta_regularization>0
: do something likebeta_left[2:] ~ normal(beta_left[:n_beta_pieces-1], dummy_beta_reg);
-
beta_regularization<0
: in addition treat beta_regularization as a log-normally distributed parameter.
However, everything is in serious need of refactoring.
For fitting, specifying metric=‘dense_e’ appears to speed things up and I think inits should be samples from the prior with constant-in-time betas.
Edit: Note that not all combinations appear to work well. Some other reparametrization may be in order.
This is interesting! Thanks! I will try the model with several beta_regularization
values and also with:
beta_linear_discontinuous
beta_linear_continuous
beta_constant_discontinuous
The num_sub_steps
inside the rk4
could be interpreted as weeks in time t
to use the beta
s to integrate the ODE system right?
Yes, I agree that it needs a major refactoring.
Hm, no, it specifies how many rk4 timesteps are performed per day. hh
is 1 day, and the h
used by the intermediate steps is hh/num_sub_steps
.
Hm, okay everyone, forget every other model that has ever been mentioned in this thread. With the typical overreach I present to you the only SEIR model you’ll ever need. (I think) it allows any type of priors, regularization, ansatz or stochasticity for the infection rate, while converging perfectly and fast while probably being much more exact than any of the other models. Tagging the relevant people: @storopoli, @caesoma and @s.maskell and for good measure @bbbales2.
In less than two minutes we get > 4k N_eff for any of 485+ instead of 63 parameters.
So, while I don’t believe its applicable to many problems, here it fits perfectly. It’s essentially what @wds15 said:
The key idea is just that anything downstream of E1
is linear. Instead of parametrizing in terms of some inital condition and beta
s, we just parametrize in terms of new infections per day. Then, once per leapfrog iteration we can compute a fixed transition matrix using matrix_exp
and just iteratively (per day) compute a single matrix vector product.
For sake of simplicity I don’t pool the daily deaths in this model, but this and anything else is perfectly possible and should not impact convergence at all ™.
Enjoy:
data {
int no_days;
int population;
//observed new deaths per day
int new_deaths[no_days];
real beta_regularization;
real likelihood;
}
parameters {
/*
The elements of a simplex sum to one.
The first no_days entries represent daily new infections as a fraction
of the total population while the last entry represents the proportion that
remains susceptible at the end.
*/
simplex[no_days+1] unit_dS;
real<lower=0> dL;
real<lower=0> dI;
real<lower=0> dT;
real<lower=0, upper=1> omega;
real<lower=0> reciprocal_phi_deaths;
}
transformed parameters {
vector[no_days] daily_infections = population * unit_dS[:no_days];
vector[no_days] daily_deaths;
vector[no_days] beta;
if(likelihood){
vector[7] state = [
0, 0,
0, 0,
0, 0,
0
]';
matrix[7, 7] transition_matrix = matrix_exp([
//[E1 ,E2 ,I1 ,I2 ,T1 ,T2 ,D]
[-2/dL,0 ,0 ,0 ,0 ,0 ,0],//E1
[+2/dL,-2/dL,0 ,0 ,0 ,0 ,0],//E2
[0 ,+2/dL,-2/dI,0 ,0 ,0 ,0],//I1
[0 ,0 ,+2/dI,-2/dI ,0 ,0 ,0],//I2
[0 ,0 ,0 ,+2/dI*omega,-2/dT,0 ,0],//T1
[0 ,0 ,0 ,0 ,+2/dT,-2/dT,0],//T2
[0 ,0 ,0 ,0 ,0 ,+2/dT,0]//D
]);
real S = population;
real last_D;
for(i in 1:no_days){
last_D = state[7];
S -= daily_infections[i];
state[1] += daily_infections[i];
state = transition_matrix * state;
daily_deaths[i] = state[7] - last_D;
beta[i] = daily_infections[i] * population / (S*(state[3]+state[4]));
}
}
}
model {
//One possible regularization
if(beta_regularization){
unit_dS[2:no_days] ~ lognormal(log(unit_dS[:no_days-1]), beta_regularization);
}
//This imposes a very wide prior on the proportion of still susceptible people!
unit_dS[no_days+1] ~ uniform(0,1);
dL ~ normal(4., .2);
dI ~ normal(3.06, .21);
dT ~ normal(16, .71);
omega ~ beta(100, 9803);
reciprocal_phi_deaths ~ exponential(5);
if(likelihood){
new_deaths ~ neg_binomial_2(daily_deaths, 1/reciprocal_phi_deaths);
}
}
Small caveat: I don’t know how exact matrix_exp
is, but probably quite exact.
Edit: also, unit_S
is very inappropriately named, I did not know how simplex
works.
Edit2: updated the model.
Edit3: fixed an off-by one error in beta[i] = daily_infections[i] * population / (S*(state[3]+state[4]));
← this is correct.
@Funko_Unko this is great! You took the whole ODE solver out!
- We are missing the
generated quantities
block:generated quantities { vector[no_days-1] growth_rate = (log(daily_infections[2:]) - log(daily_infections[:no_days-1]))*100; int pred_deaths[no_days] = neg_binomial_2_rng(daily_deaths, 1/reciprocal_phi_deaths); }
- We are also missing
effective_reproduction_number
:transformed parameters { vector[no_days] daily_infections = population * unit_S[:no_days]; vector[no_days] daily_deaths; vector[no_days] effective_reproduction_number; { vector[7] state = [ 0, 0, 0, 0, 0, 0, 0 ]'; matrix[7, 7] transition_matrix = matrix_exp([ //[E1 ,E2 ,I1 ,I2 ,T1 ,T2 ,D] [-2/dL,0 ,0 ,0 ,0 ,0 ,0],//E1 [+2/dL,-2/dL,0 ,0 ,0 ,0 ,0],//E2 [0 ,+2/dL,-2/dI,0 ,0 ,0 ,0],//I1 [0 ,0 ,+2/dI,-2/dI ,0 ,0 ,0],//I2 [0 ,0 ,0 ,+2/dI*omega,-2/dT,0 ,0],//T1 [0 ,0 ,0 ,0 ,+2/dT,-2/dT,0],//T2 [0 ,0 ,0 ,0 ,0 ,+2/dT,0]//D ]); real last_D; for(i in 1:no_days){ last_D = state[7]; state[1] += daily_infections[i]; state = transition_matrix * state; daily_deaths[i] = state[7] - last_D; effective_reproduction_number[i] = daily_infections[i] / (state[3] + state[4]) * dI; }}
}
-
Can we use
target += neg_binomial_2_lpmf
? Does it speed things up?target += neg_binomial_2_lpmf(deaths | daily_deaths, 1 / reciprocal_phi_deaths);
-
deaths[no_deaths]
is a cumulative sum (cumsum
). Just to clear for the people watching this.
I am running now. @Funko_Unko does 1. and 2. are okay?
Thanks!
EDIT: I am calling this model deaths_matrix_exp.stan
:)
EDIT2: Damn it is fast!
All 4 chains finished successfully.
Mean chain execution time: 117.2 seconds.
Total execution time: 127.5 seconds.
EDIT3: I am doing something wrong with the deaths (???). The gray thing is the 90% range (q5
and q90
):
This is absolutely awesome. Wow. We’ll certainly take a look. Thank you for the insight.
Simon
PS @remoore, @alphillips: please take a look with some urgency. This could well be transformational.
@storopoli Hm, this is how a very unpolished fan plot that I have lying around looks like for me for varying beta_regularization
:
Let me rename a few things in the above model and introduce some comments to clarify things. I’ll edit the above post.
- Re 1: Looks good to me.
daily_infections
anddaily_deaths
should exactly mirror the quantities from the previous models. - Re 2: This also looks good to me, but you/the data will have to be the ultimate judge of this.
- Re 3: I don’t think this makes a difference, but I do not know the Stan internals.
- Re 4: The model expects the daily new deaths. I’ll rename the variable to make this in line with the provided data, which has a column
new_deaths
.
@s.maskell Thanks, I was/am pretty excited about this myself. BTW, from what I have seen from the Liverpool model, this parametrization should also be applicable there.
Some further thoughts for anyone that’s listening:
There are two main differences to the previous models,
- the change in how the ODE is (approximately) solved and
- the changed parametrization
and I’m not sure what has the greater impact.
An (nonexistent) efficient implementation of the custom rk4 solver (with one step per day) boils down to the addition of 4 size-8 vectors which are quickly computed. Contrast this with one 7x7 dense matrix-vector multiplication for the above model. Speedwise, I would not be surprised if the rk4 solver could actually be quicker/not much slower than the matrix_exp
method for a single iteration. I did very shallowly investigate the impact that the accuracy of the solver has on the inference (hence the sub_num_steps
variable) and found it to be essentially nonexistent, probably due to the sparse and delayed data.
However the previous models were generally much slower than this one, and that with far fewer variables. Before, we had 63 (or 2x63) parameters for beta and now we have 435+ parameters. The best model so far finished in roughly 8 minutes, but convergence was actually slightly finicky and depended on the choice of ansatz, regularization, prior and initialization. I did also try the previous models with one beta parameter per day, but this took even longer than 8 minutes and I’m quite impatient. On top, if you look at N_eff
of the previous models (both my model and UNINOVE), these were generally around or less than 1k, with the worst N_eff (usually lp__
) being only around 300. For this model, even the worst N_eff is usually above 2k, Rhat(lp__) is always in the order of 1.001 and E-BFMI is around 1.
So this all points towards the main benefit actually arising from the reparametrization, but I’m no expert. Can someone more experienced than I weigh in?
One further question:
Rt.live appears to have used a simple convolution model, and still appears to have been much slower:
Sampling 4 chains for 700 tune and 200 draw iterations (2_800 + 800 draws total) took 4340 seconds.
INFO:pymc3:Sampling 4 chains for 700 tune and 200 draw iterations (2_800 + 800 draws total) took 4340 seconds.
However, they used pymc3 and an extended model, so maybe this is the reason? I haven’t actually looked at (or rather understood) their model.
Edit with a small comment:
Actually, the matrix_exp
method should stay much quicker than even the most efficient rk4 method, because the small 7x7 matrix can probably stay in cache and the intermediate rk-steps depend on each other, probably leading to worsened pipelining. But who knows in this age of compilers/processors.
Further edit: @tvladeck is actually here, maybe he could weigh in? Relevant backlink to Translating random walk to gaussian process (and pymc3 model to stan)
I’ve ran the model using couple of beta_regularization
values. The predictions and 90% quantiles seems do behave better now. Here are some benchmarks using UNINOVE data (435 days) in a 2018 Mac Mini i5-8500B (6-core single thread per core):
-
beta_regularization = 0
All 4 chains finished successfully. Mean chain execution time: 55.6 seconds. Total execution time: 56.8 seconds.
-
beta_regularization = 0.01
All 4 chains finished successfully. Mean chain execution time: 820.2 seconds. Total execution time: 837.2 seconds. 1621 of 4000 (41.0%) transitions hit the maximum treedepth limit of 10 or 2^10-1 leapfrog steps. Trajectories that are prematurely terminated due to this limit will result in slow exploration. Increasing the max_treedepth limit can avoid this at the expense of more computation. If increasing max_treedepth does not remove warnings, try to reparameterize the model.
-
beta_regularization = 0.10
All 4 chains finished successfully. Mean chain execution time: 163.7 seconds. Total execution time: 165.6 seconds.
-
beta_regularization = 0.20
All 4 chains finished successfully. Mean chain execution time: 125.3 seconds.. Total execution time: 132.5 seconds.
-
beta_regularization = 0.30
All 4 chains finished successfully. Mean chain execution time: 107.7 seconds. Total execution time: 116.9 seconds.
-
beta_regularization = 0.30
All 4 chains finished successfully. Mean chain execution time: 107.7 seconds. Total execution time: 116.9 seconds.
-
beta_regularization = 0.5
All 4 chains finished successfully. Mean chain execution time: 104.7 seconds. Total execution time: 110.0 seconds.
Also here is the model in .stan
file with the generated quantities block and beta regularizations.
deaths_matrix_exp.stan (2.6 KB)
could you share the code that you’ve used to generate this image?
Ah, right, it looks like too small a beta_regularization
leads to beta being forced to be rather constant and the model compensating by cranking up (or down?) reciprocal_phi_deaths
. Observe that in my figure in the left column (beta_regularization=0.01
) and the lowest fanplot (daily_deaths
) the lines to not agree with each other.
Sure.
Edit:
Also, due to the periodicity of the reporting of deaths which has been masked by the pooling, reciprocal_phi_deaths
probably gets under/overestimated anyways. This could probably be fixed either by pooling again or by modeling this periodicity explicitly.
Yeah we might work instead of daily_deaths
with weekly_deaths
?
Hi all,
Firstly, I want to apologise for being late for the conversation.
I’ve spent quite a lot of time working on this model, and it’s great to get your collective thoughts on how it could be made more computationally efficient. There are an awful lot of excellent ideas in this thread, most of which I’m still trying to digest. I intend to mull these over and contact you about them at a later date.
My initial comments relate to @Funko_Unko’s
only SEIR model you’ll ever need
I think the idea is a brilliant way of drastically reducing the time it takes to fit the model. Still, I’m slightly concerned that this performance improvement comes at the expense of discarding potentially important epidemiological understanding that the original model structure captured. This reparameterisation breaks the link between the size of the infectious population and the rate of new infections, making the distinctions between the meanings of the exposed, infectious, and terminally ill compartments less clear. My concern is that by going further down this route, we’ll end up with a black-box model that assumes the time series of observations to be lagged version of the time series of daily infections without capturing assumptions about the epidemiological processes that drive the rate of infection.
I’m more than happy to change my view and would welcome others thoughts on this.
Could you initialise the parameters in common between the two models using values from the simplified / fast one?
@hhau, initialising the beta parameterisation of the model with the outputs of the infection rate parameterisation of the model is undoubtedly a good idea, but I’m not sure how much of a performance improvement you would get
Yes, you can. However, the initialization is not the only problem the original models have. To really save any time you’d also have to translate the metrics somehow, which should be possible in principle, but maybe somewhat tedious in practice. On top, even if you had a perfectly initialized metric, you might still get divergences or other issues.
Either this, this is reasonably straightforward. You could also introduce an additional vector parameter
real<lower=0, upper=1> reporting_probability[7];
which would quantify how probable the reporting at each weekday is. One preliminary model would yield this:
Edit: whoops, forgot the figure:
- Left: condition on weekly deaths only. No problems here.
- Right: Use some reporting probability. Quite a few divergences here. So it’s not 100% straightforward.
Yes, this is most certainly a possibility/danger. Really, the simplex model is just a glorified convolution model. However, you can still impose the same priors on an (approximated) beta, so I think you should be able to inject all the domain knowledge you have/need.
Not much. Very little work is put into finding the typical set (I think 50 warmup iterations), while almost all of the work has to be put into estimating the metric. The only efficient reinitialization requires that you somehow transfer the metrics from one fit to the other. Which is possible and will, if the geometry permits it, provide insane speedups.
I think you should be able to inject all the domain knowledge you have/need
It’s not immediately apparent to me how to incorporate the domain knowledge that a larger infectious population leads to a larger infection rate into the simplex model. Can you expand on how you would go about injecting this information?
So I think that you can in principle just add something like the following to your model block:
daily_infections ~ lognormal(log(factor*SI/population), sigma);
where factor
and sigma
would have to be determined somehow and SI=S*(I1+I2)
as before. But I’m not quite sure.
Just caught up with and absorbed all of the above - thanks for all the brilliant suggestions.
This sounds reasonable to me, (daily_infections
is just a constant multiple of unit_dS
so no Jacobian adjustment needed) but I think it conflicts with the regularisation in:
unit_dS[2:no_days] ~ lognormal(log(unit_dS[:no_days-1]), beta_regularization);
There’s probably a way of doing both at once but I’d have to think carefully about how to achieve that.