Notebook

In [70]:

libraries = c("dplyr","magrittr","tidyr","ggplot2","rstan","readxl")
for(x in libraries) { library(x,character.only=TRUE,warn.conflicts=FALSE,quietly=TRUE) }

require(zoo)
require(lubridate)

base_sz = 12 # base_size parameter
theme_set(theme_bw())

'%&%' = function(x,y) paste0(x,y)

options(mc.cores = parallel::detectCores())
rstan_options(auto_write = TRUE)

packageVersion("rstan")
packageVersion("StanHeaders")
rstan::stan_version()

Loading required package: zoo

Warning message in library(package, lib.loc = lib.loc, character.only = TRUE, logical.return = TRUE, :
“there is no package called ‘zoo’”

[1] ‘2.19.3’

[1] ‘2.21.0.1’

'2.21.0'

In [71]:

read.csv("../../data/supplemetary table.csv") %>% 
    filter(SIClassification=='Certain') %>%
    select(-X, -Source, -SIClassification, -DiagnosisCountry) %>%
    mutate(InfectorOnset = as.Date(InfectorOnset, format="%m/%d/%Y"), 
           InfecteeOnset = as.Date(InfecteeOnset, format="%m/%d/%Y")) -> df
df

A data.frame: 18 × 6
InfectorOnset	InfecteeOnset	ER	EL	SL	SR
<date>	<date>	<int>	<int>	<int>	<int>
2020-01-17	2020-01-20	48	47	50	51
2020-01-22	2020-01-26	53	52	56	57
2020-01-24	2020-01-26	55	54	56	57
2020-01-24	2020-01-26	55	54	56	57
2020-01-26	2020-01-30	57	56	60	61
2020-01-26	2020-01-29	57	56	59	60
2020-01-26	2020-01-30	57	56	60	61
2020-01-26	2020-01-30	57	56	60	61
2020-01-21	2020-01-24	52	51	54	55
2020-01-21	2020-01-24	52	51	54	55
2020-01-20	2020-01-29	51	50	59	60
2020-02-01	2020-02-05	63	62	66	67
2019-12-20	2019-12-25	20	19	24	25
2019-12-20	2019-12-29	20	19	28	29
2019-12-27	2020-01-03	27	26	33	34
2019-12-12	2019-12-19	12	11	18	19
2019-12-21	2019-12-24	21	20	23	24
2020-01-04	2020-01-11	35	34	41	42

In [72]:

CUTOFF_TIME = as.Date('2020-02-12')
t0 = as.Date('2019-12-01')

df['tstar'] = CUTOFF_TIME
df %<>% mutate(dist = (SR+SL)/2-(ER+EL)/2,
               SL = if_else(SL < EL, EL, SL), 
               ER = if_else(ER > SR, SR, ER), 
               tstar = as.numeric(tstar - t0)) 

df

A data.frame: 18 × 8
InfectorOnset	InfecteeOnset	ER	EL	SL	SR	tstar	dist
<date>	<date>	<int>	<int>	<int>	<int>	<dbl>	<dbl>
2020-01-17	2020-01-20	48	47	50	51	73	3
2020-01-22	2020-01-26	53	52	56	57	73	4
2020-01-24	2020-01-26	55	54	56	57	73	2
2020-01-24	2020-01-26	55	54	56	57	73	2
2020-01-26	2020-01-30	57	56	60	61	73	4
2020-01-26	2020-01-29	57	56	59	60	73	3
2020-01-26	2020-01-30	57	56	60	61	73	4
2020-01-26	2020-01-30	57	56	60	61	73	4
2020-01-21	2020-01-24	52	51	54	55	73	3
2020-01-21	2020-01-24	52	51	54	55	73	3
2020-01-20	2020-01-29	51	50	59	60	73	9
2020-02-01	2020-02-05	63	62	66	67	73	4
2019-12-20	2019-12-25	20	19	24	25	73	5
2019-12-20	2019-12-29	20	19	28	29	73	9
2019-12-27	2020-01-03	27	26	33	34	73	7
2019-12-12	2019-12-19	12	11	18	19	73	7
2019-12-21	2019-12-24	21	20	23	24	73	3
2020-01-04	2020-01-11	35	34	41	42	73	7

In [73]:

mean(df$dist)

4.61111111111111

In [74]:

sd(df$dist)

2.226548077152

In [75]:

data_drname = "../../data"
flname = 'data.csv'
write.table(df, paste0(data_drname,flname), row.names=FALSE, sep=",", quote = FALSE)

Stan simulations¶

In [76]:

stanmaindir = '../../../../Hokkaido_Backup/Wuhan_Serial_interval_2020/certain'
unlink(stanmaindir, recursive=T)
dir.create(stanmaindir)

No truncation¶

Lognormal distribution¶

In [77]:

## main dir for Stan simulations
standirname = stanmaindir%&%"/lognormal-no_truncation"
unlink(standirname, recursive=T)
dir.create(standirname)

# Dumping data
N = nrow(df)
E_L = df$EL
E_R = df$ER
S_L = df$SL
S_R = df$SR
stan_rdump(c('E_L', 'E_R', 'S_L', 'S_R', 'N'), file=standirname%&%"/Data.R") 

# Dumping initial conditions
e_raw = rep(.5, N)
s_raw = rep(.5, N)
logmean_SI = log(mean(df$dist))
logsd_SI = log(sd(df$dist))
stan_rdump(c('e_raw', 's_raw', 'logmean_SI', 'logsd_SI'), file=standirname%&%"/Init.R") 

# Stan program
"data {
    int<lower = 0> N; // number of records
    vector<lower = 0>[N] E_L;
    vector<lower = 0>[N] E_R;
    vector<lower = 0>[N] S_L;
    vector<lower = 0>[N] S_R;
}

parameters {
    real logmean_SI;
    real logsd_SI;

    vector<lower = 0, upper = 1>[N] s_raw;
    vector<lower = 0, upper = 1>[N] e_raw;
}

transformed parameters {
    real<lower = 0> param2 = sqrt(log((exp(2*(logsd_SI-logmean_SI))+1.0)));
    real param1 = logmean_SI - param2^2/2.0;

    vector<lower = min(S_L), upper = max(S_R)>[N] s;
    vector<lower = min(E_L), upper = max(E_R)>[N] e;

    s = S_L + (S_R - S_L) .* s_raw;
    for (k in 1:N) 
        if (E_R[k] > s[k]) 
            e[k] = E_L[k] + (s[k] - E_L[k]) * e_raw[k];
        else
            e[k] = E_L[k] + (E_R[k] - E_L[k]) * e_raw[k];
}

model {
    logmean_SI ~ std_normal();
    logsd_SI ~ std_normal();

    e_raw ~ normal(0.5, 1.0);
    s_raw ~ normal(0.5, 1.0);

    target += lognormal_lpdf(s - e | param1, param2);
}

generated quantities {
    real<lower = 0> mean_SI = exp(param1 + square(param2) / 2);
    real<lower = 0> sd_SI = sqrt((exp(square(param2)) - 1) * exp(2*param1 + square(param2)));

    vector[N] log_likelihood;
    for (k in 1:N) 
        log_likelihood[k] = lognormal_lpdf(s[k] - e[k] | param1, param2);
}" %>% cat(file=standirname %&% "/fit.stan", sep="", fill=TRUE)

standistribdir = "../../../../../CmdStan-2.22.1"
stanscriptdir = "../Dropbox/" %&% substring(standirname,13)
## bash file
"#!/bin/bash
cwd=$(pwd)
cd "%&%standistribdir%&%"
make -j6 "%&%stanscriptdir%&%"/fit
cd "%&%stanscriptdir%&%"
mkdir -p diagnostics
for i in {1..10}
do
    echo Running ${i}
    SEEDNUMBER=$((1+$i))
    ./fit \\
        method=sample num_samples=10000 num_warmup=20000 save_warmup=0 \\
            adapt delta=0.98 \\
            algorithm=hmc \\
                engine=nuts \\
        random seed=${SEEDNUMBER} \\
        id=$i \\
        data file=Data.R \\
        init=Init.R \\
        output file=trace-$i.csv \\
            diagnostic_file=diagnostics/diagnostics-$i.csv > diagnostics/output-$i.txt &
done
echo Finished sampling haha!
" %>% cat(file=standirname%&%"/fit.sh", sep="", fill=TRUE)

## running the bash script
system("bash "%&%standirname%&%"/fit.sh", intern = TRUE)

'mpicxx -fvisibility-inlines-hidden -std=c++17 -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /home/aakhmetz/anaconda3/include -std=c++1y -D_REENTRANT -Wno-sign-compare -Wno-delete-non-virtual-dtor -I stan/lib/stan_math/lib/tbb_2019_U8/include -O3 -I src -I stan/src -I lib/rapidjson_1.1.0/ -I stan/lib/stan_math/ -I stan/lib/stan_math/lib/eigen_3.3.3 -I stan/lib/stan_math/lib/boost_1.72.0 -I stan/lib/stan_math/lib/sundials_4.1.0/include -DNDEBUG -D_FORTIFY_SOURCE=2 -O2 -isystem /home/aakhmetz/anaconda3/include -DBOOST_DISABLE_ASSERTS -DSTAN_MPI -c -MT src/cmdstan/main.o -MM -E -MG -MP -MF src/cmdstan/main.d src/cmdstan/main.cpp'
''
'--- Translating Stan model to C++ code ---'
'bin/stanc --o=../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/lognormal-no_truncation/fit.hpp ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/lognormal-no_truncation/fit.stan'
'mpicxx -fvisibility-inlines-hidden -std=c++17 -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /home/aakhmetz/anaconda3/include -std=c++1y -D_REENTRANT -Wno-sign-compare -Wno-delete-non-virtual-dtor -I stan/lib/stan_math/lib/tbb_2019_U8/include -O3 -I src -I stan/src -I lib/rapidjson_1.1.0/ -I stan/lib/stan_math/ -I stan/lib/stan_math/lib/eigen_3.3.3 -I stan/lib/stan_math/lib/boost_1.72.0 -I stan/lib/stan_math/lib/sundials_4.1.0/include -DNDEBUG -D_FORTIFY_SOURCE=2 -O2 -isystem /home/aakhmetz/anaconda3/include -DBOOST_DISABLE_ASSERTS -DSTAN_MPI -c -MT ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/lognormal-no_truncation/fit.o -MT ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/lognormal-no_truncation/fit -include ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/lognormal-no_truncation/fit.hpp -include src/cmdstan/main.cpp -MM -E -MG -MP -MF ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/lognormal-no_truncation/fit.d ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/lognormal-no_truncation/fit.hpp'
''
'--- Compiling, linking C++ code ---'
'mpicxx -fvisibility-inlines-hidden -std=c++17 -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /home/aakhmetz/anaconda3/include -std=c++1y -D_REENTRANT -Wno-sign-compare -Wno-delete-non-virtual-dtor -I stan/lib/stan_math/lib/tbb_2019_U8/include -O3 -I src -I stan/src -I lib/rapidjson_1.1.0/ -I stan/lib/stan_math/ -I stan/lib/stan_math/lib/eigen_3.3.3 -I stan/lib/stan_math/lib/boost_1.72.0 -I stan/lib/stan_math/lib/sundials_4.1.0/include -DNDEBUG -D_FORTIFY_SOURCE=2 -O2 -isystem /home/aakhmetz/anaconda3/include -DBOOST_DISABLE_ASSERTS -DSTAN_MPI -c -x c++ -o ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/lognormal-no_truncation/fit.o ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/lognormal-no_truncation/fit.hpp'
'mpicxx -fvisibility-inlines-hidden -std=c++17 -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /home/aakhmetz/anaconda3/include -std=c++1y -D_REENTRANT -Wno-sign-compare -Wno-delete-non-virtual-dtor -I stan/lib/stan_math/lib/tbb_2019_U8/include -O3 -I src -I stan/src -I lib/rapidjson_1.1.0/ -I stan/lib/stan_math/ -I stan/lib/stan_math/lib/eigen_3.3.3 -I stan/lib/stan_math/lib/boost_1.72.0 -I stan/lib/stan_math/lib/sundials_4.1.0/include -DNDEBUG -D_FORTIFY_SOURCE=2 -O2 -isystem /home/aakhmetz/anaconda3/include -DBOOST_DISABLE_ASSERTS -DSTAN_MPI -Wl,-O2 -Wl,--sort-common -Wl,--as-needed -Wl,-z,relro -Wl,-z,now -Wl,--disable-new-dtags -Wl,--gc-sections -Wl,-rpath,/home/aakhmetz/anaconda3/lib -Wl,-rpath-link,/home/aakhmetz/anaconda3/lib -L/home/aakhmetz/anaconda3/lib -Wl,-L,"/home/aakhmetz/CmdStan-2.22.1/stan/lib/stan_math/lib/boost_1.72.0/stage/lib" -Wl,-rpath,"/home/aakhmetz/CmdStan-2.22.1/stan/lib/stan_math/lib/boost_1.72.0/stage/lib" -Wl,-L,"/home/aakhmetz/CmdStan-2.22.1/stan/lib/stan_math/lib/tbb" -Wl,-rpath,"/home/aakhmetz/CmdStan-2.22.1/stan/lib/stan_math/lib/tbb" ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/lognormal-no_truncation/fit.o src/cmdstan/main.o stan/lib/stan_math/lib/sundials_4.1.0/lib/libsundials_nvecserial.a stan/lib/stan_math/lib/sundials_4.1.0/lib/libsundials_cvodes.a stan/lib/stan_math/lib/sundials_4.1.0/lib/libsundials_idas.a stan/lib/stan_math/lib/sundials_4.1.0/lib/libsundials_kinsol.a stan/lib/stan_math/lib/boost_1.72.0/stage/lib/libboost_serialization.so stan/lib/stan_math/lib/boost_1.72.0/stage/lib/libboost_mpi.so stan/lib/stan_math/stan/math/prim/functor/mpi_cluster_inst.o stan/lib/stan_math/lib/tbb/libtbb.so.2 -o ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/lognormal-no_truncation/fit'
'Running 1'
'Running 2'
'Running 3'
'Running 4'
'Running 5'
'Running 6'
'Running 7'
'Running 8'
'Running 9'
'Running 10'
'Finished sampling haha!'

Gamma distribution¶

In [79]:

## main dir for Stan simulations
standirname = stanmaindir%&%"/gamma-no_truncation"
unlink(standirname, recursive=T)
dir.create(standirname)

# Dumping data
N = nrow(df)
E_L = df$EL
E_R = df$ER
S_L = df$SL
S_R = df$SR
stan_rdump(c('E_L', 'E_R', 'S_L', 'S_R', 'N'), file=standirname%&%"/Data.R") 

# Dumping initial conditions
e_raw = rep(.2, N)
s_raw = rep(.8, N)
param1 = (mean(df$dist)/sd(df$dist))^2
param2 = mean(df$dist)/(sd(df$dist)^2)
stan_rdump(c('e_raw', 's_raw', 'param1', 'param2'), file=standirname%&%"/Init.R") 

# Stan program
"data {
    int<lower = 0> N; // number of records
    vector<lower = 0>[N] E_L;
    vector<lower = 0>[N] E_R;
    vector<lower = 0>[N] S_L;
    vector<lower = 0>[N] S_R;
}

parameters {
    real<lower=0> mean_SI;
    real<lower=0> sd_SI;

    vector<lower = 0, upper = 1>[N] e_raw;
    vector<lower = 0, upper = 1>[N] s_raw;
}

transformed parameters {
    real<lower = 0> param1 = square(mean_SI/sd_SI);
    real<lower = 0> param2 = mean_SI/square(sd_SI);

    vector<lower = min(S_L), upper = max(S_R)>[N] s;
    vector<lower = min(E_L), upper = max(E_R)>[N] e;

    s = S_L + (S_R - S_L) .* s_raw;
    for (k in 1:N) 
        if (E_R[k] > s[k]) 
            e[k] = E_L[k] + (s[k] - E_L[k]) * e_raw[k];
        else
            e[k] = E_L[k] + (E_R[k] - E_L[k]) * e_raw[k];
}

model {
    mean_SI ~ normal(5.0, 10.0);
    sd_SI ~ cauchy(0, 5.0);

    e_raw ~ normal(0.5, 1.0);
    s_raw ~ normal(0.5, 1.0);

    target += gamma_lpdf(s - e | param1, param2);
}

generated quantities {
    vector[N] log_likelihood;
    for (k in 1:N) 
        log_likelihood[k] = gamma_lpdf(s[k] - e[k] | param1, param2);
}" %>% cat(file=standirname %&% "/fit.stan", sep="", fill=TRUE)

standistribdir = "../../../../../CmdStan-2.22.1"
stanscriptdir = "../Dropbox/" %&% substring(standirname,13)
## bash file
"#!/bin/bash
cwd=$(pwd)
cd "%&%standistribdir%&%"
make -j6 "%&%stanscriptdir%&%"/fit
cd "%&%stanscriptdir%&%"
mkdir -p diagnostics
for i in {1..10}
do
    echo Running ${i}
    SEEDNUMBER=$((1+$i))
    ./fit \\
        method=sample num_samples=10000 num_warmup=20000 save_warmup=0 \\
            adapt delta=0.98 \\
            algorithm=hmc \\
                engine=nuts \\
        random seed=${SEEDNUMBER} \\
        id=$i \\
        data file=Data.R \\
        init=Init.R \\
        output file=trace-$i.csv \\
            refresh=1000 \\
            diagnostic_file=diagnostics/diagnostics-$i.csv > diagnostics/output-$i.txt &
done
echo Finished sampling haha!
" %>% cat(file=standirname%&%"/fit.sh", sep="", fill=TRUE)

## running the bash script
system("bash "%&%standirname%&%"/fit.sh", intern = TRUE)

''
'--- Translating Stan model to C++ code ---'
'bin/stanc --o=../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/gamma-no_truncation/fit.hpp ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/gamma-no_truncation/fit.stan'
'mpicxx -fvisibility-inlines-hidden -std=c++17 -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /home/aakhmetz/anaconda3/include -std=c++1y -D_REENTRANT -Wno-sign-compare -Wno-delete-non-virtual-dtor -I stan/lib/stan_math/lib/tbb_2019_U8/include -O3 -I src -I stan/src -I lib/rapidjson_1.1.0/ -I stan/lib/stan_math/ -I stan/lib/stan_math/lib/eigen_3.3.3 -I stan/lib/stan_math/lib/boost_1.72.0 -I stan/lib/stan_math/lib/sundials_4.1.0/include -DNDEBUG -D_FORTIFY_SOURCE=2 -O2 -isystem /home/aakhmetz/anaconda3/include -DBOOST_DISABLE_ASSERTS -DSTAN_MPI -c -MT ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/gamma-no_truncation/fit.o -MT ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/gamma-no_truncation/fit -include ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/gamma-no_truncation/fit.hpp -include src/cmdstan/main.cpp -MM -E -MG -MP -MF ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/gamma-no_truncation/fit.d ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/gamma-no_truncation/fit.hpp'
''
'--- Compiling, linking C++ code ---'
'mpicxx -fvisibility-inlines-hidden -std=c++17 -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /home/aakhmetz/anaconda3/include -std=c++1y -D_REENTRANT -Wno-sign-compare -Wno-delete-non-virtual-dtor -I stan/lib/stan_math/lib/tbb_2019_U8/include -O3 -I src -I stan/src -I lib/rapidjson_1.1.0/ -I stan/lib/stan_math/ -I stan/lib/stan_math/lib/eigen_3.3.3 -I stan/lib/stan_math/lib/boost_1.72.0 -I stan/lib/stan_math/lib/sundials_4.1.0/include -DNDEBUG -D_FORTIFY_SOURCE=2 -O2 -isystem /home/aakhmetz/anaconda3/include -DBOOST_DISABLE_ASSERTS -DSTAN_MPI -c -x c++ -o ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/gamma-no_truncation/fit.o ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/gamma-no_truncation/fit.hpp'
'mpicxx -fvisibility-inlines-hidden -std=c++17 -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /home/aakhmetz/anaconda3/include -std=c++1y -D_REENTRANT -Wno-sign-compare -Wno-delete-non-virtual-dtor -I stan/lib/stan_math/lib/tbb_2019_U8/include -O3 -I src -I stan/src -I lib/rapidjson_1.1.0/ -I stan/lib/stan_math/ -I stan/lib/stan_math/lib/eigen_3.3.3 -I stan/lib/stan_math/lib/boost_1.72.0 -I stan/lib/stan_math/lib/sundials_4.1.0/include -DNDEBUG -D_FORTIFY_SOURCE=2 -O2 -isystem /home/aakhmetz/anaconda3/include -DBOOST_DISABLE_ASSERTS -DSTAN_MPI -Wl,-O2 -Wl,--sort-common -Wl,--as-needed -Wl,-z,relro -Wl,-z,now -Wl,--disable-new-dtags -Wl,--gc-sections -Wl,-rpath,/home/aakhmetz/anaconda3/lib -Wl,-rpath-link,/home/aakhmetz/anaconda3/lib -L/home/aakhmetz/anaconda3/lib -Wl,-L,"/home/aakhmetz/CmdStan-2.22.1/stan/lib/stan_math/lib/boost_1.72.0/stage/lib" -Wl,-rpath,"/home/aakhmetz/CmdStan-2.22.1/stan/lib/stan_math/lib/boost_1.72.0/stage/lib" -Wl,-L,"/home/aakhmetz/CmdStan-2.22.1/stan/lib/stan_math/lib/tbb" -Wl,-rpath,"/home/aakhmetz/CmdStan-2.22.1/stan/lib/stan_math/lib/tbb" ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/gamma-no_truncation/fit.o src/cmdstan/main.o stan/lib/stan_math/lib/sundials_4.1.0/lib/libsundials_nvecserial.a stan/lib/stan_math/lib/sundials_4.1.0/lib/libsundials_cvodes.a stan/lib/stan_math/lib/sundials_4.1.0/lib/libsundials_idas.a stan/lib/stan_math/lib/sundials_4.1.0/lib/libsundials_kinsol.a stan/lib/stan_math/lib/boost_1.72.0/stage/lib/libboost_serialization.so stan/lib/stan_math/lib/boost_1.72.0/stage/lib/libboost_mpi.so stan/lib/stan_math/stan/math/prim/functor/mpi_cluster_inst.o stan/lib/stan_math/lib/tbb/libtbb.so.2 -o ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/gamma-no_truncation/fit'
'Running 1'
'Running 2'
'Running 3'
'Running 4'
'Running 5'
'Running 6'
'Running 7'
'Running 8'
'Running 9'
'Running 10'
'Finished sampling haha!'

Weibull distribution¶

In [80]:

## main dir for Stan simulations
standirname = stanmaindir%&%"/weibull-no_truncation"
unlink(standirname, recursive=T)
dir.create(standirname)

# Dumping data
N = nrow(df)
E_L = df$EL
E_R = df$ER
S_L = df$SL
S_R = df$SR
stan_rdump(c('E_L', 'E_R', 'S_L', 'S_R', 'N'), file=standirname%&%"/Data.R") 

# Dumping initial conditions
e_raw = rep(.2, N)
s_raw = rep(.8, N)
logmean_SI = log(mean(df$dist))
param1 = 1.75
stan_rdump(c('e_raw', 's_raw', 'logmean_SI', 'param1'), file=standirname%&%"/Init.R") 

# Stan program
"data {
    int<lower = 0> N; // number of records
    vector<lower = 0>[N] E_L;
    vector<lower = 0>[N] E_R;
    vector<lower = 0>[N] S_L;
    vector<lower = 0>[N] S_R;
}

parameters {
    real<lower = 0> mean_SI;
    real<lower = 0> param1;

    vector<lower = 0, upper = 1>[N] e_raw;
    vector<lower = 0, upper = 1>[N] s_raw;
}

transformed parameters {
    real<lower = 0> param2 = mean_SI/tgamma(1.0+1.0/param1);

    vector<lower = min(S_L), upper = max(S_R)>[N] s;
    vector<lower = min(E_L), upper = max(E_R)>[N] e;

    s = S_L + (S_R - S_L) .* s_raw;
    for (k in 1:N) 
        if (E_R[k] > s[k]) 
            e[k] = E_L[k] + (s[k] - E_L[k]) * e_raw[k];
        else
            e[k] = E_L[k] + (E_R[k] - E_L[k]) * e_raw[k];
}

model {
    mean_SI ~ normal(5.0, 10.0);
    param1 ~ exponential(0.0001);

    e_raw ~ normal(0.5, 1.0);
    s_raw ~ normal(0.5, 1.0);

    target += weibull_lpdf(s - e | param1, param2);
}

generated quantities {
    real sd_SI = param2*sqrt(tgamma(1.0+2.0/param1) - square(tgamma(1.0+1.0/param1)));

    vector[N] log_likelihood;
    for (k in 1:N) 
        log_likelihood[k] = weibull_lpdf(s[k] - e[k] | param1, param2);
}" %>% cat(file=standirname %&% "/fit.stan", sep="", fill=TRUE)

standistribdir = "../../../../../CmdStan-2.22.1"
stanscriptdir = "../Dropbox/" %&% substring(standirname,13)
## bash file
"#!/bin/bash
cwd=$(pwd)
cd "%&%standistribdir%&%"
make -j6 "%&%stanscriptdir%&%"/fit
cd "%&%stanscriptdir%&%"
mkdir -p diagnostics
for i in {1..10}
do
    echo Running ${i}
    SEEDNUMBER=$((1+$i))
    ./fit \\
        method=sample num_samples=10000 num_warmup=10000 save_warmup=0 \\
            adapt delta=0.98 \\
            algorithm=hmc \\
                engine=nuts \\
        random seed=${SEEDNUMBER} \\
        id=$i \\
        data file=Data.R \\
        init=Init.R \\
        output file=trace-$i.csv \\
            diagnostic_file=diagnostics/diagnostics-$i.csv > diagnostics/output-$i.txt &
done
echo Finished sampling haha!
" %>% cat(file=standirname%&%"/fit.sh", sep="", fill=TRUE)

## running the bash script
system("bash "%&%standirname%&%"/fit.sh", intern = TRUE)

''
'--- Translating Stan model to C++ code ---'
'bin/stanc --o=../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/weibull-no_truncation/fit.hpp ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/weibull-no_truncation/fit.stan'
'mpicxx -fvisibility-inlines-hidden -std=c++17 -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /home/aakhmetz/anaconda3/include -std=c++1y -D_REENTRANT -Wno-sign-compare -Wno-delete-non-virtual-dtor -I stan/lib/stan_math/lib/tbb_2019_U8/include -O3 -I src -I stan/src -I lib/rapidjson_1.1.0/ -I stan/lib/stan_math/ -I stan/lib/stan_math/lib/eigen_3.3.3 -I stan/lib/stan_math/lib/boost_1.72.0 -I stan/lib/stan_math/lib/sundials_4.1.0/include -DNDEBUG -D_FORTIFY_SOURCE=2 -O2 -isystem /home/aakhmetz/anaconda3/include -DBOOST_DISABLE_ASSERTS -DSTAN_MPI -c -MT ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/weibull-no_truncation/fit.o -MT ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/weibull-no_truncation/fit -include ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/weibull-no_truncation/fit.hpp -include src/cmdstan/main.cpp -MM -E -MG -MP -MF ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/weibull-no_truncation/fit.d ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/weibull-no_truncation/fit.hpp'
''
'--- Compiling, linking C++ code ---'
'mpicxx -fvisibility-inlines-hidden -std=c++17 -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /home/aakhmetz/anaconda3/include -std=c++1y -D_REENTRANT -Wno-sign-compare -Wno-delete-non-virtual-dtor -I stan/lib/stan_math/lib/tbb_2019_U8/include -O3 -I src -I stan/src -I lib/rapidjson_1.1.0/ -I stan/lib/stan_math/ -I stan/lib/stan_math/lib/eigen_3.3.3 -I stan/lib/stan_math/lib/boost_1.72.0 -I stan/lib/stan_math/lib/sundials_4.1.0/include -DNDEBUG -D_FORTIFY_SOURCE=2 -O2 -isystem /home/aakhmetz/anaconda3/include -DBOOST_DISABLE_ASSERTS -DSTAN_MPI -c -x c++ -o ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/weibull-no_truncation/fit.o ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/weibull-no_truncation/fit.hpp'
'mpicxx -fvisibility-inlines-hidden -std=c++17 -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /home/aakhmetz/anaconda3/include -std=c++1y -D_REENTRANT -Wno-sign-compare -Wno-delete-non-virtual-dtor -I stan/lib/stan_math/lib/tbb_2019_U8/include -O3 -I src -I stan/src -I lib/rapidjson_1.1.0/ -I stan/lib/stan_math/ -I stan/lib/stan_math/lib/eigen_3.3.3 -I stan/lib/stan_math/lib/boost_1.72.0 -I stan/lib/stan_math/lib/sundials_4.1.0/include -DNDEBUG -D_FORTIFY_SOURCE=2 -O2 -isystem /home/aakhmetz/anaconda3/include -DBOOST_DISABLE_ASSERTS -DSTAN_MPI -Wl,-O2 -Wl,--sort-common -Wl,--as-needed -Wl,-z,relro -Wl,-z,now -Wl,--disable-new-dtags -Wl,--gc-sections -Wl,-rpath,/home/aakhmetz/anaconda3/lib -Wl,-rpath-link,/home/aakhmetz/anaconda3/lib -L/home/aakhmetz/anaconda3/lib -Wl,-L,"/home/aakhmetz/CmdStan-2.22.1/stan/lib/stan_math/lib/boost_1.72.0/stage/lib" -Wl,-rpath,"/home/aakhmetz/CmdStan-2.22.1/stan/lib/stan_math/lib/boost_1.72.0/stage/lib" -Wl,-L,"/home/aakhmetz/CmdStan-2.22.1/stan/lib/stan_math/lib/tbb" -Wl,-rpath,"/home/aakhmetz/CmdStan-2.22.1/stan/lib/stan_math/lib/tbb" ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/weibull-no_truncation/fit.o src/cmdstan/main.o stan/lib/stan_math/lib/sundials_4.1.0/lib/libsundials_nvecserial.a stan/lib/stan_math/lib/sundials_4.1.0/lib/libsundials_cvodes.a stan/lib/stan_math/lib/sundials_4.1.0/lib/libsundials_idas.a stan/lib/stan_math/lib/sundials_4.1.0/lib/libsundials_kinsol.a stan/lib/stan_math/lib/boost_1.72.0/stage/lib/libboost_serialization.so stan/lib/stan_math/lib/boost_1.72.0/stage/lib/libboost_mpi.so stan/lib/stan_math/stan/math/prim/functor/mpi_cluster_inst.o stan/lib/stan_math/lib/tbb/libtbb.so.2 -o ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/weibull-no_truncation/fit'
'Running 1'
'Running 2'
'Running 3'
'Running 4'
'Running 5'
'Running 6'
'Running 7'
'Running 8'
'Running 9'
'Running 10'
'Finished sampling haha!'

With truncation¶

Lognormal distribution¶

In [67]:

## main dir for Stan simulations
standirname = stanmaindir%&%"/lognormal-truncated"
unlink(standirname, recursive=T)
dir.create(standirname)

# Dumping data
N = nrow(df)
E_L = df$EL
E_R = df$ER
S_L = df$SL
S_R = df$SR
r = 0.14
upper_bound = df$tstar[1]
stan_rdump(c('E_L', 'E_R', 'S_L', 'S_R', 'N', 'r', 'upper_bound'), file=standirname%&%"/Data.R") 

# Dumping initial conditions
e_raw = rep(.2, N)
s_raw = rep(.8, N)
logmean_SI = log(mean(df$dist))
logsd_SI = log(sd(df$dist))
stan_rdump(c('e_raw', 's_raw', 'logmean_SI', 'logsd_SI'), file=standirname%&%"/Init.R") 

# Stan program
"functions {
    real[] fstar_ode(real t, real[] z, real[] theta, data real[] x_r, int[] x_i) {
        int N = x_i[1]; // number of records

        real e[N] = theta[1:N];
        real param1 = theta[N+1];
        real param2 = theta[N+2];

        real upper_bound = x_r[1];
        real r = x_r[2];

        real dzdt[N];
        real tstar[N];

        for (k in 1:N) {
            tstar[k] = upper_bound - e[k];
            dzdt[k] = exp(lognormal_lcdf(tstar[k]*(1.0-t) | param1, param2)) * r * tstar[k] * exp(-r*tstar[k]*t) / (1.0 - exp(-r*tstar[k]*t));
        }

        return dzdt;
    }
}

data {
    int<lower = 0> N; // number of records
    vector<lower = 0>[N] E_L;
    vector<lower = 0>[N] E_R;
    vector<lower = 0>[N] S_L;
    vector<lower = 0>[N] S_R;
    real<lower = 0> upper_bound;
    real<lower = 0> r;
}

transformed data {
    int X_i[1] = {N};

    real X_r[2] = {upper_bound, r};
}

parameters {
    real logmean_SI;
    real logsd_SI;

    vector<lower = 0, upper = 1>[N] e_raw;
    vector<lower = 0, upper = 1>[N] s_raw;
}

transformed parameters {
    real<lower = 0> param2 = sqrt(log((exp(2*(logsd_SI-logmean_SI))+1.0)));
    real param1 = logmean_SI - square(param2)/2.0;

    vector<lower = min(E_L), upper = max(E_R)>[N] e;
    vector<lower = min(S_L), upper = max(S_R)>[N] s;

    vector[N] Z; 
    
    {
        real theta[N+2];
        real Z0[N];
        
        s = S_L + (S_R - S_L) .* s_raw;
        for (k in 1:N) 
            if (E_R[k] > s[k]) 
                e[k] = E_L[k] + (s[k] - E_L[k]) * e_raw[k];
            else
                e[k] = E_L[k] + (E_R[k] - E_L[k]) * e_raw[k];

        for (k in 1:N) {
            Z0[k] = 0.0;
            theta[k] = e[k];
        }
        theta[N+1] = param1;
        theta[N+2] = param2;

        Z = to_vector(to_array_1d(integrate_ode_rk45(fstar_ode, Z0, 0.001, {1.0}, theta, X_r, X_i, 1e-5, 1e-3, 5e2)));
    }
}

model {
    logmean_SI ~ std_normal();
    logsd_SI ~ std_normal();

    e_raw ~ normal(0.5, 1.0);
    s_raw ~ normal(0.5, 1.0);

    target += lognormal_lpdf(s - e | param1, param2) - log(Z);
}

generated quantities {
    real<lower = 0> mean_SI = exp(param1 + square(param2)/2);
    real<lower = 0> sd_SI = sqrt((exp(square(param2))-1)*exp(2*param1+square(param2)));

    vector[N] log_likelihood;
    for (k in 1:N)
        log_likelihood[k] = lognormal_lpdf(s[k] - e[k] | param1, param2) - log(Z[k]);
}" %>% cat(file=standirname %&% "/fit.stan", sep="", fill=TRUE)

standistribdir = "../../../../../CmdStan-2.22.1"
stanscriptdir = "../Dropbox/" %&% substring(standirname,13)
## bash file
"#!/bin/bash
cwd=$(pwd)
cd "%&%standistribdir%&%"
make -j6 "%&%stanscriptdir%&%"/fit
cd "%&%stanscriptdir%&%"
mkdir -p diagnostics
for i in {1..10}
do
    echo Running ${i}
    SEEDNUMBER=$((1+$i))
    ./fit \\
        method=sample num_samples=10000 num_warmup=10000 save_warmup=0 \\
            adapt delta=0.98 \\
            algorithm=hmc \\
                engine=nuts \\
        random seed=${SEEDNUMBER} \\
        id=$i \\
        data file=Data.R \\
        init=Init.R \\
        output file=trace-$i.csv \\
            diagnostic_file=diagnostics/diagnostics-$i.csv > diagnostics/output-$i.txt &
done
echo Finished sampling haha!
" %>% cat(file=standirname%&%"/fit.sh", sep="", fill=TRUE)

## running the bash script
system("bash "%&%standirname%&%"/fit.sh", intern = TRUE)

''
'--- Translating Stan model to C++ code ---'
'bin/stanc --o=../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/lognormal-truncated/fit.hpp ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/lognormal-truncated/fit.stan'
'mpicxx -fvisibility-inlines-hidden -std=c++17 -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /home/aakhmetz/anaconda3/include -std=c++1y -D_REENTRANT -Wno-sign-compare -Wno-delete-non-virtual-dtor -I stan/lib/stan_math/lib/tbb_2019_U8/include -O3 -I src -I stan/src -I lib/rapidjson_1.1.0/ -I stan/lib/stan_math/ -I stan/lib/stan_math/lib/eigen_3.3.3 -I stan/lib/stan_math/lib/boost_1.72.0 -I stan/lib/stan_math/lib/sundials_5.2.0/include -DNDEBUG -D_FORTIFY_SOURCE=2 -O2 -isystem /home/aakhmetz/anaconda3/include -DBOOST_DISABLE_ASSERTS -DSTAN_MPI -c -MT ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/lognormal-truncated/fit.o -MT ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/lognormal-truncated/fit -include ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/lognormal-truncated/fit.hpp -include src/cmdstan/main.cpp -MM -E -MG -MP -MF ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/lognormal-truncated/fit.d ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/lognormal-truncated/fit.hpp'
''
'--- Compiling, linking C++ code ---'
'mpicxx -fvisibility-inlines-hidden -std=c++17 -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /home/aakhmetz/anaconda3/include -std=c++1y -D_REENTRANT -Wno-sign-compare -Wno-delete-non-virtual-dtor -I stan/lib/stan_math/lib/tbb_2019_U8/include -O3 -I src -I stan/src -I lib/rapidjson_1.1.0/ -I stan/lib/stan_math/ -I stan/lib/stan_math/lib/eigen_3.3.3 -I stan/lib/stan_math/lib/boost_1.72.0 -I stan/lib/stan_math/lib/sundials_5.2.0/include -DNDEBUG -D_FORTIFY_SOURCE=2 -O2 -isystem /home/aakhmetz/anaconda3/include -DBOOST_DISABLE_ASSERTS -DSTAN_MPI -c -x c++ -o ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/lognormal-truncated/fit.o ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/lognormal-truncated/fit.hpp'
'mpicxx -fvisibility-inlines-hidden -std=c++17 -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /home/aakhmetz/anaconda3/include -std=c++1y -D_REENTRANT -Wno-sign-compare -Wno-delete-non-virtual-dtor -I stan/lib/stan_math/lib/tbb_2019_U8/include -O3 -I src -I stan/src -I lib/rapidjson_1.1.0/ -I stan/lib/stan_math/ -I stan/lib/stan_math/lib/eigen_3.3.3 -I stan/lib/stan_math/lib/boost_1.72.0 -I stan/lib/stan_math/lib/sundials_5.2.0/include -DNDEBUG -D_FORTIFY_SOURCE=2 -O2 -isystem /home/aakhmetz/anaconda3/include -DBOOST_DISABLE_ASSERTS -DSTAN_MPI -Wl,-O2 -Wl,--sort-common -Wl,--as-needed -Wl,-z,relro -Wl,-z,now -Wl,--disable-new-dtags -Wl,--gc-sections -Wl,-rpath,/home/aakhmetz/anaconda3/lib -Wl,-rpath-link,/home/aakhmetz/anaconda3/lib -L/home/aakhmetz/anaconda3/lib -Wl,-L,"/home/aakhmetz/CmdStan/stan/lib/stan_math/lib/boost_1.72.0/stage/lib" -Wl,-rpath,"/home/aakhmetz/CmdStan/stan/lib/stan_math/lib/boost_1.72.0/stage/lib" -Wl,-L,"/home/aakhmetz/CmdStan/stan/lib/stan_math/lib/tbb" -Wl,-rpath,"/home/aakhmetz/CmdStan/stan/lib/stan_math/lib/tbb" ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/lognormal-truncated/fit.o src/cmdstan/main.o stan/lib/stan_math/lib/sundials_5.2.0/lib/libsundials_nvecserial.a stan/lib/stan_math/lib/sundials_5.2.0/lib/libsundials_cvodes.a stan/lib/stan_math/lib/sundials_5.2.0/lib/libsundials_idas.a stan/lib/stan_math/lib/sundials_5.2.0/lib/libsundials_kinsol.a stan/lib/stan_math/lib/boost_1.72.0/stage/lib/libboost_serialization.so stan/lib/stan_math/lib/boost_1.72.0/stage/lib/libboost_mpi.so stan/lib/stan_math/stan/math/prim/functor/mpi_cluster_inst.o stan/lib/stan_math/lib/tbb/libtbb.so.2 -o ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/lognormal-truncated/fit'
'Running 1'
'Running 2'
'Running 3'
'Running 4'
'Running 5'
'Running 6'
'Running 7'
'Running 8'
'Running 9'
'Running 10'
'Finished sampling haha!'

Gamma distribution¶

In [68]:

## main dir for Stan simulations
standirname = stanmaindir%&%"/gamma-truncated"
unlink(standirname, recursive=T)
dir.create(standirname)

# Dumping data
N = nrow(df)
E_L = df$EL
E_R = df$ER
S_L = df$SL
S_R = df$SR
r = 0.14
upper_bound = df$tstar[1]
stan_rdump(c('E_L', 'E_R', 'S_L', 'S_R', 'N', 'r', 'upper_bound'), file=standirname%&%"/Data.R") 

# Dumping initial conditions
e_raw = rep(.4, N)
s_raw = rep(.6, N)
mean_SI = mean(df$dist)
sd_SI = sd(df$dist)
stan_rdump(c('e_raw', 's_raw', 'mean_SI', 'sd_SI'), file=standirname%&%"/Init.R") 

# Stan program
"functions {
    real[] fstar_ode(real t, real[] z, real[] theta, data real[] x_r, int[] x_i) {
        int N = x_i[1]; // number of records

        real e[N] = theta[1:N];
        real param1 = theta[N+1];
        real param2 = theta[N+2];

        real upper_bound = x_r[1];
        real r = x_r[2];

        real dzdt[N];
        real tstar[N];

        for (k in 1:N) {
            tstar[k] = upper_bound - e[k];
            dzdt[k] = exp(gamma_lcdf(tstar[k]*(1.0-t) | param1, param2)) * r * tstar[k] * exp(-r*tstar[k]*t) / (1.0 - exp(-r*tstar[k]*t));
        }

        return dzdt;
    }
}

data {
    int<lower = 0> N; // number of records
    vector<lower = 0>[N] E_L;
    vector<lower = 0>[N] E_R;
    vector<lower = 0>[N] S_L;
    vector<lower = 0>[N] S_R;
    real<lower = 0> r;
    real<lower = 0> upper_bound;
}

transformed data {
    int X_i[1] = {N};

    real X_r[2] = {upper_bound, r};
}

parameters {
    real<lower = 0> mean_SI;
    real<lower = 0> sd_SI;

    vector<lower = 0, upper = 1>[N] s_raw;
    vector<lower = 0, upper = 1>[N] e_raw;
}

transformed parameters {
    real<lower = 0> param1 = square(mean_SI/sd_SI);
    real<lower = 0> param2 = mean_SI/square(sd_SI);

    vector<lower = min(S_L), upper = max(S_R)>[N] s;
    vector<lower = min(E_L), upper = max(E_R)>[N] e;

    vector[N] Z; 
    
    {
        real theta[N+2];
        real Z0[N];
        
        s = S_L + (S_R - S_L) .* s_raw;
        for (k in 1:N) 
            if (E_R[k] > s[k]) 
                e[k] = E_L[k] + (s[k] - E_L[k]) * e_raw[k];
            else
                e[k] = E_L[k] + (E_R[k] - E_L[k]) * e_raw[k];

        for (k in 1:N) {
            Z0[k] = 0.0;
            theta[k] = e[k];
        }
        theta[N+1] = param1;
        theta[N+2] = param2;

        Z = to_vector(to_array_1d(integrate_ode_rk45(fstar_ode, Z0, 0.001, {1.0}, theta, X_r, X_i)));
    }
}

model {
    mean_SI ~ normal(5.0, 10.0);
    sd_SI ~ cauchy(0, 5.0);

    e_raw ~ normal(0.5, 1.0);
    s_raw ~ normal(0.5, 1.0);

    target += gamma_lpdf(s - e | param1, param2) - log(Z);
}

generated quantities {
    vector[N] log_likelihood;
    for (k in 1:N) 
        log_likelihood[k] = gamma_lpdf(s[k] - e[k] | param1, param2) - log(Z[k]);
}" %>% cat(file=standirname %&% "/fit.stan", sep="", fill=TRUE)

standistribdir = "../../../../../CmdStan"
stanscriptdir = "../Dropbox/" %&% substring(standirname,13)
## bash file
"#!/bin/bash
cwd=$(pwd)
cd "%&%standistribdir%&%"
make -j6 "%&%stanscriptdir%&%"/fit
cd "%&%stanscriptdir%&%"
mkdir -p diagnostics
for i in {1..10}
do
    echo Running ${i}
    SEEDNUMBER=$((1+$i))
    ./fit \\
        method=sample num_samples=10000 num_warmup=10000 save_warmup=0 \\
            adapt delta=0.98 \\
            algorithm=hmc \\
                engine=nuts \\
        random seed=${SEEDNUMBER} \\
        id=$i \\
        data file=Data.R \\
        init=Init.R \\
        output file=trace-$i.csv \\
            diagnostic_file=diagnostics/diagnostics-$i.csv > diagnostics/output-$i.txt &
done
echo Finished sampling haha!
" %>% cat(file=standirname%&%"/fit.sh", sep="", fill=TRUE)

## running the bash script
system("bash "%&%standirname%&%"/fit.sh", intern = TRUE)

''
'--- Translating Stan model to C++ code ---'
'bin/stanc --o=../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/gamma-truncated/fit.hpp ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/gamma-truncated/fit.stan'
'mpicxx -fvisibility-inlines-hidden -std=c++17 -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /home/aakhmetz/anaconda3/include -std=c++1y -D_REENTRANT -Wno-sign-compare -Wno-delete-non-virtual-dtor -I stan/lib/stan_math/lib/tbb_2019_U8/include -O3 -I src -I stan/src -I lib/rapidjson_1.1.0/ -I stan/lib/stan_math/ -I stan/lib/stan_math/lib/eigen_3.3.3 -I stan/lib/stan_math/lib/boost_1.72.0 -I stan/lib/stan_math/lib/sundials_5.2.0/include -DNDEBUG -D_FORTIFY_SOURCE=2 -O2 -isystem /home/aakhmetz/anaconda3/include -DBOOST_DISABLE_ASSERTS -DSTAN_MPI -c -MT ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/gamma-truncated/fit.o -MT ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/gamma-truncated/fit -include ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/gamma-truncated/fit.hpp -include src/cmdstan/main.cpp -MM -E -MG -MP -MF ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/gamma-truncated/fit.d ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/gamma-truncated/fit.hpp'
''
'--- Compiling, linking C++ code ---'
'mpicxx -fvisibility-inlines-hidden -std=c++17 -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /home/aakhmetz/anaconda3/include -std=c++1y -D_REENTRANT -Wno-sign-compare -Wno-delete-non-virtual-dtor -I stan/lib/stan_math/lib/tbb_2019_U8/include -O3 -I src -I stan/src -I lib/rapidjson_1.1.0/ -I stan/lib/stan_math/ -I stan/lib/stan_math/lib/eigen_3.3.3 -I stan/lib/stan_math/lib/boost_1.72.0 -I stan/lib/stan_math/lib/sundials_5.2.0/include -DNDEBUG -D_FORTIFY_SOURCE=2 -O2 -isystem /home/aakhmetz/anaconda3/include -DBOOST_DISABLE_ASSERTS -DSTAN_MPI -c -x c++ -o ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/gamma-truncated/fit.o ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/gamma-truncated/fit.hpp'
'mpicxx -fvisibility-inlines-hidden -std=c++17 -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /home/aakhmetz/anaconda3/include -std=c++1y -D_REENTRANT -Wno-sign-compare -Wno-delete-non-virtual-dtor -I stan/lib/stan_math/lib/tbb_2019_U8/include -O3 -I src -I stan/src -I lib/rapidjson_1.1.0/ -I stan/lib/stan_math/ -I stan/lib/stan_math/lib/eigen_3.3.3 -I stan/lib/stan_math/lib/boost_1.72.0 -I stan/lib/stan_math/lib/sundials_5.2.0/include -DNDEBUG -D_FORTIFY_SOURCE=2 -O2 -isystem /home/aakhmetz/anaconda3/include -DBOOST_DISABLE_ASSERTS -DSTAN_MPI -Wl,-O2 -Wl,--sort-common -Wl,--as-needed -Wl,-z,relro -Wl,-z,now -Wl,--disable-new-dtags -Wl,--gc-sections -Wl,-rpath,/home/aakhmetz/anaconda3/lib -Wl,-rpath-link,/home/aakhmetz/anaconda3/lib -L/home/aakhmetz/anaconda3/lib -Wl,-L,"/home/aakhmetz/CmdStan/stan/lib/stan_math/lib/boost_1.72.0/stage/lib" -Wl,-rpath,"/home/aakhmetz/CmdStan/stan/lib/stan_math/lib/boost_1.72.0/stage/lib" -Wl,-L,"/home/aakhmetz/CmdStan/stan/lib/stan_math/lib/tbb" -Wl,-rpath,"/home/aakhmetz/CmdStan/stan/lib/stan_math/lib/tbb" ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/gamma-truncated/fit.o src/cmdstan/main.o stan/lib/stan_math/lib/sundials_5.2.0/lib/libsundials_nvecserial.a stan/lib/stan_math/lib/sundials_5.2.0/lib/libsundials_cvodes.a stan/lib/stan_math/lib/sundials_5.2.0/lib/libsundials_idas.a stan/lib/stan_math/lib/sundials_5.2.0/lib/libsundials_kinsol.a stan/lib/stan_math/lib/boost_1.72.0/stage/lib/libboost_serialization.so stan/lib/stan_math/lib/boost_1.72.0/stage/lib/libboost_mpi.so stan/lib/stan_math/stan/math/prim/functor/mpi_cluster_inst.o stan/lib/stan_math/lib/tbb/libtbb.so.2 -o ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/gamma-truncated/fit'
'Running 1'
'Running 2'
'Running 3'
'Running 4'
'Running 5'
'Running 6'
'Running 7'
'Running 8'
'Running 9'
'Running 10'
'Finished sampling haha!'

Weibull distribution¶

In [86]:

## main dir for Stan simulations
standirname = stanmaindir%&%"/weibull-truncated-2.23.0"
unlink(standirname, recursive=T)
dir.create(standirname)

# Dumping data
N = nrow(df)
E_L = df$EL
E_R = df$ER
S_L = df$SL
S_R = df$SR
r = 0.14
upper_bound = df$tstar[1]
stan_rdump(c('E_L', 'E_R', 'S_L', 'S_R', 'N', 'r', 'upper_bound'), file=standirname%&%"/Data.R") 

# Dumping initial conditions
e_raw = rep(.2, N)
s_raw = rep(.8, N)
logmean_SI = log(mean(df$dist))
param1 = 1.75
stan_rdump(c('e_raw', 's_raw', 'logmean_SI', 'param1'), file=standirname%&%"/Init.R") 

# Stan program
"functions {
    real[] fstar_ode(real t, real[] z, real[] theta, data real[] x_r, int[] x_i) {
        int N = x_i[1]; // number of records

        real e[N] = theta[1:N];
        real param1 = theta[N+1];
        real param2 = theta[N+2];

        real upper_bound = x_r[1];
        real r = x_r[2];

        real dzdt[N];
        real tstar[N];

        for (k in 1:N) {
            tstar[k] = upper_bound - e[k];
            dzdt[k] = - expm1(-((1.0-t)*tstar[k]/param2)^param1) * r * tstar[k] * exp(-r*tstar[k]*t) / (1.0 - exp(-r*tstar[k]*t));
        }

        return dzdt;
    }
}

data {
    int<lower = 0> N; // number of records
    vector<lower = 0>[N] E_L;
    vector<lower = 0>[N] E_R;
    vector<lower = 0>[N] S_L;
    vector<lower = 0>[N] S_R;
    real<lower = 0> r;
    real<lower = 0> upper_bound;
}

transformed data {
    int X_i[1] = {N};

    real X_r[2] = {upper_bound, r};
}

parameters {
    real<lower = 0> mean_SI;
    real<lower = 0> param1;

    vector<lower = 0, upper = 1>[N] e_raw;
    vector<lower = 0, upper = 1>[N] s_raw;
}

transformed parameters {
    real<lower = 0> param2 = mean_SI/tgamma(1.0+1.0/param1);

    vector<lower = min(S_L), upper = max(S_R)>[N] s;
    vector<lower = min(E_L), upper = max(E_R)>[N] e;

    real Z[N]; 
    
    {
        vector[N] s_;
        real theta[N+2];
        real Z0[N];
        
        s = S_L + (S_R - S_L) .* s_raw;
        for (k in 1:N) 
            if (E_R[k] > s[k]) 
                e[k] = E_L[k] + (s[k] - E_L[k]) * e_raw[k];
            else
                e[k] = E_L[k] + (E_R[k] - E_L[k]) * e_raw[k];

        for (k in 1:N) {
            Z0[k] = 0.0;
            theta[k] = e[k];
        }
        theta[N+1] = param1;
        theta[N+2] = param2;

        Z = to_array_1d(integrate_ode_rk45(fstar_ode, Z0, 0.01, {1.0}, theta, X_r, X_i, 1e-5, 1e-3, 5e2));
    }
}

model {
    mean_SI ~ normal(5.0, 10.0);
    param1 ~ exponential(0.0001);

    e_raw ~ normal(0.5, 1.0);
    s_raw ~ normal(0.5, 1.0);

    for (k in 1:N) 
        target += weibull_lpdf(s[k] - e[k] | param1, param2) - log(Z[k]);
}

generated quantities {
    real sd_SI = param2*sqrt(tgamma(1.0+2.0/param1)-(tgamma(1.0+1.0/param1))^2);

    vector[N] log_likelihood;
    for (k in 1:N) 
        log_likelihood[k] = weibull_lpdf(s[k] - e[k] | param1, param2) - log(Z[k]);
}" %>% cat(file=standirname %&% "/fit.stan", sep="", fill=TRUE)

standistribdir = "../../../../../CmdStan" #-2.22.1
stanscriptdir = "../Dropbox/" %&% substring(standirname,13)
## bash file
"#!/bin/bash
cwd=$(pwd)
cd "%&%standistribdir%&%"
make -j6 "%&%stanscriptdir%&%"/fit
cd "%&%stanscriptdir%&%"
mkdir -p diagnostics
for i in {1..10}
do
    echo Running ${i}
    SEEDNUMBER=$((1+$i))
    ./fit \\
        method=sample num_samples=10000 num_warmup=10000 save_warmup=0 \\
            adapt delta=0.98 \\
            algorithm=hmc \\
                engine=nuts \\
        random seed=${SEEDNUMBER} \\
        id=$i \\
        data file=Data.R \\
        init=Init.R \\
        output file=trace-$i.csv \\
            diagnostic_file=diagnostics/diagnostics-$i.csv > diagnostics/output-$i.txt &
done
echo Finished sampling haha!
" %>% cat(file=standirname%&%"/fit.sh", sep="", fill=TRUE)

## running the bash script
system("bash "%&%standirname%&%"/fit.sh", intern = TRUE)

''
'--- Translating Stan model to C++ code ---'
'bin/stanc --o=../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/weibull-truncated-2.23.0/fit.hpp ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/weibull-truncated-2.23.0/fit.stan'
'mpicxx -fvisibility-inlines-hidden -std=c++17 -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /home/aakhmetz/anaconda3/include -std=c++1y -D_REENTRANT -Wno-sign-compare -Wno-delete-non-virtual-dtor -I stan/lib/stan_math/lib/tbb_2019_U8/include -O3 -I src -I stan/src -I lib/rapidjson_1.1.0/ -I stan/lib/stan_math/ -I stan/lib/stan_math/lib/eigen_3.3.3 -I stan/lib/stan_math/lib/boost_1.72.0 -I stan/lib/stan_math/lib/sundials_5.2.0/include -DNDEBUG -D_FORTIFY_SOURCE=2 -O2 -isystem /home/aakhmetz/anaconda3/include -DBOOST_DISABLE_ASSERTS -DSTAN_MPI -c -MT ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/weibull-truncated-2.23.0/fit.o -MT ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/weibull-truncated-2.23.0/fit -include ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/weibull-truncated-2.23.0/fit.hpp -include src/cmdstan/main.cpp -MM -E -MG -MP -MF ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/weibull-truncated-2.23.0/fit.d ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/weibull-truncated-2.23.0/fit.hpp'
''
'--- Compiling, linking C++ code ---'
'mpicxx -fvisibility-inlines-hidden -std=c++17 -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /home/aakhmetz/anaconda3/include -std=c++1y -D_REENTRANT -Wno-sign-compare -Wno-delete-non-virtual-dtor -I stan/lib/stan_math/lib/tbb_2019_U8/include -O3 -I src -I stan/src -I lib/rapidjson_1.1.0/ -I stan/lib/stan_math/ -I stan/lib/stan_math/lib/eigen_3.3.3 -I stan/lib/stan_math/lib/boost_1.72.0 -I stan/lib/stan_math/lib/sundials_5.2.0/include -DNDEBUG -D_FORTIFY_SOURCE=2 -O2 -isystem /home/aakhmetz/anaconda3/include -DBOOST_DISABLE_ASSERTS -DSTAN_MPI -c -x c++ -o ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/weibull-truncated-2.23.0/fit.o ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/weibull-truncated-2.23.0/fit.hpp'
'mpicxx -fvisibility-inlines-hidden -std=c++17 -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /home/aakhmetz/anaconda3/include -std=c++1y -D_REENTRANT -Wno-sign-compare -Wno-delete-non-virtual-dtor -I stan/lib/stan_math/lib/tbb_2019_U8/include -O3 -I src -I stan/src -I lib/rapidjson_1.1.0/ -I stan/lib/stan_math/ -I stan/lib/stan_math/lib/eigen_3.3.3 -I stan/lib/stan_math/lib/boost_1.72.0 -I stan/lib/stan_math/lib/sundials_5.2.0/include -DNDEBUG -D_FORTIFY_SOURCE=2 -O2 -isystem /home/aakhmetz/anaconda3/include -DBOOST_DISABLE_ASSERTS -DSTAN_MPI -Wl,-O2 -Wl,--sort-common -Wl,--as-needed -Wl,-z,relro -Wl,-z,now -Wl,--disable-new-dtags -Wl,--gc-sections -Wl,-rpath,/home/aakhmetz/anaconda3/lib -Wl,-rpath-link,/home/aakhmetz/anaconda3/lib -L/home/aakhmetz/anaconda3/lib -Wl,-L,"/home/aakhmetz/CmdStan/stan/lib/stan_math/lib/boost_1.72.0/stage/lib" -Wl,-rpath,"/home/aakhmetz/CmdStan/stan/lib/stan_math/lib/boost_1.72.0/stage/lib" -Wl,-L,"/home/aakhmetz/CmdStan/stan/lib/stan_math/lib/tbb" -Wl,-rpath,"/home/aakhmetz/CmdStan/stan/lib/stan_math/lib/tbb" ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/weibull-truncated-2.23.0/fit.o src/cmdstan/main.o stan/lib/stan_math/lib/sundials_5.2.0/lib/libsundials_nvecserial.a stan/lib/stan_math/lib/sundials_5.2.0/lib/libsundials_cvodes.a stan/lib/stan_math/lib/sundials_5.2.0/lib/libsundials_idas.a stan/lib/stan_math/lib/sundials_5.2.0/lib/libsundials_kinsol.a stan/lib/stan_math/lib/boost_1.72.0/stage/lib/libboost_serialization.so stan/lib/stan_math/lib/boost_1.72.0/stage/lib/libboost_mpi.so stan/lib/stan_math/stan/math/prim/functor/mpi_cluster_inst.o stan/lib/stan_math/lib/tbb/libtbb.so.2 -o ../Dropbox/Hokkaido_Backup/Wuhan_Serial_interval_2020/certain/weibull-truncated-2.23.0/fit'
'Running 1'
'Running 2'
'Running 3'
'Running 4'
'Running 5'
'Running 6'
'Running 7'
'Running 8'
'Running 9'
'Running 10'
'Finished sampling haha!'

In [ ]: