stan-dev
diff --git a/‎2018/Contributed-Talks/11_bales/Slides.pdf
2.93 MB b/‎2018/Contributed-Talks/11_bales/Slides.pdf
2.93 MB
diff --git a/‎2018/Contributed-Talks/17_crespo/RmarkdownFaustoCrespo.Rmd
+1,318 b/‎2018/Contributed-Talks/17_crespo/RmarkdownFaustoCrespo.Rmd
+1,318
diff --git a/‎2018/Contributed-Talks/17_crespo/sismos.csv
+855 b/‎2018/Contributed-Talks/17_crespo/sismos.csv
+855
diff --git a/‎2018/Invited-Talks/RabeHesketh_Furr/RH&Furr_StanCon2018_Part2.html
+277 b/‎2018/Invited-Talks/RabeHesketh_Furr/RH&Furr_StanCon2018_Part2.html
+277
diff --git a/‎2018/Invited-Talks/RabeHesketh_Furr/RabeHesketh&Furr_StanCon2018_4pp.pdf
113 KB b/‎2018/Invited-Talks/RabeHesketh_Furr/RabeHesketh&Furr_StanCon2018_4pp.pdf
113 KB
diff --git a/‎2018/Invited-Talks/RabeHesketh_Furr/RabeHesketh&Furr_StanCon2018_Slides.pdf
249 KB b/‎2018/Invited-Talks/RabeHesketh_Furr/RabeHesketh&Furr_StanCon2018_Slides.pdf
249 KB
diff --git a/‎2018/Invited-Talks/RabeHesketh_Furr/example_irt_analysis.R
+156 b/‎2018/Invited-Talks/RabeHesketh_Furr/example_irt_analysis.R
+156
diff --git a/‎2018/Invited-Talks/RabeHesketh_Furr/rasch_edstan_modified.stan
+71 b/‎2018/Invited-Talks/RabeHesketh_Furr/rasch_edstan_modified.stan
+71
diff --git a/‎2018/Invited-Talks/Weiss.pdf
6.83 MB b/‎2018/Invited-Talks/Weiss.pdf
6.83 MB
@@ -0,0 +1,156 @@
+# Set up -----------------------------------------------------------------------
+
+library(rstan)
+library(edstan)
+library(loo)
+library(reshape2)
+library(doParallel)
+options(mc.cores = 5)
+options(loo.cores = 5)
+
+
+# Functions --------------------------------------------------------------------
+
+# Replacement for rstan::get_posterior_means() that returns object with same
+# structure as rstan::extract()
+# stan_fit: A fitted Stan model
+better_posterior_means <- function(stan_fit) {
+  draws <- extract(stan_fit, stan_fit@model_pars)
+  f <- function(x) {
+    dims <- dim(x)
+    n_dims <- length(dims)
+    if (n_dims == 1) {
+      mean(x)
+    } else {
+      m <- apply(x, 2:n_dims, mean)
+      array(m, dim = c(1, dims[-1]))
+    }
+  }
+  lapply(draws, f)
+}
+
+
+# Function to obtain marginal likelihoods with parallel processing. 
+# stan_fit: Fitted Stan model
+# data_list: Data list used in fitting model
+# MFUN: Function to calculate marginal likelihood for cluster at a node 
+#   location. This is application specific.
+# resid_name: Name of residual in Stan program to integrate out
+# sd_name: Name of SD for residual in Stan program
+# n_nodes: Number of adaptive quadrature nodes to use
+# best_only: Whether to evaluate marginal likelihood only at posterior means
+mll_parallel <- function(stan_fit, data_list, MFUN, resid_name, sd_name, n_nodes,
+                         best_only = FALSE) {
+  
+  library(foreach)
+  library(statmod)       # For gauss.quad.prob()
+  library(matrixStats)   # For logSumExp()
+  
+  draws <- extract(stan_fit, stan_fit@model_pars)
+  n_iter <- ifelse(best_only, 0, nrow(draws$lp__))
+  post_means <- better_posterior_means(stan_fit)
+  
+  # Seperate out draws for residuals and their SD
+  resid <- apply(draws[[resid_name]], 2, mean)
+  stddev <- apply(draws[[resid_name]], 2, sd)
+  
+  # Get standard quadrature points
+  std_quad <- gauss.quad.prob(n_nodes, "normal", mu = 0, sigma = 1)
+  std_log_weights <- log(std_quad$weights)
+  
+  # Extra iteration is to evaluate marginal log-likelihood at parameter means.
+  ll <- foreach(i = 1:(n_iter + 1), .combine = rbind,
+                .packages = "matrixStats") %dopar% {
+                  
+    ll_j <- matrix(NA, nrow = 1, ncol = ncol(draws[[resid_name]]))
+    
+    for(j in 1:ncol(ll_j)) {
+      
+      # Set up adaptive quadrature using SD for residuals either from draws or
+      # posterior mean (for best_ll).
+      sd_i <- ifelse(i <= n_iter, draws[[sd_name]][i], post_means[[sd_name]])
+      adapt_nodes <- resid[j] + stddev[j] * std_quad$nodes
+      log_weights <- log(sqrt(2*pi)) + log(stddev[j]) + std_quad$nodes^2/2 +
+        dnorm(adapt_nodes, sd = sd_i, log = TRUE) + std_log_weights
+      
+      # Evaluate mll with adaptive quadrature. If at n_iter + 1, evaluate
+      # marginal likelihood at posterior means.
+      if(i <= n_iter) {
+        loglik_by_node <- sapply(adapt_nodes, FUN = MFUN, r = j, iter = i,
+                                 data_list = data_list, draws = draws)
+        weighted_loglik_by_node <- loglik_by_node + log_weights
+        ll_j[1,j] <- logSumExp(weighted_loglik_by_node)
+      } else {
+        loglik_by_node <- sapply(adapt_nodes, FUN = MFUN, r = j, iter = 1,
+                                 data_list = data_list, draws = post_means)
+        weighted_loglik_by_node <- loglik_by_node + log_weights
+        ll_j[1,j] <- logSumExp(weighted_loglik_by_node)
+      }
+      
+    }
+    
+    ll_j
+    
+  }
+  
+  if(best_only) {
+    return(ll[nrow(ll), ])
+  } else {
+    return(list(ll = ll[-nrow(ll), ], best_ll = ll[nrow(ll), ]))
+  }
+  
+}
+
+
+# Function to calculate likelihood for a cluster for an adaptive quad node
+# specific to the IRT example. Similar functions would be written for other
+# applications and passed to mll_parallel().
+# node: node location
+# r: index for cluster
+# iter: mcmc iteration
+# data_list: data used to fit Stan model
+# draws: mcmc draws from fitted Stan model
+f_marginal <- function(node, r, iter, data_list, draws) {
+  y <- data_list$y[data_list$jj == r]
+  theta_fix <- draws$theta_fix[iter, r]
+  delta <- draws$delta[iter, data_list$ii[data_list$jj == r]]
+  p <- boot::inv.logit(theta_fix + node - delta)
+  sum(dbinom(y, 1, p, log = TRUE))
+}
+
+
+# Function to calculate DIC
+# ll_obj: Object returned by mll_parallel()
+dic <- function(ll_obj) {
+  full_ll <- apply(ll_obj$ll, 1, sum)
+  full_best <- sum(ll_obj$best_ll)
+  mean_lpd <-  mean(full_ll)
+  pdic <- 2 * (full_best - mean_lpd)
+  elpd_dic <- full_best - pdic
+  c(elpd_dic = elpd_dic, p_dic = pdic, dic = -2*elpd_dic,
+    best_lpd = full_best, mean_lpd = mean_lpd)
+}
+
+
+# Example analysis -------------------------------------------------------------
+
+# Assemble example dataset
+dl <- irt_data(y = aggression$dich, jj = aggression$person,
+               ii = aggression$item, covariates = aggression,
+               formula = ~ 1 + male + anger)
+
+# Fit model
+fit <- stan("rasch_edstan_modified.stan", data = dl, iter = 500, chains = 5)
+
+# Obtain marginal likelihoods
+cl <- makeCluster(5)
+registerDoParallel(cl)
+ll_marg <- mll_parallel(fit, dl, f_marginal, "zeta", "sigma", 11)
+stopCluster(cl)
+
+# Obtain marginal information criteria
+dic(ll_marg)
+waic(ll_marg$ll)
+loo(ll_marg$ll)
+
+
@@ -0,0 +1,71 @@
+functions {
+  matrix obtain_adjustments(matrix W) {
+    real min_w;
+    real max_w;
+    int minmax_count;
+    matrix[2, cols(W)] adj;
+    adj[1, 1] = 0;
+    adj[2, 1] = 1;
+    if(cols(W) > 1) {
+      for(k in 2:cols(W)) {                       // remaining columns
+        min_w = min(W[1:rows(W), k]);
+        max_w = max(W[1:rows(W), k]);
+        minmax_count = 0;
+        for(j in 1:rows(W))
+          minmax_count = minmax_count + W[j,k] == min_w || W[j,k] == max_w;
+        if(minmax_count == rows(W)) {       // if column takes only 2 values
+          adj[1, k] = mean(W[1:rows(W), k]);
+          adj[2, k] = (max_w - min_w);
+        } else {                            // if column takes > 2 values
+          adj[1, k] = mean(W[1:rows(W), k]);
+          adj[2, k] = sd(W[1:rows(W), k]) * 2;
+        }
+      }
+    }
+    return adj;
+  }
+}
+data {
+  int<lower=1> I;               // # questions
+  int<lower=1> J;               // # persons
+  int<lower=1> N;               // # observations
+  int<lower=1, upper=I> ii[N];  // question for n
+  int<lower=1, upper=J> jj[N];  // person for n
+  int<lower=0, upper=1> y[N];   // correctness for n
+  int<lower=1> K;               // # person covariates
+  matrix[J,K] W;                // person covariate matrix
+}
+transformed data {
+  matrix[2,K] adj;               // values for centering and scaling covariates
+  matrix[J,K] W_adj;             // centered and scaled covariates
+  adj = obtain_adjustments(W);
+  for(k in 1:K) for(j in 1:J)
+      W_adj[j,k] = (W[j,k] - adj[1,k]) / adj[2,k];
+}
+parameters {
+  vector[I-1] delta_free;
+  vector[J] theta;
+  real<lower=0> sigma;
+  vector[K] lambda_adj;
+}
+transformed parameters {
+  vector[I] delta;
+  delta[1:(I-1)] = delta_free;
+  delta[I] = -1*sum(delta_free);
+}
+model {
+  target += normal_lpdf(delta | 0, 3);
+  theta ~ normal(W_adj*lambda_adj, sigma);
+  lambda_adj ~ student_t(3, 0, 1);
+  sigma ~ exponential(.1);
+  y ~ bernoulli_logit(theta[jj] - delta[ii]);
+}
+generated quantities {
+  vector[K] lambda;
+  vector[J] theta_fix;
+  vector[J] zeta;
+  lambda[2:K] = lambda_adj[2:K] ./ to_vector(adj[2,2:K]);
+  lambda[1] = W_adj[1, 1:K]*lambda_adj[1:K] - W[1, 2:K]*lambda[2:K];
+  theta_fix = W_adj*lambda_adj;
+  zeta = theta - theta_fix;
+}