├── DESCRIPTION
├── NAMESPACE
├── R
    ├── boot2lme.R
    ├── svy2lme.R
    ├── svy2relmat.R
    └── svylmeNG.R
├── README.md
├── THANKS
├── data
    ├── milk_subset.rda
    ├── nzmaths.rda
    └── pisa.rda
├── inst
    ├── COPYRIGHTS
    └── scripts
    │   ├── README
    │   ├── milk-sampling.R
    │   ├── pairwise-milk.R
    │   ├── pisa-analysis.R
    │   ├── svy2lmesim2.R
    │   ├── twins-pairwise.R
    │   └── twins-sampling.R
└── man
    ├── boot2lme.Rd
    ├── milk_subset.Rd
    ├── nzmaths.Rd
    ├── pisa.Rd
    ├── svy2lme.Rd
    └── svy2relmer.Rd


/DESCRIPTION:
--------------------------------------------------------------------------------
 1 | Package: svylme
 2 | Title: Linear Mixed Models for Complex Survey Data
 3 | Version: 1.5-2
 4 | Authors@R: person("Thomas", "Lumley", email = "t.lumley@auckland.ac.nz",
 5 |   role = c("aut", "cre"))
 6 | Description: Linear mixed models for complex survey data, by pairwise composite likelihood, as described in Lumley & Huang (2023) <arXiv:2311.13048>. Supports nested and crossed random effects, and correlated random effects as in genetic models.  Allows for multistage sampling and for other designs where pairwise sampling probabilities are specified or can be calculated. 
 7 | Imports: minqa, Matrix, lme4, methods, utils, stats
 8 | Depends: survey, R (>= 3.5.0)
 9 | License: GPL-3
10 | Maintainer: Thomas Lumley <t.lumley@auckland.ac.nz>
11 | 
12 | 


--------------------------------------------------------------------------------
/NAMESPACE:
--------------------------------------------------------------------------------
 1 | import(Matrix)
 2 | import(methods)
 3 | import(minqa)
 4 | import(survey)
 5 | import(lme4)
 6 | importFrom(utils,setTxtProgressBar)
 7 | importFrom(utils,txtProgressBar)
 8 | importFrom("stats", "ave", "model.frame", "pnorm", "weights")
 9 | importFrom("stats", "printCoefmat")
10 | importFrom("stats", "vcov")
11 | export(svy2lme,svy2relmer)
12 | export(boot2lme)
13 | 
14 | S3method(print,svy2lme)
15 | S3method(print, boot2lme)
16 | 
17 | S3method(coef,svy2lme)
18 | 
19 | S3method(vcov,svy2lme)
20 | S3method(vcov,boot2lme)
21 | 
22 | 
23 | 


--------------------------------------------------------------------------------
/R/boot2lme.R:
--------------------------------------------------------------------------------
  1 | 
  2 | boot2lme<-function(model, rdesign, verbose=FALSE){
  3 | 
  4 |     if(is.null(model$devfun)) stop("model must be fitted with return.devfun=TRUE")
  5 |     
  6 |     naa<-environment(model$devfun)$naa
  7 |     if (!is.null(naa)){
  8 |         if (length(environment(model$devfun)$y)+length(naa) == NROW(rdesign))
  9 |             rdesign<-rdesign[-naa,,drop=FALSE]
 10 |         if(verbose) warning(paste(length(naa),"observations dropped because of missing values"))
 11 |         }
 12 |     if (length(environment(model$devfun)$y) != NROW(rdesign)){
 13 |         stop("number of rows of design does not match model")
 14 |     }
 15 | 
 16 |     basewts<-weights(rdesign, "sampling")
 17 |     replicates<-weights(rdesign, "analysis")
 18 |     scale<-rdesign$scale
 19 |     rscales<-rdesign$rscales
 20 | 
 21 |      
 22 |     nrep<-ncol(replicates)
 23 |     pwt0<-if (model$method=="nested") get("pwts",environment(model$devfun)) else get("pwt",environment(model$devfun))
 24 |     if (is.null(rscales)) rscales<-rep(1,nrep)
 25 | 
 26 |     ii<-get("ii", environment(model$devfun))
 27 |     jj<-get("jj", environment(model$devfun))  
 28 |     repwt<-(replicates/basewts)[ii,]
 29 |     repwtj<-(replicates/basewts)[jj,]
 30 |     if ((model$method=="nested") && (any(abs((repwt-repwtj)/(1+repwt+repwtj))>1e-5)))
 31 |         warning("replicate weights vary within cluster")
 32 |     else {
 33 |         repwt<-repwt*repwtj
 34 |     }
 35 |     
 36 |     theta0<-model$opt$par
 37 |     thetastar<-matrix(nrow=nrep,ncol=length(theta0))
 38 |     betastar<-matrix(nrow=nrep,ncol=length(model$beta))
 39 |     s2star<-numeric(nrep)
 40 | 
 41 |     D<-get("L",environment(model$devfun))
 42 |     Dstar<-array(0,c(nrep,NROW(D),NCOL(D)))
 43 |     
 44 |     if (verbose) pb<-txtProgressBar(min = 0, max = nrep, style = 3)
 45 | 
 46 |     for(i in 1:nrep){
 47 |         if (verbose) setTxtProgressBar(pb, i)
 48 |         if (model$method=="nested"){
 49 |         thetastar[i,]<-bobyqa(theta0, model$devfun,
 50 |                               lower = model$lower,
 51 |                               upper = rep(Inf, length(theta0)), pwt=repwt[,i]*pwt0)$par
 52 |         } else { ## need to pass in univariate weights as well, for all.pairs. 
 53 |             thetastar[i,]<-bobyqa(theta0, model$devfun,
 54 |                               lower = model$lower,
 55 |                               upper = rep(Inf, length(theta0)),
 56 |                               pwt_new=repwt[,i]*pwt0,
 57 |                               pw_uni_new=weights(rdesign,"analysis")[,i],
 58 |                               subtract_margins=model$subtract.margins)$par
 59 |          }
 60 |         betastar[i,]<-get("beta",environment(model$devfun))
 61 |         s2star[i]<-get("s2",environment(model$devfun))
 62 |         Dstar[i,,]<-get("L",environment(model$devfun))
 63 |     }
 64 | 
 65 |     if(verbose) close(pb)
 66 |     
 67 |     rval<-list(theta=thetastar, beta=betastar, s2=s2star, D=Dstar,scale=scale, rscales=rscales, formula=model$formula)
 68 | 
 69 |     class(rval)<-"boot2lme"
 70 |     rval   
 71 | }
 72 | 
 73 | print.boot2lme<-function(x,...){
 74 |     cat("boot2lme:",length(x$s2),"replicates from", deparse(x$formula))
 75 |     invisible(x)
 76 | }
 77 | 
 78 | vcov.boot2lme<-function(object, parameter=c("beta","theta","s2","relSD","SD","relVar","fullVar"),...){
 79 |     parameter<-match.arg(parameter)
 80 | 
 81 |     nthetas<-NCOL(object$theta)
 82 | 
 83 |     if (nthetas==1){
 84 |            V<-switch(parameter,
 85 |                       beta=svrVar(object$beta, object$scale,object$rscales),
 86 |                       theta=svrVar(object$theta, object$scale,object$rscales),
 87 |                       s2=svrVar(object$s2, object$scale, object$rscales),
 88 |                       relSD=svrVar(sqrt((apply(object$D,1, diag))), object$scale, object$rscales), ##FIXME: dimension decay when there's just one random effect
 89 |                       SD=svrVar(sqrt((apply(object$D,1, diag))*object$s2), object$scale, object$rscales),
 90 |                       relVar=svrVar((apply(object$D,1,c)), object$scale, object$rscales),
 91 |                       fullVar=svrVar((apply(object$D,1,c))*object$s2, object$scale, object$rscales)
 92 |                       )
 93 | 
 94 |         } else {
 95 |             V<-switch(parameter,
 96 |                       beta=svrVar(object$beta, object$scale,object$rscales),
 97 |                       theta=svrVar(object$theta, object$scale,object$rscales),
 98 |                       s2=svrVar(object$s2, object$scale, object$rscales),
 99 |                       relSD=svrVar(sqrt(t(apply(object$D,1, diag))), object$scale, object$rscales), ##FIXME: dimension decay when there's just one random effect
100 |                       SD=svrVar(sqrt(t(apply(object$D,1, diag))*object$s2), object$scale, object$rscales),
101 |                       relVar=svrVar(t(apply(object$D,1,c)), object$scale, object$rscales),
102 |                       fullVar=svrVar(t(apply(object$D,1,c))*object$s2, object$scale, object$rscales)
103 |                       )
104 |     }
105 | 
106 |     as.matrix(V)
107 | 
108 |     }
109 | 


--------------------------------------------------------------------------------
/R/svy2lme.R:
--------------------------------------------------------------------------------
  1 | ## like all.equal only specialised to matrices and returns logical
  2 | is_close<-function(a,b, tolerance=1e-5){
  3 |     all(abs((as.matrix(a)-as.matrix(b))/(as.matrix(a)+as.matrix(b)))<tolerance)
  4 | }
  5 | 
  6 | 
  7 | ## safe devision
  8 | "%//%"<-function(e1,e2) ifelse(e1==0,0, e1/e2)
  9 | 
 10 | 
 11 | 
 12 | ## For nested sampling: assumes PSUs are not correlated and so a
 13 | ## pair can't have observations from two PSUs
 14 | ## $first are marginal PSU weights
 15 | ## $cond are conditional pairwise weights given that the PSU is selected
 16 | ## $all are the full pairwise weights
 17 | ## first and cond are needed for the sandwich estimator, not for the
 18 | ##   pairwise likelihood itself
 19 | pi_from_design<-function(design, ii,jj){
 20 | 
 21 |     if (design$pps && !is.null(design$dcheck)){
 22 |         ## We have pairwise probabilities already. Or, at least, covariances
 23 |         Deltacheck<-design$dcheck[ii,jj]
 24 |         indep<-design$prob[ii]*design$prob[jj]
 25 |         pi_ij<-(Deltacheck+1)*indep
 26 | 
 27 |         last<-ncol(design$allprob)
 28 |         n<-design$fpc$sampsize
 29 |         N<-design$fpc$popsize
 30 | 
 31 |         ## But sandwich standard errors would require fourth-order probabilities
 32 |         return(list(full=pi_ij,
 33 |                     first=NULL,
 34 |                     cond=NULL))
 35 |         }
 36 |     
 37 |     if (NCOL(design$allprob)==1){
 38 |         ## No multistage weights
 39 |         if (NCOL(design$cluster)>1)
 40 |             stop("you need weights/probabilities for each stage of sampling")
 41 |         
 42 |         if (NCOL(design$cluster)==1 && !any(duplicated(design$cluster))){
 43 |             ## ok, element sampling
 44 |             if(is.null(design$fpc$popsize)) #with replacement
 45 |                 return(list(full=design$prob[ii]*design$prob[jj],
 46 |                        first=design$prob[ii],
 47 |                        cond=rep(1,length(ii))))
 48 |             else if(is_close(as.vector(design$allprob),
 49 |                               as.vector(design$fpc$sampsize/design$fpc$popsize),tolerance=1e-4)){
 50 |                 # srs, possibly stratified
 51 |                 n<-design$fpc$sampsize
 52 |                 N<-design$fpc$popsize
 53 |                 return(list(full= n[ii]*(n[jj]-1)%//%( N[ii]*(N[jj]-1)),
 54 |                             first=n[ii]/N[ii],
 55 |                             cond=rep(1,length(ii))))
 56 |             } else {
 57 |                 ## Hajek high entropy: based on Brewer p153, equation 9.14
 58 |                 pi<-design$allprob
 59 |                 denom<-ave(1-pi, design$strata,FUN=sum)
 60 |                 samestrata<-(design$strata[ii]==design$strata[jj])
 61 |                 return(list(full=pi[ii]*pi[jj]*(1- ifelse(samestrata, (1-pi[ii])*(1-pi[jj])/denom, 0)),
 62 |                             first=pi[ii],
 63 |                             cond=rep(1,length(ii))))
 64 |             }
 65 |         } else if (all(by(design$prob, design$cluster[,1], function(x) length(unique(x)))==1)) {
 66 |             ## possibly ok, sampling of whole clusters
 67 |             warning("assuming no subsampling within clusters because multi-stage weights were not given")
 68 |              if(is.null(design$fpc$popsize)) #with replacement
 69 |                  return(list(full=design$prob[ii],
 70 |                              first=design$prob[ii],
 71 |                              cond=rep(1, length(ii))))
 72 |             else if(is_close(as.vector(design$allprob[[1]]),
 73 |                               as.vector(design$fpc$sampsize/design$fpc$popsize),tolerance=1e-4)){
 74 |                 # srs, possibly stratified
 75 |                 n<-design$fpc$sampsize
 76 |                 N<-design$fpc$popsize
 77 |                 return(list(full= (n[ii]/N[ii]),
 78 |                             first=n[ii]/N[ii],
 79 |                             cond=rep(1,length(ii))))
 80 |             } else {
 81 |                 ## Hajek high entropy: based on Brewer p153, equation 9.14
 82 |                 pi<-design$allprob
 83 |                 denom<-ave(1-pi, design$strata,FUN=sum)
 84 |                 samestrata<-(design$strata[ii,1]==design$strata[jj,1])
 85 |                 return(list(full=pi[ii,1],
 86 |                             first=pi[ii,1],
 87 |                             cond=rep(1,length(ii))))
 88 |             }
 89 |         } else {
 90 |             ## not ok
 91 |             stop("you need weights/probabilities for each stage of sampling")
 92 |         }       
 93 |     }
 94 | 
 95 |     ## If we're here, we have multistage weights
 96 |     if (ncol(design$allprob)!=ncol(design$cluster)){
 97 |         ## ? can't happen
 98 |         stop("number of stages of sampling does not match number of stages of weights")
 99 |     }
100 | 
101 |     if(is.null(design$fpc$popsize)){ #with replacement
102 |         last<-ncol(design$allprob)
103 |         return(list(full=design$prob[ii]*design$allprob[jj,last],
104 |                     first=apply(design$allprob[ii,-last, drop=FALSE], 1, prod),
105 |                     cond=design$allprob[ii,last]*design$allprob[jj,last]))
106 |     }
107 |     if(all.equal(as.matrix(design$allprob), as.matrix(design$fpc$sampsize/design$fpc$popsize),tolerance=1e-4)){
108 |         ## multistage stratified random sampling
109 |         last<-ncol(design$allprob)
110 |         n<-design$fpc$sampsize
111 |         N<-design$fpc$popsize
112 |         samestrata<-(design$strata[ii, ]==design$strata[jj, ])
113 |         pstages <-(n[ii,]/N[ii,])*(samestrata*((n[jj,]-1)%//%(N[jj,]-1)) + (1-samestrata)*(n[jj,]/N[jj,]))  ##FIXME divide by  zero when N==1
114 |         return(list(full=apply((n[ii,]/N[ii,])[,-last,drop=FALSE],1,prod)*pstages[,last],
115 |                     first=apply((n[ii,]/N[ii,])[,-last,drop=FALSE],1,prod),
116 |                     cond=pstages[,last]))
117 |     }
118 | 
119 |     ## Hajek high entropy: Brewer p153
120 |     first<-cpwt<-rep_len(1,length(ii))
121 |     for (i in 1:ncol(design$allprob)){
122 |         pi<-design$allprob[,i]
123 |         denom<-ave(1-pi, design$strata[,i],FUN=sum)
124 |         samestrata<-(design$strata[ii,i]==design$strata[jj,i])
125 |         if (i==ncol(design$allprob))
126 |             cpwt<-cpwt*pi[ii]*pi[jj]*(1- ifelse(samestrata, (1-pi[ii])*(1-pi[jj])/denom, 0))
127 |         else
128 |             first<-first*pi[ii]
129 |     }
130 |     return(list(full=first*cpwt, first= first, cond=cpwt))
131 | 
132 | }
133 | 
134 | getpairs<-function(gp, TOOBIG=1000){
135 |     n<-length(gp)
136 |     if (n < TOOBIG){
137 |         ij<-outer(gp,gp,"==")
138 |         ij<-ij & upper.tri(ij)
139 |         return(which(ij,arr.ind=TRUE))
140 |     } 
141 | 
142 |     ng<-ave(1:n, gp, FUN=length)
143 |     j<-rep(1:n,ng)
144 |     i<-numeric(length(j))
145 |     for (g in unique(gp)){
146 |         this<- which(gp[j]==g)
147 |         i[this] <-which(gp==g)
148 |         }
149 |     data.frame(i=i[i<j],j=j[i<j])
150 |     }
151 | 
152 | svy2lme_nested<-function(formula,design,sterr=TRUE, return.devfun=FALSE){
153 | 
154 |     data<-model.frame(design)
155 |     
156 |     ## Use unweighted model to get starting values and set up variables
157 |     m0<-lme4::lmer(formula,data,REML=FALSE)
158 | 
159 |     ## remove missing from design
160 |     if (!is.null(naa<-attr(m0@frame,"na.action"))){
161 |         design<-design[-naa,]
162 |     }
163 | 
164 | 
165 |     ## Extract varables
166 |     y<-m0@resp$y
167 |     X<-m0@pp$X
168 | 
169 |     ## cluster indicator
170 |     g<-m0@flist[[1]]
171 |     if (sterr){
172 |         ll<-NCOL(design$cluster)
173 |         gpsu<-g[!duplicated(design$cluster[,ll-1])]
174 |         if(any(duplicated(gpsu))){
175 |             stop("model clusters must be nested in design clusters")
176 |         }
177 |     }
178 |     
179 |     ## number of clusters
180 |     n1<-length(unique(g))
181 |     ## number of random effects
182 |     qis<-sapply(m0@cnms,length)
183 |     q<-sum(qis)
184 |     n<-NROW(X)
185 | 
186 |     ## Z in lme4::lmer has separate columns for each cluster; restructure it
187 |     Z<-matrix(nrow=n, ncol=sum(qis))
188 |     pos<-0
189 |     npos<-0
190 |     for(qi in qis){
191 |         Z[,pos+(1:qi)]<-as.matrix(crossprod(m0@pp$Zt[npos+(1:(n1*qi)),,drop=FALSE], outer(1:(n1*qi),1:qi,function(i,j) ((i-j) %% qi)==0)*1))
192 |         pos<-pos+qi
193 |         npos<-npos+qi*n1
194 |     }
195 |     
196 |     ##Z<-crossprod(m0@pp$Zt, (outer(1:(n1*q),1:q,function(i,j) ((i-j) %% q)==0)*1))
197 | 
198 | 
199 |     ## all pairs within same cluster
200 |     ## Conceptually:
201 |     ## ij<-subset(expand.grid(i=1:n,j=1:n), (g[i] == g[j]) & (i<j))
202 |     ## but needs to work when n^2 is too big to construct
203 |     ij<-getpairs(g)
204 |     
205 |     ## columns of indices for first and second observation in a pair
206 |     ii<-ij[,1]
207 |     jj<-ij[,2]
208 |     npairs<-nrow(ij)
209 |     
210 |     p<-NCOL(X)
211 |     
212 |     ## starting values from the unweighted model
213 |     s2<-m0@devcomp$cmp["sigmaML"]^2
214 |     theta<-theta0<- m0@theta
215 |     beta<-beta0<-lme4::fixef(m0)
216 | 
217 |     ## second-order weights
218 |     allpwts<-pi_from_design(design,ii,jj)
219 |     pwts<-1/allpwts$full
220 |     pwt2<-1/allpwts$cond
221 |     p1<-allpwts$first
222 |     
223 |     ## if (is.null(N2)){
224 |     ##     ## using probabilities
225 |     ##     pwt2 <- (1/p2[ii])*(1/p2[jj])
226 |     ##     pwts<- (1/p1[ii])*pwt2  ## with replacement at stage 2
227 |     ## } else {
228 |     ##     ## using cluster size
229 |     ##     n2<-ave(as.numeric(g), g, FUN=length)
230 |     ##     pwt2<-N2[ii]*(N2[jj]-1)/(n2[ii]*(n2[ii]-1))
231 |     ##     pwts<-(1/p1[ii])*pwt2  ## SRS without replacement at stage 2
232 |     ## }
233 | 
234 |     ## variance matrix of random effects
235 |     qi<-sapply(m0@cnms,length)
236 |     L<-as.matrix(Matrix::bdiag(lapply(qi,function(i) matrix(1,i,i))))
237 |     ###(need indicator for where thetas go in the matrix)
238 |     ThInd<-which((L==1) & lower.tri(L,diag=TRUE))
239 |     
240 |     ## profile pairwise deviance
241 |     devfun<-function(theta,pwt){
242 |         ## variance parameters: Cholesky square root of variance matrix
243 |         Th<-matrix(0,q,q)
244 |         Th[ThInd]<-theta
245 |         L[]<<-tcrossprod(Th)
246 | 
247 |         ## v11 is a vector of (1,1) entries of the matrix var(Y)
248 |         ## for each pair, similarly for the others
249 |         v11<-(rowSums(Z[ii,,drop=FALSE]*( Z[ii,,drop=FALSE]%*%L))+1)
250 |         v12<-rowSums(Z[ii,,drop=FALSE]*(Z[jj,,drop=FALSE]%*%L))
251 |         v22<-(rowSums(Z[jj,,drop=FALSE]*(Z[jj,,drop=FALSE]%*%L))+1)
252 |         ## explicit 2x2 determinants
253 |         det<-v11*v22-v12*v12
254 |         ## explicit 2x2 inverses
255 |         inv11<- v22/det
256 |         inv22<- v11/det
257 |         inv12<- -v12/det
258 | 
259 |         ## X matrices for first and second element of each pair
260 |         Xii<-X[ii,,drop=FALSE]
261 |         Xjj<-X[jj,,drop=FALSE]
262 | 
263 |         ## X^TWX
264 |         xtwx<- crossprod(Xii,pwt*inv11*Xii)+
265 |             crossprod(Xjj,pwt*inv22*Xjj)+
266 |             crossprod(Xii,pwt*inv12*Xjj)+
267 |             crossprod(Xjj,pwt*inv12*Xii)
268 | 
269 |         ## X^WY
270 |         xtwy<-crossprod(Xii,pwt*inv11*y[ii])+
271 |             crossprod(Xjj,pwt*inv22*y[jj])+
272 |             crossprod(Xii,pwt*inv12*y[jj])+
273 |             crossprod(Xjj,pwt*inv12*y[ii])
274 | 
275 |         ## betahat at the given variance parameter values
276 |         beta<<-solve(xtwx,xtwy)
277 |         Xbeta<-X%*%beta
278 | 
279 |         ## two residuals per pair
280 |         r<-y-Xbeta
281 |         r1<-r[ii]
282 |         r2<-r[jj]
283 | 
284 |         ## -2 times Gaussian log profile pairwise likelihood
285 |         qf<-crossprod(r1,pwt*inv11*r1)+
286 |             crossprod(r2,pwt*inv22*r2)+
287 |             crossprod(r1,pwt*inv12*r2)+
288 |             crossprod(r2,pwt*inv12*r1)
289 | 
290 |         Nhat<-sum(pwt)*2
291 |         s2<<-qf/Nhat
292 |         
293 |         ##sum(log(det)*pwt) + qf 
294 |         sum(log(det)*pwt) + Nhat*log(qf*2*pi/Nhat)
295 |         
296 |     }
297 | 
298 |     ## Standard errors of regression parameters
299 |     Vbeta<-function(theta,pwt){
300 |         ## setup exactly as in devfun
301 |         Th<-matrix(0,q,q)
302 |         Th[ThInd]<-theta
303 |         L<<-tcrossprod(Th)
304 |         
305 |         v11<-(rowSums(Z[ii,,drop=FALSE]*( Z[ii,,drop=FALSE]%*%L))+1)
306 |         v12<-rowSums(Z[ii,,drop=FALSE]*(Z[jj,,drop=FALSE]%*%L))
307 |         v22<-(rowSums(Z[jj,,drop=FALSE]*(Z[jj,,drop=FALSE]%*%L))+1)
308 |         det<-v11*v22-v12*v12
309 |         inv11<- v22/det
310 |         inv22<- v11/det
311 |         inv12<- -v12/det
312 |         
313 |         Xii<-X[ii,,drop=FALSE]
314 |         Xjj<-X[jj,,drop=FALSE]
315 |         
316 |         xtwx<- crossprod(Xii,pwt*inv11*Xii)+
317 |             crossprod(Xjj,pwt*inv22*Xjj)+
318 |             crossprod(Xii,pwt*inv12*Xjj)+
319 |             crossprod(Xjj,pwt*inv12*Xii)
320 |         
321 |         Xbeta<-X%*%beta
322 |         r<-y-Xbeta
323 |         r1<-r[ii]
324 |         r2<-r[jj]
325 | 
326 |         ## score for betas
327 |         xwr<-Xii*pwt2*(inv11*r1)+
328 |             Xjj*pwt2*(inv22*r2)+
329 |             Xii*pwt2*(inv12*r2)+
330 |             Xjj*pwt2*(inv12*r1)
331 | 
332 |         ## There could be multiple clusters in the same PSU
333 |         ## Sum the cluster influence functions over PSU, then crossprod
334 |         
335 |         ## cluster weights
336 |         p1g<-p1[!duplicated(g[ii])]
337 | 
338 |         if (is.null(design)){
339 |             ## sandwich estimator
340 |             J<-crossprod((1/p1g)*rowsum(xwr,g[ii],reorder=FALSE)*sqrt(n1/(n1-1)))
341 |             G<-solve(xtwx)
342 |             G%*%J%*%G
343 |         } else {
344 |             inffun<-(1/p1g)*rowsum(xwr,g[ii],reorder=FALSE)%*%solve(xtwx)
345 |             PSUg<-design$cluster[,1][ii[!duplicated(g[ii])]]
346 |             
347 |             inffunS<-rowsum(inffun, PSUg,reorder=FALSE)
348 |             stratPSU<-design$strata[,1][ii[!duplicated(design$cluster[,1][ii])]] ##FIXME to allow single-PSU strata?
349 | 
350 |             one<-rep(1,NROW(inffunS))
351 |             ni<-ave(one,stratPSU,FUN=NROW)
352 |             centering<-apply(inffunS,2,function(x) ave(x, stratPSU, FUN=mean))
353 |             centered<- inffunS-centering
354 |             crossprod(centered*sqrt(ni/ifelse(ni==1,1,(ni-1))))
355 |         }
356 |     }
357 |     
358 | 
359 |     ## Powell's derivative-free quadratic optimiser
360 |     fit<-bobyqa(theta0, devfun,
361 |                 lower = m0@lower,
362 |                 upper = rep(Inf, length(theta)), pwt=pwts)
363 | 
364 |     ## variance of betas, if wanted
365 |     Vbeta<-if (sterr) Vbeta(fit$par,pwts) else matrix(NA,q,q)
366 |     
367 |     ## return all the things
368 |     rval<-list(opt=fit,
369 |                s2=s2,
370 |                beta=beta,
371 |                Vbeta=Vbeta,
372 |                formula=formula,
373 |                znames=do.call(c,m0@cnms),
374 |                L=L, method="nested")
375 |     
376 |     ## for resampling
377 |     if(return.devfun) {
378 |         rval$devfun<-devfun
379 |         rval$lower<-m0@lower
380 |         }
381 |     
382 |     class(rval)<-"svy2lme"
383 |     rval
384 | }
385 |         
386 | 
387 |  
388 | print.svy2lme<-function(x,digits=max(3L, getOption("digits") - 3L),...){
389 |     cat("Linear mixed model fitted by pairwise pseudolikelihood\n")
390 |     if(!is.null(x$call)){
391 |         cat("Call: ")
392 |         cat(paste(deparse(x$call),collapse="\n"))
393 |     }else{
394 |             cat("Formula: ")
395 |             cat(paste(deparse(x$formula),collapse="\n"))
396 |     }
397 |     cat("\nRandom effects:\n")
398 |     theta<-x$opt$par
399 |     s<-sqrt(as.vector(x$s2))
400 |     stdev<- matrix(s*sqrt(diag(x$L)),ncol=1)
401 |     if (!is.null(names(x$zname))){
402 |         vcnames<-paste(names(x$znames), x$znames, sep=":")
403 |     } else {
404 |         vcnames<-x$znames
405 |     }
406 |     rownames(stdev)<-vcnames
407 |     colnames(stdev)<-"Std.Dev."
408 |     print(round(stdev,digits))
409 |     cat("Residual:\t",round(s,digits))
410 |     cat("\n Fixed effects:\n")
411 |     coef<- cbind(beta=x$beta,SE=sqrt(diag(x$Vbeta)),t=x$beta/sqrt(diag(x$Vbeta)))
412 |     coef<-cbind(coef,p=2*pnorm(-abs(coef[,3])))
413 |     colnames(coef)<-c("beta","SE","t","p")
414 |     printCoefmat(coef,digits=digits,P.values=TRUE,has.Pvalue=TRUE, signif.stars=FALSE)
415 |     cat("\n")
416 |     invisible(x)
417 |     }
418 | 
419 | 
420 | coef.svy2lme<-function(object,...,random=FALSE){
421 |     if (random) {
422 |         L<-object$L
423 |         s2<-drop(object$s2)
424 |         dimnames(L)<-list(object$znames,object$znames)
425 |         list(s2=s2, varb=L*s2)
426 |     } else 
427 |         drop(object$beta)
428 | }
429 | 
430 | vcov.svy2lme<-function(object,...){
431 |     as.matrix(object$Vbeta)
432 | }
433 | 


--------------------------------------------------------------------------------
/R/svy2relmat.R:
--------------------------------------------------------------------------------
  1 | svy2relmer<-function(formula, design, sterr=TRUE, return.devfun=FALSE,
  2 |                      relmat=NULL,all.pairs=FALSE, subtract.margins=FALSE){
  3 | 
  4 |     data<-model.frame(design)
  5 | 
  6 |     formula_copy <-formula
  7 |     formula$relmat<-NULL
  8 | 
  9 |     ## Use unweighted model to get starting values and set up variables
 10 |     m0<-relmatLmer_naive(formula,data,relmat=relmat)
 11 |     ## now have to worry about ordering
 12 | 
 13 |     ## remove missing from design
 14 |     if (!is.null(naa<-attr(m0@frame,"na.action"))){
 15 |         design<-design[-naa,]
 16 |     }
 17 | 
 18 | 
 19 |     ## Extract varables
 20 |     y<-m0@resp$y
 21 |     X<-m0@pp$X
 22 | 
 23 |     ## cluster indicators
 24 |     gs<-m0@flist
 25 |     
 26 |     ## number of clusters 
 27 |     n1s<-sapply(gs, function(gi) length(unique(gi)))
 28 |     
 29 |     ## number of random effects
 30 |     qis<-sapply(m0@cnms,length)
 31 |     q<-sum(qis)
 32 |     n<-NROW(X)
 33 |     
 34 |     Z<-t(m0@pp$Zt)
 35 |     
 36 |     ## need PSUs as well as clusters now
 37 |     psu<-design$cluster[[1]]
 38 |     
 39 |    if (all.pairs && !subtract.margins){
 40 |         ## unavoidably going to be big
 41 |        ij<-expand.grid(i=1:n,j=1:n)
 42 |        ij<-ij[ij$i!=ij$j,]  ## this would be clearer using subset(), but CRAN
 43 |     } else{
 44 |         ## all pairs within same cluster
 45 |         ## needs to be all correlated (in the model) pairs
 46 |         Lambda<- lme4::getME(m0, "Lambda")
 47 |         Zt<-lme4::getME(m0,"Zt")
 48 |         Xi<-tcrossprod(crossprod(Zt, Lambda)) + Diagonal(n)
 49 |         ij<-expand.grid(i=1:n,j=1:n)
 50 |         ij<-ij[ij$i!=ij$j,]  ## this would be clearer using subset(), but CRAN
 51 |         ij<-ij[Xi[as.matrix(ij)]!=0,]
 52 |     }
 53 |     
 54 |     ## columns of indices for first and second observation in a pair
 55 |     ii<-ij[,1]
 56 |     jj<-ij[,2]
 57 |     npairs<-nrow(ij)
 58 |     
 59 |     p<-NCOL(X)
 60 |     
 61 |     ## starting values from the unweighted model
 62 |     s2<-m0@devcomp$cmp["sigmaML"]^2
 63 |     theta<-theta0<- m0@theta
 64 |     beta<-beta0<-lme4::fixef(m0)
 65 | 
 66 |     ## second-order weights
 67 |     allpwts<-all_pi_from_design(design,ii,jj)
 68 |     pwt<-1/allpwts$full
 69 |     
 70 |     ## variance matrix of random effects
 71 |     qi<-sapply(m0@cnms,length)
 72 |     L<-as.matrix(Matrix::bdiag(lapply(qi,function(i) matrix(1,i,i))))  
 73 |     ###(need indicator for where thetas go in the matrix)
 74 |     ThInd<-which((L==1) & lower.tri(L,diag=TRUE))
 75 |     Lambda<- lme4::getME(m0, "Lambda")
 76 |     Zt<-lme4::getME(m0,"Zt")
 77 |     
 78 | 
 79 |     ## profile pairwise deviance
 80 |     ##
 81 |     ## having this be a copy of the one in svy2lmeNG looks bad
 82 |     ## but it's to allow reference to big objects by lexical scope
 83 |     devfun<-function(theta,  pwt_new=NULL, pw_uni_new=NULL, subtract_margins=FALSE){
 84 |        if (!is.null(pwt_new)) pwt<-pwt_new  ##resampling
 85 |        if (!is.null(pw_uni_new)){
 86 |             pw_uni<-pw_uni_new  ##resampling
 87 |        } else {
 88 |             pw_uni<-weights(design)
 89 |        }
 90 |        
 91 |        ## variance parameters: Cholesky square root of variance matrix
 92 |         Lind<-lme4::getME(m0, "Lind")
 93 |         Lambda@x<- theta[Lind]
 94 |         ## Full (sparse) vcov(Y)
 95 |         Xi<-tcrossprod(crossprod(Zt, Lambda)) + Diagonal(n)
 96 |         D<-diag(Xi)
 97 |         
 98 |         ## v11 is a vector of (1,1) entries of the matrix var(Y)
 99 |         ## for each pair, similarly for the others
100 |         v11<-D[ii]
101 |         v22<-D[jj]
102 |         v12<-Xi[cbind(ii,jj)]
103 | 
104 | 
105 |         ## assign to enclosing environment for resampling
106 |         Th<-matrix(0,q,q)
107 |         Th[ThInd]<-theta
108 |         L<-tcrossprod(Th)
109 | 
110 | 
111 |         ## explicit 2x2 determinants
112 |         det<-v11*v22-v12*v12
113 |         ## explicit 2x2 inverses
114 |         inv11<- v22/det
115 |         inv22<- v11/det
116 |         inv12<- -v12/det
117 | 
118 |         ## X matrices for first and second element of each pair
119 |         Xii<-X[ii,,drop=FALSE]
120 |         Xjj<-X[jj,,drop=FALSE]
121 | 
122 |         ## X^TWX
123 |         xtwx<- crossprod(Xii,pwt*inv11*Xii)+
124 |             crossprod(Xjj,pwt*inv22*Xjj)+
125 |             crossprod(Xii,pwt*inv12*Xjj)+
126 |             crossprod(Xjj,pwt*inv12*Xii)
127 | 
128 |         ## X^WY
129 |         xtwy<-crossprod(Xii,pwt*inv11*y[ii])+
130 |             crossprod(Xjj,pwt*inv22*y[jj])+
131 |             crossprod(Xii,pwt*inv12*y[jj])+
132 |             crossprod(Xjj,pwt*inv12*y[ii])
133 | 
134 |         ## all pairs by subtraction
135 |         ## nb: some observations may not be in *any* correlated pairs
136 |         if (subtract_margins){
137 |             v_margin <- D
138 |             xtwx_margin<-crossprod(X,pw_uni*X/v_margin)
139 |             xtwy_margin<-crossprod(X,pw_uni*y/v_margin)
140 |             xtwx_ind<- crossprod(Xii,pwt*Xii/v11) + crossprod(Xjj,pwt*Xjj/v22)
141 |             xtwy_ind<-crossprod(Xii,pwt*y[ii]/v11) + crossprod(Xjj,pwt*y[jj]/v22)     
142 |             N<-sum(pw_uni)  ## population number of observations
143 |             xtwx<-xtwx-xtwx_ind+2*(N-1)*xtwx_margin
144 |             xtwy<-xtwy-xtwy_ind+2*(N-1)*xtwy_margin
145 |         }
146 | 
147 |         ## betahat at the given variance parameter values
148 |         beta<<-solve(xtwx,xtwy)
149 |         Xbeta<-X%*%beta
150 | 
151 |         ## two residuals per pair
152 |         r<-y-Xbeta
153 |         r1<-r[ii]
154 |         r2<-r[jj]
155 | 
156 |         Nhat<-sum(pwt) ## population number of correlated pairs 
157 | 
158 |         ## -2 times Gaussian log profile pairwise likelihood
159 |         qf<-crossprod(r1,pwt*inv11*r1)+
160 |             crossprod(r2,pwt*inv22*r2)+
161 |             crossprod(r1,pwt*inv12*r2)+
162 |             crossprod(r2,pwt*inv12*r1)
163 | 
164 |         logdet<-sum(log(det)*pwt)
165 |         
166 |         ## all pairs by subtraction
167 |         if (subtract_margins){
168 |             qf_margin<-crossprod(r,pw_uni*r/v_margin)
169 |             qf_ind<-crossprod(r1,pwt*r1/v11)+crossprod(r2,pwt*r2/v22)
170 |             qf<-qf-qf_ind+2*(N-1)*qf_margin
171 |             
172 |             logdet_margin<-sum(log(v_margin)*pw_uni)
173 |             logdet_ind<-sum(log(v11*v22)*pwt)
174 |             logdet<- logdet-logdet_ind+2*(N-1)*logdet_margin
175 | 
176 |             Nhat<-N*(N-1)  ## population number of pairs
177 |         } 
178 |         s2<<-qf/(2*Nhat)
179 |         
180 |         logdet +2*Nhat*log(qf*2*pi/Nhat)
181 |         
182 |     }
183 | 
184 |    
185 |     ## Standard errors of regression parameters
186 |     ##
187 |     ## If beta = (X^TWX)^{-1}(XTWY)
188 |     ## the middle of the sandwich is the sum over design-correlated pairs
189 |     ## of X^TW(Y-mu)^T(Y-mu)WX
190 |     ##
191 |     ## off-diag W is just off-diag Xi[ij]^{-1}/pi_{ij}, ie, inv12/pi_ij
192 |     ## diag W is sum of diag Xi[ij]^{-1}/pi_{ij} for all pairs with i in them
193 |     ## ie, sum_j(inv11/pi_ij) but being careful about indices
194 |     ##
195 |     ## The nested version was simpler because pairs were always in the same PSU
196 |     
197 |     Vbeta<-function(theta, subtract_margins=FALSE){
198 |         ## setup exactly as in devfun
199 |         ## variance parameters: Cholesky square root of variance matrix
200 |         Lind<-lme4::getME(m0, "Lind")
201 |         Lambda@x<- theta[Lind]
202 |         ## Full (sparse) vcov(Y)
203 |         Xi<-tcrossprod(crossprod(Zt, Lambda)) + Diagonal(n)
204 |         D<-diag(Xi)
205 |         
206 |         ## v11 is a vector of (1,1) entries of the matrix var(Y)
207 |         ## for each pair, similarly for the others
208 |         v11<-D[ii]
209 |         v22<-D[jj]
210 |         v12<-Xi[cbind(ii,jj)]
211 |         
212 |         det<-v11*v22-v12*v12
213 |         inv11<- v22/det
214 |         inv22<- v11/det
215 |         inv12<- -v12/det
216 |         
217 |         Xii<-X[ii,,drop=FALSE]
218 |         Xjj<-X[jj,,drop=FALSE]
219 | 
220 | 
221 |         
222 |         Xbeta<-X%*%beta
223 |         r<-y-Xbeta
224 |         r1<-r[ii]
225 |         r2<-r[jj]
226 |         ## all pairs by subtraction
227 |         ## nb: some observations may not be in *any* correlated pairs
228 |         if (subtract_margins){
229 |             v_margin <- D
230 |             pw_uni<-weights(design)
231 |             N<-sum(pw_uni)  ## population number of observations
232 |         }
233 |         
234 |         ## try making W explicitly
235 |         W<-Matrix(0, n,n)
236 |         W[cbind(ii,jj)]<-inv12*pwt
237 |         idx<-which((1:n) %in% ii)
238 |         W[cbind(idx,idx)]<-rowsum(inv11*pwt,ii,reorder=TRUE)
239 |         if (subtract_margins){
240 |             n_uncorr<-rep(n-1,n)
241 |             n_uncorr[idx]<-n_uncorr[idx]-rowsum(rep(1,length(jj)),ii,reorder=TRUE)
242 |             W[cbind(1:n,1:n)]<-W[cbind(1:n,1:n)]+pw_uni*(1/v_margin)*n_uncorr
243 |         }
244 |         xtwx<-crossprod(X, W%*%X)
245 |         xwr<-X*(W%*%r)
246 |         xtwxinv<-solve(xtwx)
247 |         V<-xtwxinv%*%vcov(svytotal(as.matrix(xwr)%//%weights(design), design))%*%xtwxinv
248 |         dimnames(V)<-list(colnames(X),colnames(X))
249 |         return(V)
250 |     
251 |     }
252 |     if (any(zero<-(theta0==m0@lower))){
253 |         theta0[zero]<-0.5  ## relative variance, so 0.5 should be safe, but should see what lmer does
254 |     }
255 |      
256 |     ## Powell's derivative-free quadratic optimiser
257 |     fit<-minqa::bobyqa(theta0, devfun,
258 |                 lower = m0@lower,
259 |                 upper = rep(Inf, length(theta)), 
260 |                 subtract_margins=all.pairs && subtract.margins)
261 | 
262 |     ## variance of betas, if wanted
263 |     Vbeta<-if (sterr) Vbeta(fit$par,subtract_margins=all.pairs && subtract.margins) else matrix(NA,q,q)
264 | 
265 |     ## variance components
266 |     Th<-matrix(0,q,q)
267 |     Th[ThInd]<-fit$par
268 |     L<-tcrossprod(Th)
269 | 
270 |     ## names: get the relmat names into the output if possible
271 |     znames<-do.call(c,m0@cnms)
272 |     if (any(names(znames) %in% names(sys.call()$relmat))){
273 |         tn<-names(znames)[names(znames) %in% names(sys.call()$relmat)]
274 |         for(tni in tn){
275 |             names(znames)[names(znames) %in% tni]<-deparse(sys.call()$relmat[[tni]])
276 |         }
277 |     }
278 |     
279 |     ## return all the things
280 |     rval<-list(opt=fit,
281 |                s2=s2,
282 |                beta=beta,
283 |                Vbeta=Vbeta,
284 |                formula=formula,
285 |                znames=znames,
286 |                L=L,call=sys.call(),
287 |                all.pairs=all.pairs,
288 |                subtract.margins=subtract.margins,
289 |                method="general")
290 |     
291 |     ## for resampling
292 |     if(return.devfun) {
293 |         rval$devfun<-devfun
294 |         rval$lower<-m0@lower
295 |         }
296 |     
297 |     class(rval)<-c("svy2lme","svy2relmer")
298 |     rval
299 | 
300 | 
301 | }
302 | 
303 | 
304 | ## From lme4qtl (github.com/variani/lme4qtl), GPL3
305 | relmatLmer_naive <- function(formula, data = NULL, 
306 |   start = NULL,
307 |   relmat =NULL
308 | )
309 | {
310 |   ## lme4 formula
311 |   control <- lme4::lmerControl(check.nobs.vs.rankZ = "ignore", 
312 |     check.nobs.vs.nlev = "ignore", check.nobs.vs.nRE = "ignore")
313 |     mc <- mcout <- match.call()
314 | 
315 |   ## lme4 data setup
316 |   lmod <- lme4::lFormula(formula, data, control = control)
317 | 
318 |     if (is.null(relmat)){
319 |         warning("No relmat terms found")
320 |         } else {
321 |             ##-------------------------------
322 |             ## start of relmatLmer-specific code
323 |             ##-------------------------------
324 |             if (!is.list(relmat)) stop("relmat must be a list")
325 |             if (length(names(relmat)) != length(relmat)) stop("relmat terms must have names")
326 | 
327 |             relnms <- names(relmat)
328 |             relfac <- relmat
329 |             flist <- lmod$reTrms[["flist"]]   ## list of factors
330 |             fnmns <- names(flist)
331 |             
332 |             ind <- (relnms %in% names(flist))
333 |             if (any(!ind)) warning("some relmat terms are not used")
334 |             
335 |             if(any(ind)) {   
336 |                 asgn <- attr(flist, "assign")
337 |                 if (any(duplicated(asgn))) stop("a relmat term can have only one random-effect term")
338 |                 for(i in seq_along(fnmns)) {
339 |                     fn <- fnmns[i]
340 |                     if (!(fn %in% relnms)) next  ## not relmat
341 |                     
342 |                     ##tn <- which(relmati == names(flist))
343 |                     ##fn <- names(flist)[tn]
344 |                     
345 |                     zn <- lmod$fr[, fn]
346 |                     zn<-as.factor(zn)
347 |                     zn.unique <- levels(zn)
348 |                     
349 |                     if(is.null(rownames(relmat[[fn]]))) stop("relmat matrices must have dimnames")
350 |                     rn <- rownames(relmat[[fn]])
351 |                     
352 |                     if(!all(zn.unique %in% rn)) stop("relmat dimnames do not match factor levels")
353 |                     
354 |                     ## compute a relative factor R: K = R'R
355 |                     ## See lme4qtl:::relfac
356 |                     K <- Matrix::Matrix(relmat[[fn]][zn.unique, zn.unique], sparse = TRUE)
357 |                     R <- Matrix::chol(K)
358 |                     relfac[[fn]] <- R
359 |                     
360 |                     pi <- length(lmod$reTrms$cnms[[i]])
361 |                     Zi_t <- lmod$reTrms$Ztlist[[i]] 
362 |                     Zi_t <- kronecker(R, diag(1, pi)) %*% Zi_t ## t(Z*)
363 |                     
364 |                     ## put the new t(Z*) back into the appropriate slot `Ztlist`
365 |                     lmod$reTrms$Ztlist[[i]] <- Zi_t
366 |                     
367 |                 }
368 |             }
369 |             lmod$reTrms[["Zt"]] <- do.call(rbind, lmod$reTrms$Ztlist)
370 |         }
371 |     mcout$formula <- lmod$formula
372 |     lmod$formula <- NULL
373 |     
374 |     devfun <- do.call(mkLmerDevfun, c(lmod,list(start = start)))
375 |     
376 |     opt <-optimizeLmer(devfun,start=start)
377 |     
378 |     rval<-lme4::mkMerMod(environment(devfun), opt, lmod$reTrms, fr = lmod$fr)
379 |     rval@optinfo$relfac<-list(relfac=relfac)
380 |     rval
381 | }
382 | 


--------------------------------------------------------------------------------
/R/svylmeNG.R:
--------------------------------------------------------------------------------
  1 | 
  2 | 
  3 | getallpairs<-function(gps, TOOBIG=1000){
  4 |     n<-length(gps[1])
  5 |     if (n < TOOBIG){
  6 |         ijall<-Reduce("|", lapply(gps, function(gp) outer(gp,gp,"==")), FALSE)
  7 |         diag(ijall)<-FALSE
  8 |         return(which(ijall, arr.ind=TRUE)) ## return(which(ijall & upper.tri(ijall), arr.ind=TRUE))
  9 |     } 
 10 | 
 11 |     alli<-list(); allj<-list()
 12 |     for (gp in gps){
 13 |         ng<-ave(1:n, gp, FUN=length)
 14 |         j<-rep(1:n,ng)
 15 |         i<-numeric(length(j))
 16 |         for (g in unique(gp)){
 17 |             this<- which(gp[j]==g)
 18 |             i[this] <-which(gp==g)
 19 |         }
 20 |         alli[[gp]]<-i
 21 |         allj[[gp]]<-j
 22 |     }
 23 |     i<-do.call(c,alli)
 24 |     j<-do.call(c,allj)
 25 |     rval<-data.frame(i=i[i<j],j=j[i<j])
 26 |     unique(rval)
 27 | }
 28 | 
 29 | 
 30 | svy2lme<-function(formula, design, sterr=TRUE, return.devfun=FALSE, method=c("general","nested"), all.pairs=FALSE, subtract.margins=FALSE){
 31 | 
 32 |     method<-match.arg(method)
 33 |     if(method=="nested"){
 34 |         if(all.pairs) stop("all.pairs=TRUE not allowed for method='nested'")
 35 |         return(svy2lme_nested(formula,design, sterr=sterr, return.devfun=return.devfun))
 36 |     }
 37 |     data<-model.frame(design)
 38 |     
 39 |     ## Use unweighted model to get starting values and set up variables
 40 |     m0<-lme4::lmer(formula,data,REML=FALSE)
 41 |     
 42 |     ## remove missing from design
 43 |     if (!is.null(naa<-attr(m0@frame,"na.action"))){
 44 |         design<-design[-naa,]
 45 |     }
 46 | 
 47 | 
 48 |     ## Extract varables
 49 |     y<-m0@resp$y
 50 |     X<-m0@pp$X
 51 | 
 52 |     ## cluster indicators
 53 |     gs<-m0@flist
 54 |     
 55 |     ## number of clusters 
 56 |     n1s<-sapply(gs, function(gi) length(unique(gi)))
 57 |     
 58 |     ## number of random effects
 59 |     qis<-sapply(m0@cnms,length)
 60 |     q<-sum(qis)
 61 |     n<-NROW(X)
 62 |     
 63 |     Z<-t(m0@pp$Zt)
 64 |     
 65 |     ## need PSUs as well as clusters now
 66 |     psu<-design$cluster[[1]]
 67 |     
 68 |     if (all.pairs && !subtract.margins){
 69 |         ## unavoidably going to be big
 70 |         ij<-expand.grid(i=1:n,j=1:n)
 71 |         ij<-ij[ij$i!=ij$j,]  ## this would be clearer using subset(), but CRAN
 72 |     } else{
 73 |         ## all pairs within same cluster
 74 |         ## Conceptually, the union of 
 75 |         ## ij<-subset(expand.grid(i=1:n,j=1:n), (g[i] == g[j]) & (i<j))
 76 |         ## but needs to work when n^2 is too big to construct
 77 |         ij<-getallpairs(gs)
 78 |     }
 79 |     ## columns of indices for first and second observation in a pair
 80 |     ii<-ij[,1]
 81 |     jj<-ij[,2]
 82 |     
 83 |     npairs<-nrow(ij)
 84 |     
 85 |     p<-NCOL(X)
 86 |     
 87 |     ## starting values from the unweighted model
 88 |     s2<-m0@devcomp$cmp["sigmaML"]^2
 89 |     theta<-theta0<- m0@theta
 90 |     beta<-beta0<-lme4::fixef(m0)
 91 | 
 92 |     ## second-order weights
 93 |     allpwts<-all_pi_from_design(design,ii,jj)
 94 |     pwt<-1/allpwts$full
 95 |   
 96 |     ## variance matrix of random effects
 97 |     qi<-sapply(m0@cnms,length)
 98 |     L<-as.matrix(Matrix::bdiag(lapply(qi,function(i) matrix(1,i,i)))) 
 99 |     ###(need indicator for where thetas go in the matrix)
100 |     ThInd<-which((L==1) & lower.tri(L,diag=TRUE))
101 |     Lambda<- lme4::getME(m0, "Lambda")
102 |     Zt<-lme4::getME(m0,"Zt")
103 |     
104 |     ## profile pairwise deviance
105 |     ## a whole heap of stuff is being passed by lexical scope
106 |     devfun<-function(theta, pwt_new=NULL, pw_uni_new=NULL, subtract_margins=FALSE){
107 |         if (!is.null(pwt_new)) pwt<-pwt_new  ##resampling
108 |         if (!is.null(pw_uni_new)){
109 |             pw_uni<-pw_uni_new  ##resampling
110 |         } else {
111 |             pw_uni<-weights(design)
112 |         }
113 |         
114 |         ## variance parameters: Cholesky square root of variance matrix
115 |         Lind<-lme4::getME(m0, "Lind")
116 |         Lambda@x<- theta[Lind]
117 |         ## Full (sparse) vcov(Y)
118 |         Xi<-tcrossprod(crossprod(Zt, Lambda)) + Diagonal(n)
119 |         D<-diag(Xi)
120 | 
121 |         ## assign to enclosing env for resampling
122 |         Th<-matrix(0,q,q)
123 |         Th[ThInd]<-theta
124 |         L<<-tcrossprod(Th)
125 | 
126 |         
127 |         ## v11 is a vector of (1,1) entries of the matrix var(Y)
128 |         ## for each pair, similarly for the others
129 |         v11<-D[ii]
130 |         v22<-D[jj]
131 |         v12<-Xi[cbind(ii,jj)]
132 |         
133 | 
134 |         ## explicit 2x2 determinants
135 |         det<-v11*v22-v12*v12
136 |         ## explicit 2x2 inverses
137 |         inv11<- v22/det
138 |         inv22<- v11/det
139 |         inv12<- -v12/det
140 | 
141 |         ## X matrices for first and second element of each pair
142 |         Xii<-X[ii,,drop=FALSE]
143 |         Xjj<-X[jj,,drop=FALSE]
144 | 
145 |         ## X^TWX
146 |         xtwx<- crossprod(Xii,pwt*inv11*Xii)+
147 |             crossprod(Xjj,pwt*inv22*Xjj)+
148 |             crossprod(Xii,pwt*inv12*Xjj)+
149 |             crossprod(Xjj,pwt*inv12*Xii)
150 | 
151 |         ## X^WY
152 |         xtwy<-crossprod(Xii,pwt*inv11*y[ii])+
153 |             crossprod(Xjj,pwt*inv22*y[jj])+
154 |             crossprod(Xii,pwt*inv12*y[jj])+
155 |             crossprod(Xjj,pwt*inv12*y[ii])
156 | 
157 |         ## all pairs by subtraction
158 |         ## nb: some observations may not be in *any* correlated pairs
159 |         if (subtract_margins){
160 |             v_margin <- D
161 |             xtwx_margin<-crossprod(X,pw_uni*X/v_margin)
162 |             xtwy_margin<-crossprod(X,pw_uni*y/v_margin)
163 |             xtwx_ind<- crossprod(Xii,pwt*Xii/v11) + crossprod(Xjj,pwt*Xjj/v22)
164 |             xtwy_ind<-crossprod(Xii,pwt*y[ii]/v11) + crossprod(Xjj,pwt*y[jj]/v22)     
165 |             N<-sum(pw_uni)  ## population number of observations
166 |             xtwx<-xtwx-xtwx_ind+2*(N-1)*xtwx_margin
167 |             xtwy<-xtwy-xtwy_ind+2*(N-1)*xtwy_margin
168 |         }
169 | 
170 |         ## betahat at the given variance parameter values
171 |         beta<<-solve(xtwx,xtwy)
172 |         Xbeta<-X%*%beta
173 | 
174 |         ## two residuals per pair
175 |         r<-y-Xbeta
176 |         r1<-r[ii]
177 |         r2<-r[jj]
178 | 
179 |         Nhat<-sum(pwt)*2 ## population number of *correlated* pairs 
180 | 
181 |         ## -2 times Gaussian log profile pairwise likelihood
182 |         qf<-crossprod(r1,pwt*inv11*r1)+
183 |             crossprod(r2,pwt*inv22*r2)+
184 |             crossprod(r1,pwt*inv12*r2)+
185 |             crossprod(r2,pwt*inv12*r1)
186 | 
187 |         logdet<-sum(log(det)*pwt)
188 |         
189 |         ## all pairs by subtraction
190 |         if (subtract_margins){
191 |             qf_margin<-crossprod(r,pw_uni*r/v_margin)
192 |             qf_ind<-crossprod(r1,pwt*r1/v11)+crossprod(r2,pwt*r2/v22)
193 |             qf<-qf-qf_ind+(N-1)*qf_margin
194 |             
195 |             logdet_margin<-sum(log(v_margin)*pw_uni)
196 |             logdet_ind<-sum(log(v11*v22)*pwt)
197 |             logdet<- logdet-logdet_ind+(N-1)*logdet_margin
198 | 
199 |             Nhat<-N*(N-1)  ## population number of pairs
200 |         } 
201 |         s2<<-qf/Nhat
202 |         
203 |         logdet + Nhat*log(qf*2*pi/Nhat)
204 |         
205 |     }
206 | 
207 |     ## Standard errors of regression parameters
208 |     ##
209 |     ## If beta = (X^TWX)^{-1}(XTWY)
210 |     ## the middle of the sandwich is the sum over design-correlated pairs
211 |     ## of X^TW(Y-mu)^T(Y-mu)WX
212 |     ##
213 |     ## off-diag W is just off-diag Xi[ij]^{-1}/pi_{ij}, ie, inv12/pi_ij
214 |     ## diag W is sum of diag Xi[ij]^{-1}/pi_{ij} for all pairs with i in them
215 |     ## ie, sum_j(inv11/pi_ij) but being careful about indices
216 |     ##
217 |     ## The nested version was simpler because pairs were always in the same PSU
218 |     
219 |     Vbeta<-function(theta, subtract_margins=FALSE){
220 |         ## setup exactly as in devfun
221 |         ## variance parameters: Cholesky square root of variance matrix
222 |         Lind<-lme4::getME(m0, "Lind")
223 |         Lambda@x<- theta[Lind]
224 |         ## Full (sparse) vcov(Y)
225 |         Xi<-tcrossprod(crossprod(Zt, Lambda)) + Diagonal(n)
226 |         D<-diag(Xi)
227 |         
228 |         ## v11 is a vector of (1,1) entries of the matrix var(Y)
229 |         ## for each pair, similarly for the others
230 |         v11<-D[ii]
231 |         v22<-D[jj]
232 |         v12<-Xi[cbind(ii,jj)]
233 |         
234 |         det<-v11*v22-v12*v12
235 |         inv11<- v22/det
236 |         inv22<- v11/det
237 |         inv12<- -v12/det
238 |         
239 |         Xii<-X[ii,,drop=FALSE]
240 |         Xjj<-X[jj,,drop=FALSE]
241 | 
242 | 
243 |         if (subtract_margins){
244 |             v_margin <- D
245 |             pw_uni<-weights(design)
246 |             N<-sum(pw_uni)  ## population number of observations
247 |         }
248 |         
249 |         Xbeta<-X%*%beta
250 |         r<-y-Xbeta
251 |         r1<-r[ii]
252 |         r2<-r[jj]
253 | 
254 |         ## try making W explicitly
255 |         W<-Matrix(0, n,n)
256 |         W[cbind(ii,jj)]<-inv12*pwt
257 |         idx<-which((1:n) %in% ii)
258 |         W[cbind(idx,idx)]<-rowsum(inv11*pwt,ii,reorder=TRUE)
259 |         if (subtract_margins){
260 |             n_uncorr<-rep(n-1,n)
261 |             n_uncorr[idx]<-n_uncorr[idx]-rowsum(rep(1,length(jj)),ii,reorder=TRUE)
262 |             W[cbind(1:n,1:n)]<-W[cbind(1:n,1:n)]+pw_uni*(1/v_margin)*n_uncorr
263 |         }
264 |         xtwx<-crossprod(X, W%*%X)
265 |         xwr<-X*drop(W%*%r)
266 |         xtwxinv<-solve(xtwx)
267 |         V<-xtwxinv%*%vcov(svytotal(as.matrix(xwr)%//%weights(design), design))%*%xtwxinv
268 |         dimnames(V)<-list(colnames(X),colnames(X))
269 |         return(V)
270 |     }
271 |     
272 |     if (any(zero<-(theta0==m0@lower))){
273 |         theta0[zero]<-0.5  ## relative variance, so 0.5 should be safe, but should see what lmer does
274 |     }
275 |     
276 |     ## Powell's derivative-free quadratic optimiser
277 |     fit<-minqa::bobyqa(theta0, devfun,
278 |                 lower = m0@lower,
279 |                 upper = rep(Inf, length(theta)), 
280 |                 subtract_margins=all.pairs && subtract.margins)
281 | 
282 |     ## variance of betas, if wanted
283 |     Vb<-if (sterr ) Vbeta(fit$par,subtract_margins=all.pairs && subtract.margins) else matrix(NA,q,q)
284 | 
285 |     ## variance components
286 |     Th<-matrix(0,q,q)
287 |     Th[ThInd]<-fit$par
288 |     L<-tcrossprod(Th)
289 |     ## return all the things
290 |     rval<-list(opt=fit,
291 |                s2=s2,
292 |                beta=beta,
293 |                Vbeta=Vb,
294 |                formula=formula,
295 |                znames=do.call(c,m0@cnms),
296 |                L=L, all.pairs=all.pairs,
297 |                subtract.margins=subtract.margins, method="general")
298 |     
299 |     ## for resampling
300 |     if(return.devfun) {
301 |         rval$devfun<-devfun
302 |         rval$lower<-m0@lower
303 |         }
304 |     
305 |     class(rval)<-"svy2lme"
306 |     rval
307 | }
308 | 
309 | 
310 | ## pairwise probabilities: does *not* assume nesting
311 | ##
312 | ## we only use $full, not the other components.
313 | ##
314 | all_pi_from_design<-function(design, ii,jj){
315 | 
316 |     if (design$pps && !is.null(design$dcheck)){
317 |         ## We have pairwise probabilities already. Or, at least, covariances
318 |         Deltacheck<-design$dcheck[[1]]$dcheck[cbind(ii,jj)]
319 |         indep<-design$prob[ii]*design$prob[jj]
320 |         pi_ij<-(Deltacheck+1)*indep
321 | 
322 |         last<-ncol(design$allprob)
323 |         n<-design$fpc$sampsize
324 |         N<-design$fpc$popsize
325 | 
326 |         return(list(full=pi_ij,
327 |                     first=NULL,
328 |                     cond=NULL))
329 |         }
330 |     
331 |     if (NCOL(design$allprob)==1){
332 |         ## No multistage weights
333 |         if (NCOL(design$cluster)>1)
334 |             stop("you need weights/probabilities for each stage of sampling")
335 |         
336 |         if (NCOL(design$cluster)==1 && !any(duplicated(design$cluster))){
337 |             ## ok, element sampling, can't be same PSU
338 |             if(is.null(design$fpc$popsize)) #with replacement
339 |                 return(list(full=design$prob[ii]*design$prob[jj],
340 |                             first=design$prob[ii],
341 |                             cond=rep(1,length(ii))))
342 |             else if(is_close(as.vector(design$allprob),
343 |                              as.vector(design$fpc$sampsize/design$fpc$popsize),tolerance=1e-4)){
344 |                 ## srs, possibly stratified
345 |                 n<-design$fpc$sampsize
346 |                 N<-design$fpc$popsize
347 |                 return(list(full= n[ii]*(n[jj]-1)%//%( N[ii]*(N[jj]-1)),
348 |                             first=n[ii]/N[ii],
349 |                             cond=rep(1,length(ii))))
350 |             } else {
351 |                 ## Hajek high entropy: based on Brewer p153, equation 9.14
352 |                 pi<-design$allprob
353 |                 denom<-ave(1-pi, design$strata,FUN=sum)
354 |                 samestrata<-(design$strata[ii]==design$strata[jj])
355 |                 return(list(full=pi[ii]*pi[jj]*(1- ifelse(samestrata, (1-pi[ii])*(1-pi[jj])/denom, 0)),
356 |                             first=pi[ii],
357 |                             cond=rep(1,length(ii))))
358 |             }
359 |         } else if (all(by(design$prob, design$cluster[,1], function(x) length(unique(x)))==1)) {
360 |             ## possibly ok, sampling of whole PSUs
361 |             warning("assuming no subsampling within PSUs because multi-stage weights were not given")
362 |             
363 |             samePSU<-design$cluster[ii,1]==design$cluster[jj,1]
364 | 
365 |             if(is.null(design$fpc$popsize)){ #with replacement
366 |                  return(list(full=ifelse(samePSU, design$prob[ii], design$prob[ii]*design$prob[jj]),
367 |                              first=design$prob[ii],
368 |                              cond=rep(1, length(ii))))
369 |             } else if(is_close(as.vector(design$allprob[[1]]),
370 |                               as.vector(design$fpc$sampsize/design$fpc$popsize),tolerance=1e-4)){
371 |                 # srs, possibly stratified
372 |                 n<-design$fpc$sampsize
373 |                 N<-design$fpc$popsize
374 |                 return(list(full= ifelse(samePSU, (n[ii]/N[ii]),(n[ii]/N[ii])*(n[jj]/N[jj])),
375 |                             first=n[ii]/N[ii],
376 |                             cond=rep(1,length(ii))))
377 |             } else {
378 |                 ## Hajek high entropy: based on Brewer p153, equation 9.14
379 |                 pi<-design$allprob
380 |                 denom<-ave(1-pi, design$strata,FUN=sum)
381 |                 samestrata<-(design$strata[ii,1]==design$strata[jj,1])
382 |                 return(list(full=ifelse(samePSU, pi[ii,1], pi[ii,1]*pi[jj,1]*(1- ifelse(samestrata, (1-pi[ii,1])*(1-pi[jj,1])/denom, 0))),
383 |                             first=pi[ii,1],
384 |                             cond=rep(1,length(ii))))
385 |             }
386 |         } else {
387 |             ## not ok
388 |             stop("you need weights/probabilities for each stage of sampling")
389 |         }       
390 |     }
391 | 
392 |     ## If we're here, we have multistage weights
393 |     if (ncol(design$allprob)!=ncol(design$cluster)){
394 |         ## ? can't happen
395 |         stop("number of stages of sampling does not match number of stages of weights")
396 |     }
397 |     samePSU<-design$cluster[ii,1]==design$cluster[jj,1]
398 | 
399 |     if(is.null(design$fpc$popsize)){ #with replacement
400 |         last<-ncol(design$allprob)
401 |         return(list(full=ifelse(samePSU, design$prob[ii]*design$allprob[jj,last],design$prob[ii]*design$prob[jj]),
402 |                     first=apply(design$allprob[ii,-last, drop=FALSE], 1, prod),
403 |                     cond=design$allprob[ii,last]*design$allprob[jj,last]))
404 |     }
405 |     if(all.equal(as.matrix(design$allprob), as.matrix(design$fpc$sampsize/design$fpc$popsize),tolerance=1e-4)){
406 |         ## multistage stratified random sampling
407 |         last<-ncol(design$allprob)
408 |         n<-design$fpc$sampsize
409 |         N<-design$fpc$popsize
410 |         samestrata<-(design$strata[ii, ]==design$strata[jj, ])
411 |         pstages <-(n[ii,]/N[ii,])*(samestrata*((n[jj,]-1)%//%(N[jj,]-1)) + (1-samestrata)*(n[jj,]/N[jj,]))  ##FIXME divide by  zero when N==1
412 |         return(list(full=ifelse(samePSU, apply((n[ii,]/N[ii,])[,-last,drop=FALSE],1,prod)*pstages[,last],design$prob[ii]*design$prob[jj]),
413 |                     first=apply((n[ii,]/N[ii,])[,-last,drop=FALSE],1,prod),
414 |                     cond=pstages[,last]))
415 |     }
416 | 
417 |     ## Hajek high entropy: Brewer p153
418 |     first<-cpwt<-rep_len(1,length(ii))
419 |     for (i in 1:ncol(design$allprob)){
420 |         pi<-design$allprob[,i]
421 |         denom<-ave(1-pi, design$strata[,i],FUN=sum)
422 |         samestrata<-(design$strata[ii,i]==design$strata[jj,i])
423 |         if (i==ncol(design$allprob))
424 |             cpwt<-cpwt*pi[ii]*pi[jj]*(1- ifelse(samestrata, (1-pi[ii])*(1-pi[jj])/denom, 0))
425 |         else
426 |             first<-first*pi[ii]
427 |     }
428 |     return(list(full=ifelse(samePSU, first*cpwt,design$prob[ii]*design$prob[jj]), first= first, cond=cpwt))
429 | 
430 | }
431 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | # svylme
 2 | Mixed models for complex surveys
 3 | 
 4 | This package fits linear mixed models to data from complex surveys, by maximising a weighted pairwise likelihood
 5 | 
 6 | ```
 7 | remotes::install_github("tslumley/svylme")
 8 | ```
 9 | 
10 | ## Advantages
11 | 
12 | It works (gives consistent estimates of the regression coefficients and variance components) for **any** linear mixed model and **any** design, without any restrictions on the sampling units
13 | and model clusters being related. For example, you could sample on home address but fit a model clustering on school.
14 | 
15 | The implementation allows for correlated random effects such as you get in quantiative genetics
16 | 
17 | ## Disadvantages
18 | 
19 | Linear models only
20 | 
21 | Some loss of efficiency compared to just fitting a design-based linear model (if you don't care about the variance components)
22 | 
23 | There isn't (yet) an analog of the BLUPs of random effects, eg for small-area estimation
24 | 
25 | If your sampling units and model clusters are the same, and your design isn't too strongly informative, you can likely get more precise estimates of the variance components with
26 | stagewise pseudolikelihood as implemented in Stata or Mplus. 
27 | 


--------------------------------------------------------------------------------
/THANKS:
--------------------------------------------------------------------------------
1 | This code is based on research supported by the Marsden Fund Council 
2 | from Government funding, managed by Royal Society Te Apārangi
3 | 


--------------------------------------------------------------------------------
/data/milk_subset.rda:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/tslumley/svylme/426d6edd43c341e238e9a2e00079ea71a7501a2c/data/milk_subset.rda


--------------------------------------------------------------------------------
/data/nzmaths.rda:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/tslumley/svylme/426d6edd43c341e238e9a2e00079ea71a7501a2c/data/nzmaths.rda


--------------------------------------------------------------------------------
/data/pisa.rda:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/tslumley/svylme/426d6edd43c341e238e9a2e00079ea71a7501a2c/data/pisa.rda


--------------------------------------------------------------------------------
/inst/COPYRIGHTS:
--------------------------------------------------------------------------------
1 | The file R/svy2relmat.R contains code modified from the lme4qtl package.
2 | This is copyright Andrey Ziyatdinov, but is in turn based in part on
3 | the lme4 package, https://github.com/lme4/lme4. All these are GPL-3
4 | 


--------------------------------------------------------------------------------
/inst/scripts/README:
--------------------------------------------------------------------------------
1 | Examples
2 | 
3 | pairwise-milk:  milk yields, from pedigreemm. Large gene/environment example with varying group sizes
4 | milk-sampling: subsampling from the milk data
5 | twins-pairwise: bmi of twins, from mets.  Large data set of mostly pairs.
6 | twins-sampling: subsampling from the twins data
7 | svy2lmesim2: simulated data where PSU partially overlaps with model cluster
8 | 
9 | 


--------------------------------------------------------------------------------
/inst/scripts/milk-sampling.R:
--------------------------------------------------------------------------------
  1 | library(pedigreemm)
  2 | 
  3 | data(milk)
  4 | 
  5 | milk <- within(milk, {
  6 |   id <- as.character(id)
  7 |   sdMilk <- milk / sd(milk)
  8 | })
  9 | system.time(
 10 | m0<-pedigreemm(sdMilk~lact+log(dim)+(1|id)+(1|herd),data=milk, pedigree=list(id=pedCowsR), REML=FALSE)
 11 | )
 12 | 
 13 | A_gen <- getA(pedCowsR)
 14 | ind <- rownames(A_gen) %in% milk$id
 15 | A_gen <- A_gen[ind, ind]
 16 | 
 17 | 
 18 | library(lme4qtl)
 19 | library(svylme)
 20 | library(sampling)
 21 | 
 22 | simMilk<-function(theta,model, n){
 23 | 	Lambda<- getME(model, "Lambda")
 24 |     Zt<-getME(model,"Zt")
 25 |     Lind<-getME(model, "Lind")
 26 |     Lambda@x<- theta[Lind]
 27 |     s2<-model@devcomp$cmp["sigmaML"]
 28 |     m<-nrow(Zt)
 29 |   	u<-matrix(rnorm(m*n,0,1),ncol=n)
 30 | 	U<-crossprod(Zt,Lambda)%*%u*sqrt(s2)
 31 | 	Y<-drop(getME(model,"X")%*%model@beta)+U+matrix(rnorm(nrow(U)*n,0,s=sqrt(s2)),ncol=n)
 32 | 	Y
 33 | }
 34 | 
 35 | 
 36 | set.seed(2023-6-29)
 37 | sim_milk<-simMilk(m0@optinfo$val, m0,2)
 38 | milk$simMilk<-sim_milk[,1]
 39 | 
 40 | herds<-aggregate(milk$milk,list(milk$herd),sum)
 41 | herds$p<-herds[,2]*10/sum(herds[,2])
 42 | 
 43 | cfsvy<-function(model)  c(coef(model), unlist(coef(model,random=TRUE))[c(2,5,1)])
 44 | 
 45 | cflmer<-function(model){
 46 |     a<-VarCorr(model)
 47 |     c(fixef(model), as.vector(unlist(a[1:2])), attr(a,"sc")^2)
 48 |     }
 49 | 
 50 | Pi2<-UPtillepi2(herds$p)
 51 | dimnames(Pi2)<-list(herds[,1], herds[,1])
 52 | 
 53 | 
 54 | 
 55 | one.sim<-function(){
 56 |     sampled_herds<-as.logical(UPtille(herds$p))
 57 |     submilk<-subset(milk, herd %in% herds[sampled_herds,1])
 58 |     submilk$herd<-as.character(submilk$herd)
 59 |     
 60 |     p<-herds$p[sampled_herds]
 61 |     names(p)<-herds[sampled_herds,1]
 62 |     submilk$p<-p[submilk$herd]
 63 |     
 64 |     
 65 |     PI2_sub<-Pi2[sampled_herds,sampled_herds][submilk$herd,submilk$herd]
 66 |     
 67 |     
 68 |     
 69 |     sub_milk_des<-svydesign(id=~herd,data=submilk, prob=~p,pps=ppsmat(PI2_sub))
 70 |     
 71 |     
 72 |     m1a<-relmatLmer(sdMilk~lact+log(dim)+(1|id)+(1|herd),data=submilk, relmat=list(id=A_gen),REML=FALSE)
 73 |     m2a<-svy2relmer(sdMilk~lact+log(dim)+(1|id)+(1|herd),design=sub_milk_des, relmat=list(id=A_gen),return.devfun=TRUE)
 74 |     m3a<-svy2relmer(sdMilk~lact+log(dim)+(1|id)+(1|herd),design=sub_milk_des, relmat=list(id=A_gen),all.pairs=TRUE, subtract.margins=TRUE)
 75 |     
 76 |     
 77 | 
 78 |     m1b<-relmatLmer(simMilk~lact+log(dim)+(1|id)+(1|herd),data=submilk, relmat=list(id=A_gen),REML=FALSE)
 79 |     m2b<-svy2relmer(simMilk~lact+log(dim)+(1|id)+(1|herd),design=sub_milk_des, relmat=list(id=A_gen),return.devfun=TRUE)
 80 |     m3b<-svy2relmer(simMilk~lact+log(dim)+(1|id)+(1|herd),design=sub_milk_des, relmat=list(id=A_gen),all.pairs=TRUE, subtract.margins=TRUE)
 81 |     
 82 |     rval<-c( cflmer(m1a),
 83 |             cfsvy(m2a),
 84 |             cfsvy(m3a),
 85 |             cflmer(m1b),
 86 |             cfsvy(m2b),
 87 |             cfsvy(m3b)
 88 |             )
 89 | }
 90 | 
 91 | results<-replicate(1000, tryCatch(one.sim(), error=function(e) rep(NA,36)))
 92 | save(results,file="~/milk-sampling.rda")
 93 | 
 94 | 
 95 | milk_des<-svydesign(id=~1 ,data=milk)
 96 | 
 97 | true1a<-m0
 98 | true1b<-svy2relmer(sdMilk~lact+log(dim)+(1|id)+(1|herd),design=milk_des, relmat=list(id=A_gen))
 99 | trub1c<-svy2relmer(sdMilk~lact+log(dim)+(1|id)+(1|herd),design=milk_des, relmat=list(id=A_gen),all.pairs=TRUE, subtract.margins=TRUE)
100 | 
101 | 
102 | true2a<-pedigreemm(simMilk~lact+log(dim)+(1|id)+(1|herd),data=milk, pedigree=list(id=pedCowsR), REML=FALSE)
103 | true2b<-svy2relmer(simMilk~lact+log(dim)+(1|id)+(1|herd),design=milk_des, relmat=list(id=A_gen))
104 | trub2c<-svy2relmer(simMilk~lact+log(dim)+(1|id)+(1|herd),design=milk_des, relmat=list(id=A_gen),all.pairs=TRUE, subtract.margins=TRUE)
105 |   
106 | 


--------------------------------------------------------------------------------
/inst/scripts/pairwise-milk.R:
--------------------------------------------------------------------------------
 1 | library(pedigreemm)
 2 | 
 3 | data(milk)
 4 | 
 5 | milk <- within(milk, {
 6 |   id <- as.character(id)
 7 |   sdMilk <- milk / sd(milk)
 8 | })
 9 | system.time(
10 | m0<-pedigreemm(sdMilk~lact+log(dim)+(1|id)+(1|herd),data=milk, pedigree=list(id=pedCowsR), REML=FALSE)
11 | )
12 | 
13 | A_gen <- getA(pedCowsR)
14 | ind <- rownames(A_gen) %in% milk$id
15 | A_gen <- A_gen[ind, ind]
16 | 
17 | 
18 | library(lme4qtl)
19 | system.time(
20 | m1<-relmatLmer(sdMilk~lact+log(dim)+(1|id)+(1|herd),data=milk, relmat=list(id=A_gen))
21 | )
22 | 
23 | 
24 | 
25 | library(svylme)
26 | milk_des<-svydesign(id=~1,data=milk)
27 | system.time(
28 | m2<-svy2relmer(sdMilk~lact+log(dim)+(1|id)+(1|herd),design=milk_des, relmat=list(id=A_gen))
29 | )
30 | 
31 | system.time(
32 | m3<-svy2relmer(sdMilk~lact+log(dim)+(1|id)+(1|herd),design=milk_des, relmat=list(id=A_gen),all.pairs=TRUE, subtract.margins=TRUE)
33 | )
34 | 
35 | 
36 | simMilk<-function(theta,model, n){
37 | 	Lambda<- getME(model, "Lambda")
38 |     Zt<-getME(model,"Zt")
39 |     Lind<-getME(model, "Lind")
40 |     Lambda@x<- theta[Lind]
41 |     s2<-model@devcomp$cmp["sigmaML"]
42 |     m<-nrow(Zt)
43 |   	u<-matrix(rnorm(m*n,0,1),ncol=n)
44 | 	U<-crossprod(Zt,Lambda)%*%u*sqrt(s2)
45 | 	Y<-drop(getME(model,"X")%*%model@beta)+U+matrix(rnorm(nrow(U)*n,0,s=sqrt(s2)),ncol=n)
46 | 	Y
47 | }
48 | 
49 | 
50 | set.seed(2023-6-7)
51 | sim_milk<-simMilk(m0@optinfo$val, m0,2)
52 | milk$simMilk<-sim_milk[,1]
53 | sim_milk_des<-svydesign(id=~1,data=milk)
54 | 
55 | m1a<-relmatLmer(simMilk~lact+log(dim)+(1|id)+(1|herd),data=milk, relmat=list(id=A_gen),REML=FALSE)
56 | m2a<-svy2relmer(simMilk~lact+log(dim)+(1|id)+(1|herd),design=sim_milk_des, relmat=list(id=A_gen),return.devfun=TRUE)
57 | m3a<-svy2relmer(simMilk~lact+log(dim)+(1|id)+(1|herd),design=sim_milk_des, relmat=list(id=A_gen),all.pairs=TRUE, subtract.margins=TRUE)
58 | 
59 | 
60 | 
61 | 
62 | m0
63 | m1
64 | m2
65 | m3
66 | 
67 | m1a
68 | m2a
69 | m3a


--------------------------------------------------------------------------------
/inst/scripts/pisa-analysis.R:
--------------------------------------------------------------------------------
 1 | 
 2 | data(nzmaths)
 3 | 
 4 | nzmaths$cSTRATUM<- nzmaths$STRATUM
 5 | nzmaths$cSTRATUM[nzmaths$cSTRATUM=="NZL0102"]<-"NZL0202"
 6 | 
 7 | 
 8 | des<-svydesign(id=~SCHOOLID+STIDSTD, strata=~cSTRATUM, nest=TRUE,
 9 | 	weights=~W_FSCHWT+condwt, data=nzmaths)
10 | 
11 | des<-update(des, centPCGIRLS=PCGIRLS-0.5)
12 | jkdes<-as.svrepdesign(des)
13 | 
14 | m1<-svy2lme(PV1MATH~ (1+ ST04Q01 |SCHOOLID)+ST04Q01*(centPCGIRLS+SMRATIO)+MATHEFF+OPENPS, design=des, return.devfun=TRUE)
15 | m2<-svy2lme(PV1MATH~ (1+ ST04Q01 |SCHOOLID)+ST04Q01*(centPCGIRLS+SMRATIO)+MATHEFF+OPENPS, design=des, return.devfun=TRUE,all.pairs=TRUE, subtract.margins=TRUE)
16 | 
17 | m1var<-boot2lme(m1,jkdes,verbose=TRUE)
18 | m2var<-boot2lme(m2,jkdes,verbose=TRUE)
19 | 


--------------------------------------------------------------------------------
/inst/scripts/svy2lmesim2.R:
--------------------------------------------------------------------------------
  1 | library(lme4)
  2 | library(svylme)
  3 | 
  4 | 
  5 | library(parallel)
  6 | RNGkind("L'Ecuyer-CMRG")
  7 | mcreplicate<-function(n, expr,...){
  8 |     l<-mclapply(integer(n), eval.parent(substitute(function(...) expr)), mc.cores=6,mc.set.seed = TRUE, mc.preschedule=TRUE)
  9 |     simplify2array(l, higher = TRUE)
 10 |     }
 11 | 
 12 | 
 13 | set.seed(2023-6-20)
 14 | 
 15 | N1=400 
 16 | N2=400 
 17 | latitude<-1:N2
 18 | longitude<-1:N1
 19 | population<-expand.grid(lat=latitude,long=longitude)
 20 | population$PSU<-population$long
 21 | overlap=ceiling(N2*1/2)
 22 | 
 23 | 
 24 | cflmer<-function(model){
 25 |     a<-VarCorr(model)
 26 |     c(fixef(model), as.vector(unlist(a[1:2])), attr(a,"sc")^2, SE(model), c(0,0))
 27 |     }
 28 | cfsvy<-function(model){
 29 |     a<-coef(model, random=TRUE)
 30 |     c(coef(model), diag(a$varb),a$s2,SE(model),c(0,0))
 31 |     }
 32 | 
 33 | cfglm<-function(model){c(coef(model),c(0,0), SE(model), c(0,0))}
 34 | 
 35 | model_cluster<-function(population, overlap){
 36 |    population$cluster<-numeric(nrow(population))
 37 |    
 38 |    id<-ifelse(population$lat<=overlap, 
 39 |               population$long, 
 40 |               ((population$long+population$lat-overlap) %% N1)+1
 41 |    )
 42 |    population$cluster<-id
 43 |    population	
 44 | }
 45 | 
 46 | 
 47 | f<-function(overlap,REPS=1000){
 48 |     
 49 |     population<-model_cluster(population,overlap)
 50 |     population$x<- population$long %% 40
 51 |     population$z<-rnorm(400*400)
 52 |     population$u<-sort(rnorm(400))[population$cluster]
 53 |     population$y<- with(population, x+z + u+rnorm(400*400))    
 54 |     
 55 |     population$strata<-(population$long-1) %/% 40
 56 |     population$uid<-1:nrow(population)
 57 |     
 58 |     true<-cflmer(lmer(y~x+z+(1|cluster), population))
 59 |     
 60 |     rr<-mcreplicate(REPS, {
 61 |         
 62 |         stratsize<- c(20,5,4,3,2,2,3,4,5,20)
 63 |         names(stratsize)<-unique(population$strata)
 64 |         sstrat<-stratsample(population$strata[!duplicated(population$PSU)], stratsize)
 65 |         
 66 |         stage1psu<- population$PSU[!duplicated(population$PSU)][sstrat]
 67 |         stage1<- subset(population, PSU %in% stage1psu)
 68 |         
 69 |         
 70 |         stratsize2<-rep(c(20,8,20),c(1,66,1))
 71 |         names(stratsize2)<-unique(stage1$PSU)
 72 |         stage2<-stage1[stratsample(stage1$PSU, stratsize2),]
 73 |         
 74 |     
 75 |         stage2$fpc1<-400/10
 76 |         stage2$fpc2<-400
 77 |         des<-svydesign(id=~PSU+uid, fpc=~fpc1+fpc2, strata=~strata,data=stage2)
 78 |         pair<-svy2lme(y~x+z+(1|cluster), design=des,return.devfun=TRUE)
 79 |         jkdes<-as.svrepdesign(des)
 80 |         jkvar<-boot2lme(pair,jkdes)
 81 |         
 82 |         c(
 83 |             cfsvy(pair),
 84 |             ##cflmer(lmer(y~x+z+(1|cluster), population)),
 85 |             cflmer(lmer(y~x+z+(1|cluster), stage2)),
 86 |             cfglm(svyglm(y~x+z+(1|cluster), design=des)),
 87 |             rep(0,5),SE(jkvar,"beta"), SE(jkvar,"fullVar"), sqrt(vcov(jkvar,"s2"))
 88 |         )
 89 |     })
 90 | 
 91 |     list(
 92 |         overlap=overlap/N2,
 93 |         true=true,
 94 |         median=matrix(apply(rr, 1, median),byrow=TRUE,nrow=4),
 95 |         mad=matrix(apply(rr, 1, mad),byrow=TRUE,nrow=4)
 96 |     )
 97 | }
 98 | 
 99 | 
100 | ##results<- lapply(c(0.1,0.25,0.5,0.75,0.9,1)*N2, f)
101 | 
102 | 
103 | results_0.25<-replicate(100, f(N2*1/4))
104 | results_0.75<-replicate(100, f(N2*3/4))
105 | save(results_0.25,results_0.75, file="~/svy2lmesim-crossed1.rda")
106 | 
107 | 
108 | ## summaries
109 | ## > round(rowMeans(sapply(results_0.75["median",],function(x) x[1,])),3)
110 | ## [1] -0.121  1.006  1.000  0.993  0.965  0.247  0.010  0.078
111 | ## > round(rowMeans(sapply(results_0.75["mad",],function(x) x[1,])),3)
112 | ## [1] 0.278 0.013 0.092 0.189 0.126 0.072 0.003 0.021
113 | 


--------------------------------------------------------------------------------
/inst/scripts/twins-pairwise.R:
--------------------------------------------------------------------------------
 1 | data("twinbmi",package="mets")
 2 | library(svylme)
 3 | library(Matrix)
 4 | I_twin<-with(twinbmi, Matrix(outer(1:nrow(twinbmi),1:nrow(twinbmi),function(i,j) (id[i]==id[j]) & (i!=j))))
 5 | I_mz<-with(twinbmi, Matrix(outer(1:nrow(twinbmi),1:nrow(twinbmi),function(i,j) (id[i]==id[j]) & (zyg[i]=="MZ") & (i!=j))))
 6 | 
 7 | n<-nrow(I_twin)
 8 | Phi_env<-I_twin+Diagonal(n)
 9 | Phi_add<-I_twin/2+I_mz/2+Diagonal(n)
10 | Phi_dom<-I_twin/4+I_mz*3/4+Diagonal(n)
11 | 
12 | dimnames(Phi_env)<-list(twinbmi$id,twinbmi$id)
13 | dimnames(Phi_add)<-list(twinbmi$id,twinbmi$id)
14 | dimnames(Phi_dom)<-list(twinbmi$id,twinbmi$id)
15 | 
16 | 
17 | twinbmi$id2<-twinbmi$id
18 | twinbmi$id3<-twinbmi$id
19 | 
20 | des<-svydesign(id=~id,data=twinbmi)
21 | 
22 | ## environment
23 | svy2lme(bmi ~ age+gender+(1|id), design=des)
24 | svy2relmer(bmi ~ age+gender+(1|id), design=des,relmat=list(id=Phi_env))
25 | lme4::lmer(bmi ~ age+gender+(1|id),data=twinbmi)
26 | lme4qtl::relmatLmer(bmi ~ age+gender+(1|id),data=twinbmi,relmat=list(id=Phi_env))
27 | svy2lme(bmi ~ age+gender+(1|id), design=des,all.pairs=TRUE,subtract.margins=TRUE)
28 | 
29 | ## environment plus additive genetic
30 | svy2relmer(bmi ~ age+gender+(1|id)+(1|id2), design=des,relmat=list(id=Phi_env,id2=Phi_add))
31 | lme4qtl::relmatLmer(bmi ~ age+gender+(1|id)+(1|id2), data=twinbmi,relmat=list(id=Phi_env,id2=Phi_add))
32 | 
33 | 
34 | ## environment plus additive and dominant genetic
35 | svy2relmer(bmi ~ age+gender+(1|id)+(1|id2)+(1|id3), design=des,relmat=list(id=Phi_env,id2=Phi_add,id3=Phi_dom))
36 | lme4qtl::relmatLmer(bmi ~ age+gender+(1|id)+(1|id2)+(1|id3), data=twinbmi,relmat=list(id=Phi_env,id2=Phi_add,id3=Phi_dom))
37 | 


--------------------------------------------------------------------------------
/inst/scripts/twins-sampling.R:
--------------------------------------------------------------------------------
 1 | data("twinbmi",package="mets")
 2 | library(svylme)
 3 | library(lme4)
 4 | library(Matrix)
 5 | I_twin<-with(twinbmi, Matrix(outer(1:nrow(twinbmi),1:nrow(twinbmi),function(i,j) (id[i]==id[j]) & (i!=j))))
 6 | I_mz<-with(twinbmi, Matrix(outer(1:nrow(twinbmi),1:nrow(twinbmi),function(i,j) (id[i]==id[j]) & (zyg[i]=="MZ") & (i!=j))))
 7 | 
 8 | n<-nrow(I_twin)
 9 | Phi_env<-I_twin+Diagonal(n)
10 | Phi_add<-I_twin/2+I_mz/2+Diagonal(n)
11 | Phi_dom<-I_twin/4+I_mz*3/4+Diagonal(n)
12 | 
13 | dimnames(Phi_env)<-list(twinbmi$id,twinbmi$id)
14 | dimnames(Phi_add)<-list(twinbmi$id,twinbmi$id)
15 | dimnames(Phi_dom)<-list(twinbmi$id,twinbmi$id)
16 | 
17 | 
18 | twinbmi$id2<-twinbmi$id
19 | twinbmi$id3<-twinbmi$id
20 | 
21 | ## sampling
22 | 
23 | ## whole twins
24 | 
25 | twinbmi$dbmi<-with(twinbmi, ave(bmi,id, FUN=function(v) if (length(v)>1) abs(diff(v)) else 0))
26 | 
27 | dup<-duplicated(twinbmi$id)
28 | uid<-twinbmi$id[!dup]
29 | udbmi<-twinbmi$dbmi[!dup]
30 | twinbmi$strata<-cut(twinbmi$dbmi, quantile(udbmi,(1:5)/5), include.lowest=TRUE) 
31 | nsample<-c(50,50,150,400)
32 | names(nsample)<-levels(twinbmi$strata)
33 | 
34 | results<-replicate(1000,{tryCatch({
35 | 
36 | insample<- twinbmi$id %in% uid[stratsample(twinbmi$strata[!dup], nsample)]
37 | twinbmi$fpc<-1383
38 | des<-svydesign(id=~id,data=twinbmi[insample,], strata=~strata, fpc=~fpc)
39 | 
40 | 
41 | 
42 | ## environment
43 | a<-svy2lme(bmi ~ age+gender+(1|id), design=des)
44 | b<-lme4::lmer(bmi ~ age+gender+(1|id),data=twinbmi[insample,])
45 | ##svy2lme(bmi ~ age+gender+(1|id), design=des,all.pairs=TRUE,subtract.margins=TRUE)
46 | 
47 | ## environment plus additive genetic
48 | d<-svy2relmer(bmi ~ age+gender+(1|id)+(1|id2), design=des,relmat=list(id=Phi_env,id2=Phi_add))
49 | e<-lme4qtl::relmatLmer(bmi ~ age+gender+(1|id)+(1|id2), data=twinbmi[insample,],relmat=list(id=Phi_env,id2=Phi_add))
50 | 
51 | r1<-list(a=c(coef(a),sqrt(unlist(coef(a, random=TRUE))[2:1])),
52 |      b=c(fixef(b),c(sqrt(unlist(VarCorr(b)[1])),attr(VarCorr(b),"sc"))),
53 |      d=c(coef(d),sqrt(unlist(coef(d, random=TRUE))[c(2,5,1)])),
54 |      e=c(fixef(e),c(sqrt(unlist(VarCorr(e)[1:2])),attr(VarCorr(e),"sc")))
55 | )
56 | 
57 | ## individuals
58 | 
59 | twinbmi$keep<-rbinom(nrow(twinbmi), 1, .5)
60 | twinsubsample <- subset(twinbmi[insample,], keep==1)
61 | twinsubsample$fpc2<-2
62 | iid<-1:nrow(twinsubsample)
63 | des2<-svydesign(id=~id+iid,data=twinsubsample, strata=~strata, fpc=~fpc+fpc2)
64 | 
65 | ## environment
66 | A<-svy2lme(bmi ~ age+gender+(1|id), design=des2)
67 | ##lme4::lmer(bmi ~ age+gender+(1|id),data=twinsubsample)
68 | B<-svy2lme(bmi ~ age+gender+(1|id), design=des2,all.pairs=TRUE,subtract.margins=TRUE)
69 | 
70 | ## environment plus additive genetic
71 | D<-svy2relmer(bmi ~ age+gender+(1|id)+(1|id2), design=des2,relmat=list(id=Phi_env,id2=Phi_add))
72 | ##lme4qtl::relmatLmer(bmi ~ age+gender+(1|id)+(1|id2), data=twinsubsample,relmat=list(id=Phi_env,id2=Phi_add))
73 | E<-svy2relmer(bmi ~ age+gender+(1|id)+(1|id2), design=des2,relmat=list(id=Phi_env,id2=Phi_add),all.pairs=TRUE,subtract.margins=TRUE)
74 | 
75 | 
76 | r2<-list(A=c(coef(A),sqrt(unlist(coef(A, random=TRUE))[2:1])),
77 |      B=c(coef(B),sqrt(unlist(coef(B, random=TRUE))[2:1])),
78 |      D=c(coef(D),sqrt(unlist(coef(D, random=TRUE))[c(2,5,1)])),
79 |      E=c(coef(E),sqrt(unlist(coef(E, random=TRUE))[c(2,5,1)]))
80 | )
81 | 
82 | c(r1,r2)
83 | }, error=function(e) NULL)
84 | })
85 | 
86 | save(results, file="twin-sampling.rda")
87 | 


--------------------------------------------------------------------------------
/man/boot2lme.Rd:
--------------------------------------------------------------------------------
  1 | \name{boot2lme}
  2 | \alias{boot2lme}
  3 | \alias{vcov.boot2lme}
  4 | %- Also NEED an '\alias' for EACH other topic documented here.
  5 | \title{
  6 | Resampling variances for svy2lme
  7 | }
  8 | \description{
  9 |   Computes variance estimates for the weighted-pairwise-likelihood
 10 |   linear mixed models fitted by \code{\link{svy2lme}} using replicate
 11 |   weights.  The replicate weights for a pair are obtained by dividing by
 12 |   the sampling weight and then multiplying by the replicate
 13 |   weight. There will be a warning if the ratio of replicate weight to
 14 |   sampling weight differs for observations in the same pair.  
 15 | }
 16 | \usage{
 17 | boot2lme(model, rdesign,  verbose = FALSE)
 18 | \method{vcov}{boot2lme}(object,
 19 |    parameter=c("beta", "theta","s2", "relSD" ,"SD","relVar","fullVar"),
 20 |    ...)
 21 | }
 22 | %- maybe also 'usage' for other objects documented here.
 23 | \arguments{
 24 |   \item{model}{
 25 | A model returned by \code{svy2lme} with the \code{devfun=TRUE} option
 26 | }
 27 |   \item{rdesign}{
 28 |   replicate-weights design corresponding to the design used to fit the model, see example
 29 | }
 30 |  
 31 |   \item{verbose}{
 32 | print progess information?
 33 | }
 34 | \item{object}{returned by \code{boot2lme}}
 35 | \item{\dots}{for method compatibility}
 36 | \item{parameter}{Variance matrix for: regression parameters, relative variance
 37 |   parameters on Cholesky square root scale, residual variance, relative
 38 |   standard errors of random effects, standard errors of random effects,
 39 |   entire relative variance matrix, entire variance matrix}
 40 | }
 41 | \details{
 42 | The variance is estimated from the replicates \code{thetastar} and original point estimate \code{theta} as \code{scale*sum(rscales* (thetastar-theta)^2)}. 
 43 | }
 44 | \value{
 45 |  For \code{boot2lme}, an object of class \code{boot2lme} with components
 46 |   \item{theta}{replicates of variance parameters (on Cholesky square
 47 |     root scale)}
 48 |   \item{beta}{replicates of regression parameters}
 49 |   \item{D}{replicates of relative variance matrix}
 50 |   \item{scale,rscales}{from the input}
 51 |   \item{formula}{model formula from the input}
 52 | 
 53 |   For the \code{vcov} method, a variance matrix.
 54 | }
 55 | 
 56 | 
 57 | 
 58 | \examples{
 59 | 
 60 | data(api, package="survey")
 61 | 
 62 | # two-stage cluster sample
 63 | dclus2<-svydesign(id=~dnum+snum, fpc=~fpc1+fpc2, data=apiclus2)
 64 | 
 65 | m0<-svy2lme(api00~(1|dnum)+ell+mobility, design=dclus2,return.devfun=TRUE)
 66 | jkdes<-as.svrepdesign(dclus2, type="mrb")
 67 | jkvar<-boot2lme(m0,jkdes)
 68 | 
 69 | SE(jkvar, "beta")
 70 | SE(jkvar, "SD")
 71 | SE(jkvar,"s2")
 72 | 
 73 | 
 74 | m1<-svy2lme(api00~(1|dnum)+ell+mobility,
 75 | design=dclus2,return.devfun=TRUE, all.pairs=TRUE, subtract.margins=TRUE)
 76 | jk1var<-boot2lme(m1,jkdes)
 77 | 
 78 | SE(jk1var, "beta")
 79 | SE(jk1var, "SD")
 80 | 
 81 | 
 82 | \donttest{
 83 | ##takes a few minutes
 84 | data(pisa)
 85 | 
 86 | pisa$w_condstuwt<-with(pisa, w_fstuwt/wnrschbw)
 87 | pisa$id_student<-1:nrow(pisa)
 88 | 
 89 | dpisa<-survey::svydesign(id=~id_school+id_student, weight=~wnrschbw+w_condstuwt, data=pisa)
 90 | 
 91 | m<-svy2lme(isei~(1+female|id_school)+female+high_school+college+one_for+both_for+test_lang,
 92 | 	design=dpisa, return.devfun=TRUE,method="nested")
 93 | 
 94 | bpisa<-as.svrepdesign(dpisa, type="bootstrap", replicates=100)
 95 | 
 96 | b<-boot2lme(m, bpisa, verbose=TRUE)
 97 | str(b)
 98 | 
 99 | vcov(b,"beta")
100 | vcov(b,"s2")
101 | 
102 | ## SE() inherits the parameter= argument
103 | SE(b,"beta")
104 | SE(b,"theta")
105 | SE(b,"SD")
106 | 
107 | }
108 | }
109 | % Add one or more standard keywords, see file 'KEYWORDS' in the
110 | % R documentation directory.
111 | \keyword{regression}% use one of  RShowDoc("KEYWORDS")
112 | \keyword{survey}% __ONLY ONE__ keyword per line
113 | 


--------------------------------------------------------------------------------
/man/milk_subset.Rd:
--------------------------------------------------------------------------------
 1 | \name{milk_subset}
 2 | \alias{milk_subset}
 3 | \alias{A_gen}
 4 | \docType{data}
 5 | \title{
 6 |   Milk production (subset)
 7 | }
 8 | \description{
 9 | A subset of a dataset from the \code{pedigreemm} package, created as an
10 | example for the \code{lme4qtl} package.  The original data had records
11 | of the milk production of 3397 lactations from first through fifty
12 | parity Holsteins. These were 1,359 cows, daughters of 38 sires in 57
13 | herds. The data was downloaded from the USDA internet site. All
14 | lactation records represent cows with at least 100 days in milk, with an
15 | average of 347 days. Milk yield ranged from 4,065 to 19,345 kg estimated
16 | for 305 days, averaging 11,636 kg. There were 1,314, 1,006, 640, 334 and
17 | 103 records were from first thorough fifth lactation animals.  The
18 | subset is of cows from 3 sires. 
19 | 
20 |   
21 | }
22 | \usage{data("milk_subset")}
23 | \format{
24 |   A data frame with 316 observations on the following 13 variables.
25 |   \describe{
26 |     \item{\code{id}}{numeric identifier of cow}
27 |     \item{\code{lact}}{number of lactation for which production is measured}
28 |     \item{\code{herd}}{a factor indicating the herd}
29 |     \item{\code{sire}}{a factor indicating the sire}
30 |     \item{\code{dim}}{number of days in milk for that lactation}
31 |     \item{\code{milk}}{milk production estimated at 305 days}
32 |     \item{\code{fat}}{fat production estimated at 305 days}
33 |     \item{\code{prot}}{protein production estimated at 305 days}
34 |     \item{\code{scs}}{the somatic cell score}
35 |     \item{\code{sdMilk}}{\code{milk} scaled by cow-specific
36 |       standard deviation}
37 |     \item{\code{herd_id}}{a character vector indicating the herd}
38 |     \item{\code{one}}{a vector of 1s for convenience in weighting}
39 |     \item{\code{one2}}{another vector of 1s for convenience in weighting}
40 |   }
41 | }
42 | \details{
43 | This data example gives noticeably different results for full likelihood
44 | and pairwise likelihood because the model is misspecified.  The best
45 | fitting linear model for the large herd 89 is different, and that herd
46 | gets relatively more weight in the pairwise analysis (because it has
47 | more pairs).
48 | 
49 | }
50 | \source{
51 |   Constructed at \url{https://github.com/variani/lme4qtl/blob/master/vignettes/pedigreemm.Rmd}
52 | }
53 | \references{
54 |    2010. A.I. Vazquez, D.M. Bates, G.J.M. Rosa, D. Gianola and K.A. Weigel.
55 |    Technical Note: An R package for fitting generalized linear mixed models
56 |    in animal breeding. Journal of Animal Science, 88:497-504.
57 |  }
58 | \examples{
59 | data(milk_subset)
60 | herd_des<- svydesign(id = ~herd + id, prob = ~one + one2, data = milk_subset)
61 | lm(sdMilk ~ lact + log(dim),data=milk_subset,subset=herd==89)
62 | lm(sdMilk ~ lact + log(dim),data=milk_subset,subset=herd!=89)
63 | svy2lme(sdMilk ~ lact + log(dim) + (1|herd), design=herd_des,method="nested")
64 | svy2lme(sdMilk ~ lact + log(dim) + (1|herd), design=herd_des,method="general")
65 | 
66 | ## pairwise result is closer to herd 89 than to remainder
67 | lme4::lmer(sdMilk ~ lact + log(dim) + (1|herd), data=milk_subset)
68 | svy2relmer(sdMilk ~ lact + log(dim) + (1|id) + (1|herd), design=herd_des,
69 |     relmat = list(id = A_gen))
70 | 
71 | ## compare to all pairs
72 | svy2lme(sdMilk ~ lact + log(dim) + (1|herd),
73 | design=herd_des,method="general", all.pairs=TRUE)
74 | svy2lme(sdMilk ~ lact + log(dim) + (1|herd),
75 | design=herd_des,method="general", all.pairs=TRUE, subtract.margins=TRUE)
76 | 
77 | }
78 | \keyword{datasets}
79 | 


--------------------------------------------------------------------------------
/man/nzmaths.Rd:
--------------------------------------------------------------------------------
 1 | \name{nzmaths}
 2 | \alias{nzmaths}
 3 | \docType{data}
 4 | \title{
 5 | Maths Performance Data from the PISA 2012 survey in New Zealand
 6 | }
 7 | \description{
 8 | Data on maths performance, gender, some problem-solving variables and some school resource variables.
 9 | }
10 | \usage{data("nzmaths")}
11 | \format{
12 |   A data frame with 4291 observations on the following 26 variables.
13 |   \describe{
14 |     \item{\code{SCHOOLID}}{School ID}
15 |     \item{\code{CNT}}{Country id: a factor with levels \code{New Zealand}}
16 |     \item{\code{STRATUM}}{a factor with levels \code{NZL0101} \code{NZL0102} \code{NZL0202} \code{NZL0203}}
17 |     \item{\code{OECD}}{Is the country in the OECD?}
18 |     \item{\code{STIDSTD}}{Student ID}
19 |     \item{\code{ST04Q01}}{Gender: a factor with levels \code{Female} \code{Male}}
20 |     \item{\code{ST14Q02}}{Mother has university qualifications \code{No} \code{Yes}}
21 |     \item{\code{ST18Q02}}{Father has university qualifications \code{No} \code{Yes}}
22 |     \item{\code{MATHEFF}}{Mathematics Self-Efficacy: numeric vector}
23 |     \item{\code{OPENPS}}{Mathematics Self-Efficacy:  numeric vector}
24 |     \item{\code{PV1MATH},\code{PV2MATH},\code{PV3MATH},\code{PV4MATH},\code{PV5MATH} }{'Plausible values' (multiple imputations) for maths performance}
25 |     \item{\code{W_FSTUWT}}{Design weight for student}
26 |     \item{\code{SC35Q02}}{Proportion of maths teachers with professional development in maths in past year}
27 |     \item{\code{PCGIRLS}}{Proportion of girls at the school}
28 |     \item{\code{PROPMA5A}}{Proportion of maths teachers with ISCED 5A (math major)}
29 |     \item{\code{ABGMATH}}{Does the school group maths students: a factor with levels \code{No ability grouping between any classes} \code{One of these forms of ability grouping between classes for s} \code{One of these forms of ability grouping for all classes}}
30 |     \item{\code{SMRATIO}}{Number of students per maths teacher}
31 |     \item{\code{W_FSCHWT}}{Design weight for school}
32 |     \item{\code{condwt}}{Design weight for student given school}
33 |       }
34 | }
35 | 
36 | \source{
37 | A subset extracted from the \code{PISA2012lite} R package, \url{https://github.com/pbiecek/PISA2012lite}
38 | }
39 | \references{
40 | OECD (2013) PISA 2012 Assessment and Analytical Framework: Mathematics, Reading, Science, Problem Solving and Financial Literacy. OECD Publishing.
41 | }
42 | \examples{
43 | data(nzmaths)
44 | 
45 | oo<-options(survey.lonely.psu="average") ## only one PSU in one of the strata
46 | 
47 | des<-svydesign(id=~SCHOOLID+STIDSTD, strata=~STRATUM, nest=TRUE,
48 | 	weights=~W_FSCHWT+condwt, data=nzmaths)
49 | 
50 | ## This example works, but it takes more than five seconds to run, so it
51 | ## has been commented out
52 | ## m1<-svy2lme(PV1MATH~ (1+ ST04Q01 |SCHOOLID)+ST04Q01*(PCGIRLS+SMRATIO)+MATHEFF+OPENPS, design=des)
53 | 
54 | options(oo)
55 | 
56 | }
57 | \keyword{datasets}
58 | 


--------------------------------------------------------------------------------
/man/pisa.Rd:
--------------------------------------------------------------------------------
 1 | \name{pisa}
 2 | \alias{pisa}
 3 | \docType{data}
 4 | \title{
 5 | Data from the PISA international school survey
 6 | }
 7 | \description{
 8 | Data from the PISA survey of schools, obtained from Stata, who obtained it from Rabe-Hesketh & Skrondal. 
 9 | }
10 | \usage{data("pisa")}
11 | \format{
12 |   A data frame with 2069 observations on the following 11 variables.
13 |   \describe{
14 |     \item{\code{female}}{1 for female}
15 |     \item{\code{isei}}{socioeconomic index}
16 |     \item{\code{w_fstuwt}}{student sampling weight (total)}
17 |     \item{\code{wnrschbw}}{school sampling weight}
18 |     \item{\code{high_school}}{1 if highest level of parents' education is high school}
19 |     \item{\code{college}}{1 if highest level of parents' education is college/uni}
20 |     \item{\code{one_for}}{1 if one parent is foreign-born}
21 |     \item{\code{both_for}}{1 if both parents are foreign-born}
22 |     \item{\code{test_lang}}{1 if the test language is spoken at home}
23 |     \item{\code{pass_read}}{1 if the student passed a reading proficiency test}
24 |     \item{\code{id_school}}{school (sampling unit) identifier}
25 |   }
26 | }
27 | 
28 | \source{
29 | Data downloaded from
30 | \url{https://www.stata-press.com/data/r15/pisa2000.dta}
31 | }
32 | \references{
33 | Rabe-Hesketh, S., and A. Skrondal.  2006.  Multilevel modelling of
34 | complex survey data.Journal of the Royal Statistical Society,  Series  A. 169:  805-827
35 | }
36 | \examples{
37 | data(pisa)
38 | 
39 | ## This model doesn't make a lot of sense, but it's the one in the
40 | ## Stata documentation because the outcome variable is numeric.
41 | 
42 | pisa$w_condstuwt<-with(pisa, w_fstuwt/wnrschbw)
43 | pisa$id_student<-1:nrow(pisa)
44 | 
45 | dpisa<-survey::svydesign(id=~id_school+id_student, weight=~wnrschbw+w_condstuwt, data=pisa)
46 | 
47 | 
48 | svy2lme(isei~(1|id_school)+female+high_school+college+one_for+both_for+test_lang,
49 | 	design=dpisa)
50 | 
51 | 
52 | 
53 | 
54 | }
55 | \keyword{datasets}
56 | 


--------------------------------------------------------------------------------
/man/svy2lme.Rd:
--------------------------------------------------------------------------------
  1 | \name{svy2lme}
  2 | \alias{svy2lme}
  3 | \encoding{utf8}
  4 | \alias{coef.svy2lme}
  5 | %- Also NEED an '\alias' for EACH other topic documented here.
  6 | \title{
  7 | Linear mixed models by pairwise likelihood
  8 | }
  9 | \description{
 10 | Fits linear mixed models to survey data by maximimising the profile pairwise composite
 11 | likelihood. 
 12 | }
 13 | \usage{
 14 | svy2lme(formula, design, sterr=TRUE,  return.devfun=FALSE,
 15 | method=c("general","nested"), all.pairs=FALSE, subtract.margins=FALSE)
 16 | \method{coef}{svy2lme}(object,...,random=FALSE)
 17 | }
 18 | %- maybe also 'usage' for other objects documented here.
 19 | \arguments{
 20 |   \item{formula}{
 21 |     Model formula as in the \code{lme4} package}
 22 |   \item{design}{
 23 |     A survey design object produced by \code{survey::svydesign}. The
 24 |     pairwise weights will be computed from this design, which must have
 25 |     separate probabilities or weights for each stage of sampling.
 26 |   }
 27 |   \item{sterr}{
 28 |     Estimate standard errors for fixed effects? Set to \code{FALSE} for
 29 |     greater speed when using resampling to get standard errors. Also,
 30 |     a PPS-without-replacement survey design can't get sandwich standard errors
 31 |     (because fourth-order sampling probabilities would be needed) 
 32 |   }
 33 | 
 34 |   \item{return.devfun}{If \code{TRUE}, return the deviance function as a
 35 |     component of the object. This will increase the memory use
 36 |     substantially, but allows for bootstrapping.}
 37 |   \item{method}{\code{"nested"} requires the model clusters to have a
 38 |     single grouping variable that is the same as the primary sampling
 39 |     unit. It's faster.}
 40 |     \item{all.pairs}{Only with \code{method="general"}, use all pairs
 41 |       rather than just correlated pairs?}
 42 |     \item{subtract.margins}{If \code{TRUE} and \code{all.pairs=TRUE},
 43 |     compute with all pairs by the faster algorithm involving subtraction
 44 |     from the marginal likelihood}
 45 |   \item{object}{\code{svy2lme} object}
 46 |   \item{\dots}{for method compatibility}
 47 |     \item{random}{if \code{TRUE}, the variance components rather than
 48 |     the fixed effects}
 49 | }
 50 | \details{
 51 |   The population pairwise likelihood would be the sum of the
 52 |     loglikelihoods for a pair of observations, taken over all pairs of
 53 |     observations from the same cluster.  This is estimated by taking a
 54 |     weighted sum over pairs in the sample, with the weights being the
 55 |     reciprocals of pairwise sampling probabilities. The advantage over
 56 |     standard weighted pseudolikelihoods is that there is no
 57 |     large-cluster assumption needed and no rescaling of weights. The
 58 |     disadvantage is some loss of efficiency and simpler point
 59 |     estimation.
 60 | 
 61 |     With \code{method="nested"} we have the method of Yi et al
 62 |     (2016). Using \code{method="general"} relaxes the conditions on the
 63 |     design and model. 
 64 |   
 65 |     The code uses \code{lme4::lmer} to parse the formula and produce
 66 |     starting values, profiles out the fixed effects and residual
 67 |     variance, and then uses \code{minqa::bobyqa} to maximise the
 68 |     resulting profile deviance.
 69 | 
 70 |     As with \code{lme4::lmer}, the default is to estimate the
 71 |     correlations of the random effects, since there is typically  no
 72 |     reason to assume these are zero. You can force two random effects to
 73 |     be independent by entering them in separate terms, eg
 74 |     \code{(1|g)+(-1+x|g)} in the model formula asks for a random intercept
 75 |     and a random slope with no random intercept, which will be uncorrelated.
 76 |     
 77 |     The internal parametrisation of the variance components uses the
 78 |     Cholesky decomposition of the relative variance matrix (the variance
 79 |     matrix divided by the residual variance), as in
 80 |     \code{lme4::lmer}. The component \code{object$s2} contains the
 81 |     estimated residual variance and the component \code{object$opt$par}
 82 |     contains the elements of the Cholesky factor in column-major order,
 83 |     omitting any elements that are forced to be zero by requiring
 84 |     indepedent random effects. 
 85 |     
 86 |     Standard errors of the fixed effects are currently estimated using a
 87 |     "with replacement" approximation, valid when the sampling fraction
 88 |     is small and superpopulation (model, process) inference is
 89 |     intended. Tthe influence functions are added up within
 90 |     cluster, centered within strata, the residuals added up within strata, and then
 91 |     the crossproduct is taken within each stratum. The stratum variance
 92 |     is scaled by \code{ni/(ni-1)} where \code{ni} is the number of PSUs
 93 |     in the stratum, and then added up across strata. When the sampling
 94 |     and model structure are the same, this is the estimator of Yi et al,
 95 |     but it also allows for there to be sampling stages before the stages
 96 |     that are modelled, and for the model and sampling structures to be
 97 |     different.
 98 | 
 99 |     The \code{return.devfun=TRUE} option is useful if you want to
100 |     examine objects that aren't returned as part of the output. For
101 |     example, \code{get("ij", environment(object$devfun))} is the set of
102 |     pairs used in computation. 
103 |   
104 | }
105 | \value{
106 |   \code{svy2lme} returns an object with \code{print}, \code{coef}, and
107 |   \code{vcov} methods.
108 | 
109 |   The \code{coef} method with \code{random=TRUE} returns a two-element
110 |   list: the first element is the estimated residual variance, the second
111 |   is the matrix of estimated variances and covariances of the random effects.
112 |   
113 | }
114 | \references{
115 |   J.N.K. Rao, François Verret and Mike A. Hidiroglou "A weighted composite likelihood approach to inference for two-level models from survey data" Survey Methodology, December 2013  Vol. 39, No. 2, pp. 263-282
116 | 
117 |   Grace Y. Yi , J. N. K. Rao and Haocheng Li "A WEIGHTED COMPOSITE LIKELIHOOD APPROACH FOR ANALYSIS OF SURVEY DATA UNDER TWO-LEVEL MODELS" Statistica Sinica 
118 |   Vol. 26, No. 2 (April 2016), pp. 569-587
119 | }
120 | \author{
121 |   Thomas Lumley
122 | }
123 | \examples{
124 | 
125 | data(api, package="survey")
126 | 
127 | # one-stage cluster sample
128 | dclus1<-svydesign(id=~dnum, weights=~pw, data=apiclus1, fpc=~fpc)
129 | # two-stage cluster sample
130 | dclus2<-svydesign(id=~dnum+snum, fpc=~fpc1+fpc2, data=apiclus2)
131 | 
132 | svy2lme(api00~(1|dnum)+ell+mobility+api99, design=dclus1)
133 | svy2lme(api00~(1|dnum)+ell+mobility+api99, design=dclus2)
134 | svy2lme(api00~(1|dnum)+ell+mobility+api99, design=dclus2,method="nested")
135 | 
136 | lme4::lmer(api00~(1|dnum)+ell+mobility+api99, data=apipop)
137 | 
138 | ## Simulated
139 | 
140 | set.seed(2000-2-29)
141 | 
142 | df<-data.frame(x=rnorm(1000*20),g=rep(1:1000,each=20), t=rep(1:20,1000), id=1:20000)
143 | df$u<-with(df, rnorm(1000)[g])
144 | 
145 | df$y<-with(df, x+u+rnorm(1000,s=2))
146 | 
147 | ## oversample extreme `u` to bias random-intercept variance
148 | pg<-exp(abs(df$u/2)-2.2)[df$t==1]
149 | 
150 | in1<-rbinom(1000,1,pg)==1
151 | in2<-rep(1:5, length(in1))
152 | 
153 | sdf<-subset(df, (g \%in\% (1:1000)[in1]) & (t \%in\% in2))
154 | 
155 | p1<-rep(pg[in1],each=5)
156 | N2<-rep(20,nrow(sdf))
157 | 
158 | ## Population values
159 | lme4::lmer(y~x+(1|g), data=df)
160 | 
161 | ## Naive estimator: higher intercept variance
162 | lme4::lmer(y~x+(1|g), data=sdf)
163 | 
164 | ##pairwise estimator
165 | sdf$w1<-1/p1
166 | sdf$w2<-20/5
167 | 
168 | design<-survey::svydesign(id=~g+id, data=sdf, weights=~w1+w2)
169 | pair<-svy2lme(y~x+(1|g),design=design,method="nested")
170 | pair
171 | 
172 | pair_g<-svy2lme(y~x+(1|g),design=design,method="general")
173 | pair_g
174 | 
175 | all.equal(coef(pair), coef(pair_g))
176 | all.equal(SE(pair), SE(pair_g))
177 | 
178 | 
179 | }
180 | % Add one or more standard keywords, see file 'KEYWORDS' in the
181 | % R documentation directory.
182 | \keyword{regression }% use one of  RShowDoc("KEYWORDS")
183 | \keyword{survey }% __ONLY ONE__ keyword per line
184 | 


--------------------------------------------------------------------------------
/man/svy2relmer.Rd:
--------------------------------------------------------------------------------
  1 | \name{svy2relmer}
  2 | \alias{svy2relmer}
  3 | \encoding{utf8}
  4 | %- Also NEED an '\alias' for EACH other topic documented here.
  5 | \title{
  6 | Linear mixed models with correlated random effects
  7 | }
  8 | \description{
  9 | Fits linear mixed models by maximising the profile pairwise composite
 10 | likelihood. Allows for correlated random effects, eg, for genetic
 11 | relatedness (QTL) models
 12 | }
 13 | \usage{
 14 | svy2relmer(formula, design, sterr=TRUE, return.devfun=FALSE, relmat=NULL,
 15 |  all.pairs=FALSE, subtract.margins=FALSE )
 16 | }
 17 | %- maybe also 'usage' for other objects documented here.
 18 | \arguments{
 19 |   \item{formula}{
 20 |     Model formula as in the \code{lme4} package, or with terms like
 21 |     \code{(1|id)} for correlated random effects together with the
 22 |     \code{relmat} argument.
 23 |   }
 24 |   \item{design}{
 25 |     A survey design object produced by \code{survey::svydesign}. The
 26 |     pairwise weights will be computed from this design, which must have
 27 |     separate probabilities or weights for each stage of sampling.
 28 |   }
 29 |   \item{sterr}{
 30 |     Estimate standard errors for fixed effects? Set to \code{FALSE} for
 31 |     greater speed when using resampling to get standard errors.
 32 |   }
 33 | 
 34 |   \item{return.devfun}{If \code{TRUE}, return the deviance function as a
 35 |     component of the object. This will increase the memory use
 36 |     substantially, but allows for bootstrapping.}
 37 |   \item{relmat}{ Specifies a list of relatedness matrices that corresponds to one or
 38 |     more random-effect groupings (eg \code{(1|id)} in the \code{formula}
 39 |     together with \code{relmat=list(id=Phi)} implies a covariance matrix
 40 |     of \code{Phi} for the random effects before scaling). See Details and
 41 |     the vignettes.  }
 42 |   \item{all.pairs}{Use all pairs rather than just correlated pairs?}
 43 |     \item{subtract.margins}{If \code{TRUE} and \code{all.pairs=TRUE},
 44 |     compute with all pairs by the faster algorithm involving subtraction
 45 |     from the marginal likelihood}
 46 | }
 47 | \details{
 48 | 
 49 |     This function is very similar to \code{\link{svy2lme}} and only the
 50 |     differences are described here.
 51 | 
 52 |     Formula parsing and starting values use code based on the
 53 |     \code{lme4qtl} package.
 54 | 
 55 |     In \code{svy2lme} and \code{lme4::lmer}, the model is based on
 56 |     independent standard Normal random effects that are transformed to
 57 |     give random coefficients that might be correlated within observation
 58 |     but are either identical or independent between observations. In
 59 |     this function, the basic random effects in a term are multiplied by a square
 60 |     root of the \code{relmat} matrix for that term, giving basic random
 61 |     effects whose covariance between observations proportional to the
 62 |     \code{relmat} matrix. For example, in a quantitative trait locus
 63 |     model in genetics, the matrix would be a genetic relatedness matrix.
 64 | 
 65 |     The  \code{relmat} matrices must have dimnames for matching to the
 66 |     id variable. It is permissible for the  \code{relmat} matrices to
 67 |     be larger than necessary -- eg, containing related units that are
 68 |     not in the sample -- since the dimnames will be used to select the
 69 |     relevant submatrix. 
 70 |     
 71 |     There can be only one random-effect term for each \code{relmat} term. If
 72 |     you need more, make a copy of the term with a different
 73 |     name.   
 74 | 
 75 |     The \code{return.devfun=TRUE} option is useful if you want to
 76 |     examine objects that aren't returned as part of the output. For
 77 |     example, \code{get("ij", environment(object$devfun))} is the set of
 78 |     pairs used in computation. 
 79 |   
 80 | }
 81 | \value{
 82 |   \code{svy2relmer} returns an object with \code{print}, \code{coef}, and
 83 |   \code{vcov} methods.
 84 | 
 85 |   
 86 | }
 87 | \references{
 88 | Ziyatdinov, A., Vázquez-Santiago, M., Brunel, H. et al. lme4qtl: linear mixed models with flexible covariance structure for genetic studies of related individuals. BMC Bioinformatics 19, 68 (2018). \url{https://bmcbioinformatics.biomedcentral.com/articles/10.1186/s12859-018-2057-x}
 89 | }
 90 | \author{
 91 |   Thomas Lumley
 92 | }
 93 | \examples{
 94 | data(milk_subset)
 95 | herd_des<- svydesign(id = ~herd + id, prob = ~one + one2, data = milk_subset)
 96 | 
 97 | svy2lme(sdMilk ~ lact + log(dim) + (1|herd), design=herd_des, method="general")
 98 | 
 99 | svy2relmer(sdMilk ~ lact + log(dim) + (1|id) + (1|herd), design=herd_des,
100 |     relmat = list(id = A_gen))
101 | 
102 | 
103 | }
104 | % Add one or more standard keywords, see file 'KEYWORDS' in the
105 | % R documentation directory.
106 | \keyword{regression }% use one of  RShowDoc("KEYWORDS")
107 | \keyword{survey }% __ONLY ONE__ keyword per line
108 | 


--------------------------------------------------------------------------------