wb.stats: [R] Scanning node statistics from WinBUGS output

> source('c:/users/pbelisle/My Documents/Home/bin/R/fcts/WBStats.R') # load file where wb.stats R function is defined
> u <- wb.stats('c:/users/pbelisle/My Documents/Home/MyProject/WinBUGS/log/mywinbugsoutput.txt', return.as.list=F) # read (all) the node statistics from the cited WinBUGS text output file
> u

	mean	sd	MC error	2.5%	median	97.5%	start	sample
x.p.null[1]	6.5e-01	6.7e-02	1.1e-03	5.2e-01	6.6e-01	7.8e-01	5.0e+03	2.0e+04
x.p.null[2]	5.0e-02	2.7e-02	5.7e-04	6.9e-03	4.7e-02	1.1e-01	5.0e+03	2.0e+04
x.mu[1]	5.5e+00	2.8e-01	1.2e-02	5.0e+00	5.5e+00	6.1e+00	5.0e+03	2.0e+04
x.mu[2]	8.2e+00	2.4e-01	3.3e-03	7.7e+00	8.2e+00	8.7e+00	5.0e+03	2.0e+04
x.mudiff	2.7e+00	3.6e-01	1.1e-02	2.0e+00	2.7e+00	3.4e+00	5.0e+03	2.0e+04
x.sd.between[1]	7.0e-01	3.8e-01	2.5e-02	5.2e-02	7.2e-01	1.4e+00	5.0e+03	2.0e+04
x.sd.between[2]	1.7e+00	1.9e-01	2.1e-03	1.4e+00	1.7e+00	2.1e+00	5.0e+03	2.0e+04
x.sd.within[1]	7.5e-01	3.3e-01	1.6e-02	1.2e-01	7.6e-01	1.4e+00	5.0e+03	2.0e+04
x.sd.within[2]	9.3e-01	8.9e-02	1.3e-03	7.8e-01	9.3e-01	1.1e+00	5.0e+03	2.0e+04
prev	8.2e-01	6.2e-02	1.5e-03	6.9e-01	8.3e-01	9.3e-01	5.0e+03	2.0e+04

# Read the same WinBUGS output file as above, but select only a subset of nodes found therein
u <- wb.stats('c:/users/pbelisle/My Documents/Home/MyProject/WinBUGS/log/mywinbugsoutput.txt', nodes=c('x.mudiff', 'prev'), return.as.list=F)
> u

	mean	sd	MC error	2.5%	median	97.5%	start	sample
x.mudiff	2.7e+00	3.6e-01	1.1e-02	2.0e+00	2.7e+00	3.4e+00	5.0e+03	2.0e+04
prev	8.2e-01	6.2e-02	1.5e-03	6.9e-01	8.3e-01	9.3e-01	5.0e+03	2.0e+04

# Read the same WinBUGS output file as above, but select only a subset of nodes found therein and only a few node statistics AND RETURN OUTPUT AS A LIST
u <- wb.stats('c:/users/pbelisle/My Documents/Home/MyProject/WinBUGS/log/mywinbugsoutput.txt', nodes=c('prev', 'x.mu'), node.statistics=c('mean', 'median'))
> u

$prev
$prev$mean
[1] 0.82

$prev$median
[1] 0.83

$x.mu
$x.mu$mean
x.mu[1] x.mu[2]
5.5 8.2

$x.mu$median
x.mu[1] x.mu[2]
5.5 8.2

wb.stats <- function(file, nodes=character(0), node.statistics=c("mean", "sd", "MC error", "2.5%", "median", "97.5%", "start", "sample"), return.as.list=length(node.statistics)>1)
{
   wblog <- scan(file, sep='\n', what="", quiet=T)
   tab.found <- grep('\t', wblog)
   wblog <- wblog[tab.found]

   # Remove node stats header line(s) -- if found twice, ignore lines below second occurence
   median.found <- grep('\\smedian', wblog, perl=T)
   if (length(median.found) > 1) wblog <- wblog[seq(median.found[2]-1)]
   wblog <- wblog[-median.found[1]]

   # Exhaustive list of node stats returned by WinBUGS
   wb.node.statistics <- c("mean", "sd", "MC error", "2.5%", "median", "97.5%", "start", "sample")

   # remove lines with comments (possible if output was modified)
   found.comment <- grep('#', wblog)
   if (length(found.comment)) wblog <- wblog[-found.comment]

   wblog <- gsub('\\s+', ' ', wblog, perl=T)
   wblog <- sub('\\s', '', wblog, perl=T) # remove leading space
   wblog <- wblog[nchar(wblog)>0] # drop empty lines
     # drop lines with /odds ratio/
     slashes <- grep("/", wblog)
     if (length(slashes)) wblog <- wblog[-slashes]
   wblog <- matrix(unlist(strsplit(wblog, ' ')), byrow=T, nrow=length(wblog))
   nodes.names <- wblog[,1]
   wblog <- matrix(suppressWarnings(as.numeric(wblog[,-1])), nrow=nrow(wblog))
   colnames(wblog) <- wb.node.statistics
   rownames(wblog) <- nodes.names

   # Keep only required node statistics
   w <- match(tolower(node.statistics), tolower(wb.node.statistics))
   wblog <- wblog[,w,drop=F]

   if (length(nodes))
   {
     nodes.names0 <- sub('\\[.*', '', nodes.names, perl=T)
     w <- !is.na(match(nodes.names0, nodes)) | !is.na(match(nodes.names, nodes))
     wblog <- wblog[w,,drop=F]
   }

   if (return.as.list)
   {
     stats <- sort(colnames(wblog))
     n.stats <- length(stats)

     dim <- rownames(wblog)
     dim <- sub("\\[.*", "", dim, perl=T)
     dimensions <- unique(sort(dim))
     n.dim <- length(dimensions)

     out <- list()

     for (i in seq(n.dim))
     {
       d <- dimensions[i]
       w <- which(dim==d)

       my.out <- list()
       my.i <- 0
       for (s in stats)
       {
         my.i <- my.i + 1
         my.out[[my.i]] <- wblog[w, s]
       }

       if (n.stats == 1)
       {
         my.out <- unlist(my.out)
       }
       else
       {
         names(my.out) <- stats
       }

       out[[i]] <- my.out
     }

     names(out) <- dimensions
   }
   else
   {
     out <- wblog
   }

   out
} # end of wb.stats