require(Hmisc)
require(plotly)
require(htmlTable)
source('~/R/hreport/R/Misc.r')
source('~/R/hreport/R/accrualReport.r')
source('~/R/hreport/R/exReport.r')
mu <- markupSpecs$html # in Hmisc - HTML markups
frac <- mu$frac
mu$styles() # define HTML styles, functions
## Generate test data
set.seed(1)
n <- 500
d <- data.frame(country=sample(c('US', 'Canada', 'Spain', 'France',
'Germany'), n, TRUE),
site=sample(1:10, n, TRUE))
d$site <- paste(substring(d$country, 1, 2), d$site, sep='')
d$region <- factor(ifelse(d$country %in% c('US', 'Canada'),
'North America', 'Europe'))
d <- upData(d, edate = as.Date('2005-01-01') +
round(rgamma(n, 2, .01)) - 600 * (country == 'US'),
rdate = edate + round(runif(n, 1, 30)), print=FALSE)
d$rdate[runif(nrow(d)) < 0.5] <- NA # non-randomized subjects )
# with(d, table(region, country))
# For US manually compute # randomized per month
us <- subset(d, country == 'US')
site <- us$site
ed <- us$edate
rd <- us$rdate
months <- difftime(as.Date('2007-12-31'), ed, units='days') /
(365.25 / 12)
m <- max(months)
a <- sum(!is.na(rd)) / as.numeric(m) # .8545774 (agrees with chart)
# Compute maximum months elapsed for each site then sum over sites
maxpersite <- tapply(months, site, max)
b <- sum(!is.na(rd)) / sum(maxpersite)
## 0.0864429 = 47 / 543.6715 chart: .08645 (rounded)
## Suppose there are more subjects enrolled and randomized than really
## made their way into the dataset
denom <- c(enrolled=nrow(d) * 1.1,
randomized=sum(!is.na(d$rdate)) + 10)
sethreportOption(tx.var='treat', denom=denom)
## Initialize file to hold appendix information such as subject IDs
## so all later writing to this file can use append=TRUE
appfile <- gethreportOption('appfile')
cat('', file=appfile)
Introduction
Interactive Graphs
Most of the graphs produced here are semi-interactive. One can hover over elements of graphs with the mouse to have detailed information pop up.
Extended Box Plots
For depicting distributions of continuous variables, many of the following displays use extended box plots, also called box–percentile plots. A prototype, with explanations, is below.
bpplt()

Dot Charts
Dot charts are used to present stratified proportions. In these charts the area of the symbols is proportional to the square root of the denominator. The legend shows representative denominators and their corresponding symbol areas, using denominators that actually occurred in the data and extended from the minimum observed to the maximum observed sample size.???
Survival Curves
Graphs containing pairs of Kaplan-Meier survival curves show a shaded region centered at the midpoint of the two survival estimates and having a height equal to the half-width of the approximate 0.95 pointwise confidence interval for the difference of the two survival probabilities. Time points at which the two survival estimates do not touch the shaded region denote approximately significantly different survival estimates, without any multiplicity correction.
Accrual
accrualReport(enroll(edate) + randomize(rdate) ~
region(region) + country(country) + site(site),
data=d,
dateRange=c('2005-01-01', '2007-12-31'),
targetN=
data.frame(edate=c(500, 1000), rdate=c(250, 500)),
targetDate=c('2006-01-01', '2007-12-31'),
closeDate='2007-12-31')
Study Numbers
Number
|
Category
|
5
|
Countries
|
50
|
Sites
|
500
|
Participants enrolled
|
260
|
Participants randomized
|
5.2
|
Participants per site
|
50
|
Sites randomizing
|
5.2
|
Subjects randomized per randomizing site
|
55.1
|
Months from first subject randomized (2003-05-29) to 2007-12-31
|
1873.8
|
Site-months for sites randomizing
|
37.5
|
Average months since a site first randomized
|
0.14
|
Participants randomized per site per month
|
15
|
Mean days from enrollment to randomization
|
15
|
Median days from enrollment to randomization
|
∟ Participants enrolled over time
The blue line depicts the cumulative frequency. The thick grayscale line represent targets.
|
Category
|
N
|
Used
|
Enrolled
|
550
|
500
|
|
|
∟ Participants randomized over time
The blue line depicts the cumulative frequency. The thick grayscale line represent targets.
|
Category
|
N
|
Used
|
Enrolled
|
550
|
260
|
Randomized
|
270
|
260
|
|
|
∟ Days from enrollment to randomization
Quartiles and mean number of days by region and country
|
Category
|
N
|
Used
|
Enrolled
|
550
|
260
|
Randomized
|
270
|
260
|
|
|
∟ Number of sites × number of participants
Number of sites having the given number of participants
|
Category
|
N
|
Used
|
Enrolled
|
550
|
260
|
Randomized
|
270
|
260
|
|
|
∟ Participants enrolled by region and country
∟ Participants randomized by region and country
∟ Sites that enrolled by region and country
∟ Sites that randomized by region and country
∟ Fraction of enrolled participants randomized by region and country
∟ Participants randomized per month by region and country
∟ Partipants randomized per site per month by region and country
Exclusions
d <- upData(d,
subjid = 1 : n,
pend = rbinom(n, 1, .1),
e1 = rbinom(n, 1, .02),
e2 = rbinom(n, 1, .02),
e3 = rbinom(n, 1, .02),
e4 = ifelse(runif(n) < 0.25, NA, rbinom(n, 1, .10)),
tested = rbinom(n, 1, .75),
e5 = ifelse(tested, rbinom(n, 1, .04), NA),
e6 = rbinom(n, 1, .02),
e7 = rbinom(n, 1, .02),
rndz = rbinom(n, 1, .75),
labels=c(e1='Prior MI', e2='History of Asthma',
e3='History of Upper GI Bleeding',
e4='No Significant CAD', e5='Inadequate Renal Function',
e6='Pneumonia within 6 weeks', e7='Prior cardiac surgery'),
print=FALSE)
erd <- data.frame(subjid = 1 : 50,
loc = sample(c('gastric', 'lung', 'trachea'), 50, TRUE))
# To check warning messages, greportOption denom does not match pend, e1-e7
exReport(~ pending(pend) + e1 + e2 + e3 + e4 + e5 + e6 + e7 +
randomized(rndz) + id(subjid) + cond(e5, 'Tested', tested),
erdata = erd,
whenapp= c(e4='CCTA done'), data=d) #, hc=3.75, h=4)
∟ Cumulative exclusions
Cumulative number of exclusions (\(y\)-axis) and number of additional exclusions after exclusions placed higher, for participants not actually randomized. Exclusions are sorted by descending number of incremental exclusions. 550 participants were enrolled, 12 non-excluded participants are pending randomization, and 20 participants were excluded. 371 participants were randomized. Note: Number of observations (500) does not equal number officially enrolled (550). Note: Number of enrolled (488) minus number excluded (20) does not match official number randomized (270).
◫ Exclusions
Incremental exclusions are those in addition to exclusions in earlier rows. Marginal exclusions are numbers of participants excluded for the indicated reason whether or not she was excluded for other reasons. The three Fractions are based on incremental exclusions.
Exclusions
|
Incremental Exclusions
|
Marginal Exclusions
|
Fraction of Enrolled
|
Fraction of Exclusions
|
Fraction Remaining
|
|
No Significant CAD (CCTA done, n=386)
|
6
|
6
|
0.012
|
0.30
|
0.988
|
Prior Cardiac Surgery
|
4
|
4
|
0.008
|
0.20
|
0.980
|
Inadequate Renal Function / 373
|
3
|
3
|
0.006
|
0.15
|
0.973
|
3⁄367 = 0.008 of Tested
|
Prior MI
|
2
|
3
|
0.004
|
0.10
|
0.969
|
History of Upper GI Bleeding
|
2
|
2
|
0.004
|
0.10
|
0.965
|
Pneumonia within 6 Weeks
|
2
|
2
|
0.004
|
0.10
|
0.961
|
History of Asthma
|
1
|
1
|
0.002
|
0.05
|
0.959
|
Total
|
20
|
|
0.041
|
1.00
|
0.959
|
◫ Exclusions in randomized participants
Frequency of exclusions for participants marked as randomized
Exclusion
|
Frequency
|
Prior MI
|
8
|
History of Asthma
|
7
|
History of Upper GI Bleeding
|
7
|
No Significant CAD
|
42
|
Inadequate Renal Function
|
15
|
Pneumonia within 6 Weeks
|
7
|
Prior Cardiac Surgery
|
8
|
Total Partcipants with Any Exclusion
|
84
|
▼Click arrow at left to show participant IDs:
Exclusion
|
IDs
|
Prior MI
|
87, 127, 209, 250, 274, 321, 442, 448
|
History of Asthma
|
17, 62, 68, 121, 122, 127, 462
|
History of Upper GI Bleeding
|
64, 202, 307, 310, 330, 449, 462
|
No Significant CAD
|
6, 7, 10, 22, 27, 37, 39, 53, 67, 112, 113, 118, 122, 143, 145, 175, 179, 184, 226, 227, 249, 255, 278, 282, 289, 291, 297, 321, 330, 344, 359, 361, 371, 377, 385, 402, 438, 451, 455, 471, 482, 499
|
Inadequate Renal Function
|
24, 37, 46, 70, 88, 154, 183, 194, 226, 234, 242, 292, 295, 322, 484
|
Pneumonia within 6 Weeks
|
29, 166, 230, 235, 313, 447, 473
|
Prior Cardiac Surgery
|
171, 191, 344, 377, 388, 389, 477, 482
|
▼Click arrow at left to see more information about those participants:
subjid
|
loc
|
6
|
gastric
|
7
|
gastric
|
10
|
trachea
|
17
|
lung
|
22
|
trachea
|
24
|
gastric
|
27
|
lung
|
29
|
trachea
|
37
|
trachea
|
39
|
lung
|
46
|
gastric
|
# Show exclusions in original variable order
if(FALSE) exReport(~ pending(pend) + e1 + e2 + e3 + e4 + e5 + e6 + e7 +
randomized(rndz) + id(subjid) + cond(e5, 'Tested', tested),
erdata=erd,
whenapp=c(e4='CCTA done'), data=d, #hc=3.75, h=4,
sort=FALSE, app=FALSE)
