Nothing
rm(list=ls())
library(SEERaBomb)
library(ggplot2)
library(dplyr)
load("~/data/SEER/mrgd/cancDef.RData")
load("~/data/SEER/mrgd/popsae.RData")
(tb=sort(table(canc$cancer),dec=T))
CANCS=c("AML","CML","MDS")
CANCS=names(tb)
CANCS=c("stomach","lung","melanoma","prostate")
CANCS=names(tb)[1:9]
CANCS=c("AML","MDS","CMML","AMLti","APL","MPN","CML") # second cancers of interest
D=canc
mds="clean"
mds="all"
cutyr=2001
if (mds=="clean") D=canc%>%filter(yrdx>=cutyr,cancer%in%CANCS,histo3!=9989) else
D=canc%>%filter(yrdx>=cutyr,cancer%in%CANCS)
D=D%>%mutate(year=yrdx,age=agedx+0.5) #let year=yrdx to match population column below
P=popsae%>%filter(year>=cutyr)
# make them all end at 98.5
D=D%>%filter(age<99)
stdUS=stdUS%>%filter(age<99)
P=P%>%filter(age<99)
r=data.frame(reg=levels(D$reg))
c=data.frame(cancer=CANCS)
cr=merge(c,r)
head(D)
head(P)
range(P$age)
m=D%>%group_by(cancer,db,reg,age)%>%summarize(cases=n())
p=P%>%group_by(db,reg,age)%>%summarise(py=sum(py))
p=left_join(cr,p)
d=left_join(p,m)
d[is.na(d$cases),"cases"]=0 #join left missings where zero's should be, so fix this
head(d)
head(stdUS)
tail(stdUS)
tail(d)
d1=d%>%
group_by(cancer,db,reg,age,add=F)%>%
summarize(cases=sum(cases),py=sum(py)/1e5)%>%
left_join(stdUS)%>%
mutate(ai=cases/py)%>%
summarize(vr=sum(cases*prop^2/py^2),stdIncid=weighted.mean(ai,w=prop),
stdLo=stdIncid-1.96*sqrt(vr),stdHi=stdIncid+1.96*sqrt(vr))
# head(d1)
graphics.off()
if(length(grep("linux",R.Version()$os))) windows <- function( ... ) X11( ... )
if(length(grep("darwin",R.Version()$os))) windows <- function( ... ) quartz( ... )
windows(width=12,height=7)
theme_set(theme_gray(base_size = 12))
# theme_get()
theme_update(
# axis.title = element_text(size = rel(3)),
legend.direction = "horizontal" #, # c(.96, .56),
# plot.margin = unit(c(.5,1,.5,.5),"lines")
)
# theme_get()
head(d1)
ggplot(aes(x=reg,y=stdIncid,col=db),data=d1)+
ylab("Age-adjusted Incidence (Cases/100,000 PY) US2000 Std")+
xlab("SEER Registry") +
ggtitle(paste0("Cancers in ",cutyr,"-2015")) +
geom_errorbar(aes(ymin=stdLo,ymax=stdHi))+
scale_colour_hue("Dataset", breaks = c("73", "92", "00"), labels = c("1973", "1992", "2000"))+
theme(axis.title = element_text(size = rel(1.2)),
legend.position = c(.87, .15),
axis.text.y = element_text(size = rel(1.5)),
plot.title = element_text(size = rel(2)),
axis.title.x = element_text(size = rel(1.7)),
axis.title.y = element_text(size = rel(1.3)),
strip.text = element_text(size = rel(2))
) +
facet_wrap(~cancer)
if (length(CANCS)>3) ggsave("~/Results/SEERaBomb/cancersVsregs.eps") else
ggsave(paste0("~/Results/SEERaBomb/mlVsregsMDS",mds,".eps"))
Any scripts or data that you put into this service are public.
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.