Nothing
mapCancs<-function(D){
ICD9=D$ICD9
# histo2=D$histo2
histo3=D$histo3
cancer=rep("other",dim(D)[1])
cancer[(ICD9==9999)]="unknown"
# cancer[(ICD9<1450)]="l140"
cancer[(ICD9>=2300)&(ICD9<2310)]="giCIS"
cancer[(ICD9>=2310)&(ICD9<2320)]="respCIS"
cancer[(ICD9>=2320)&(ICD9<2330)]="skinCIS"
cancer[(ICD9==2330)]="breastCIS"
cancer[(ICD9==2331)]="cervixCIS"
cancer[(ICD9>=2332)&(ICD9<=2333)]="femGenCIS"
cancer[(ICD9>=2334)&(ICD9<=2336)]="maleGenCIS"
cancer[(ICD9>=2337)&(ICD9<2340)]="guCIS"
cancer[(ICD9>=2340)&(ICD9<2349)]="otherCIS"
cancer[(ICD9>=1400)&(ICD9<1500)]="oral"
cancer[(ICD9>=1500)&(ICD9<=1509)]="esophagus"
cancer[(ICD9>=1510)&(ICD9<=1519)]="stomach"
cancer[(ICD9>=1520)&(ICD9<=1529)]="intestine"
cancer[(ICD9>=1530)&(ICD9<=1539)]="colon"
cancer[(ICD9>=1540)&(ICD9<=1549)]="rectal"
cancer[(ICD9>=1550)&(ICD9<=1559)]="liver"
cancer[(ICD9>=1560)&(ICD9<=1569)]="gallBladder"
cancer[(ICD9>=1570)&(ICD9<=1579)]="pancreas"
cancer[(ICD9>=1580)&(ICD9<=1589)]="peritonium"
cancer[(ICD9>=1590)&(ICD9<=1599)]="GI"
cancer[(ICD9>=1600)&(ICD9<=1609)]="sinus"
cancer[(ICD9>=1610)&(ICD9<=1619)]="larynx"
cancer[(ICD9>=1620)&(ICD9<=1629)]="lung"
cancer[(ICD9==1639)]="pleura"
cancer[(ICD9>=1640)&(ICD9<=1649)]="thymus"
cancer[(ICD9>=1700)&(ICD9<=1709)]="bone"
cancer[(ICD9>=1710)&(ICD9<=1719)]="HnN"
cancer[(ICD9>=1720)&(ICD9<=1729)]="melanoma"
cancer[(ICD9>=1730)&(ICD9<=1739)]="skin"
cancer[(ICD9>=1740)&(ICD9<=1749)]="breast"
cancer[(ICD9==175)|((ICD9>=1750)&(ICD9<=1759))]="breast"
cancer[ICD9==179]="uterus"
cancer[(ICD9>=1800)&(ICD9<=1809)]="cervix"
# cancer[ICD9==181]="pla"
cancer[(ICD9>=1820)&(ICD9<=1829)]="uterus"
cancer[(ICD9>=1830)&(ICD9<=1839)]="ovary"
cancer[(ICD9==2362)]="ovary"
cancer[(ICD9>=1840)&(ICD9<=1849)]="femGen"
cancer[ICD9==185]="prostate"
cancer[(ICD9>=1860)&(ICD9<=1869)]="testes"
cancer[(ICD9>=1870)&(ICD9<=1879)]="maleGen"
cancer[(ICD9>=1880)&(ICD9<=1889)]="bladder"
cancer[(ICD9>=1890)&(ICD9<=1899)]="renal"
cancer[(ICD9>=1900)&(ICD9<=1909)]="eye"
cancer[(ICD9>=1910)&(ICD9<=1919)]="brain"
cancer[(ICD9>=1920)&(ICD9<=1929)]="nerves"
cancer[ICD9==193]="thyroid"
cancer[ICD9==1991]="otherMalig"
# this chunk of ICD9 codes is replaced by cleaner ICD-O3 codes below
# cancer[(ICD9>=2000)&(ICD9<2010)]="NHL"
# cancer[(ICD9>=2010)&(ICD9<2020)]="hodgkin"
# cancer[(ICD9>=2020)&(ICD9<2030)]="NHL"
# cancer[(ICD9>=2030)&(ICD9<2040)]="MM"
# cancer[(ICD9>=2040)&(ICD9<2050)]="ALL"
# cancer[(ICD9>=2050)&(ICD9<2080)]="AML" # same here
# cancer[(ICD9>=2080)&(ICD9<2090)]="OL" #M0 like stuff
# cancer[(ICD9==2387)]="OL"
# clean things with histO3 codes that trump the heme ICD9 codes above
cancer[(histo3>=9590)&(histo3<9600)]="NHL"
# cancer[(histo3>=9650)&(histo3<9670)]="hodgkin"
cancer[(histo3>=9650)&(histo3<9670)]="HL"
cancer[(histo3>=9670)&(histo3<9730)]="NHL"
cancer[(histo3>=9730)&(histo3<9735)]="MM"
cancer[(histo3>=9735)&(histo3<9740)]="NHL"
cancer[(histo3>=9740)&(histo3<=9742)]="MPN" #"mastocytosis"
cancer[(histo3>=9743)&(histo3<9760)]="MPN" # assume histiocytosis is more like MPN than NHL
# cancer[(histo3==9751)]="MPN" #"LCH" lagerhan cell histiocytes are APCs = macrophage like, guessing MPN-like
cancer[(histo3>=9760)&(histo3<=9770)]="MM" # outside of below there are ~20 cases of these
# this cancer[(ICD9>=2730)&(ICD9<2739)]="globinemia" yielded 5080 cases of 9761 and 9762
cancer[(histo3>=9800)&(histo3<9810)]="OL" # takes back 60 AMLs from ICD9 in 9808 and 9809
cancer[histo3==9948]="OL" # aggressive NK leukemia lumped in here
# cancer[(histo3==9812)|(histo3==9806)]="ALLba" #ALL with BCR-ABL (110 cases) 2010-12 + 12 mixed lineage 2011-12
cancer[(histo3>=9810)&(histo3<9840)]="ALL" # take some OL back to ALL
cancer[(histo3==9831)&(D$yrdx>2009)]="LGL" # 9831 is cleanly LGL only starting in 2010
cancer[(histo3==9823)]="CLL" # pull out the CLLs
# cancer[(histo3==9670)]="SLL" # SLL has different risk time course, so better not merge with CLL.
cancer[(histo3==9670)]="CLL" #more 2nd SLL since earlier DX of CLL=> more likely SLL, so better to pool
# Dutch study placed 9800 and 9820 also in CLL, but incidence age responses are clearly different.
cancer[(histo3>=9840)&(histo3<9940)]="AML" # take some OL back to AML, includes next two lines
# cancer[(histo3==9910)]="AML" #AMKL
# cancer[(histo3==9930)]="AML" #myeloid sarcoma (blasts forming tumor outside of marrow ... advanced AML)
cancer[histo3%in%c(9863,9875)]="CML" # take back CMLs
cancer[(histo3==9866)]="APL" # andmake APL exclusive
cancer[histo3%in%c(9865,9869,9871,9896,9897,9911)]="AMLti" # AML by tranlocation or inversion
# t(6,9),inv(3),inv(16),t(8,21),t(9,11),t(1,22)
cancer[(histo3>9979)&(histo3<9990)]="MDS" ##!!!!! tMDS=9987 got mapped in with tAML=9920 starting in 2010
# cancer[(histo3==9987)]="tMDS" ##!!! so we have to pull both out and correct for this
# cancer[(histo3==9920)]="tAML"
# cancer[(histo3==9982)]="RARS" # take out to look for correlations with CLL via SF3B1
# cancer[(histo3==9986)]="MDSdel5q" # take out to look for extra radiation induction (skip: confounded by tMDS)
#9980=RA; 9981=nothing, 9983=RAEB, 9984=RAEB-T transformation (also stopped in 2010),9985=RCMD, 9989=NOS
cancer[(histo3==9940)]="HCL" #hairy cell leukemia was getting into NHL (note: HCL in 20's goes to 9591=NHL)
cancer[(histo3==9945)]="CMML"
# cancer[(histo3==9960)]="MDS" #"CMPD" #this got remapped to mdsMPN = 9975 in 2010
# cancer[(histo3==9975)]="MDS" #"mdsMPN": guessing this is CMML-like, and more MDS-like than MPN-like
cancer[(histo3==9960)]="MPN" #switch to MPN to keep MDS clean
cancer[(histo3==9975)]="MPN" #same here, better keep MDS clean
cancer[(histo3==9946)]="MPN" #"jCMML" these come out of 205.1/CML
cancer[(histo3==9950)]="MPN" #"PV"
cancer[(histo3==9961)]="MPN" #"PMF"
cancer[(histo3==9962)]="MPN" #"ET"
cancer[(histo3==9963)]="MPN" #"CNL"
cancer[(histo3==9964)]="MPN" #"CEL"
cancer[(histo3>=9965)&(histo3<=9967)]="MPN" # GFR mutatants
cancer[(histo3>=9970)&(histo3<=9971)]="NHL" # ICD9 put it mostly there, so sweep stray 1s into it also.
cancer[(histo3==9876)]="MPN" #"aCML"
cancer[histo3==9140]="KS" # overwrite mostly skin as Kaposi Sarcoma (KS)
cancer[(D$seqnum>=60)&(D$seqnum<=88)]="benign" # 88 is benign but unknown sequence
## most of below fall into benign, and most started in 2004.
## Bottomline: Bucket to remove since my codes don't handle such seqnums.
## Complications of handling them include: if I map 60 to 0 and 61 to 1, trouble may come in one caseID havinf 2 seqnum=0 or 1
## rows. I'll leave figuring out how to handle this to someone with real interests in brain tumors.
# cancer[(histo3==9530)]="meningioma" #supposedly malignant, but seqnums >59 confuse this.
# # cancer[(histo3>=9531)&(histo3<=9539)]="meningioma" #benigns, mix in with mal or comment to pool with unknown
# cancer[(histo3==9560)]="schwannoma"
# cancer[(histo3==8272)]="pituitary"
D$cancer=as.factor(cancer)
D
}
Any scripts or data that you put into this service are public.
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.