be$sex<-ifelse(be$sex=="Female",1,ifelse(be$sex=="Male",2,NA))#性別轉換成1和2,缺失的使用NA表示,其他的相同
be$rezult1 <-ifelse(be$rezult1 =="Alive or dead due to cancer",1,ifelse(be$rezult1 =="Dead (attributable to causes other than this cancer dx)",2,NA))
be$status<-ifelse(be$status=="Alive",0,ifelse(be$status=="Dead",1,NA))
be$race<-ifelse(be$race=="White",1,ifelse(be$race=="Black",2,3))
be$Subtype<-recode(be$Subtype,"'HR-/HER2- (Triple Negative)'=1;'HR-/HER2+ (HER2 enriched)'=2;'HR+/HER2- (Luminal A)'=3;'HR+/HER2+ (Luminal B)'=4;else=NA")#這里是4個分類變量,使用ifelse函數套疊胎麻煩,改用car函數
be$nodes[be$nodes=="Blank(s)"]=NA#讓數據中的Blank(s)變為缺失值,下面同理
be$tumor.size[be$tumor.size=="Blank(s)"]=NA
be$extension[be$extension=="Blank(s)"]=NA
be$lymph.nodes[be$lymph.nodes=="Blank(s)"]=NA
be$age<-str_extract(be$age,"\\d+")#把年齡里面的數字提取出來
be$ajcc[be$ajcc=="Blank(s)"]=NA