未定义的列在火车中的 SVM 插入符号中出现错误



需要您帮助解决以下错误。

##Loading Libraries.
library(caret)
library(kernlab)
##Loading the data
rm(list=ls())
set.seed(3421)
Extrapolation_Data <- read.table("./Data/Data5/EP_CUST_COMBINED_07042017.txt",
                                sep="|", header=TRUE , 
                                colClasses = c("X6MNTH_FTD" = "NULL" , 
                                              "X6MNTH_LTD"="NULL" , 
                                              "India3MLtd_TRANS" = "NULL", 
                                              "Cust_Considered" = "NULL",
                                              "Customer_No"="character",
                                              "Segment"="factor",
                                              "Store"="factor",
                                              "DISTINCT_VISITS_BAND"="factor",
                                              "DISTINCT_MONTH_VISITS"="factor",
                                              "CUST_SALES_BAND"="factor",
                                              "ITEMS_PER_MONTH_BAND"="factor",
                                              "VISITS_PER_MONTH_BAND"="factor",
                                              "STAPLES_TRANS"="factor",
                                              "BDF_TRANS"="factor",
                                              "HPC_TRANS"="factor",
                                              "PF_TRANS"="factor",
                                              "FV_TRANS"="factor",
                                              "PROCESS_FOOD_TRANS"="factor",
                                              "BREAD_EGGS_TRANS"="factor",
                                              "FROZEN_TRANS"="factor",
                                              "MILK_TRANS"="factor",
                                              "LAUNDRY_TRANS"="factor",
                                              "PC_TRANS"="factor",
                                              "DISTINCT_CLASSES_BAND"="factor",
                                              "LAUNDRY_TRANS_1"="factor",
                                              "Cookies_TRANS"="factor",
                                              "ExoticFruitandVegetables_TRANS"="factor",
                                              "Healthbiscuit_TRANS"="factor",
                                              "Kellogs_TRANS"="factor",
                                              "BasmatiRice_TRANS"="factor",
                                              "Pastry_TRANS"="factor",
                                              "Dessert_TRANS"="factor",
                                              "Organics_TRANS"="factor",
                                              "PaperandTissue_TRANS"="factor",
                                              "Almonds_TRANS"="factor",
                                              "Pears_TRANS"="factor",
                                              "GingellyOil_TRANS"="factor",
                                              "Yoghurt_TRANS"="factor",
                                              "Dove_TRANS"="factor",
                                              "Mayonnaise_TRANS"="factor",
                                              "PeanutButter_TRANS"="factor",
                                              "HealthDietFood_TRANS"="factor",
                                              "OliveOil_TRANS"="factor",
                                              "ShowerGel_TRANS"="factor",
                                              "ChocolateSpread_TRANS"="factor",
                                              "Continental_TRANS"="factor",
                                              "GarbageBag_TRANS"="factor",
                                              "ReadytoEat_TRANS"="factor",
                                              "ToiletPaper_TRANS"="factor",
                                              "MOP_TRANS"="factor",
                                              "IceTea_TRANS"="factor",
                                              "ShowerandBath_TRANS"="factor",
                                              "CarCare_TRANS"="factor",
                                              "PetFood_TRANS"="factor",
                                              "Muesli_TRANS"="factor",
                                              "CottonBall_TRANS"="factor",
                                              "CannedFood_TRANS"="factor",
                                              "PremiumVegetables_TRANS"="factor",
                                              "Maybelline_TRANS"="factor",
                                              "PremixCoffee_TRANS"="factor",
                                              "ImportedCigarettes_TRANS"="factor",
                                              "MicrowaveItems_TRANS"="factor",
                                              "Housekeeping.Plugin_TRANS"="factor",
                                              "YogaMat_TRANS"="factor",
                                              "Moti_TRANS"="factor",
                                              "Toys_TRANS"="factor",
                                              "Loreal_TRANS"="factor",
                                              "AdultsBooks_TRANS"="factor",
                                              "Gala_TRANS"="factor",
                                              "Revlon_TRANS"="factor"))
## Dividing the data in Train Test.    
indexes = sample(nrow(Extrapolation_Data), 
                 size=0.2*nrow(Extrapolation_Data), replace= FALSE)
TrainData <- Extrapolation_Data[-indexes,]
TestData <- Extrapolation_Data[indexes,]    
##Creating new column Segment_C from Segment
TrainData$Segment_C <- as.factor(ifelse(TrainData$Segment=="C", "Y" , "N"))
TestData$Segment_C <- as.factor(ifelse(TestData$Segment=="C", "Y" , "N"))
## No Null Values
sum(is.na(TrainData))
# [1] 0
fitControl <- trainControl(method = "cv", number = 1,repeats = 2,
                           summaryFunction = twoClassSummary)    
set.seed(10001)
## Executing the below query is giving me error    
SVMFit <- train(Segment_C ~ TENURE + CUST_SALES + VISITS_PER_MONTH + FROZEN_TRANS + 
                          MILK_TRANS + PC_TRANS + Cookies_TRANS,  
                data=TrainData, method="lssvmPoly", 
                trControl = fitControl , metric = "Kappa")

错误:

[.data.frame(data, , lvls[1]( 中的错误:选择了未定义的列

我错过了什么吗?我的任何变量都不正确吗?

任何帮助都非常感谢。

变量名在下面的语句中定义不正确--SVMFit<-train(Segment_C~TENURE+CUST_SALES+VISITS_PER_MONTH+FROZEN_TRANS+MILK_TRANS+PC_TRANS+Cookies_TRANS, data=TrainData, method="lssvmPoly" , trControl = fitControl , metric = "Kappa"(

原始数据不包含名为"任期"的变量。以及CUST_SALES,VISITS_PER_MONTH:原始变量名称CUST_SALES_BAND和VISITS_PER_MONTH_BAND

最新更新