DROP PROCEDURE DTREE_WITH_R;
CREATE PROCEDURE DTREE_WITH_R(IN train "CENSUSINCOME", IN test "CENSUSINCOME_PREDICT", OUT result "DTREE_RESULT_R")
LANGUAGE RLANG AS
BEGIN
library(rpart)
fit <- rpart(CLASS ~ .,
method="class", data=train, control=rpart.control(minsplit=0.71))
result <- data.frame(cbind(ID=test$ID, CLASS=as.character(predict(fit, newdata=test, type=c("class")))))
END;
DROP TABLE CENSUSINCOME;
CREATE TABLE CENSUSINCOME ("AGE" INT,"CLASS_WORKER" VARCHAR(100),"DETAILED_IND_RECODE" INT,"DETAILED_OCC_RECODE" INT,"EDUCATION" VARCHAR(100),"WAGE" INT,
"ENROLL_IN_WK" VARCHAR(100),"MARITAL_STATE" VARCHAR(100), "MAJOR_IND_CODE" VARCHAR(100),"MAJOR_OCC_CODE" VARCHAR(100),"RACE" VARCHAR(100),"HISPANIC_ORIGIN" VARCHAR(100),
"SEX" VARCHAR(100),"LABOR_UNION" VARCHAR(100),"REASON4UNEMPLOYMENT" VARCHAR(100),"FULLORPARTTIME" VARCHAR(100),"CAPITAL_GAINS" INT,"CAPITAL_LOSSES" INT,"DIVIDENDS_STOCKS" INT,
"TAX_FILER" VARCHAR(100),"REGION_PRE_RESIDENCE" VARCHAR(100),"STATE_PRE_RESIDENCE" VARCHAR(100),"HOUSEHOLD_FAMILY" VARCHAR(100),"HOUSEHOLD_SUMMARY" VARCHAR(100),
"INSTANCE_WEIGHT" DOUBLE,"MIGRATION_IN_MSA" VARCHAR(100),"MIGRATION_IN_REG" VARCHAR(100),"MIGRATION_CODE_MOVE" VARCHAR(100),"LIVE_IN_HOUSE_ONE_AGO" VARCHAR(100),
"PREV_SUNBELT" VARCHAR(100),"NUM_PERSONS" INT,"FAMILY_MEM_UNDER_18" VARCHAR(100),"COUNTRY_BIRTH_FATHER" VARCHAR(100),"COUNTRY_BIRTH_MOTHER" VARCHAR(100),
"COUNTRY_BIRTH_SELF" VARCHAR(100),"CITIZENSHIP" VARCHAR(100),"OWN_BUSINESS" INT,"FILL_INC" VARCHAR(100),"VETERANS" INT,"WEEKS_IN_YEARS" INT,"YEAR" INT,"CLASS" VARCHAR(100));
DROP TABLE CENSUSINCOME_PREDICT;
CREATE TABLE CENSUSINCOME_PREDICT ("ID" INT,"AGE" INT,"CLASS_WORKER" VARCHAR(100),"DETAILED_IND_RECODE" INT,"DETAILED_OCC_RECODE" INT,"EDUCATION" VARCHAR(100),"WAGE" INT,
"ENROLL_IN_WK" VARCHAR(100),"MARITAL_STATE" VARCHAR(100), "MAJOR_IND_CODE" VARCHAR(100),"MAJOR_OCC_CODE" VARCHAR(100),"RACE" VARCHAR(100),"HISPANIC_ORIGIN" VARCHAR(100),
"SEX" VARCHAR(100),"LABOR_UNION" VARCHAR(100),"REASON4UNEMPLOYMENT" VARCHAR(100),"FULLORPARTTIME" VARCHAR(100),"CAPITAL_GAINS" INT,"CAPITAL_LOSSES" INT,"DIVIDENDS_STOCKS" INT,
"TAX_FILER" VARCHAR(100),"REGION_PRE_RESIDENCE" VARCHAR(100),"STATE_PRE_RESIDENCE" VARCHAR(100),"HOUSEHOLD_FAMILY" VARCHAR(100),"HOUSEHOLD_SUMMARY" VARCHAR(100),
"INSTANCE_WEIGHT" DOUBLE,"MIGRATION_IN_MSA" VARCHAR(100),"MIGRATION_IN_REG" VARCHAR(100),"MIGRATION_CODE_MOVE" VARCHAR(100),"LIVE_IN_HOUSE_ONE_AGO" VARCHAR(100),
"PREV_SUNBELT" VARCHAR(100),"NUM_PERSONS" INT,"FAMILY_MEM_UNDER_18" VARCHAR(100),"COUNTRY_BIRTH_FATHER" VARCHAR(100),"COUNTRY_BIRTH_MOTHER" VARCHAR(100),
"COUNTRY_BIRTH_SELF" VARCHAR(100),"CITIZENSHIP" VARCHAR(100),"OWN_BUSINESS" INT,"FILL_INC" VARCHAR(100),"VETERANS" INT,"WEEKS_IN_YEARS" INT,"YEAR" INT);
这是用的两个表。
执行时报错,说表里面凡是类型为varchar的都与fit不匹配。。。。。。。
怎么整合下数据啊!!!


雷达卡


京公网安备 11010802022788号







