我正在估计一个多经济的logit模型,并想报告边际效应。我遇到了一个困难,因为当我使用更大版本的模型时,我会出错。
这里是一个可重复的例子。下面的代码有两个协变量,工作正常。
library(mlogit)
df = data.frame(c(0,1,1,2,0,1,0), c(1,6,7,4,2,2,1), c(683,276,756,487,776,100,982))
colnames(df) <- c('y', 'col1', 'col3')
df$col2<-df$col1^2
mydata = df
mldata <- mlogit.data(mydata, choice="y", shape="wide")
mlogit.model1 <- mlogit(y ~ 1| col1+col2, data=mldata)
m <- mlogit(y ~ 1| col1+col2, data = mldata)
z <- with(mldata, data.frame(col1 = tapply(col1, index(m)$alt, mean),
col2 = tapply(col2, index(m)$alt, mean) ) )
effects(mlogit.model1, covariate = "col1", data = z)现在,当我有三个协变量时:
mlogit.model1 <- mlogit(y ~ 1| col1+col2+col3, data=mldata)
m <- mlogit(y ~ 1| col1+col2+col3, data = mldata)
z <- with(mldata, data.frame(col1 = tapply(col1, index(m)$alt, mean),
col2 = tapply(col2, index(m)$alt, mean),
col3 = tapply(col3, index(m)$alt, mean) ) )
effects(mlogit.model1, covariate = "col1", data = z)最后一行给出了以下错误:
if中的错误(% c(1,3)中的rhs%){:参数长度为零
但如果我跑了
effects(mlogit.model1, covariate = "col3", data = z)然后,它可以给出col3的边际效应。为什么不给出col1的边际效应?
请注意,所有列都不包含NULLs,且长度相同。有人能解释一下这种行为的原因吗?
发布于 2017-04-15 15:45:59
我的感觉是,这可能会帮助你找到一个解决方案。
参考资料:http://www.talkstats.com/showthread.php/44314-calculate-marginal-effects-using-mlogit-package
> methods(effects)
[1] effects.glm* effects.lm* effects.mlogit*
see '?methods' for accessing help and source code
Note: Non-visible functions are asterisked解释:
需要在effects.mlogit源代码中进行一点转换。
在第16行中,您应该将"cov.list <- lapply(attr(cov.list(Object),“rhs ",as.character)”替换为"cov.list <- strsplit(as.character(as.character(cov.list(Object),"rhs")),“+”,as.character=TRUE。
修正结果:
> effects(mlogit.model1, covariate = "col1", data = z)
0 1 2
-4.135459e-01 4.135459e-01 9.958986e-12
> myeffects(mlogit.model2, covariate = "col1", data = z2)
0 1 2
1.156729129 -1.157014778 0.000285649 代码
require(mlogit)
myeffects<-function (object, covariate = NULL, type = c("aa", "ar", "rr",
"ra"), data = NULL, ...)
{
type <- match.arg(type)
if (is.null(data)) {
P <- predict(object, returnData = TRUE)
data <- attr(P, "data")
attr(P, "data") <- NULL
}
else P <- predict(object, data)
newdata <- data
J <- length(P)
alt.levels <- names(P)
pVar <- substr(type, 1, 1)
xVar <- substr(type, 2, 2)
cov.list <- strsplit(as.character(attr(formula(object), "rhs")), " + ", fixed = TRUE)
rhs <- sapply(cov.list, function(x) length(na.omit(match(x,
covariate))) > 0)
rhs <- (1:length(cov.list))[rhs]
eps <- 1e-05
if (rhs %in% c(1, 3)) {
if (rhs == 3) {
theCoef <- paste(alt.levels, covariate, sep = ":")
theCoef <- coef(object)[theCoef]
}
else theCoef <- coef(object)[covariate]
me <- c()
for (l in 1:J) {
newdata[l, covariate] <- data[l, covariate] + eps
newP <- predict(object, newdata)
me <- rbind(me, (newP - P)/eps)
newdata <- data
}
if (pVar == "r")
me <- t(t(me)/P)
if (xVar == "r")
me <- me * matrix(rep(data[[covariate]], J), J)
dimnames(me) <- list(alt.levels, alt.levels)
}
if (rhs == 2) {
newdata[, covariate] <- data[, covariate] + eps
newP <- predict(object, newdata)
me <- (newP - P)/eps
if (pVar == "r")
me <- me/P
if (xVar == "r")
me <- me * data[[covariate]]
names(me) <- alt.levels
}
me
}
df = data.frame(c(0,1,1,2,0,1,0), c(1,6,7,4,2,2,1), c(683,276,756,487,776,100,982))
colnames(df) <- c('y', 'col1', 'col3')
df$col2<-df$col1^2
mydata = df
mldata <- mlogit.data(mydata, choice="y", shape="wide")
mlogit.model1 <- mlogit(y ~ 1| col1+col2, data=mldata)
m <- mlogit(y ~ 1| col1+col2, data = mldata)
z <- with(mldata, data.frame(col1 = tapply(col1, index(m)$alt, mean),
col2 = tapply(col2, index(m)$alt, mean) ) )
mldata2 <- mlogit.data(mydata, choice="y", shape="wide")
mlogit.model2 <- mlogit(y ~ 1| col1+col2+col3, data=mldata2)
m2 <- mlogit(y ~ 1| col1+col2+col3, data = mldata2)
z2 <- with(mldata, data.frame(col1 = tapply(col1, index(m2)$alt, mean),
col2 = tapply(col2, index(m2)$alt, mean),
col3 = tapply(col3, index(m2)$alt, mean) ) )
effects(mlogit.model1, covariate = "col1", data = z)
myeffects(mlogit.model2, covariate = "col1", data = z2)https://stackoverflow.com/questions/43346473
复制相似问题