Problem with setx and character variables - Zelig

10 May 2004

I'm trying to replicate Fearon and Laitin's "Ethnicity, Insurgency, and
Civil War" data (search for repdata.zip associated with Laitin's web site).
This replication pointed out an annoying problem with setx() and sim() while
using model = "logit".

Error in setx.default(z.out.my) : character is not a supported variable type
(use factor or numeric).

It would be nice if Zelig could just convert the data as appropriate.

###
### Stephen Purpura
###
###
options(digits=3,scipen=12)
library(car)
library(lattice)
library(modreg)
library(foreign)
library(Zelig)

#########################################################################
###
### http://www.stanford.edu/group/ethnic/publicdata/publicdata.html
###
### 
wd<-"z:/Documents and Settings/Steve/My Documents/UW POLS503/Assignment 2"
setwd(wd)

f.laitin<-read.dta('repdata.dta')
attach(f.laitin)

onset[onset==4]<-0

###
### Build Table #1, Col 1 from the paper
###
z.out.1<-zelig(formula = as.factor(onset) ~ warl + gdpenl + lpopl1 + lmtnest
+ ncontig + Oil + nwstate + instab + polity2l + ethfrac + relfrac, model =
"logit", data = f.laitin)
summary(z.out.1)

pred.1<-trunc(plogis(predict(z.out.1))/.5)

pred<-trunc((1/(1+exp(-predict(z.out.1))))/.5)
table(pred,z.out.1$y)

###
### col #2
### TODO: if second > .049999
###
z.out.2<-zelig(formula = as.factor(ethonset) ~ warl + gdpenl + lpopl1 +
lmtnest + ncontig + Oil + nwstate + instab + polity2l + ethfrac + relfrac,
model = "logit", data = f.laitin)
summary(z.out.2)

###
### col #3
###
z.out.3<-zelig(formula = as.factor(onset) ~ warl + gdpenl + lpopl1 + lmtnest
+ ncontig + Oil + nwstate + instab + anocl + deml + ethfrac + relfrac, model
= "logit", data = f.laitin)
summary(z.out.3)

###
### col #4
###
z.out.4<-zelig(formula = as.factor(emponset) ~ empwarl + empgdpenl +
emplpopl + emplmtnest + empncontig + Oil + nwstate + instab + empethfrac,
model = "logit", data = f.laitin)
summary(z.out.4)

###
### col #5
###
z.out.5<-zelig(formula = as.factor(cowonset) ~ cowwarl + gdpenl + lpopl1 +
lmtnest + ncontig + Oil + nwstate + instab + anocl + deml + ethfrac +
relfrac, model = "logit", data = f.laitin)
summary(z.out.5)

#### logit dependent variable
#  major onset variables are:
# onset
# ethonset
# emponset
# colonset
# cowonset
# sdonset
#
# so let's check their values first

table(onset,exclude=NULL)
table(ethonset,exclude=NULL)
table(emponset,exclude=NULL)
table(colonset,exclude=NULL)
table(sdonset,exclude=NULL)
table(cowonset,exclude=NULL)

###
### Our variable
###
m.onset<-onset
m.ethonset<-ethonset
m.emponset<-emponset
m.cowonset<-cowonset
m.colonset<-colonset
m.sdonset<-sdonset

m.onset[m.onset>1]<-0
m.ethonset[m.ethonset>1]<-0
m.emponset[m.emponset>1]<-0
m.cowonset[m.cowonset>1]<-0
m.colonset[m.colonset>1]<-0
m.sdonset[m.sdonset>1]<-0

# there are NA in colonset and cowonset; I will set these to
# zero and check. Goofy code but it gets around the problem
# with NA.
ccolonset<-rep(0,length(m.colonset))
ccowonset<-rep(0,length(m.cowonset))
ccolonset[m.colonset==1]<-1
ccowonset[m.cowonset==1]<-1
m.colonset<-ccolonset
m.cowonset<-ccowonset
table(m.colonset,exclude=NULL)
table(m.cowonset,exclude=NULL)

myonset<-m.onset | m.ethonset | m.emponset | m.cowonset | m.colonset |
m.sdonset

table(m.onset)
table(m.ethonset)
table(m.emponset)
table(m.cowonset)
table(m.colonset)
table(m.sdonset)

table(myonset)

z.out.my<-zelig(formula = myonset ~ warl + gdpenl + lpopl1 + lmtnest +
ncontig + Oil + nwstate + instab + polity2l + ethfrac + relfrac + anocl +
deml, model = "logit", data = f.laitin)
summary(z.out.my)
write.table(z.out.my$coeff, file = "myonset.csv", sep = ",", col.names
= NA)
x.out<-setx(z.out.my) ## failure
s.out<-sim(z.out.my,x=x.out)
summary(s.out)
plot(s.out)

-
Zelig Mailing List, served by Harvard-MIT Data Center
Send messages: zelig(a)latte.harvard.edu
[un]subscribe Options: http://lists.hmdc.harvard.edu/?info=zelig
Zelig program information: http://gking.harvard.edu/zelig/