Hi,
I am trying to impute missing values from UCR crime data using a chained equation model with linear regression. However, the model generates negative crime values that are implausible. Thus, it would be really helpful if someone could suggest how to address this issue. This is my first time imputing for missing values, so it would be really helpful if someone could respond.
mi set wide
mi register imputed Murder Manslaughter Rape Robbery Assault Burglary Larceny_Theft Vehicle_Theft Other_Assault Arson Forgery Fraud Embezzlement Stolen_Property Vandalism Weapons Prostitution Drugs_Offenses Drugs_Sale Drugs_Possesion DUI Disorderly
mi impute chained (regress) Murder Manslaughter Rape Robbery Assault Burglary Larceny_Theft ///
Vehicle_Theft Other_Assault Arson Forgery Fraud Embezzlement Stolen_Property Vandalism Weapons ///
Prostitution Drugs_Offenses Drugs_Sale Drugs_Possesion DUI Disorderly ///
= Tot_Officers Tot_Civ_Emp Unemp_Rate Avg_Weekly_Wage GDP_PerCap Male_Perc Hispanic_Perc Black_Perc Age_1624_Perc, add(20) rseed(12345) nolegend noisily noimputed force bootstrap
local vars "Murder Manslaughter Rape Robbery Assault Burglary Larceny_Theft Vehicle_Theft Other_Assault Arson Forgery Fraud Embezzlement Stolen_Property Vandalism Weapons Prostitution Drugs_Offenses Drugs_Sale Drugs_Possesion DUI Disorderly"
foreach var of local vars {
egen `var'_ImpMean = rowmean(_1_`var'-_20_`var')
}
input float ori str9 ORI double fips str20 state str33 county float year double(Murder _1_Murder) float Murder_ImpMean
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 1990 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 1990 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 1990 1 1 1
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 1991 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 1991 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 1991 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 1992 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 1992 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 1992 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 1993 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 1993 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 1993 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 1994 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 1994 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 1994 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 1995 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 1995 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 1995 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 1996 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 1996 1 1 1
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 1996 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 1997 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 1997 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 1997 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 1998 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 1998 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 1998 1 1 1
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 1999 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 1999 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 1999 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2000 1 1 1
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2000 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2000 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2001 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2001 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2001 1 1 1
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2002 1 1 1
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2002 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2002 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2003 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2003 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2003 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2004 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2004 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2004 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2005 1 1 1
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2005 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2005 . -8.090556023485881 -3.029669
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2006 . 1.9373855949781276 -2.501579
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2006 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2006 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2007 1 1 1
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2007 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2007 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2008 1 1 1
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2008 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2008 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2009 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2009 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2009 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2010 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2010 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2010 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2011 . -1.0829318935674845 -1.9352152
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2011 . -7.027801633499241 -.6673061
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2011 . 1.1019194333660172 3.181552
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2012 . -6.335854940855695 -.07712661
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2012 . -9.159714860346124 .8726751
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2012 . 2.9786409098697253 -.017971981
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2013 . -3.053980170947446 -.15758996
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2013 . -2.067913775015881 .13371472
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2013 . -.9866195381136287 -.25479743
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2014 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2014 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2014 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2015 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2015 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2015 3 3 3
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2016 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2016 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2016 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2017 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2017 1 1 1
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2017 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2018 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2018 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2018 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2019 1 1 1
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2019 1 1 1
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2019 0 0 0
12 "AL00600" 1005 "ALABAMA" "BARBOUR" 1990 3 3 3
12 "AL00600" 1005 "ALABAMA" "BARBOUR" 1991 2 2 2
12 "AL00600" 1005 "ALABAMA" "BARBOUR" 1992 0 0 0
12 "AL00600" 1005 "ALABAMA" "BARBOUR" 1993 1 1 1
12 "AL00600" 1005 "ALABAMA" "BARBOUR" 1994 0 0 0
12 "AL00600" 1005 "ALABAMA" "BARBOUR" 1995 0 0 0
12 "AL00600" 1005 "ALABAMA" "BARBOUR" 1996 0 0 0
12 "AL00600" 1005 "ALABAMA" "BARBOUR" 1997 . -.8895328461551177 2.080324
12 "AL00600" 1005 "ALABAMA" "BARBOUR" 1998 . 4.434697612914603 1.965525
12 "AL00600" 1005 "ALABAMA" "BARBOUR" 1999 1 1 1
end
I am trying to impute missing values from UCR crime data using a chained equation model with linear regression. However, the model generates negative crime values that are implausible. Thus, it would be really helpful if someone could suggest how to address this issue. This is my first time imputing for missing values, so it would be really helpful if someone could respond.
mi set wide
mi register imputed Murder Manslaughter Rape Robbery Assault Burglary Larceny_Theft Vehicle_Theft Other_Assault Arson Forgery Fraud Embezzlement Stolen_Property Vandalism Weapons Prostitution Drugs_Offenses Drugs_Sale Drugs_Possesion DUI Disorderly
mi impute chained (regress) Murder Manslaughter Rape Robbery Assault Burglary Larceny_Theft ///
Vehicle_Theft Other_Assault Arson Forgery Fraud Embezzlement Stolen_Property Vandalism Weapons ///
Prostitution Drugs_Offenses Drugs_Sale Drugs_Possesion DUI Disorderly ///
= Tot_Officers Tot_Civ_Emp Unemp_Rate Avg_Weekly_Wage GDP_PerCap Male_Perc Hispanic_Perc Black_Perc Age_1624_Perc, add(20) rseed(12345) nolegend noisily noimputed force bootstrap
local vars "Murder Manslaughter Rape Robbery Assault Burglary Larceny_Theft Vehicle_Theft Other_Assault Arson Forgery Fraud Embezzlement Stolen_Property Vandalism Weapons Prostitution Drugs_Offenses Drugs_Sale Drugs_Possesion DUI Disorderly"
foreach var of local vars {
egen `var'_ImpMean = rowmean(_1_`var'-_20_`var')
}
input float ori str9 ORI double fips str20 state str33 county float year double(Murder _1_Murder) float Murder_ImpMean
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 1990 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 1990 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 1990 1 1 1
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 1991 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 1991 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 1991 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 1992 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 1992 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 1992 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 1993 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 1993 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 1993 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 1994 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 1994 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 1994 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 1995 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 1995 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 1995 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 1996 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 1996 1 1 1
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 1996 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 1997 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 1997 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 1997 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 1998 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 1998 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 1998 1 1 1
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 1999 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 1999 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 1999 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2000 1 1 1
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2000 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2000 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2001 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2001 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2001 1 1 1
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2002 1 1 1
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2002 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2002 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2003 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2003 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2003 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2004 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2004 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2004 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2005 1 1 1
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2005 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2005 . -8.090556023485881 -3.029669
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2006 . 1.9373855949781276 -2.501579
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2006 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2006 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2007 1 1 1
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2007 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2007 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2008 1 1 1
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2008 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2008 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2009 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2009 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2009 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2010 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2010 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2010 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2011 . -1.0829318935674845 -1.9352152
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2011 . -7.027801633499241 -.6673061
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2011 . 1.1019194333660172 3.181552
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2012 . -6.335854940855695 -.07712661
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2012 . -9.159714860346124 .8726751
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2012 . 2.9786409098697253 -.017971981
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2013 . -3.053980170947446 -.15758996
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2013 . -2.067913775015881 .13371472
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2013 . -.9866195381136287 -.25479743
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2014 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2014 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2014 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2015 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2015 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2015 3 3 3
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2016 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2016 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2016 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2017 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2017 1 1 1
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2017 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2018 0 0 0
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2018 0 0 0
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2018 0 0 0
11 "AL00508" 1003 "ALABAMA" "BALDWIN" 2019 1 1 1
10 "AL00505" 1003 "ALABAMA" "BALDWIN" 2019 1 1 1
9 "AL00501" 1003 "ALABAMA" "BALDWIN" 2019 0 0 0
12 "AL00600" 1005 "ALABAMA" "BARBOUR" 1990 3 3 3
12 "AL00600" 1005 "ALABAMA" "BARBOUR" 1991 2 2 2
12 "AL00600" 1005 "ALABAMA" "BARBOUR" 1992 0 0 0
12 "AL00600" 1005 "ALABAMA" "BARBOUR" 1993 1 1 1
12 "AL00600" 1005 "ALABAMA" "BARBOUR" 1994 0 0 0
12 "AL00600" 1005 "ALABAMA" "BARBOUR" 1995 0 0 0
12 "AL00600" 1005 "ALABAMA" "BARBOUR" 1996 0 0 0
12 "AL00600" 1005 "ALABAMA" "BARBOUR" 1997 . -.8895328461551177 2.080324
12 "AL00600" 1005 "ALABAMA" "BARBOUR" 1998 . 4.434697612914603 1.965525
12 "AL00600" 1005 "ALABAMA" "BARBOUR" 1999 1 1 1
end
Comment