orig-data/SwissPop.R

library(pxR)
vz <- read.px("orig-data/px-d-40-1A01.px")
vzd <- as.data.frame(vz)
vzdm <- subset(vzd, grepl('^[.][.][.][.][.][.]([0-9]+).*$', Region))
vzdp <- transform(vzdm,
                  MunicipalityID=as.numeric(gsub('^[.][.][.][.][.][.]([0-9]+) (.*)$', '\\1', Region)),
                  MunicipalityName=gsub('^[.][.][.][.][.][.]([0-9]+) (.*)$', '\\2', Region))
vzdph <- subset(vzdp, Haushaltsgrösse != "Total")
vzdph$Haushaltsgrösse <- factor(vzdph$Haushaltsgrösse, levels=setdiff(levels(vzdph$Haushaltsgrösse), "Total"))
SwissPop <- with(vzdph, data.frame(Year=Jahr, MunicipalityID=kimisc::ofactor(MunicipalityID),
                                   MunicipalityName=kimisc::ofactor(MunicipalityName),
                                   HouseholdSize=Haushaltsgrösse, Households=value))
with(SwissPop, stopifnot(as.numeric(MunicipalityID) == as.numeric(MunicipalityName)))
SwissPop <- plyr::arrange(SwissPop, Year, HouseholdSize, MunicipalityID)
save(SwissPop, file="data/SwissPop.rda", compress="xz")
summary(SwissPop)
str(SwissPop)
nattimmis/Swiss-Communes-Statistical-Data documentation built on May 22, 2019, 3:52 p.m.