MCMCsarpy.R

library("graph")
library("Rgraphviz")
library("RBGL")
library("dplyr")

getBoundary <- function(subgraph, graph) {
    bdy <- unique(unlist(graph::boundary(subgraph, graph)))
    return(bdy)
    ## returns boundary of subgraph in graph as R char vector in
    ## future, add some error checking for argument types
}

getSarpyPrecincts <- function(precList) {
    sarpyBoundary <- precList[!(precList %in% c("lanc", "doug"))]
    return(sarpyBoundary)
    ## returns list (char vector) of precincts stricly in Sarpy Cty in
    ## future, add some error checking for argument types
}

makeNewCongDist <- function(sarpyPrecincts, vertexDelete, vertexAdd, county) {
    newSarpyPrecincts <- c(sarpyPrecincts[-match(vertexDelete, sarpyPrecincts)], 
        vertexAdd, county)
    newCongDist <- graph::subGraph(newSarpyPrecincts, gSarpy)
    return(newCongDist)
}

vEccentricity <- function(graph, vertex) {
    ve <- max(RBGL::dijkstra.sp(graph, start = vertex)$distances)
    return(ve)
    ## returns integer, longest shortest-path from vertex to every
    ## other vertex in graph in future, add some error checking for
    ## argument types
}

gDiameter <- function(graph) {
    d <- max(RBGL::johnson.all.pairs.sp(graph))
    return(d)
    ## returns integer, greatest distance between any pair of vertices
    ## in graph in future, add some error checking for argument types
}

contiguous <- function(graph) {
    isconnected <- length(RBGL::connectedComp(graph)) == 1
    return(isconnected)
    ## returns logical (boolean), TRUE if single connected component
    ## in future, add some error checking for argument types
}

## The following are compactness measures for the originally
## constituted congressional districts My goal is to have trial
## districts to have no greater eccentricities or diameters by using
## these functions to measure against the base.
## Positive is bad (low probability of choosing),
## negative is good (higher prob of choosing)

eccenDiff <- function(graph1, graph2) {
    BASEVECCENCD1 <- 7
    BASEVECCENCD2 <- 4
    totalVEccen <-
              (vEccentricity(graph1, "lanc") - BASEVECCENCD1) +
              (vEccentricity(graph2, "doug") - BASEVECCENCD2)
    return(totalVEccen)
}

diamDiff <- function(graph1, graph2) {
    BASEGDIAMCD1 <- 7
    BASEGDIAMCD2 <- 6
    totalGDiam <- (gDiameter(graph1) - BASEGDIAMCD1) + 
        (gDiameter(graph2) - BASEGDIAMCD2)
    return(totalGDiam)
}

energy <- function(b, w, graph1, graph2) {
    e <-
        exp( -b * (eccenDiff(graph1, graph2) +
                      w * diamDiff(graph1, graph2)))
    return(e)
}

Q <- function(E,F) {
    ## Note that transition probability only depend on the number of
    ## precincts in the FROM state, it's uniform across all TO states
    bdyCongDist1 <-
        getSarpyPrecincts(getBoundary(E, gSarpy))  # in CongDist2
    bdyCongDist2 <-
        getSarpyPrecincts(getBoundary(F, gSarpy))  # in CongDist1
    q <- 1/( length(bdyCongDist1) * length(bdyCongDist2) )
    return(q)
}
    
acceptance <- function(b, Eprime, Fprime, E, F) {
    ratio <- 
        (energy(b, 2, Eprime, Fprime) * Q(Eprime, Fprime))/
        (energy(b, 2, E, F) * Q(E, F))
    accep <- min(c(1, ratio))
    return(accep)
}


sarpyAdj <- as.matrix(read.table("sarpy_adj.txt"))
# n x 2 edgelist matrix, not adjacency matrix!
gSarpy <- ftM2graphNEL(sarpyAdj, edgemode = "undirected")

cd1Prec <- c("p1", "p2", "p3", "p4", "p5", "p6", "p7", "p8",
             "p9", "p10", "p11", "p12", "p13", "p16", "p17",
             "p18", "p20", "p21", "p22", "p24", "p25", "p26", 
             "lanc")
cd2Prec <- setdiff(nodes(gSarpy), cd1Prec)
congDist1 <- subGraph(cd1Prec, gSarpy)
congDist2 <- subGraph(cd2Prec, gSarpy)

Elec2018 <- read.csv("Elec2018.csv")

elecOutcomes <- data.frame(mcStep = 0,
                           cd2DEM = 121770, cd2REP = 126715,
                           winner = as.character("R"),
                           vEccCD1 = 7, vEccCD2 = 4,
                           gDiamCD1 = 7, gDiam = 6,
                           rePart = 0)

for (b in seq(0, 1, 0.25) ) { 
 for (mcStep in 1:100) {


     rePartitionTrial <- 1

     bdyCongDist1 <-
         getSarpyPrecincts(getBoundary(congDist1, gSarpy))  # in CongDist2
     bdyCongDist2 <-
         getSarpyPrecincts(getBoundary(congDist2, gSarpy))  # in CongDist1

     repeat { # rePartition Trial

                                         # randomly select a boundary precinct for each Cong District
         precFromCongDist1 <- sample(bdyCongDist2, 1)
         precFromCongDist2 <- sample(bdyCongDist1, 1)


         newCongDist1 <-
             makeNewCongDist(getSarpyPrecincts(nodes(congDist1)),
                             precFromCongDist1, precFromCongDist2,
                             "lanc")
         newCongDist2 <-
             makeNewCongDist(getSarpyPrecincts(nodes(congDist2)),
                             precFromCongDist2, precFromCongDist1,
                             "doug")

         rePartitionTrial <- rePartitionTrial + 1 

         if (contiguous(newCongDist1) && contiguous(newCongDist2)) {
             u <- runif(1)               #1 sample from default [0,1]
             p <- acceptance(b, newCongDist1, newCongDist2, congDist1, congDist2)
             if (u <= p) {
                 congDist1 <- newCongDist1
                 congDist2 <- newCongDist2

                 break
             }
         }

         if (rePartitionTrial == 150) {
             cat("rePartition Trials reached 150 without new partition\n")
         }

     }    

     if (b == 1.0) {
         outcome <- filter(Elec2018, prec %in% nodes(congDist2)) %>%
             group_by(party) %>% 
             summarise(newelec = sum(as.integer(votes)))

         winner < if ( as.integer(outcome[2, 2]) > as.integer(outcome[1, 2]) ) {
                       "R" } else {
                               "D"
                           }
         elecOutcomes <-
             rbind(elecOutcomes,
                   setNames(c(mcStep,
                              as.integer(outcome[1, 2]),
                              as.integer(outcome[2, 2]),
                              winner,
                              vEccentricity(congDist1, "lanc"),
                              vEccentricity(congDist2, "doug"),
                              gDiameter(congDist1),
                              gDiameter(congDist2),
                              rePartitionTrial),
                            names(elecOutcomes)))
     }
 }
}