# install.packages('network', .libPaths(), repos='http://cran.us.r-project.org')
# install.packages('ergm', .libPaths(), repos='http://cran.us.r-project.org')
# install.packages('devtools', .libPaths(), repos='http://cran.us.r-project.org')


devtools::install_github('tedhchen/ergmWorkshopTools')


library(ergm)
library(ergmWorkshopTools)


data(mid_mat)
?mid_mat


options(repr.plot.width=10, repr.plot.height=10)
checkmat(mid_mat)


?network


nw <- network(mid_mat, directed = F)
nw


options(repr.plot.width=10, repr.plot.height=10)
par(mfrow = c(1, 1))
set.seed(210615); plot(nw)


data(mid_edgelist)
nw.b <- network(mid_edgelist, directed = F)
nw.b


options(repr.plot.width=20, repr.plot.height=10)
par(mfrow = c(1, 2))
set.seed(210615); plot(nw); plot(nw.b)


data(mid_node_attr)
head(mid_node_attr)
?mid_node_attr


mat <- matrix(0, ncol = 189, nrow = 189, dimnames = list(row.names(mid_node_attr), row.names(mid_node_attr)))
mat[1:10, 1:10]


for(i in 1:nrow(mid_edgelist)){
    mat[mid_edgelist[i, 1], mid_edgelist[i, 2]] <- 1
    mat[mid_edgelist[i, 2], mid_edgelist[i, 1]] <- 1
}


options(repr.plot.width=14, repr.plot.height=7)
par(mfrow = c(1, 2))
checkmat(mat);checkmat(mid_mat)

nw


nw%v%'vertex.names'


nw%v%'dem' <- mid_node_attr$'dem'
nw


nw%v%'dem'


options(repr.plot.width=10, repr.plot.height=10)
set.seed(210615); plot(nw, vertex.col = ifelse(nw%v%'dem', 2, 1)); legend('bottomright', legend = c('Democracy', 'Nondemocracy'), fill = c(2, 1), bty = 'n', cex = 1.1)


data(contig); data(joint_dem)


options(repr.plot.width=16, repr.plot.height=8)
par(mfrow = c(1, 2))
set.seed(210615); plot(network(contig, directed = F), sub = 'Contiguity', cex.sub = 2); plot(network(joint_dem, directed = F), sub = 'Joint-Democracy', cex.sub = 2)


?`ergm-terms`


search.ergmTerms(keyword = 'transitive')


m0 <- ergm(nw ~ edges + nodefactor('dem') + edgecov(joint_dem))
summary(m0)


dyad_df <- ergmMPLE(nw ~ edges + nodefactor('dem') + edgecov(joint_dem))
dyad_df$predictor


summary(glm(dyad_df$response ~ dyad_df$predictor - 1, weights = dyad_df$weights, family = 'binomial'))


m1 <- ergm(nw ~ edges + nodefactor('dem') + edgecov(joint_dem) + kstar(2), control = control.ergm(seed = 210616))


m1 <- ergm(nw ~ edges + nodefactor('dem') + edgecov(joint_dem) + gwdegree(decay = 0, fixed = T), control = control.ergm(seed = 210616))


summary(m1)


m2 <- ergm(nw ~ edges + nodefactor('dem') + edgecov(joint_dem) + gwdegree(decay = 0, fixed = T) + triangle, control = control.ergm(seed = 210616))


m2 <- ergm(nw ~ edges + nodefactor('dem') + edgecov(joint_dem) + gwdegree(decay = 0, fixed = T) + gwesp(decay = 0, fixed = T), control = control.ergm(seed = 210616))


summary(m2)


tenclique <- network(matrix(1, ncol = 10, nrow = 10), directed = T)
options(repr.plot.width=7, repr.plot.height=7)
set.seed(210615); plot(tenclique)


summary(tenclique ~ edges + gwesp(0, fixed = T) + gwesp(0.5, fixed = T) + gwesp(1, fixed = T) + gwesp(2, fixed = T) + gwesp(5, fixed = T) + gwesp(10, fixed = T) + ttriple)


m2.b <- ergm(nw ~ edges + nodefactor('dem') + edgecov(joint_dem) + gwdegree(decay = 0.2, fixed = T) + gwesp(decay = 0, fixed = T), control = control.ergm(seed = 210616))


summary(m2.b)


m2fit <- gof(m2, control = control.gof.ergm(seed = 210616))
m2fit


options(repr.plot.width=32, repr.plot.height=8)
par(mfrow = c(1, 4))
plot(m2fit)


m1fit <- gof(m1, control = control.gof.ergm(seed = 210616))
options(repr.plot.width=32, repr.plot.height=8)
par(mfrow = c(1, 4))
plot(m1fit)


summary(m2)


tri <- matrix(c(0, 1, 1,
                1, 0, 0,
                1, 0, 0), byrow = T, ncol = 3)
nw.tri <- network(tri, directed = F)
nw.tri%v%'dem' <- c(0, 1, 1)
jd.tri <- matrix(c(0, 0, 0,
                   0, 0, 1,
                   0, 1, 0), byrow = T, ncol = 3)
options(repr.plot.width=10, repr.plot.height=10)
set.seed(210615); plot(nw.tri, vertex.col = ifelse(nw.tri%v%'dem', 2, 1), displaylabels = T)


ergmMPLE(nw.tri ~ edges + nodefactor('dem') + edgecov(jd.tri) + gwdegree(decay = 0, fixed = T) + gwesp(decay = 0, fixed = T))$predictor


round(coefficients(m2), 2)


plogis(-1.76)


m2.c <- ergm(nw ~ edges + nodefactor('dem') + edgecov(joint_dem) + gwdegree(decay = 0, fixed = T) + gwesp(decay = 0, fixed = T),
             eval.loglik = F,
             control = control.ergm(seed = 210615,
                                    MCMC.burnin = 50000,
                                    MCMC.samplesize = 2500,
                                    MCMC.interval = 2500,
                                    parallel = 0))


summary(m2.c)


m2.c <- logLik(m2.c, add = T)


summary(m2.c)


options(repr.plot.width=20, repr.plot.height=10)
mcmc.diagnostics(m2)


options(repr.plot.width=20, repr.plot.height=10)
mcmc.diagnostics(m2.c)

nodes with degree:	0	1	2
w/o (2,3) edge	0	2	1
w/ (2,3) edge	0	0	3

1. Preparation¶

First, we install the required packages.¶

We have a workshop package that contains the data we will be working with and some utility functions.¶

Next, we load the libraries.¶

2. Building our networks¶

First, load the data.¶

Next, we use the network function to create a network object.¶

There are different ways network data is usually stored.¶

We need to be careful when working with them.¶

What's the difference?¶

Where are the isolates?¶

When working with this kind of data, we have to make sure we have a list of the full actors in the network.¶

Let's manually make the adjacency matrix from the edgelist.¶

Let's get back to working with our network.¶

Let's work with vertex attributes.¶

We can look at how democracies and nondemocracies differ in conflict behavior.¶

Red nodes are democracies and black are nondemocracies.¶

Edge attributes can also be specified in a similar way but it's easier to just use a separate matrix.¶

3. Specifying the ERGM¶

Let's take a look at the basic function for ERGM fitting: ergm.¶

What are the ERGM terms that we can use?¶

3.1 ERGM Terms¶

3.2 Starting to fit an ERGM¶

We start with some node and dyad variables.¶

Let's compare it with the logistic regression.¶

They are exactly the same.¶

Let's move to some network effects.¶

What happened here?¶

So instead, we can use alternative network statistics designed to address these problems.¶

References:¶

Looks like it converged.¶

Let's also add the triadic closure effect before looking at the model in more detail.¶

Again, seems like we have degeneracy.¶

Looks like it converged.¶

3.2.1 Let's consider model fit, degeneracy, and decay parameters¶

How to understand the decay parameters?¶

Reference:¶

This is easiest to demonstrate using the gwesp.¶

What happened?¶

Let's look at a real example using our MIDs network.¶

Slightly increasing the decay value improved fit and didn't run into degeneracy issues.¶

3.3 Assessing ERGM fit¶

Back to our MIDs model; it seems like our model converged, but we should still check the fit using simulations.¶

What are we looking at?¶

But it helps to compare.¶

3.4 Interpreting the ERGM output¶

Let's bring up the model output again.¶

At the network level:¶

At the dyad level:¶

$P(y_{ij} = 1 | Y, \mathbf{\theta}) = logit ^{-1}(\sum^k_{r=1}\theta_r \delta_r^{(ij)}Y)$¶

Let's illustrate using a simple example and the same coefficients.¶

What's the probability of a tie forming on the empty dyad (2,3) if this network has the same generative features of our conflict network?¶

There are two types of dyads here:¶

Adding an edge on the (2,3) dyad will add...¶

Why does gwdegree not change?¶

Calculate the log-odds.¶

Calculate the corresponding probability.¶

At the block level:¶

Reference:¶

3.5 ERGM Settings¶

Let's conclude this section by looking at some settings and useful things to do.¶

We don't get any likelihood-based statistics. We can follow the instructions to add them.¶

Increasing the MCMC samples can improve our estimates.¶

4. Resources and References¶

Packages¶

References¶

5. Questions or comments?¶

Please visit the Github repository for this notebook.¶

Or email me at ted.hsuanyun.chen@gmail.com.¶

Next, we use the `network` function to create a network object.¶

Let's take a look at the basic function for ERGM fitting: `ergm`.¶

This is easiest to demonstrate using the `gwesp`.¶

Why does `gwdegree` not change?¶