From 2faa43c2fdf34022734335ef320713de8bc97abe Mon Sep 17 00:00:00 2001 From: "Pavel N. Krivitsky" Date: Thu, 28 Nov 2024 21:58:02 +1100 Subject: [PATCH] Implemented Projection() operator, .project.net() auxiliary, and Proj1() and Proj2() aliases to evaluate statistics on a network constructed by projecting a bipartite network. --- DESCRIPTION | 1 + R/InitErgmTerm.projection.R | 93 ++++++++++++++++++ man/Project-ergmTerm-36962a06.Rd | 36 +++++++ src/changestats_projection.c | 153 +++++++++++++++++++++++++++++ tests/testthat/test-term-project.R | 29 ++++++ 5 files changed, 312 insertions(+) create mode 100644 R/InitErgmTerm.projection.R create mode 100644 man/Project-ergmTerm-36962a06.Rd create mode 100644 src/changestats_projection.c create mode 100644 tests/testthat/test-term-project.R diff --git a/DESCRIPTION b/DESCRIPTION index a89fa7bfb..fede22b0d 100644 --- a/DESCRIPTION +++ b/DESCRIPTION @@ -84,6 +84,7 @@ Collate: 'InitErgmTerm.indices.R' 'InitErgmTerm.interaction.R' 'InitErgmTerm.operator.R' + 'InitErgmTerm.projection.R' 'InitErgmTerm.spcache.R' 'InitErgmTerm.test.R' 'InitErgmTerm.transitiveties.R' diff --git a/R/InitErgmTerm.projection.R b/R/InitErgmTerm.projection.R new file mode 100644 index 000000000..e541f61d4 --- /dev/null +++ b/R/InitErgmTerm.projection.R @@ -0,0 +1,93 @@ +# File R/InitErgmTerm.projection.R in package ergm, part of the +# Statnet suite of packages for network analysis, https://statnet.org . +# +# This software is distributed under the GPL-3 license. It is free, +# open source, and has the attribution requirements (GPL Section 7) at +# https://statnet.org/attribution . +# +# Copyright 2003-2024 Statnet Commons +################################################################################ +#' @templateVar name Project +#' @title Evaluation on a projection of a bipartite network +#' +#' @description This operator on a bipartite network evaluates the +#' formula on the undirected, valued network constructed by +#' projecting it onto its specified mode. `Proj1(formula)` and +#' `Proj2(formula)` are aliases for `Project(formula, 1)` and +#' `Project(formula, 2)`, respectively. +#' +#' @usage +#' # binary: Project(formula, mode) +#' @template ergmTerm-formula +#' @param mode the mode onto which to project: 1 or 2 +#' +#' @template ergmTerm-general +#' +#' @concept operator +#' @concept bipartite +InitErgmTerm.Project <- function(nw, arglist, ...){ + a <- check.ErgmTerm(nw, arglist, bipartite = TRUE, + varnames = c("formula", "mode"), + vartypes = c("formula", "numeric"), + defaultvalues = list(NULL, NULL), + required = c(TRUE, TRUE)) + + bip <- as.integer(nw %n% "bipartite") + n <- as.integer(network.size(nw)) + + mode <- a$mode + if(! mode %in% 1:2) ergm_Init_error(sQuote("mode"), " must be 1 or 2.") + + ### Construct an empty network with the correct structure. + pnw <- nw + pnw %n% "bipartite" <- FALSE + pnw[,] <- 0 + pnw <- switch(mode, + get.inducedSubgraph(pnw, seq_len(bip)), + get.inducedSubgraph(pnw, bip + seq_len(n-bip))) + pnw %ergmlhs% "response" <- structure("w", valued = TRUE) + + m <- ergm_model(a$formula, pnw, ..., offset.decorate=FALSE) + ergm_no_ext.encode(m) + + auxiliaries <- trim_env(~.project.net(mode), "mode") + + c(list(name="on_proj_net", iinputs = mode, + submodel = m, dependence = TRUE, + auxiliaries=auxiliaries), + wrap.ergm_model(m, pnw, ergm_mk_std_op_namewrap(paste0('Proj', mode)))) +} + +#' @templateVar name Project +#' @template ergmTerm-rdname +#' @aliases Proj1-ergmTerm +#' @usage +#' # binary: Proj1(formula) +InitErgmTerm.Proj1 <- function(nw, arglist, ...){ + arglist[["mode"]] <- 1L + f <- InitErgmTerm.Project + f(nw, arglist, ...) +} + +#' @templateVar name Project +#' @template ergmTerm-rdname +#' @aliases Proj2-ergmTerm +#' @usage +#' # binary: Proj2(formula) +InitErgmTerm.Proj2 <- function(nw, arglist, ...){ + arglist[["mode"]] <- 2L + f <- InitErgmTerm.Project + f(nw, arglist, ...) +} + +InitErgmTerm..project.net <- function(nw, arglist, ...){ + a <- check.ErgmTerm(nw, arglist, bipartite = TRUE, + varnames = c("mode"), + vartypes = c("numeric"), + defaultvalues = list(NULL), + required = c(TRUE)) + + mode <- a$mode + if(! mode %in% 1:2) ergm_Init_error(sQuote("mode"), " must be 1 or 2.") + list(name=paste0("_proj_net"), iinputs = mode, coef.names = c(), dependence=TRUE) +} diff --git a/man/Project-ergmTerm-36962a06.Rd b/man/Project-ergmTerm-36962a06.Rd new file mode 100644 index 000000000..cb7e9f0c3 --- /dev/null +++ b/man/Project-ergmTerm-36962a06.Rd @@ -0,0 +1,36 @@ +% Generated by roxygen2: do not edit by hand +% Please edit documentation in R/InitErgmTerm.projection.R +\name{Project-ergmTerm} +\alias{Project-ergmTerm} +\alias{InitErgmTerm.Project} +\alias{InitErgmTerm.Proj1} +\alias{Proj1-ergmTerm} +\alias{InitErgmTerm.Proj2} +\alias{Proj2-ergmTerm} +\title{Evaluation on a projection of a bipartite network} +\usage{ +# binary: Project(formula, mode) + +# binary: Proj1(formula) + +# binary: Proj2(formula) +} +\arguments{ +\item{formula}{a one-sided \code{\link[=ergm]{ergm()}}-style formula with the terms to be evaluated} + +\item{mode}{the mode onto which to project: 1 or 2} +} +\description{ +This operator on a bipartite network evaluates the +formula on the undirected, valued network constructed by +projecting it onto its specified mode. \code{Proj1(formula)} and +\code{Proj2(formula)} are aliases for \code{Project(formula, 1)} and +\code{Project(formula, 2)}, respectively. +} +\seealso{ +\code{\link{ergmTerm}} for index of model terms currently visible to the package. + +\Sexpr[results=rd,stage=render]{ergm:::.formatTermKeywords("ergmTerm", "Project", "subsection")} +} +\concept{bipartite} +\concept{operator} diff --git a/src/changestats_projection.c b/src/changestats_projection.c new file mode 100644 index 000000000..6d7d32fee --- /dev/null +++ b/src/changestats_projection.c @@ -0,0 +1,153 @@ +/* File src/changestats_projection.c in package ergm, part of the + * Statnet suite of packages for network analysis, https://statnet.org . + * + * This software is distributed under the GPL-3 license. It is free, + * open source, and has the attribution requirements (GPL Section 7) at + * https://statnet.org/attribution . + * + * Copyright 2003-2024 Statnet Commons + */ +#define STRICT_Wt_HEADERS +#include "ergm_wtchangestat_operator.h" +#include "ergm_changestat_operator.h" +#include "ergm_storage.h" + +typedef struct { + WtModel *m; + Vertex *t, *h; + double *w; +} StoreWtModelAndWtChanges; + + +I_CHANGESTAT_FN(i_on_proj_net){ + GET_AUX_STORAGE(WtNetwork, pnwp); + ALLOC_STORAGE(1, StoreWtModelAndWtChanges, storage); + // No need to allocate it: we are only storing a pointer to a model. + storage->m = WtModelInitialize(getListElement(mtp->R, "submodel"), mtp->ext_state, pnwp, FALSE); + + /* WtSELECT_C_OR_D_BASED_ON_SUBMODEL(storage->m); */ + WtDELETE_IF_UNUSED_IN_SUBMODEL(x_func, storage->m); + WtDELETE_IF_UNUSED_IN_SUBMODEL(z_func, storage->m); + + unsigned int mode = IINPUT_PARAM[0], + maxchanges = mode == 1 ? BIPARTITE-1 : N_NODES-BIPARTITE-1; + + storage->t = R_Calloc(maxchanges, Vertex); + storage->h = R_Calloc(maxchanges, Vertex); + storage->w = R_Calloc(maxchanges, double); +} + +/* TODO: A d_function? */ + +C_CHANGESTAT_FN(c_on_proj_net){ + GET_AUX_STORAGE(WtNetwork, pnwp); + GET_STORAGE(StoreWtModelAndWtChanges, storage); + + int echange = edgestate ? -1 : 1; + + unsigned int nt = 0, mode = IINPUT_PARAM[0]; + + switch(mode){ + case 1: + EXEC_THROUGH_FINEDGES(head, e, tail2, { + if(tail!=tail2){ + storage->t[nt] = MIN(tail, tail2); + storage->h[nt] = MAX(tail, tail2); + storage->w[nt] = WtGETWT(tail, tail2, pnwp) + echange; + nt++; + } + }); break; + case 2: + EXEC_THROUGH_FOUTEDGES(tail, e, head2, { + if(head!=head2){ + storage->t[nt] = MIN(head-BIPARTITE, head2-BIPARTITE); + storage->h[nt] = MAX(head-BIPARTITE, head2-BIPARTITE); + storage->w[nt] = WtGETWT(head-BIPARTITE, head2-BIPARTITE, pnwp) + echange; + nt++; + } + }); break; + default: error("We should never be here."); + } + + WtChangeStats(nt, storage->t, storage->h, storage->w, pnwp, storage->m); + + memcpy(CHANGE_STAT, storage->m->workspace, N_CHANGE_STATS*sizeof(double)); +} + +Z_CHANGESTAT_FN(z_on_proj_net){ + GET_AUX_STORAGE(WtNetwork, pnwp); + GET_STORAGE(StoreWtModelAndWtChanges, storage) + + WtZStats(pnwp, storage->m, FALSE); + + memcpy(CHANGE_STAT, storage->m->workspace, N_CHANGE_STATS*sizeof(double)); +} + +X_CHANGESTAT_FN(x_on_proj_net){ + GET_AUX_STORAGE(WtNetwork, pnwp); + GET_STORAGE(StoreWtModelAndWtChanges, storage); + ModelTerm *_mymtp = mtp; + WtSEND_X_SIGNAL_INTO(pnwp, storage->m, NULL, _mymtp->dstats, type, data); +} + +F_CHANGESTAT_FN(f_on_proj_net){ + GET_AUX_STORAGE(WtNetwork, pnwp); + GET_STORAGE(StoreWtModelAndWtChanges, storage); + + R_Free(storage->t); + R_Free(storage->h); + R_Free(storage->w); + WtModelDestroy(pnwp, storage->m); +} + + + +I_CHANGESTAT_FN(i__proj_net){ + unsigned int mode = IINPUT_PARAM[0]; + + WtNetwork *pnwp = AUX_STORAGE = WtNetworkInitialize(NULL, NULL, NULL, 0, mode == 1 ? BIPARTITE : N_NODES - BIPARTITE, DIRECTED, FALSE, FALSE, 0, NULL); + + switch(mode){ + case 1: + EXEC_THROUGH_NET_EDGES_PRE(tail, head, e1, { + EXEC_THROUGH_FINEDGES(head, e2, tail2, { + if(tail < tail2) + WtSETWT(tail, tail2, WtGETWT(tail, tail2, pnwp) + 1, pnwp); + }); + }); break; + case 2: + EXEC_THROUGH_NET_EDGES_PRE(tail, head, e1, { + EXEC_THROUGH_FOUTEDGES(tail, e2, head2, { + if(head < head2) + WtSETWT(head-BIPARTITE, head2-BIPARTITE, WtGETWT(head-BIPARTITE, head2-BIPARTITE, pnwp) + 1, pnwp); + }); + }); break; + default: error("We should never be here."); + } +} + +U_CHANGESTAT_FN(u__proj_net){ + GET_AUX_STORAGE(WtNetwork, pnwp); + int echange = edgestate ? -1 : 1; + unsigned int mode = IINPUT_PARAM[0]; + + switch(mode){ + case 1: + EXEC_THROUGH_FINEDGES(head, e, tail2, { + if(tail!=tail2) + WtSETWT(tail, tail2, WtGETWT(tail, tail2, pnwp) + echange, pnwp); + }); break; + case 2: + EXEC_THROUGH_FOUTEDGES(tail, e, head2, { + if(head!=head2) + WtSETWT(head-BIPARTITE, head2-BIPARTITE, WtGETWT(head-BIPARTITE, head2-BIPARTITE, pnwp) + echange, pnwp); + }); break; + default: error("We should never be here."); + } +} + +F_CHANGESTAT_FN(f__proj_net){ + GET_AUX_STORAGE(WtNetwork, pnwp); + WtNetworkDestroy(pnwp); + AUX_STORAGE = NULL; +} diff --git a/tests/testthat/test-term-project.R b/tests/testthat/test-term-project.R new file mode 100644 index 000000000..54c27ec3a --- /dev/null +++ b/tests/testthat/test-term-project.R @@ -0,0 +1,29 @@ +n <- 20 +b <- 5 + +nw0 <- network.initialize(n, bipartite = b, directed = FALSE) +nw0 %v% "b1" <- c(rnorm(b), rep(NA, n-b)) +nw0 %v% "b2" <- c(rep(NA, b), rnorm(n-b)) +nw1 <- simulate(nw0 ~ edges, coef = 0) +nw2 <- simulate(nw0 ~ edges, coef = 0) +m1 <- as.matrix(nw1) +m2 <- as.matrix(nw2) + +nw1.absdiff.b1 <- sum(abs(outer(na.omit(nw1 %v% "b1"), na.omit(nw1 %v% "b1"), FUN = "-")) * tcrossprod(m1))/2 +nw1.absdiff.b2 <- sum(abs(outer(na.omit(nw1 %v% "b2"), na.omit(nw1 %v% "b2"), FUN = "-")) * crossprod(m1))/2 +nw2.absdiff.b1 <- sum(abs(outer(na.omit(nw2 %v% "b1"), na.omit(nw2 %v% "b1"), FUN = "-")) * tcrossprod(m2))/2 +nw2.absdiff.b2 <- sum(abs(outer(na.omit(nw2 %v% "b2"), na.omit(nw2 %v% "b2"), FUN = "-")) * crossprod(m2))/2 + +f <- nw1 ~ Project(~ absdiff("b1"), 1) + Proj1(~absdiff("b1")) + Project(~absdiff("b2"), 2) + Proj2(~absdiff("b2")) + +test_that("Projection(), Proj1(), and Proj2() summary", { + expect_equal(summary(f), + c(`Proj1~absdiff.sum.b1` = nw1.absdiff.b1, `Proj1~absdiff.sum.b1` = nw1.absdiff.b1, + `Proj2~absdiff.sum.b2` = nw1.absdiff.b2, `Proj2~absdiff.sum.b2` = nw1.absdiff.b2)) +}) + +test_that("Projection(), Proj1(), and Proj2() change", { + changes <- as.matrix(xor(nw1, nw2), matrix.type = "edgelist") + expect_equal(c(ergm.godfather(f, changes = changes)), + rep(c(nw2.absdiff.b1, nw2.absdiff.b2), each = 2)) +})