From 7260d62cf6f1470584753f76970d19664638eeed Mon Sep 17 00:00:00 2001 From: Johannes Hostert Date: Wed, 27 Jan 2021 11:32:08 +0000 Subject: [PATCH] Add methods to add vertex attributes for mail/issue/pr count for issue #188 Signed-off-by: Johannes Hostert --- util-networks-covariates.R | 249 +++++++++++++++++++++++++++++++++++++ util-split.R | 4 +- 2 files changed, 251 insertions(+), 2 deletions(-) diff --git a/util-networks-covariates.R b/util-networks-covariates.R index 1aa00603..dc7eac97 100644 --- a/util-networks-covariates.R +++ b/util-networks-covariates.R @@ -345,6 +345,255 @@ add.vertex.attribute.commit.count.helper = function(list.of.networks, project.da return(nets.with.attr) } + +## * Mail count ---------------------------------------------------------- + +#' Add mail-count attribute based on the total number of mails send where the person represented by the vertex is the author +#' +#' @param list.of.networks The network list +#' @param project.data The project data +#' @param name The attribute name to add [default: "mail.count"] +#' @param aggregation.level Determines the data to use for the attribute calculation. +#' One of \code{"range"}, \code{"cumulative"}, \code{"all.ranges"}, +#' \code{"project.cumulative"}, \code{"project.all.ranges"}, and +#' \code{"complete"}. See \code{split.data.by.networks} for +#' more details. [default: "range"] +#' @param default.value The default value to add if a vertex has no matching value [default: 0L] +#' +#' @return A list of networks with the added attribute +add.vertex.attribute.mail.count = function(list.of.networks, project.data, + name = "mail.count", + aggregation.level = c("range", "cumulative", "all.ranges", + "project.cumulative", "project.all.ranges", + "complete"), + default.value = 0L) { + nets.with.attr = add.vertex.attribute.commit.count.helper( + list.of.networks, project.data, name, aggregation.level, + default.value, get.author.mail.count, "author.name" + ) + + return(nets.with.attr) +} +#' Add mail-count attribute based on the number of mail threads participated in where the person represented by the vertex is the author +#' +#' @param list.of.networks The network list +#' @param project.data The project data +#' @param name The attribute name to add [default: "mail.thread.count"] +#' @param aggregation.level Determines the data to use for the attribute calculation. +#' One of \code{"range"}, \code{"cumulative"}, \code{"all.ranges"}, +#' \code{"project.cumulative"}, \code{"project.all.ranges"}, and +#' \code{"complete"}. See \code{split.data.by.networks} for +#' more details. [default: "range"] +#' @param default.value The default value to add if a vertex has no matching value [default: 0L] +#' +#' @return A list of networks with the added attribute +add.vertex.attribute.mail.thread.count = function(list.of.networks, project.data, + name = "mail.thread.count", + aggregation.level = c("range", "cumulative", "all.ranges", + "project.cumulative", "project.all.ranges", + "complete"), + default.value = 0L) { + nets.with.attr = add.vertex.attribute.commit.count.helper( + list.of.networks, project.data, name, aggregation.level, + default.value, get.author.mail.thread.count, "author.name" + ) + + return(nets.with.attr) +} + +## * Issue count -------------------------------------------------------------- + +#' Add issues-count attribute based on the number of issues participated in where the person represented by the vertex is the author +#' +#' @param list.of.networks The network list +#' @param project.data The project data +#' @param name The attribute name to add [default: "issues.count"] +#' @param aggregation.level Determines the data to use for the attribute calculation. +#' One of \code{"range"}, \code{"cumulative"}, \code{"all.ranges"}, +#' \code{"project.cumulative"}, \code{"project.all.ranges"}, and +#' \code{"complete"}. See \code{split.data.by.networks} for +#' more details. [default: "range"] +#' @param default.value The default value to add if a vertex has no matching value [default: 0L] +#' +#' @return A list of networks with the added attribute +add.vertex.attribute.issue.count = function(list.of.networks, project.data, + name = "issues.count", + aggregation.level = c("range", "cumulative", "all.ranges", + "project.cumulative", "project.all.ranges", + "complete"), + default.value = 0L) { + nets.with.attr = add.vertex.attribute.commit.count.helper( + list.of.networks, project.data, name, aggregation.level, + default.value, get.author.issues.count, "author.name" + ) + + return(nets.with.attr) +} + +#' Add issues-count attribute based on the number of issues participated by commenting in where the person represented by the vertex is the author +#' +#' @param list.of.networks The network list +#' @param project.data The project data +#' @param name The attribute name to add [default: "issues.count.by.commenting"] +#' @param aggregation.level Determines the data to use for the attribute calculation. +#' One of \code{"range"}, \code{"cumulative"}, \code{"all.ranges"}, +#' \code{"project.cumulative"}, \code{"project.all.ranges"}, and +#' \code{"complete"}. See \code{split.data.by.networks} for +#' more details. [default: "range"] +#' @param default.value The default value to add if a vertex has no matching value [default: 0L] +#' +#' @return A list of networks with the added attribute +add.vertex.attribute.issue.count.by.commenting = function(list.of.networks, project.data, + name = "issues.count.by.commenting", + aggregation.level = c("range", "cumulative", "all.ranges", + "project.cumulative", "project.all.ranges", + "complete"), + default.value = 0L) { + nets.with.attr = add.vertex.attribute.commit.count.helper( + list.of.networks, project.data, name, aggregation.level, + default.value, get.author.issues.commented.in.count, "author.name" + ) + + return(nets.with.attr) +} + +#' Add issues-count attribute based on the number of issues participated by commenting in where the person represented by the vertex is the author +#' +#' @param list.of.networks The network list +#' @param project.data The project data +#' @param name The attribute name to add [default: "issue.comment.count"] +#' @param aggregation.level Determines the data to use for the attribute calculation. +#' One of \code{"range"}, \code{"cumulative"}, \code{"all.ranges"}, +#' \code{"project.cumulative"}, \code{"project.all.ranges"}, and +#' \code{"complete"}. See \code{split.data.by.networks} for +#' more details. [default: "range"] +#' @param default.value The default value to add if a vertex has no matching value [default: 0L] +#' +#' @return A list of networks with the added attribute +add.vertex.attribute.issue.comment.count = function(list.of.networks, project.data, + name = "issue.comment.count", + aggregation.level = c("range", "cumulative", "all.ranges", + "project.cumulative", "project.all.ranges", + "complete"), + default.value = 0L) { + nets.with.attr = add.vertex.attribute.commit.count.helper( + list.of.networks, project.data, name, aggregation.level, + default.value, get.author.issue.comments.count, "author.name" + ) + + return(nets.with.attr) +} + +## * Pull request count ------------------------------------------------------------- + +#' Add PR-count attribute based on the number of PR created where the person represented by the vertex is the author +#' +#' @param list.of.networks The network list +#' @param project.data The project data +#' @param name The attribute name to add [default: "pull.request.creation.count"] +#' @param aggregation.level Determines the data to use for the attribute calculation. +#' One of \code{"range"}, \code{"cumulative"}, \code{"all.ranges"}, +#' \code{"project.cumulative"}, \code{"project.all.ranges"}, and +#' \code{"complete"}. See \code{split.data.by.networks} for +#' more details. [default: "range"] +#' @param default.value The default value to add if a vertex has no matching value [default: 0L] +#' +#' @return A list of networks with the added attribute +add.vertex.attribute.pull.request.creation.count = function(list.of.networks, project.data, + name = "pull.request.creation.count", + aggregation.level = c("range", "cumulative", "all.ranges", + "project.cumulative", "project.all.ranges", + "complete"), + default.value = 0L) { + nets.with.attr = add.vertex.attribute.commit.count.helper( + list.of.networks, project.data, name, aggregation.level, + default.value, get.author.pull.requests.created.count, "author.name" + ) + + return(nets.with.attr) +} + +#' Add PR-count attribute based on the number of PRs participated in where the person represented by the vertex is the author +#' +#' @param list.of.networks The network list +#' @param project.data The project data +#' @param name The attribute name to add [default: "mail.thread.count"] +#' @param aggregation.level Determines the data to use for the attribute calculation. +#' One of \code{"range"}, \code{"cumulative"}, \code{"all.ranges"}, +#' \code{"project.cumulative"}, \code{"project.all.ranges"}, and +#' \code{"complete"}. See \code{split.data.by.networks} for +#' more details. [default: "range"] +#' @param default.value The default value to add if a vertex has no matching value [default: 0L] +#' +#' @return A list of networks with the added attribute +add.vertex.attribute.pull.request.count = function(list.of.networks, project.data, + name = "pull.request.count", + aggregation.level = c("range", "cumulative", "all.ranges", + "project.cumulative", "project.all.ranges", + "complete"), + default.value = 0L) { + nets.with.attr = add.vertex.attribute.commit.count.helper( + list.of.networks, project.data, name, aggregation.level, + default.value, get.author.pull.requests.count, "author.name" + ) + + return(nets.with.attr) +} + +#' Add PR-count attribute based on the number of PRs commits were added to where the person represented by the vertex is the author +#' +#' @param list.of.networks The network list +#' @param project.data The project data +#' @param name The attribute name to add [default: "mail.thread.count"] +#' @param aggregation.level Determines the data to use for the attribute calculation. +#' One of \code{"range"}, \code{"cumulative"}, \code{"all.ranges"}, +#' \code{"project.cumulative"}, \code{"project.all.ranges"}, and +#' \code{"complete"}. See \code{split.data.by.networks} for +#' more details. [default: "range"] +#' @param default.value The default value to add if a vertex has no matching value [default: 0L] +#' +#' @return A list of networks with the added attribute +add.vertex.attribute.pull.request.count.by.commits = function(list.of.networks, project.data, + name = "pull.request.count.by.commits", + aggregation.level = c("range", "cumulative", "all.ranges", + "project.cumulative", "project.all.ranges", + "complete"), + default.value = 0L) { + nets.with.attr = add.vertex.attribute.commit.count.helper( + list.of.networks, project.data, name, aggregation.level, + default.value, get.author.pull.requests.commited.in.count, "author.name" + ) + + return(nets.with.attr) +} + +#' Add PR-comment-count attribute based on the number of PRs comments written where the person represented by the vertex is the author +#' +#' @param list.of.networks The network list +#' @param project.data The project data +#' @param name The attribute name to add [default: "mail.thread.count"] +#' @param aggregation.level Determines the data to use for the attribute calculation. +#' One of \code{"range"}, \code{"cumulative"}, \code{"all.ranges"}, +#' \code{"project.cumulative"}, \code{"project.all.ranges"}, and +#' \code{"complete"}. See \code{split.data.by.networks} for +#' more details. [default: "range"] +#' @param default.value The default value to add if a vertex has no matching value [default: 0L] +#' +#' @return A list of networks with the added attribute +add.vertex.attribute.pull.request.count.by.commits = function(list.of.networks, project.data, + name = "pull.request.comments", + aggregation.level = c("range", "cumulative", "all.ranges", + "project.cumulative", "project.all.ranges", + "complete"), + default.value = 0L) { + nets.with.attr = add.vertex.attribute.commit.count.helper( + list.of.networks, project.data, name, aggregation.level, + default.value, get.author.pull.request.comments.count, "author.name" + ) + + return(nets.with.attr) +} + ## * Meta-data ------------------------------------------------------------- #' Add author email attribute diff --git a/util-split.R b/util-split.R index 2d7f1531..a6f99116 100644 --- a/util-split.R +++ b/util-split.R @@ -63,7 +63,7 @@ split.data.time.based = function(project.data, time.period = "3 months", bins = data = list( commits = project.data$get.commits(), mails = project.data$get.mails(), - issues = project.data$get.issues() + issues = project.data$get.issues.unfiltered() ) split.data = names(data) names(split.data) = split.data @@ -237,7 +237,7 @@ split.data.activity.based = function(project.data, activity.type = c("commits", data = list( commits = project.data$get.commits(), mails = project.data$get.mails(), - issues = project.data$get.issues() + issues = project.data$get.issues.unfiltered() ) ## define ID columns for mails and commits