Merge pull request #25 from R-Computing-Lab/dev_main

1.2.1 update
R-Computing-Lab · Mar 26, 2024 · 781c972 · 781c972
2 parents 813ad8a + ea8c077
commit 781c972
Show file tree

Hide file tree

Showing 24 changed files with 431 additions and 47 deletions.
diff --git a/.Rbuildignore b/.Rbuildignore
@@ -3,6 +3,8 @@
 ^LICENSE\.md$
 ^R/\.Rhistory$
 ^R/paper$
+^checkParents\.X
+^test-clean\.X
 CITATION.cff$
 ^doc$
 ^data-raw$

diff --git a/.github/workflows/R-CMD-dev_maincheck.yaml b/.github/workflows/R-CMD-dev_maincheck.yaml
@@ -33,22 +33,22 @@ jobs:
     steps:
       - uses: actions/checkout@v3
 
-      - uses: r-lib/actions/setup-pandoc@v2
+      - uses: r-lib/actions/setup-pandoc@v3
 
-      - uses: r-lib/actions/setup-r@v2
+      - uses: r-lib/actions/setup-r@v3
         with:
           r-version: ${{ matrix.config.r }}
           rtools-version: ${{ matrix.config.rtools }}
           http-user-agent: ${{ matrix.config.http-user-agent }}
           use-public-rspm: true
 
-      - uses: r-lib/actions/setup-r-dependencies@v2
+      - uses: r-lib/actions/setup-r-dependencies@v3
         with:
           cache-version: 3
           extra-packages: |
             any::rcmdcheck
           upgrade: 'TRUE'
           needs: check
-      - uses: r-lib/actions/check-r-package@v2
+      - uses: r-lib/actions/check-r-package@v3
         with:
           upload-snapshots: true
diff --git a/.gitignore b/.gitignore
@@ -4,13 +4,9 @@ R/plane.txt
 R/.Rhistory
 .Rhistory
 paper/paper.html
-inst/doc
-/doc/
 /Meta/
 *.knit.md
 vignettes/articles/paper.html
 BGmisc.code-workspace
-.lintr
-
 tests/testthat/Rplots.pdf
-docs
+
diff --git a/.lintr b/.lintr
@@ -0,0 +1,2 @@
+linters: linters_with_defaults(line_length_linter(120),commented_code_linter = NULL,object_name_linter = object_name_linter(styles = c("snake_case", "symbols"))) # see vignette("lintr")
+encoding: "UTF-8"
diff --git a/CODE_OF_CONDUCT.md b/CODE_OF_CONDUCT.md
@@ -60,7 +60,7 @@ representative at an online or offline event.
 
 Instances of abusive, harassing, or otherwise unacceptable behavior may be
 reported to the community leaders responsible for enforcement at
-[email protected].
+[[email protected]](mailto:[email protected]).
 All complaints will be reviewed and investigated promptly and fairly.
 
 All community leaders are obligated to respect the privacy and security of the
@@ -116,13 +116,13 @@ the community.
 
 This Code of Conduct is adapted from the [Contributor Covenant][homepage],
 version 2.0, available at
-https://www.contributor-covenant.org/version/2/0/code_of_conduct.html.
+<https://www.contributor-covenant.org/version/2/0/code_of_conduct.html>.
 
 Community Impact Guidelines were inspired by [Mozilla's code of conduct
 enforcement ladder](https://github.com/mozilla/diversity).
 
 [homepage]: https://www.contributor-covenant.org
 
 For answers to common questions about this code of conduct, see the FAQ at
-https://www.contributor-covenant.org/faq. Translations are available at
-https://www.contributor-covenant.org/translations.
+<https://www.contributor-covenant.org/faq>. Translations are available at
+<https://www.contributor-covenant.org/translations>.
diff --git a/DESCRIPTION b/DESCRIPTION
@@ -1,17 +1,17 @@
 Package: BGmisc
 Title: An R Package for Extended Behavior Genetics Analysis
-Version: 1.2.0
+Version: 1.2.1
 Authors@R: c(
-    person("S. Mason", "Garrison", , "[email protected]", role = c("aut", "cre"),
+    person("S. Mason", "Garrison", , email= "[email protected]", role = c("aut", "cre"),
            comment = c(ORCID = "0000-0002-4804-6003")),
     person(c("Michael", "D."), "Hunter", role = "aut",
            comment = c(ORCID = "0000-0002-3651-6709")),
     person("Xuanyu", "Lyu", role = "aut",
            comment = c(ORCID = "0000-0002-2841-5529")),
-    person(c("Rachel", "N."), "Good", role = "ctb",
-           comment = c(ORCID = "0000-0000-0000-0000")),
-    person(c("Jonathan", "D."), "Trattner", role = "aut",
-           comment = c(ORCID = "0000-0002-1097-7603")),
+    person(c("Rachel", "N."), "Good", role = "ctb"),
+    person(c("Jonathan", "D."), "Trattner", role = "aut", email = "[email protected]", 
+           comment = c(ORCID = "0000-0002-1097-7603",
+                       url = "https://www.jdtrat.com/")),
     person(c("S.", "Alexandra"), "Burt", role = "aut",
            comment = c(ORCID = "0000-0001-5538-7431"))
   )

diff --git a/NEWS.md b/NEWS.md
@@ -1,3 +1,8 @@
+# BGmisc 1.2.1
+
+* Added alternative transpose options for the matrix
+* Added generalization of Falconer's formula
+
 # BGmisc 1.2.0
 
 * Added numerous code checks, increased code coverage to 85%

diff --git a/R/checkParents.X b/R/checkParents.X
@@ -0,0 +1,154 @@
+# Challenge: Missing parents: If one parent is missing and the other one isn't, this needs to be handled somehow. Firstly, I think it can cause certain ways of estimating relatedness to give wrong numbers. And secondly, it requires us to make guesses in cases where e.g. two people have the same mother and missing fathers: They could then be either half-sibs, if the missing fathers are different people, or full sibs if not. This then also affects relatedness for their descendants.
+
+#' Validates and Optionally Repairs Parent IDs in a Pedigree Dataframe
+#'
+#' This function takes a pedigree object and performs two main tasks:
+#' 1. Checks for the validity of parent IDs, specifically looking for instances where only one parent ID is missing.
+#' 2. Optionally repairs the missing parent IDs based on a specified logic.
+#'
+#' @param ped A dataframe representing the pedigree data with columns 'ID', 'dadID', and 'momID'.
+#' @param verbose A logical flag indicating whether to print progress and validation messages to the console.
+#' @param repair A logical flag indicating whether to attempt repairs on missing parent IDs.
+#'
+#' @return Depending on the value of `repair`, either a list containing validation results or a repaired dataframe is returned.
+#' @examples
+#' \dontrun{
+#' ped <- data.frame(ID = 1:4, dadID = c(NA, 1, 1, 2), momID = c(NA, NA, 2, 2))
+#' checkParentIDs(ped, verbose = TRUE, repair = FALSE)
+#' }
+#' @export
+checkParentIDs <- function(ped, verbose = FALSE, repair = FALSE) {
+  # Standardize column names in the input dataframe
+  ped <- standardize_colnames(ped)
+
+  # Initialize a list to store validation results
+  validation_results <- list()
+
+  if (verbose) {
+    cat("Step 1: Checking for missing parents...\n")
+  }
+
+  # Identify missing fathers and mothers
+  missing_fathers <- ped$ID[which(is.na(ped$dadID) & !is.na(ped$momID))]
+  missing_mothers <- ped$ID[which(!is.na(ped$dadID) & is.na(ped$momID))]
+
+  # Update the validation_results list
+  if (length(missing_fathers) > 0) {
+    validation_results$missing_fathers <- missing_fathers
+  }
+  if (length(missing_mothers) > 0) {
+    validation_results$missing_mothers <- missing_mothers
+  }
+
+  # If no missing parents are found
+  if (length(validation_results) == 0) {
+    if (verbose) {
+      cat("No missing single parents found.\n")
+    }
+    validation_results$missing_parents <- FALSE
+  }
+  # If missing parents are found
+  else {
+    if (verbose) {
+      cat("Missing single parents found.\n")
+    }
+    validation_results$missing_parents <- TRUE
+  }
+
+  if (verbose) {
+    cat("Step 2: Determining the if moms are the same sex and dads are same sex\n")
+  }
+
+  # Determine the most frequent sex for moms and dads
+  most_frequent_sex_mom <- names(sort(table(ped$sex[ped$ID %in% ped$momID]), decreasing = TRUE))[1]
+  most_frequent_sex_dad <- names(sort(table(ped$sex[ped$ID %in% ped$dadID]), decreasing = TRUE))[1]
+
+  # are all moms/dads the same sex?
+  validation_results$mom_sex <- unique(ped$sex[ped$ID %in% ped$momID])
+  validation_results$dad_sex <- unique(ped$sex[ped$ID %in% ped$dadID])
+
+  # Store the most frequent sex for moms and dads
+  if (is.numeric(ped$sex)) {
+    validation_results$female_var <- as.numeric(most_frequent_sex_mom)
+    validation_results$male_var <- as.numeric(most_frequent_sex_dad)
+  } else if (is.character(ped$sex) | is.factor(ped$sex)) {
+    validation_results$female_var <- most_frequent_sex_mom
+    validation_results$male_var <- most_frequent_sex_dad
+  } else {
+    print("You should never see this. If you do, then you have a problem with the data type of the sex variable")
+  }
+
+  # verbose
+  if (length(validation_results$mom_sex) == 1) {
+    if (verbose) {
+      cat(paste0(
+        "All moms are '",
+        validation_results$female_var,
+        "'.\n"
+      ))
+    }
+    validation_results$female_moms <- TRUE
+  } else {
+    validation_results$female_moms <- FALSE
+  }
+
+  if (length(validation_results$dad_sex) == 1) {
+    if (verbose) {
+      cat(paste0(
+        "All dads are '",
+        validation_results$male_var,
+        "'.\n"
+      ))
+    }
+    validation_results$male_dads <- TRUE
+  } else {
+    validation_results$male_dads <- FALSE
+  }
+  # Check for inconsistent gender roles
+  wrong_sex_moms <- ped$ID[which(ped$sex[ped$ID %in% ped$momID] != validation_results$female_var)]
+  wrong_sex_dads <- ped$ID[which(ped$sex[ped$ID %in% ped$dadID] != validation_results$male_var)]
+
+
+
+  # Are any parents in both momID and dadID?
+  momdad <- intersect(ped$dadID, ped$momID)
+  if (length(momdad) > 0) {
+    validation_results$parents_in_both <- momdad
+  }
+
+
+  male_moms <- ped$ID[which(ped$dadID & !is.na(ped$momID))]
+
+  if (repair) {
+    if (verbose) {
+      cat("Validation Results:\n")
+      print(validation_results)
+      cat("Step 2: Attempting to repair missing parents...\n")
+    }
+    cat("REPAIR IN EARLY ALPHA\n")
+    # Initialize a list to track changes made during repair
+    changes <- list()
+
+    # [Insert logic to repair parent IDs here]
+
+    # Update the pedigree dataframe after repair
+    repaired_ped <- ped
+
+    if (verbose) {
+      cat("Changes Made:\n")
+      print(changes)
+    }
+    return(repaired_ped)
+  } else {
+    return(validation_results)
+  }
+}
+#' Repair Parent IDs
+#'
+#' This function repairs parent IDs in a pedigree.
+#' @param ped A pedigree object
+#' @param verbose A logical indicating whether to print progress messages
+#' @return A corrected pedigree
+repairParentIDs <- function(ped, verbose = FALSE) {
+  checkParentIDs(ped = ped, verbose = verbose, repair = TRUE)
+}
diff --git a/R/convertPedigree.R b/R/convertPedigree.R
@@ -9,6 +9,8 @@
 #' @param gc logical. If TRUE, do frequent garbage collection via \code{\link{gc}} to save memory
 #' @param flatten.diag logical. If TRUE, overwrite the diagonal of the final relatedness matrix with ones
 #' @param standardize.colnames logical. If TRUE, standardize the column names of the pedigree dataset
+#' @param tcross.alt.crossprod logical. If TRUE, use alternative method of using Crossprod function for computing the transpose
+#' @param tcross.alt.star logical. If TRUE, use alternative method of using \%\*\% for computing the transpose
 #' @param ... additional arguments to be passed to \code{\link{ped2com}}
 #' @details The algorithms and methodologies used in this function are further discussed and exemplified in the vignette titled "examplePedigreeFunctions".
 #' @export
@@ -20,6 +22,8 @@ ped2com <- function(ped, component,
                     gc = FALSE,
                     flatten.diag = FALSE,
                     standardize.colnames = TRUE,
+                    tcross.alt.crossprod = FALSE,
+                    tcross.alt.star = FALSE,
                     ...) {
   # Validate the 'component' argument and match it against predefined choices
   component <- match.arg(tolower(component),
@@ -169,7 +173,15 @@ ped2com <- function(ped, component,
   if (verbose) {
     cat("Doing tcrossprod\n")
   }
-  r <- Matrix::tcrossprod(r2)
+  if(tcross.alt.crossprod){
+    cat("Doing alt tcrossprod crossprod t \n")
+    r <-    crossprod(t(as.matrix(r2)))
+    }else if(tcross.alt.star){
+	  cat("Doing alt tcrossprod %*% t \n")
+     r <-       r2 %*% t(as.matrix(r2))
+  }else{
+     r <- Matrix::tcrossprod(r2)
+  }
   if (component == "generation") {
     return(gen)
   } else {
@@ -194,15 +206,19 @@ ped2com <- function(ped, component,
 
 #' @export
 #'
-ped2add <- function(ped, max.gen = Inf, sparse = FALSE, verbose = FALSE, gc = FALSE, flatten.diag = FALSE) {
+ped2add <- function(ped, max.gen = Inf, sparse = FALSE, verbose = FALSE, gc = FALSE, flatten.diag = FALSE, standardize.colnames = TRUE,
+                    tcross.alt.crossprod = FALSE, tcross.alt.star = FALSE) {
   ped2com(
     ped = ped,
     max.gen = max.gen,
     sparse = sparse,
     verbose = verbose,
     gc = gc,
     component = "additive",
-    flatten.diag = flatten.diag
+    flatten.diag = flatten.diag,
+    standardize.colnames = standardize.colnames,
+    tcross.alt.crossprod = tcross.alt.crossprod,
+    tcross.alt.star = tcross.alt.star
   )
 }
 
@@ -212,35 +228,38 @@ ped2add <- function(ped, max.gen = Inf, sparse = FALSE, verbose = FALSE, gc = FA
 #' @export
 #' @aliases ped2mt
 #'
-ped2mit <- ped2mt <- function(ped, max.gen = Inf, sparse = FALSE, verbose = FALSE, gc = FALSE, flatten.diag = FALSE) {
+ped2mit <- ped2mt <- function(ped, max.gen = Inf, sparse = FALSE, verbose = FALSE, gc = FALSE, flatten.diag = FALSE, standardize.colnames = TRUE, tcross.alt.crossprod = FALSE, tcross.alt.star = FALSE) {
   ped2com(
     ped = ped,
     max.gen = max.gen,
     sparse = sparse,
     verbose = verbose,
     gc = gc,
     component = "mitochondrial",
-    flatten.diag = flatten.diag
+    flatten.diag = flatten.diag,
+    standardize.colnames = standardize.colnames,
+    tcross.alt.crossprod = tcross.alt.crossprod,
+    tcross.alt.star = tcross.alt.star
   )
 }
 
-
-
-
 #' Take a pedigree and turn it into a common nuclear environmental relatedness matrix
 #' @inheritParams ped2com
 #' @details The algorithms and methodologies used in this function are further discussed and exemplified in the vignette titled "examplePedigreeFunctions".
 #' @export
 #'
-ped2cn <- function(ped, max.gen = Inf, sparse = FALSE, verbose = FALSE, gc = FALSE, flatten.diag = FALSE) {
+ped2cn <- function(ped, max.gen = Inf, sparse = FALSE, verbose = FALSE, gc = FALSE, flatten.diag = FALSE, standardize.colnames = TRUE, tcross.alt.crossprod = FALSE, tcross.alt.star = FALSE) {
   ped2com(
     ped = ped,
     max.gen = max.gen,
     sparse = sparse,
     verbose = verbose,
     gc = gc,
     component = "common nuclear",
-    flatten.diag = flatten.diag
+    flatten.diag = flatten.diag,
+    standardize.colnames = standardize.colnames,
+    tcross.alt.crossprod = tcross.alt.crossprod,
+    tcross.alt.star = tcross.alt.star
   )
 }
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1,2 @@
		linters: linters_with_defaults(line_length_linter(120),commented_code_linter = NULL,object_name_linter = object_name_linter(styles = c("snake_case", "symbols"))) # see vignette("lintr")
		encoding: "UTF-8"