amices · stefvanbuuren · Sep 11, 2023 · Sep 11, 2023 · Sep 12, 2023 · Sep 13, 2023
diff --git a/DESCRIPTION b/DESCRIPTION
@@ -100,3 +100,4 @@ BugReports: https://github.com/amices/mice/issues
 LinkingTo: cpp11, Rcpp
 License: GPL (>= 2)
 RoxygenNote: 7.2.3
+Roxygen: list(markdown = TRUE)
diff --git a/NAMESPACE b/NAMESPACE
@@ -65,10 +65,12 @@ export(cc)
 export(cci)
 export(complete)
 export(construct.blocks)
+export(construct.parcel)
 export(convergence)
 export(densityplot)
 export(estimice)
 export(extractBS)
+export(f2p)
 export(fico)
 export(filter)
 export(fix.coef)
@@ -90,8 +92,10 @@ export(is.mitml.result)
 export(lm.mids)
 export(make.blocks)
 export(make.blots)
+export(make.dots)
 export(make.formulas)
 export(make.method)
+export(make.parcel)
 export(make.post)
 export(make.predictorMatrix)
 export(make.visitSequence)
@@ -148,6 +152,7 @@ export(nelsonaalen)
 export(nic)
 export(nimp)
 export(norm.draw)
+export(p2f)
 export(parlmice)
 export(pool)
 export(pool.compare)
@@ -158,6 +163,7 @@ export(pool.syn)
 export(pool.table)
 export(quickpred)
 export(rbind)
+export(remove.rhs.variables)
 export(squeeze)
 export(stripplot)
 export(supports.transparent)
@@ -256,6 +262,7 @@ importFrom(stats,spline)
 importFrom(stats,summary.glm)
 importFrom(stats,terms)
 importFrom(stats,update)
+importFrom(stats,update.formula)
 importFrom(stats,var)
 importFrom(stats,vcov)
 importFrom(tidyr,complete)

diff --git a/NEWS.md b/NEWS.md
@@ -1,3 +1,33 @@
+## New behaviours
+
+1. Prevention of `NA` propagation by removing incomplete predictors. This version detects when a predictor contains missing values that are not imputed. In order to prevent NA propagation, `mice()` does the following actions: 1) removes incomplete predictor(s) from the RHS, 2) adds incomplete predictor(s) to formulas `(var ~ 1)` and block components, sets `method[var] = ""`, and sets the `predictorMatrix` column and row to zero
+
+2. The `predictorMatrix` input can be a square submatrix of the full `predictorMatrix`. `mice()` will augment `predictorMatrix` to the full matrix and always return a p * p named matrix corresponding to the p columns in the data. The inactive variables will have zero columns and rows.
+
+3. The `predictorMatrix` input may be unnamed if its size is p * p. For other than p * p, an unnamed matrix generated an error.
+
+
+## Changes 
+
+- Performs stricter checks on zero rows in predictorMatrix under empty imputation method
+- Adds supports a tiny predictorMatrix
+- Solves bug in f2p()
+- Adds new function `remove.rhs.variables()`
+- Adds a `validate.mids()` check at exit that errors if `rownames(predictorMatrix)` differ from `colnames(data)`. Some more output tests need to be added.
+- Removes codes designed to work specifically with a non-square `predictorMatrix`
+- Generates an error if `predictorMatrix` has fewer rows than length of `blocks`
+
+## New exit checks
+
+- `rownames(predictorMatrix)` must match `colnames(data)`
+- length of `formulas` and `blocks` must be equal
+- length of `formulas` and `method` must be equal
+- length of `blots` and `method` must be equal
+- length of `method` vector cannot exceed number of variables
+- length of `imp` and number of variables must be equal
+
+## Other fixes
+
 * Prepares for the deprecation of the `blocks` argument at various places
 * Removes the need for `blocks` in `initialize_chain()`
 * In `rbind()`, when formulas are concatenated and duplicate names are found, also rename the duplicated variables in formulas by their new name

diff --git a/R/D1.R b/R/D1.R
@@ -2,25 +2,25 @@
 #'
 #' The D1-statistics is the multivariate Wald test.
 #'
-#' @param fit1 An object of class \code{mira}, produced by \code{with()}.
-#' @param fit0 An object of class \code{mira}, produced by \code{with()}. The
-#' model in \code{fit0} is a nested within \code{fit1}. The default null
-#' model \code{fit0 = NULL} compares \code{fit1} to the intercept-only model.
+#' @param fit1 An object of class `mira`, produced by `with()`.
+#' @param fit0 An object of class `mira`, produced by `with()`. The
+#' model in `fit0` is a nested within `fit1`. The default null
+#' model `fit0 = NULL` compares `fit1` to the intercept-only model.
 #' @param dfcom A single number denoting the
-#' complete-data degrees of freedom of model \code{fit1}. If not specified,
-#' it is set equal to \code{df.residual} of model \code{fit1}. If that cannot
+#' complete-data degrees of freedom of model `fit1`. If not specified,
+#' it is set equal to `df.residual` of model `fit1`. If that cannot
 #' be done, the procedure assumes (perhaps incorrectly) a large sample.
 #' @param df.com Deprecated
 #' @note Warning: `D1()` assumes that the order of the variables is the
 #' same in different models. See
-#' \url{https://github.com/amices/mice/issues/420} for details.
+#' <https://github.com/amices/mice/issues/420> for details.
 #' @references
 #' Li, K. H., T. E. Raghunathan, and D. B. Rubin. 1991.
 #' Large-Sample Significance Levels from Multiply Imputed Data Using
 #' Moment-Based Statistics and an F Reference Distribution.
-#' \emph{Journal of the American Statistical Association}, 86(416): 1065–73.
+#' *Journal of the American Statistical Association*, 86(416): 1065–73.
 #'
-#' \url{https://stefvanbuuren.name/fimd/sec-multiparameter.html#sec:wald}
+#' <https://stefvanbuuren.name/fimd/sec-multiparameter.html#sec:wald>
 #' @examples
 #' # Compare two linear models:
 #' imp <- mice(nhanes2, seed = 51009, print = FALSE)
@@ -34,7 +34,7 @@
 #' fit0 <- with(imp, glm(gen > levels(gen)[1] ~ hgt + hc, family = binomial))
 #' D1(fit1, fit0)
 #' }
-#' @seealso \code{\link[mitml]{testModels}}
+#' @seealso [mitml::testModels()]
 #' @export
 D1 <- function(fit1, fit0 = NULL, dfcom = NULL, df.com = NULL) {
   install.on.demand("mitml")

diff --git a/R/D2.R b/R/D2.R
@@ -7,13 +7,13 @@
 #' @inheritParams mitml::testModels
 #' @note Warning: `D2()` assumes that the order of the variables is the
 #' same in different models. See
-#' \url{https://github.com/amices/mice/issues/420} for details.
+#' <https://github.com/amices/mice/issues/420> for details.
 #' @references
 #' Li, K. H., X. L. Meng, T. E. Raghunathan, and D. B. Rubin. 1991.
 #' Significance Levels from Repeated p-Values with Multiply-Imputed Data.
-#' \emph{Statistica Sinica} 1 (1): 65–92.
+#' *Statistica Sinica* 1 (1): 65–92.
 #'
-#' \url{https://stefvanbuuren.name/fimd/sec-multiparameter.html#sec:chi}
+#' <https://stefvanbuuren.name/fimd/sec-multiparameter.html#sec:chi>
 #' @examples
 #' # Compare two linear models:
 #' imp <- mice(nhanes2, seed = 51009, print = FALSE)
@@ -27,7 +27,7 @@
 #' fit0 <- with(imp, glm(gen > levels(gen)[1] ~ hgt + hc, family = binomial))
 #' D2(fit1, fit0)
 #' }
-#' @seealso \code{\link[mitml]{testModels}}
+#' @seealso [mitml::testModels()]
 #' @export
 D2 <- function(fit1, fit0 = NULL, use = "wald") {
   install.on.demand("mitml")

diff --git a/R/D3.R b/R/D3.R
@@ -3,34 +3,34 @@
 #' The D3-statistic is a likelihood-ratio test statistic.
 #'
 #' @details
-#' The \code{D3()} function implement the LR-method by
+#' The `D3()` function implement the LR-method by
 #' Meng and Rubin (1992). The implementation of the method relies
-#' on the \code{broom} package, the standard \code{update} mechanism
-#' for statistical models in \code{R} and the \code{offset} function.
+#' on the `broom` package, the standard `update` mechanism
+#' for statistical models in `R` and the `offset` function.
 #'
-#' The function calculates \code{m} repetitions of the full
+#' The function calculates `m` repetitions of the full
 #' (or null) models, calculates the mean of the estimates of the
 #' (fixed) parameter coefficients \eqn{\beta}. For each imputed
 #' imputed dataset, it calculates the likelihood for the model with
 #' the parameters constrained to \eqn{\beta}.
 #'
-#' The \code{mitml::testModels()} function offers similar functionality
-#' for a subset of statistical models. Results of \code{mice::D3()} and
-#' \code{mitml::testModels()} differ in multilevel models because the
-#' \code{testModels()} also constrains the variance components parameters.
+#' The `mitml::testModels()` function offers similar functionality
+#' for a subset of statistical models. Results of `mice::D3()` and
+#' `mitml::testModels()` differ in multilevel models because the
+#' `testModels()` also constrains the variance components parameters.
 #' For more details on
 #'
-#' @seealso \code{\link{fix.coef}}
+#' @seealso [fix.coef()]
 #' @inheritParams D1
-#' @return An object of class \code{mice.anova}
+#' @return An object of class `mice.anova`
 #' @references
 #' Meng, X. L., and D. B. Rubin. 1992.
 #' Performing Likelihood Ratio Tests with Multiply-Imputed Data Sets.
-#' \emph{Biometrika}, 79 (1): 103–11.
+#' *Biometrika*, 79 (1): 103–11.
 #'
-#' \url{https://stefvanbuuren.name/fimd/sec-multiparameter.html#sec:likelihoodratio}
+#' <https://stefvanbuuren.name/fimd/sec-multiparameter.html#sec:likelihoodratio>
 #'
-#' \url{http://bbolker.github.io/mixedmodels-misc/glmmFAQ.html#setting-residual-variances-to-a-fixed-value-zero-or-other}
+#' <http://bbolker.github.io/mixedmodels-misc/glmmFAQ.html#setting-residual-variances-to-a-fixed-value-zero-or-other>
 #' @examples
 #' # Compare two linear models:
 #' imp <- mice(nhanes2, seed = 51009, print = FALSE)