easystats
diff --git a/‎DESCRIPTION
Lines changed: 2 additions & 1 deletion b/‎DESCRIPTION
Lines changed: 2 additions & 1 deletion
diff --git a/‎NAMESPACE
Lines changed: 1 addition & 0 deletions b/‎NAMESPACE
Lines changed: 1 addition & 0 deletions
diff --git a/‎NEWS.md
Lines changed: 9 additions & 0 deletions b/‎NEWS.md
Lines changed: 9 additions & 0 deletions
diff --git a/‎R/factor_analysis.R
Lines changed: 53 additions & 2 deletions b/‎R/factor_analysis.R
Lines changed: 53 additions & 2 deletions
diff --git a/‎R/principal_components.R
Lines changed: 41 additions & 24 deletions b/‎R/principal_components.R
Lines changed: 41 additions & 24 deletions
diff --git a/‎R/utils_pca_efa.R
Lines changed: 18 additions & 13 deletions b/‎R/utils_pca_efa.R
Lines changed: 18 additions & 13 deletions
diff --git a/‎man/get_scores.Rd
Lines changed: 14 additions & 9 deletions b/‎man/get_scores.Rd
Lines changed: 14 additions & 9 deletions
@@ -110,6 +110,7 @@ Suggests:
     cluster,
     cobalt,
     coda,
+    correlation,
     coxme,
     cplm,
     curl,
@@ -228,4 +229,4 @@ Config/testthat/parallel: true
 Config/Needs/website: easystats/easystatstemplate
 Config/Needs/check: stan-dev/cmdstanr
 Config/rcmdcheck/ignore-inconsequential-notes: true
-Remotes: easystats/insight, easystats/bayestestR
+Remotes: easystats/insight, easystats/bayestestR, easystats/correlation
@@ -151,6 +151,7 @@ S3method(equivalence_test,rma)
 S3method(equivalence_test,wbm)
 S3method(equivalence_test,zeroinfl)
 S3method(factor_analysis,data.frame)
+S3method(factor_analysis,matrix)
 S3method(factor_scores,fa)
 S3method(factor_scores,omega)
 S3method(factor_scores,parameters_efa)
 
@@ -4,13 +4,22 @@
 
 * The `standardize` argument in `factor_analysis()` now defaults to `FALSE`.
 
+* The `rotation` argument in `factor_analysis()` now defaults to `"oblimin"`,
+  because the former default of `"none"` rarely makes sense in the context of
+  factor analysis. If you want to use no rotation, please set `rotation =
+  "none"`.
+
 * The `cor` argument in `n_factors()` was renamed into `correlation_matrix`. In
   `factor_analysis()`, the `cor` argument was completely removed to avoid naming
   collision with the `cor` argument of `psych::fa()`, which now users can pass
   the `cor` argument to `psych::fa()` when using `factor_analysis()`.
 
 ## Changes
 
+* `factor_analysis()` gets a `.matrix` method, including arguments `n_obs` and
+  `n_matrix`, to compute factor analysis for a correlation matrix or covariance
+  matrix.
+
 * New function `factor_scores()` to extract factor scores from EFA (`psych::fa()`
   or `factor_analysis()`).
 
 
@@ -9,7 +9,8 @@ factor_analysis <- function(x, ...) {
 #' @export
 factor_analysis.data.frame <- function(x,
                                        n = "auto",
-                                       rotation = "none",
+                                       rotation = "oblimin",
+                                       factor_method = "minres",
                                        sort = FALSE,
                                        threshold = NULL,
                                        standardize = FALSE,
@@ -31,7 +32,7 @@ factor_analysis.data.frame <- function(x,
 
   # FA
   out <- model_parameters(
-    psych::fa(x, nfactors = n, rotate = rotation, ...),
+    psych::fa(x, nfactors = n, rotate = rotation, fm = factor_method, ...),
     threshold = threshold,
     sort = sort,
     ...
@@ -42,6 +43,56 @@ factor_analysis.data.frame <- function(x,
 }
 
 
+#' @rdname principal_components
+#' @export
+factor_analysis.matrix <- function(x,
+                                   n = "auto",
+                                   rotation = "oblimin",
+                                   factor_method = "minres",
+                                   n_obs = NULL,
+                                   sort = FALSE,
+                                   threshold = NULL,
+                                   standardize = FALSE,
+                                   ...) {
+  # check if we have a square matrix. in this case, we assume that
+  # the user wants to do a factor analysis on the correlation matrix
+  if ((dim(x)[1] == dim(x)[2]) && is.null(n_obs)) {
+    insight::format_error(
+      "You provided a square matrix, which is assumed to be a correlation matrix. Please specify the number of observations with `n_obs`. If your matrix is not a correlation matrix, please provide a data frame instead."
+    )
+  }
+
+  # the default n.obs argument in `psych::fa()` is `NA`, so we change
+  # our default `NULL` to `NA` to avoid errors
+  n_matrix <- NULL
+  if (is.null(n_obs)) {
+    n_obs <- NA
+  } else if (is.matrix(n_obs)) {
+    n_matrix <- n_obs
+    n_obs <- NA
+    # check for correct dimensions
+    if (dim(n_matrix)[1] != dim(x)[1] || dim(n_matrix)[2] != dim(x)[2]) {
+      insight::format_error(
+        "The provided `n_obs` matrix must have the same dimensions as the input matrix."
+      )
+    }
+  }
+
+  factor_analysis.data.frame(
+    x,
+    n = n,
+    rotation = rotation,
+    factor_method = factor_method,
+    sort = sort,
+    threshold = threshold,
+    standardize = standardize,
+    n.obs = n_obs,
+    np.obs = n_matrix,
+    ...
+  )
+}
+
+
 .is_oblique_rotation <- function(rotation) {
   !is.null(rotation) && tolower(rotation) %in% c("promax", "oblimin", "simplimax", "bentlerQ", "geominQ", "biquartimin", "cluster") # nolint
 }
@@ -1,12 +1,12 @@
 #' Principal Component Analysis (PCA) and Factor Analysis (FA)
 #'
-#' The functions `principal_components()` and `factor_analysis()` can
-#' be used to perform a principal component analysis (PCA) or a factor analysis
-#' (FA). They return the loadings as a data frame, and various methods and
-#' functions are available to access / display other information (see the
-#' Details section).
+#' The functions `principal_components()` and `factor_analysis()` can be used to
+#' perform a principal component analysis (PCA) or a factor analysis (FA). They
+#' return the loadings as a data frame, and various methods and functions are
+#' available to access / display other information (see the 'Details' section).
 #'
-#' @param x A data frame or a statistical model.
+#' @param x A data frame or a statistical model. For `closest_component()`, the
+#'   output of the `principal_components()` function.
 #' @param n Number of components to extract. If `n="all"`, then `n` is set as
 #'   the number of variables minus 1 (`ncol(x)-1`). If `n="auto"` (default) or
 #'   `n=NULL`, the number of components is selected through [`n_factors()`]
@@ -19,12 +19,29 @@
 #' @param rotation If not `"none"`, the PCA / FA will be computed using the
 #'   **psych** package. Possible options include `"varimax"`, `"quartimax"`,
 #'   `"promax"`, `"oblimin"`, `"simplimax"`, or `"cluster"` (and more). See
-#'   [`psych::fa()`] for details.
+#'   [`psych::fa()`] for details. The default is `"none"` for PCA, and
+#'   `"oblimin"` for FA.
+#' @param factor_method The factoring method to be used. Passed to the `fm`
+#'   argument in `psych::fa()`. Defaults to `"minres"` (minimum residual). Other
+#'   options include `"uls"`, `"ols"`, `"wls"`, `"gls"`, `"ml"`, `"minchi"`,
+#'   `"minrank"`, `"old.min"`, and `"alpha"`. See `?psych::fa` for details.
 #' @param sparse Whether to compute sparse PCA (SPCA, using [`sparsepca::spca()`]).
 #'   SPCA attempts to find sparse loadings (with few nonzero values), which improves
 #'   interpretability and avoids overfitting. Can be `TRUE` or `"robust"` (see
 #'   [`sparsepca::robspca()`]).
 #' @param sort Sort the loadings.
+#' @param n_obs An integer or a matrix.
+#'   - **Integer:** Number of observations in the original data set if `x` is a
+#'     correlation matrix. Required to compute correct fit indices.
+#'   - **Matrix:** A matrix where each cell `[i, j]` specifies the number of
+#'     pairwise complete observations used to compute the correlation between
+#'     variable `i` and variable `j` in the input `x`. It is crucial when `x` is
+#'     a correlation matrix (rather than raw data), especially if that matrix
+#'     was derived from a dataset containing missing values using pairwise
+#'     deletion. Providing a matrix allows `psych::fa()` to accurately calculate
+#'     statistical measures, such as chi-square fit statistics, by accounting
+#'     for the varying sample sizes that contribute to each individual
+#'     correlation coefficient.
 #' @param threshold A value between 0 and 1 indicates which (absolute) values
 #'   from the loadings should be removed. An integer higher than 1 indicates the
 #'   n strongest loadings to retain. Can also be `"max"`, in which case it will
@@ -46,7 +63,6 @@
 #'   with missing values from the original data, hence the number of rows of
 #'   predicted data and original data is equal.
 #' @param ... Arguments passed to or from other methods.
-#' @param pca_results The output of the `principal_components()` function.
 #' @param digits Argument for `print()`, indicates the number of digits
 #'   (rounding) to be used.
 #' @param labels Argument for `print()`, character vector of same length as
@@ -83,7 +99,7 @@
 #'   values, so it matches the original data frame.
 #'
 #' - `performance::item_omega()` is a convenient wrapper around `psych::omega()`,
-#'   which provides some additioal methods to work seamleassly within the
+#'   which provides some additional methods to work seamlessly within the
 #'   *easystats* framework.
 #'
 #' - [`performance::check_normality()`] checks residuals from objects returned
@@ -134,14 +150,15 @@
 #'
 #' ## Computing Item Scores
 #' Use [`get_scores()`] to compute scores for the "subscales" represented by the
-#' extracted principal components. `get_scores()` takes the results from
-#' `principal_components()` and extracts the variables for each component found
-#' by the PCA. Then, for each of these "subscales", raw means are calculated
-#' (which equals adding up the single items and dividing by the number of items).
-#' This results in a sum score for each component from the PCA, which is on the
-#' same scale as the original, single items that were used to compute the PCA.
-#' One can also use `predict()` to back-predict scores for each component,
-#' to which one can provide `newdata` or a vector of `names` for the components.
+#' extracted principal components or factors. `get_scores()` takes the results
+#' from `principal_components()` or `factor_analysis()` and extracts the
+#' variables for each component found by the PCA. Then, for each of these
+#' "subscales", raw means are calculated (which equals adding up the single
+#' items and dividing by the number of items). This results in a sum score for
+#' each component from the PCA, which is on the same scale as the original,
+#' single items that were used to compute the PCA. One can also use `predict()`
+#' to back-predict scores for each component, to which one can provide `newdata`
+#' or a vector of `names` for the components.
 #'
 #' ## Explained Variance and Eingenvalues
 #' Use `summary()` to get the Eigenvalues and the explained variance for each
@@ -213,9 +230,9 @@
 #'
 #' # Factor Analysis (FA) ------------------------
 #'
-#' factor_analysis(mtcars[, 1:7], n = "all", threshold = 0.2)
-#' factor_analysis(mtcars[, 1:7], n = 2, rotation = "oblimin", threshold = "max", sort = TRUE)
-#' factor_analysis(mtcars[, 1:7], n = 2, threshold = 2, sort = TRUE)
+#' factor_analysis(mtcars[, 1:7], n = "all", threshold = 0.2, rotation = "Promax")
+#' factor_analysis(mtcars[, 1:7], n = 2, threshold = "max", sort = TRUE)
+#' factor_analysis(mtcars[, 1:7], n = 2, rotation = "none", threshold = 2, sort = TRUE)
 #'
 #' efa <- factor_analysis(mtcars[, 1:5], n = 2)
 #' summary(efa)
@@ -234,9 +251,9 @@ principal_components <- function(x, ...) {
 
 #' @rdname principal_components
 #' @export
-rotated_data <- function(pca_results, verbose = TRUE) {
-  original_data <- attributes(pca_results)$dataset
-  rotated_matrix <- insight::get_predicted(attributes(pca_results)$model)
+rotated_data <- function(x, verbose = TRUE) {
+  original_data <- attributes(x)$dataset
+  rotated_matrix <- insight::get_predicted(attributes(x)$model)
   out <- NULL
 
   if (is.null(original_data) || is.null(rotated_matrix)) {
@@ -246,7 +263,7 @@ rotated_data <- function(pca_results, verbose = TRUE) {
     return(NULL)
   }
 
-  compl_cases <- attributes(pca_results)$complete_cases
+  compl_cases <- attributes(x)$complete_cases
   if (is.null(compl_cases) && nrow(original_data) != nrow(rotated_matrix)) {
     if (verbose) {
       insight::format_warning("Could not retrieve information about missing data.")
 
@@ -1,10 +1,12 @@
-#' Get Scores from Principal Component Analysis (PCA)
+#' Get Scores from Principal Component or Factor Analysis (PCA/FA)
 #'
 #' `get_scores()` takes `n_items` amount of items that load the most
 #' (either by loading cutoff or number) on a component, and then computes their
-#' average.
+#' average. This results in a sum score for each component from the PCA/FA,
+#' which is on the same scale as the original, single items that were used to
+#' compute the PCA/FA.
 #'
-#' @param x An object returned by [principal_components()].
+#' @param x An object returned by [principal_components()] or [factor_analysis()].
 #' @param n_items Number of required (i.e. non-missing) items to build the sum
 #' score for an observation. If an observation has more missing values than
 #' `n_items` in all items of a (sub) scale, `NA` is returned for that
@@ -19,15 +21,18 @@
 #' @details
 #' `get_scores()` takes the results from [`principal_components()`] or
 #' [`factor_analysis()`] and extracts the variables for each component found by
-#' the PCA. Then, for each of these "subscales", row means are calculated (which
-#' equals adding up the single items and dividing by the number of items). This
-#' results in a sum score for each component from the PCA, which is on the same
-#' scale as the original, single items that were used to compute the PCA.
+#' the PCA/FA. Then, for each of these "subscales", row means are calculated
+#' (which equals adding up the single items and dividing by the number of
+#' items). This results in a sum score for each component from the PCA/FA, which
+#' is on the same scale as the original, single items that were used to compute
+#' the PCA/FA.
 #'
 #' @return A data frame with subscales, which are average sum scores for all
-#'   items from each component.
+#' items from each component or factor.
 #'
-#' @seealso [`principal_components()`]
+#' @seealso Functions to carry out a PCA ([`principal_components()`]) or
+#' a FA ([`factor_analysis()`]). [`factor_scores()`] extracts factor scores
+#' from an FA object.
 #'
 #' @examplesIf insight::check_if_installed("psych", quietly = TRUE)
 #' pca <- principal_components(mtcars[, 1:7], n = 2, rotation = "varimax")
@@ -596,11 +601,11 @@ sort.parameters_pca <- sort.parameters_efa
 
 #' @rdname principal_components
 #' @export
-closest_component <- function(pca_results) {
-  if ("closest_component" %in% names(attributes(pca_results))) {
-    attributes(pca_results)$closest_component
+closest_component <- function(x) {
+  if ("closest_component" %in% names(attributes(x))) {
+    attributes(x)$closest_component
   } else {
-    .closest_component(pca_results)
+    .closest_component(x)
   }
 }