From 4eab9b868d962639420b0509b8226b80a1b64f9d Mon Sep 17 00:00:00 2001
From: leifeld <philip.leifeld@manchester.ac.uk>
Date: Mon, 19 Aug 2024 21:55:23 +0200
Subject: [PATCH 01/11] Updated GitHub actions

---
 ...ild-and-check.yml => build-check-test.yml} | 180 +++++-------------
 1 file changed, 45 insertions(+), 135 deletions(-)
 rename .github/workflows/{build-and-check.yml => build-check-test.yml} (52%)

diff --git a/.github/workflows/build-and-check.yml b/.github/workflows/build-check-test.yml
similarity index 52%
rename from .github/workflows/build-and-check.yml
rename to .github/workflows/build-check-test.yml
index 4caf6570..fee3c9e8 100644
--- a/.github/workflows/build-and-check.yml
+++ b/.github/workflows/build-check-test.yml
@@ -1,102 +1,19 @@
-name: build
+name: build-check-test
 
 on: [push, pull_request, workflow_dispatch]
 
 jobs:
-  install-system-dependencies:
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v3
-
-      - name: Restore System Dependencies Cache
-        uses: actions/cache@v3
-        id: system-deps-cache
-        with:
-          path: |
-            /usr/local/texlive
-            /usr/local/bin/pandoc
-            /usr/local/texlive/texmf-var
-            /usr/local/texlive/tlpkg/texlive.tlpdb
-          key: ${{ runner.os }}-system-deps-v1
-
-      - name: Install System Dependencies
-        if: steps.system-deps-cache.outputs.cache-hit != 'true'
-        run: |
-          sudo apt-get update
-          sudo apt-get install -y texlive-latex-base texlive-latex-recommended texlive-latex-extra texlive-fonts-recommended texlive-bibtex-extra
-
-  install-r-dependencies:
-    runs-on: ${{ matrix.config.os }}
-    name: ${{ matrix.config.os }} (${{ matrix.config.r }})
-    strategy:
-      fail-fast: false
-      matrix:
-        config:
-          - {os: macOS-latest,   r: 'release'}
-          - {os: windows-latest, r: 'release'}
-          - {os: ubuntu-latest,   r: 'devel', http-user-agent: 'release'}
-          - {os: ubuntu-latest,   r: 'release'}
-          - {os: ubuntu-latest,   r: 'oldrel-1'}
-    env:
-      GITHUB_PAT: ${{ secrets.GITHUB_TOKEN }}
-      R_KEEP_PKG_SOURCE: yes
-    steps:
-      - uses: actions/checkout@v3
-      - uses: actions/cache@v3
-        id: r-packages-cache
-        with:
-          path: |
-            ~/.cache/R
-            /usr/local/texlive
-            /usr/local/bin/pandoc
-            /usr/local/texlive/texmf-var
-          key: ${{ runner.os }}-r-${{ hashFiles('**/DESCRIPTION') }}-v1
-
-      - uses: r-lib/actions/setup-r@v2
-
-      - uses: r-lib/actions/setup-r-dependencies@v2
-        with:
-          cache-version: 2
-          working-directory: rDNA/rDNA
-          extra-packages: |
-            any::devtools
-            any::testthat
-            any::roxygen2
-            any::ggplot2
-            any::roxygen2
-            any::igraph
-            any::ggraph
-            any::askpass
-            any::cluster
-            any::sna
-            any::ggrepel
-            any::coda
-            any::MCMCpack
-            any::tidygraph
-            any::heatmaply
-            any::factoextra
-            any::MASS
-            any::pbmcapply
-
   Bibliography:
-    needs: install-system-dependencies
     runs-on: ubuntu-latest
     steps:
     - uses: actions/checkout@v3
     - uses: r-lib/actions/setup-tinytex@v2
-    - uses: gradle/wrapper-validation-action@v1
-    - name: Restore System Dependencies
-      uses: actions/cache@v3
-      with:
-        path: |
-          /usr/local/texlive
-          /usr/local/bin/pandoc
-          /usr/local/texlive/texmf-var
-          /usr/local/texlive/tlpkg/texlive.tlpdb
-        key: ${{ runner.os }}-system-deps-v1
 
-    - name: Restore pandoc
-      uses: actions/cache@v3
+    - name: Install LaTeX packages
+      run: tlmgr install urlbst
+
+    - uses: gradle/wrapper-validation-action@v1
+    - uses: actions/cache@v3
       id: pandoc
       with:
         path: pandoc-2.19.2-1
@@ -117,8 +34,10 @@ jobs:
 
     - name: Setup Gradle
       uses: gradle/gradle-build-action@v2.4.2
+
     - name: Execute Gradle build for bibliography
-      run: ./gradlew :bibliography:build --info --stacktrace
+      run: ./gradlew :bibliography:build
+
     - name: Store artifacts
       uses: actions/upload-artifact@v3
       with:
@@ -148,31 +67,22 @@ jobs:
         name: DNA
         path: build/*.jar
 
+
   rDNA:
-    needs: [DNA, install-system-dependencies, install-r-dependencies]
     runs-on: ubuntu-latest
     steps:
     - uses: actions/checkout@v3
+
     - uses: r-lib/actions/setup-r@v2
-    - name: Restore System Dependencies
-      uses: actions/cache@v3
-      with:
-        path: |
-          /usr/local/texlive
-          /usr/local/bin/pandoc
-          /usr/local/texlive/texmf-var
-          /usr/local/texlive/tlpkg/texlive.tlpdb
-        key: ${{ runner.os }}-system-deps-v1
-    - name: Restore R Packages
-      uses: actions/cache@v3
-      with:
-        path: ~/.cache/R
-        key: ${{ runner.os }}-r-${{ hashFiles('**/DESCRIPTION') }}-v1
+
     - uses: gradle/wrapper-validation-action@v1
+
     - name: Setup Gradle
       uses: gradle/gradle-build-action@v2.4.2
+
     - name: Execute Gradle build for rDNA
       run: ./gradlew :rDNA:build
+
     - name: Store artifacts
       uses: actions/upload-artifact@v3
       with:
@@ -181,8 +91,9 @@ jobs:
 
   rDNA-check:
     runs-on: ${{ matrix.config.os }}
-    needs: [DNA, install-system-dependencies, install-r-dependencies]
+
     name: ${{ matrix.config.os }} (${{ matrix.config.r }})
+
     strategy:
       fail-fast: false
       matrix:
@@ -192,40 +103,26 @@ jobs:
           - {os: ubuntu-latest,   r: 'devel', http-user-agent: 'release'}
           - {os: ubuntu-latest,   r: 'release'}
           - {os: ubuntu-latest,   r: 'oldrel-1'}
+
     env:
       GITHUB_PAT: ${{ secrets.GITHUB_TOKEN }}
       R_KEEP_PKG_SOURCE: yes
+
     steps:
       - uses: actions/checkout@v3
+
       - uses: r-lib/actions/setup-r@v2
         with:
           r-version: ${{ matrix.config.r }}
           http-user-agent: ${{ matrix.config.http-user-agent }}
           use-public-rspm: true
-      - name: Restore System Dependencies
-        uses: actions/cache@v3
-        with:
-          path: |
-            /usr/local/texlive
-            /usr/local/bin/pandoc
-            /usr/local/texlive/texmf-var
-            /usr/local/texlive/tlpkg/texlive.tlpdb
-          key: ${{ runner.os }}-system-deps-v1
-      - name: Restore R Packages
-        uses: actions/cache@v3
-        with:
-          path: ~/.cache/R
-          key: ${{ runner.os }}-r-${{ hashFiles('**/DESCRIPTION') }}-v1
-      - uses: gradle/wrapper-validation-action@v1
-      - name: Setup Gradle
-        uses: gradle/gradle-build-action@v2.4.2
-      - name: Execute Gradle build for rDNA
-        run: ./gradlew :rDNA:build
+
       - uses: r-lib/actions/setup-r-dependencies@v2
         with:
           extra-packages: any::rcmdcheck
           needs: check
           working-directory: rDNA/rDNA
+
       - uses: r-lib/actions/check-r-package@v2
         with:
           working-directory: rDNA/rDNA
@@ -233,24 +130,37 @@ jobs:
 
   rDNA-test:
     runs-on: ubuntu-latest
-    needs: [DNA, install-system-dependencies, install-r-dependencies]
     steps:
       - uses: actions/checkout@v3
       - uses: r-lib/actions/setup-r@v2
-      - name: Restore System Dependencies
-        uses: actions/cache@v3
-        with:
-          path: |
-            /usr/local/texlive
-            /usr/local/bin/pandoc
-            /usr/local/texlive/texmf-var
-            /usr/local/texlive/tlpkg/texlive.tlpdb
-          key: ${{ runner.os }}-system-deps-v1
+
       - name: Restore R Packages
         uses: actions/cache@v3
         with:
           path: ~/.cache/R
           key: ${{ runner.os }}-r-${{ hashFiles('**/DESCRIPTION') }}-v1
+
+      - uses: r-lib/actions/setup-r-dependencies@v2
+        with:
+          cache-version: 2
+          working-directory: rDNA/rDNA
+          extra-packages: |
+            any::ggplot2
+            any::roxygen2
+            any::igraph
+            any::ggraph
+            any::askpass
+            any::cluster
+            any::sna
+            any::ggrepel
+            any::coda
+            any::MCMCpack
+            any::tidygraph
+            any::heatmaply
+            any::factoextra
+            any::MASS
+            any::pbmcapply
+
       - uses: gradle/wrapper-validation-action@v1
       - name: Setup Gradle
         uses: gradle/gradle-build-action@v2.4.2

From d78a4ec7e969b4a37f2fadf1a6a3cda8e2cd20dd Mon Sep 17 00:00:00 2001
From: leifeld <philip.leifeld@manchester.ac.uk>
Date: Mon, 19 Aug 2024 22:07:59 +0200
Subject: [PATCH 02/11] Updated GitHub actions

---
 .github/workflows/build-check-test.yml | 26 +++++++++++++++++++++++---
 1 file changed, 23 insertions(+), 3 deletions(-)

diff --git a/.github/workflows/build-check-test.yml b/.github/workflows/build-check-test.yml
index fee3c9e8..1a0c9f4f 100644
--- a/.github/workflows/build-check-test.yml
+++ b/.github/workflows/build-check-test.yml
@@ -75,6 +75,19 @@ jobs:
 
     - uses: r-lib/actions/setup-r@v2
 
+    - name: Restore R Packages
+      uses: actions/cache@v3
+      with:
+        path: ~/.cache/R
+        key: ${{ runner.os }}-r-${{ hashFiles('**/DESCRIPTION') }}-v1
+
+    - uses: r-lib/actions/setup-r-dependencies@v2
+      with:
+        cache-version: 2
+        working-directory: rDNA/rDNA
+        extra-packages: |
+        any::roxygen2
+
     - uses: gradle/wrapper-validation-action@v1
 
     - name: Setup Gradle
@@ -117,11 +130,18 @@ jobs:
           http-user-agent: ${{ matrix.config.http-user-agent }}
           use-public-rspm: true
 
+      - name: Restore R Packages
+        uses: actions/cache@v3
+        with:
+          path: ~/.cache/R
+          key: ${{ runner.os }}-r-${{ hashFiles('**/DESCRIPTION') }}-v1
+
       - uses: r-lib/actions/setup-r-dependencies@v2
         with:
-          extra-packages: any::rcmdcheck
-          needs: check
+          cache-version: 2
           working-directory: rDNA/rDNA
+          extra-packages: |
+            any::rcmdcheck
 
       - uses: r-lib/actions/check-r-package@v2
         with:
@@ -145,8 +165,8 @@ jobs:
           cache-version: 2
           working-directory: rDNA/rDNA
           extra-packages: |
+            any::covr
             any::ggplot2
-            any::roxygen2
             any::igraph
             any::ggraph
             any::askpass

From 2d274adfb1048d8ca14cd6c713c049dc28067b55 Mon Sep 17 00:00:00 2001
From: leifeld <philip.leifeld@manchester.ac.uk>
Date: Mon, 19 Aug 2024 22:26:45 +0200
Subject: [PATCH 03/11] Updated GitHub actions

---
 .github/workflows/build-check-test.yml | 21 +++++++++++++++++----
 1 file changed, 17 insertions(+), 4 deletions(-)

diff --git a/.github/workflows/build-check-test.yml b/.github/workflows/build-check-test.yml
index 1a0c9f4f..4e07254a 100644
--- a/.github/workflows/build-check-test.yml
+++ b/.github/workflows/build-check-test.yml
@@ -79,20 +79,26 @@ jobs:
       uses: actions/cache@v3
       with:
         path: ~/.cache/R
-        key: ${{ runner.os }}-r-${{ hashFiles('**/DESCRIPTION') }}-v1
+        key: ${{ runner.os }}-r-rDNA-${{ hashFiles('**/DESCRIPTION') }}-v1
 
     - uses: r-lib/actions/setup-r-dependencies@v2
       with:
         cache-version: 2
         working-directory: rDNA/rDNA
         extra-packages: |
-        any::roxygen2
+          any::roxygen2
 
     - uses: gradle/wrapper-validation-action@v1
 
     - name: Setup Gradle
       uses: gradle/gradle-build-action@v2.4.2
 
+    - name: Restore Gradle Cache
+      uses: actions/cache@v3
+      with:
+        path: ~/.gradle/caches
+        key: ${{ runner.os }}-gradle-${{ hashFiles('**/build.gradle') }}-v1
+
     - name: Execute Gradle build for rDNA
       run: ./gradlew :rDNA:build
 
@@ -134,7 +140,7 @@ jobs:
         uses: actions/cache@v3
         with:
           path: ~/.cache/R
-          key: ${{ runner.os }}-r-${{ hashFiles('**/DESCRIPTION') }}-v1
+          key: ${{ runner.os }}-r-rDNA-check-${{ hashFiles('**/DESCRIPTION') }}-v1
 
       - uses: r-lib/actions/setup-r-dependencies@v2
         with:
@@ -158,7 +164,7 @@ jobs:
         uses: actions/cache@v3
         with:
           path: ~/.cache/R
-          key: ${{ runner.os }}-r-${{ hashFiles('**/DESCRIPTION') }}-v1
+          key: ${{ runner.os }}-r-rDNA-test-${{ hashFiles('**/DESCRIPTION') }}-v1
 
       - uses: r-lib/actions/setup-r-dependencies@v2
         with:
@@ -182,6 +188,13 @@ jobs:
             any::pbmcapply
 
       - uses: gradle/wrapper-validation-action@v1
+
+      - name: Restore Gradle Cache
+        uses: actions/cache@v3
+        with:
+          path: ~/.gradle/caches
+          key: ${{ runner.os }}-gradle-${{ hashFiles('**/build.gradle') }}-v1
+
       - name: Setup Gradle
         uses: gradle/gradle-build-action@v2.4.2
       - name: Execute Gradle build for rDNA

From 87721a48b26ade386fe208f3e57fd6c537b532cd Mon Sep 17 00:00:00 2001
From: leifeld <philip.leifeld@manchester.ac.uk>
Date: Mon, 19 Aug 2024 22:53:32 +0200
Subject: [PATCH 04/11] Updated GitHub actions and gradle for testing

---
 .github/workflows/build-check-test.yml   | 61 ++++++++----------------
 rDNA/build.gradle                        |  8 +---
 rDNA/rDNA/tests/testthat/test-backbone.R | 10 ----
 3 files changed, 20 insertions(+), 59 deletions(-)

diff --git a/.github/workflows/build-check-test.yml b/.github/workflows/build-check-test.yml
index 4e07254a..1a78947a 100644
--- a/.github/workflows/build-check-test.yml
+++ b/.github/workflows/build-check-test.yml
@@ -154,55 +154,32 @@ jobs:
           working-directory: rDNA/rDNA
           upload-snapshots: true
 
-  rDNA-test:
+  rDNA-coverage:
+    needs: rDNA
     runs-on: ubuntu-latest
     steps:
       - uses: actions/checkout@v3
+
+      - uses: actions/download-artifact@v3
+        with:
+          name: rDNA
+
       - uses: r-lib/actions/setup-r@v2
+        with:
+          r-version: release
 
       - name: Restore R Packages
         uses: actions/cache@v3
         with:
           path: ~/.cache/R
-          key: ${{ runner.os }}-r-rDNA-test-${{ hashFiles('**/DESCRIPTION') }}-v1
+          key: ${{ runner.os }}-r-rDNA-coverage-${{ hashFiles('**/DESCRIPTION') }}-v1
 
-      - uses: r-lib/actions/setup-r-dependencies@v2
-        with:
-          cache-version: 2
-          working-directory: rDNA/rDNA
-          extra-packages: |
-            any::covr
-            any::ggplot2
-            any::igraph
-            any::ggraph
-            any::askpass
-            any::cluster
-            any::sna
-            any::ggrepel
-            any::coda
-            any::MCMCpack
-            any::tidygraph
-            any::heatmaply
-            any::factoextra
-            any::MASS
-            any::pbmcapply
-
-      - uses: gradle/wrapper-validation-action@v1
-
-      - name: Restore Gradle Cache
-        uses: actions/cache@v3
-        with:
-          path: ~/.gradle/caches
-          key: ${{ runner.os }}-gradle-${{ hashFiles('**/build.gradle') }}-v1
-
-      - name: Setup Gradle
-        uses: gradle/gradle-build-action@v2.4.2
-      - name: Execute Gradle build for rDNA
-        run: ./gradlew :rDNA:build
-      - name: Execute Gradle rDNATest Task
-        run: ./gradlew :rDNA:rDNATest
-      - name: Store test results
-        uses: actions/upload-artifact@v3
-        with:
-          name: rDNA-Test-Results
-          path: build/reports/tests
+      - name: Install Dependencies
+        run: |
+          install.packages('remotes')
+          remotes::install_deps(dependencies = TRUE)
+          install.packages('covr')
+
+      - name: Run Coverage
+        run: |
+          Rscript -e 'pkg_tarball <- list.files(pattern = "*.tar.gz", full.names = TRUE); covr::codecov(path = pkg_tarball)'
diff --git a/rDNA/build.gradle b/rDNA/build.gradle
index 86f78796..513400bb 100644
--- a/rDNA/build.gradle
+++ b/rDNA/build.gradle
@@ -112,13 +112,7 @@ task rDNATest(dependsOn: [rDNADocument, copyRPackageSourcesToBuildDir, copyJarIn
             commandLine 'R', '-e', 'devtools::test()'
         }
 
-        // Run code coverage using covr::codecov() on the package source directory
-        exec {
-            workingDir tempDir.absolutePath
-            commandLine 'R', '-e', 'covr::codecov()'
-        }
-
-        println "R package testing and code coverage completed."
+        println "R package testing completed."
         println "Deleting temporary directory..."
         delete tempDir
         println "Temporary directory deleted."
diff --git a/rDNA/rDNA/tests/testthat/test-backbone.R b/rDNA/rDNA/tests/testthat/test-backbone.R
index 290cd09b..c956804c 100644
--- a/rDNA/rDNA/tests/testthat/test-backbone.R
+++ b/rDNA/rDNA/tests/testthat/test-backbone.R
@@ -2,7 +2,6 @@ context("backbone")
 
 test_that("Penalized backbone works", {
   testthat::skip_on_cran()
-  testthat::skip_on_ci()
   samp <- dna_sample()
   dna_init()
   dna_openDatabase(samp, coderId = 1, coderPassword = "sample")
@@ -40,7 +39,6 @@ test_that("Penalized backbone works", {
 
 test_that("Plot method works for backbones with penalty", {
   testthat::skip_on_cran()
-  testthat::skip_on_ci()
   samp <- dna_sample()
   dna_openDatabase(samp, coderId = 1, coderPassword = "sample")
   b <- dna_backbone(method = "penalty",
@@ -66,7 +64,6 @@ test_that("Plot method works for backbones with penalty", {
 
 test_that("Autoplot method works for backbones with penalty", {
   testthat::skip_on_cran()
-  testthat::skip_on_ci()
   samp <- dna_sample()
   dna_openDatabase(samp, coderId = 1, coderPassword = "sample")
   b <- dna_backbone(method = "penalty",
@@ -89,7 +86,6 @@ test_that("Autoplot method works for backbones with penalty", {
 
 test_that("Fixed backbone works", {
   testthat::skip_on_cran()
-  testthat::skip_on_ci()
   samp <- dna_sample()
   dna_openDatabase(samp, coderId = 1, coderPassword = "sample")
   b <- dna_backbone(method = "fixed",
@@ -126,7 +122,6 @@ test_that("Fixed backbone works", {
 
 test_that("Plot method works for fixed backbone size", {
   testthat::skip_on_cran()
-  testthat::skip_on_ci()
   samp <- dna_sample()
   dna_openDatabase(samp, coderId = 1, coderPassword = "sample")
   b <- dna_backbone(method = "fixed",
@@ -152,7 +147,6 @@ test_that("Plot method works for fixed backbone size", {
 
 test_that("Autoplot method works for backbones with fixed size", {
   testthat::skip_on_cran()
-  testthat::skip_on_ci()
   samp <- dna_sample()
   dna_openDatabase(samp, coderId = 1, coderPassword = "sample")
   b <- dna_backbone(method = "fixed",
@@ -175,7 +169,6 @@ test_that("Autoplot method works for backbones with fixed size", {
 
 test_that("Nested backbone works", {
   testthat::skip_on_cran()
-  testthat::skip_on_ci()
   samp <- dna_sample()
   dna_openDatabase(samp, coderId = 1, coderPassword = "sample")
   b <- dna_backbone(method = "nested",
@@ -203,7 +196,6 @@ test_that("Nested backbone works", {
 
 test_that("Plot method works for nested backbone", {
   testthat::skip_on_cran()
-  testthat::skip_on_ci()
   samp <- dna_sample()
   dna_openDatabase(samp, coderId = 1, coderPassword = "sample")
   b <- dna_backbone(method = "nested",
@@ -227,7 +219,6 @@ test_that("Plot method works for nested backbone", {
 
 test_that("Autoplot method works for nested backbones", {
   testthat::skip_on_cran()
-  testthat::skip_on_ci()
   samp <- dna_sample()
   dna_openDatabase(samp, coderId = 1, coderPassword = "sample")
   b <- dna_backbone(method = "nested",
@@ -247,7 +238,6 @@ test_that("Autoplot method works for nested backbones", {
 
 test_that("Evaluate backbone solution works", {
   testthat::skip_on_cran()
-  testthat::skip_on_ci()
   samp <- dna_sample()
   dna_openDatabase(samp, coderId = 1, coderPassword = "sample")
   b <- dna_evaluateBackboneSolution(

From 82cc74a263857180bcadc722ca3889c30b122919 Mon Sep 17 00:00:00 2001
From: leifeld <philip.leifeld@manchester.ac.uk>
Date: Mon, 19 Aug 2024 23:06:11 +0200
Subject: [PATCH 05/11] Updated GitHub actions

---
 .github/workflows/build-check-test.yml   | 55 ++++++++++++++++--------
 rDNA/rDNA/tests/testthat/test-backbone.R | 10 +++++
 2 files changed, 46 insertions(+), 19 deletions(-)

diff --git a/.github/workflows/build-check-test.yml b/.github/workflows/build-check-test.yml
index 1a78947a..c31e7e5e 100644
--- a/.github/workflows/build-check-test.yml
+++ b/.github/workflows/build-check-test.yml
@@ -154,32 +154,49 @@ jobs:
           working-directory: rDNA/rDNA
           upload-snapshots: true
 
-  rDNA-coverage:
-    needs: rDNA
+  rDNA-test:
     runs-on: ubuntu-latest
     steps:
       - uses: actions/checkout@v3
-
-      - uses: actions/download-artifact@v3
-        with:
-          name: rDNA
-
       - uses: r-lib/actions/setup-r@v2
-        with:
-          r-version: release
 
       - name: Restore R Packages
         uses: actions/cache@v3
         with:
           path: ~/.cache/R
-          key: ${{ runner.os }}-r-rDNA-coverage-${{ hashFiles('**/DESCRIPTION') }}-v1
-
-      - name: Install Dependencies
-        run: |
-          install.packages('remotes')
-          remotes::install_deps(dependencies = TRUE)
-          install.packages('covr')
+          key: ${{ runner.os }}-r-rDNA-test-${{ hashFiles('**/DESCRIPTION') }}-v1
 
-      - name: Run Coverage
-        run: |
-          Rscript -e 'pkg_tarball <- list.files(pattern = "*.tar.gz", full.names = TRUE); covr::codecov(path = pkg_tarball)'
+      - uses: r-lib/actions/setup-r-dependencies@v2
+        with:
+          cache-version: 2
+          working-directory: rDNA/rDNA
+          extra-packages: |
+            any::covr
+            any::ggplot2
+            any::igraph
+            any::ggraph
+            any::askpass
+            any::cluster
+            any::sna
+            any::ggrepel
+            any::coda
+            any::MCMCpack
+            any::tidygraph
+            any::heatmaply
+            any::factoextra
+            any::MASS
+            any::pbmcapply
+      - uses: gradle/wrapper-validation-action@v1
+
+      - name: Restore Gradle Cache
+        uses: actions/cache@v3
+        with:
+          path: ~/.gradle/caches
+          key: ${{ runner.os }}-gradle-${{ hashFiles('**/build.gradle') }}-v1
+
+      - name: Setup Gradle
+        uses: gradle/gradle-build-action@v2.4.2
+      - name: Execute Gradle build for rDNA
+        run: ./gradlew :rDNA:build
+      - name: Execute Gradle rDNATest Task
+        run: ./gradlew :rDNA:rDNATest
\ No newline at end of file
diff --git a/rDNA/rDNA/tests/testthat/test-backbone.R b/rDNA/rDNA/tests/testthat/test-backbone.R
index c956804c..290cd09b 100644
--- a/rDNA/rDNA/tests/testthat/test-backbone.R
+++ b/rDNA/rDNA/tests/testthat/test-backbone.R
@@ -2,6 +2,7 @@ context("backbone")
 
 test_that("Penalized backbone works", {
   testthat::skip_on_cran()
+  testthat::skip_on_ci()
   samp <- dna_sample()
   dna_init()
   dna_openDatabase(samp, coderId = 1, coderPassword = "sample")
@@ -39,6 +40,7 @@ test_that("Penalized backbone works", {
 
 test_that("Plot method works for backbones with penalty", {
   testthat::skip_on_cran()
+  testthat::skip_on_ci()
   samp <- dna_sample()
   dna_openDatabase(samp, coderId = 1, coderPassword = "sample")
   b <- dna_backbone(method = "penalty",
@@ -64,6 +66,7 @@ test_that("Plot method works for backbones with penalty", {
 
 test_that("Autoplot method works for backbones with penalty", {
   testthat::skip_on_cran()
+  testthat::skip_on_ci()
   samp <- dna_sample()
   dna_openDatabase(samp, coderId = 1, coderPassword = "sample")
   b <- dna_backbone(method = "penalty",
@@ -86,6 +89,7 @@ test_that("Autoplot method works for backbones with penalty", {
 
 test_that("Fixed backbone works", {
   testthat::skip_on_cran()
+  testthat::skip_on_ci()
   samp <- dna_sample()
   dna_openDatabase(samp, coderId = 1, coderPassword = "sample")
   b <- dna_backbone(method = "fixed",
@@ -122,6 +126,7 @@ test_that("Fixed backbone works", {
 
 test_that("Plot method works for fixed backbone size", {
   testthat::skip_on_cran()
+  testthat::skip_on_ci()
   samp <- dna_sample()
   dna_openDatabase(samp, coderId = 1, coderPassword = "sample")
   b <- dna_backbone(method = "fixed",
@@ -147,6 +152,7 @@ test_that("Plot method works for fixed backbone size", {
 
 test_that("Autoplot method works for backbones with fixed size", {
   testthat::skip_on_cran()
+  testthat::skip_on_ci()
   samp <- dna_sample()
   dna_openDatabase(samp, coderId = 1, coderPassword = "sample")
   b <- dna_backbone(method = "fixed",
@@ -169,6 +175,7 @@ test_that("Autoplot method works for backbones with fixed size", {
 
 test_that("Nested backbone works", {
   testthat::skip_on_cran()
+  testthat::skip_on_ci()
   samp <- dna_sample()
   dna_openDatabase(samp, coderId = 1, coderPassword = "sample")
   b <- dna_backbone(method = "nested",
@@ -196,6 +203,7 @@ test_that("Nested backbone works", {
 
 test_that("Plot method works for nested backbone", {
   testthat::skip_on_cran()
+  testthat::skip_on_ci()
   samp <- dna_sample()
   dna_openDatabase(samp, coderId = 1, coderPassword = "sample")
   b <- dna_backbone(method = "nested",
@@ -219,6 +227,7 @@ test_that("Plot method works for nested backbone", {
 
 test_that("Autoplot method works for nested backbones", {
   testthat::skip_on_cran()
+  testthat::skip_on_ci()
   samp <- dna_sample()
   dna_openDatabase(samp, coderId = 1, coderPassword = "sample")
   b <- dna_backbone(method = "nested",
@@ -238,6 +247,7 @@ test_that("Autoplot method works for nested backbones", {
 
 test_that("Evaluate backbone solution works", {
   testthat::skip_on_cran()
+  testthat::skip_on_ci()
   samp <- dna_sample()
   dna_openDatabase(samp, coderId = 1, coderPassword = "sample")
   b <- dna_evaluateBackboneSolution(

From fa0865a7390594cb559878bcc31d2a3dd9383905 Mon Sep 17 00:00:00 2001
From: leifeld <philip.leifeld@manchester.ac.uk>
Date: Mon, 19 Aug 2024 23:17:03 +0200
Subject: [PATCH 06/11] Updated GitHub actions

---
 .github/workflows/build-check-test.yml | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/.github/workflows/build-check-test.yml b/.github/workflows/build-check-test.yml
index c31e7e5e..1a946be8 100644
--- a/.github/workflows/build-check-test.yml
+++ b/.github/workflows/build-check-test.yml
@@ -199,4 +199,6 @@ jobs:
       - name: Execute Gradle build for rDNA
         run: ./gradlew :rDNA:build
       - name: Execute Gradle rDNATest Task
-        run: ./gradlew :rDNA:rDNATest
\ No newline at end of file
+        run: |
+          export CI=false
+          ./gradlew :rDNA:rDNATest
\ No newline at end of file

From e23a2d709d5f29b367a6dfbbdd9376da316acdf8 Mon Sep 17 00:00:00 2001
From: leifeld <philip.leifeld@manchester.ac.uk>
Date: Mon, 19 Aug 2024 23:32:32 +0200
Subject: [PATCH 07/11] Updated GitHub actions and updated dna_jar

---
 .github/workflows/build-check-test.yml |  51 +----------
 rDNA/rDNA/R/rDNA.R                     | 121 ++++---------------------
 2 files changed, 17 insertions(+), 155 deletions(-)

diff --git a/.github/workflows/build-check-test.yml b/.github/workflows/build-check-test.yml
index 1a946be8..1ad7fc70 100644
--- a/.github/workflows/build-check-test.yml
+++ b/.github/workflows/build-check-test.yml
@@ -152,53 +152,4 @@ jobs:
       - uses: r-lib/actions/check-r-package@v2
         with:
           working-directory: rDNA/rDNA
-          upload-snapshots: true
-
-  rDNA-test:
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v3
-      - uses: r-lib/actions/setup-r@v2
-
-      - name: Restore R Packages
-        uses: actions/cache@v3
-        with:
-          path: ~/.cache/R
-          key: ${{ runner.os }}-r-rDNA-test-${{ hashFiles('**/DESCRIPTION') }}-v1
-
-      - uses: r-lib/actions/setup-r-dependencies@v2
-        with:
-          cache-version: 2
-          working-directory: rDNA/rDNA
-          extra-packages: |
-            any::covr
-            any::ggplot2
-            any::igraph
-            any::ggraph
-            any::askpass
-            any::cluster
-            any::sna
-            any::ggrepel
-            any::coda
-            any::MCMCpack
-            any::tidygraph
-            any::heatmaply
-            any::factoextra
-            any::MASS
-            any::pbmcapply
-      - uses: gradle/wrapper-validation-action@v1
-
-      - name: Restore Gradle Cache
-        uses: actions/cache@v3
-        with:
-          path: ~/.gradle/caches
-          key: ${{ runner.os }}-gradle-${{ hashFiles('**/build.gradle') }}-v1
-
-      - name: Setup Gradle
-        uses: gradle/gradle-build-action@v2.4.2
-      - name: Execute Gradle build for rDNA
-        run: ./gradlew :rDNA:build
-      - name: Execute Gradle rDNATest Task
-        run: |
-          export CI=false
-          ./gradlew :rDNA:rDNATest
\ No newline at end of file
+          upload-snapshots: true
\ No newline at end of file
diff --git a/rDNA/rDNA/R/rDNA.R b/rDNA/rDNA/R/rDNA.R
index c6b04f5d..c2587f05 100644
--- a/rDNA/rDNA/R/rDNA.R
+++ b/rDNA/rDNA/R/rDNA.R
@@ -101,26 +101,20 @@ dna_getHeadlessDna <- function() {
   dnaEnvironment[["dna"]]$headlessDna
 }
 
-#' Identify and/or download and install the correct DNA jar file
-#'
-#' Identify and/or download and install the correct DNA jar file.
-#'
-#' rDNA requires the installation of a DNA jar file to run properly. While it is
-#' possible to store the jar file in the respective working directory, it is
-#' preferable to install it in the rDNA library installation directory under
-#' \code{java/}. The \code{dna_jar} function attempts to find the version of the
-#' jar file that matches the installed \pkg{rDNA} version in the \code{java/}
-#' sub-directory of the package library path and return the jar file name
-#' including its full path. If this fails, it will try to find the jar file in
-#' the current working directory and return its file name. If this fails as
-#' well, it will attempt to download the matching jar file from GitHub and store
-#' it in the library path and return its file name. If this fails, it will
-#' attempt to store the downloaded jar file in the working directory and return
-#' its file name. If this fails as well, it will clone the current DNA master
-#' code from GitHub to a local temporary directory, build the jar file from
-#' source, and attempt to store the built jar file in the library path or, if
-#' this fails, in the working directory and return the file name of the jar
-#' file. If all of this fails, an error message is thrown.
+#' Find the DNA jar file
+#'
+#' Find the DNA jar file in the library path or working directory.
+#'
+#' rDNA requires the installation of a DNA jar file to run properly. The jar
+#' file is shipped with the rDNA package and is installed in the \code{java/}
+#' directory of the package installation directory in the R library tree. The
+#' version number of the jar file and the rDNA package must match for DNA and
+#' rDNA to be able to work together. The \code{dna_jar} function looks for
+#' the jar file in the package installation directory sub-directory and
+#' returns its file name with its absolute path. If it cannot be found in the
+#' installation directory, the function looks in the current working
+#' directory. The function is also called by \code{\link{dna_init}} if the
+#' location of the jar file is not provided explicitly.
 #'
 #' @return The file name of the jar file that matches the installed \pkg{rDNA}
 #'   version, including full path.
@@ -164,91 +158,8 @@ dna_jar <- function() {
     }
   }, error = function(e) {success <- FALSE})
 
-  # try to download from GitHub release directory to library path
-  tryCatch({
-    rdna_dir <- dirname(system.file(".", package = "rDNA"))
-    f <- paste0("https://github.com/leifeld/dna/releases/download/v", v, "/dna-", v, ".jar")
-    dest <- paste0(rdna_dir, "/java/dna-", v, ".jar")
-    targetdir <- paste0(rdna_dir, "/java/")
-    dir.create(targetdir, recursive = TRUE, showWarnings = FALSE)
-    suppressWarnings(download.file(url = f,
-                                   destfile = dest,
-                                   mode = "wb",
-                                   cacheOK = FALSE,
-                                   quiet = TRUE))
-    if (file.exists(dest)) {
-      message("Jar file downloaded from GitHub to library path.")
-      return(dest)
-    }
-  }, error = function(e) {success <- FALSE})
-
-  # try to download from GitHub release directory to working directory
-  tryCatch({
-    rdna_dir <- dirname(system.file(".", package = "rDNA"))
-    f <- paste0("https://github.com/leifeld/dna/releases/download/v", v, "/dna-", v, ".jar")
-    dest <- paste0(getwd(), "/dna-", v, ".jar")
-    suppressWarnings(download.file(url = f,
-                                   destfile = dest,
-                                   mode = "wb",
-                                   cacheOK = FALSE,
-                                   quiet = TRUE))
-    if (file.exists(dest)) {
-      message("Jar file downloaded from GitHub to working directory.")
-      return(dest)
-    }
-  }, error = function(e) {success <- FALSE})
-
-  # try to download and build from source
-  tryCatch({
-    td <- tempdir()
-    dest <- paste0(td, "/master.zip")
-    suppressWarnings(download.file(url = "https://github.com/leifeld/dna/archive/master.zip",
-                                   destfile = dest,
-                                   mode = "wb",
-                                   cacheOK = FALSE,
-                                   quiet = TRUE))
-    unzip(zipfile = dest, overwrite = TRUE, exdir = td)
-    output <- file.remove(dest)
-    gradle <- paste0(td, "/dna-master/gradlew")
-    Sys.chmod(gradle, mode = "0777", use_umask = TRUE)
-    oldwd <- getwd()
-    setwd(paste0(td, "/dna-master/"))
-    system(paste0(gradle, " build"), ignore.stdout = TRUE, ignore.stderr = TRUE)
-    setwd(oldwd)
-    builtjar <- paste0(td, "/dna-master/dna/build/libs/dna-", v, ".jar")
-    if (file.exists(builtjar)) {
-      message("DNA source code downloaded and jar file built successfully.")
-    }
-  }, error = function(e) {success <- FALSE})
-
-  # try to copy built jar to library path
-  tryCatch({
-    targetdir <- paste0(find.package("rDNA"), "/java/")
-    dir.create(targetdir, recursive = TRUE, showWarnings = FALSE)
-    dest <- paste0(targetdir, "dna-", v, ".jar")
-    file.copy(from = builtjar, to = targetdir)
-    if (file.exists(dest)) {
-      unlink(paste0(td, "/dna-master"), recursive = TRUE)
-      message("Jar file copied to library path.")
-      return(dest)
-    }
-  }, error = function(e) {success <- FALSE})
-
-  # try to copy built jar to working directory
-  tryCatch({
-    dest <- paste0(getwd(), "/dna-", v, ".jar")
-    file.copy(from = builtjar, to = dest)
-    if (file.exists(dest)) {
-      unlink(paste0(td, "/dna-master"), recursive = TRUE)
-      message("Jar file copied to working directory.")
-      return(dest)
-    }
-  }, error = function(e) {success <- FALSE})
-
-  stop("DNA jar file could not be identified or downloaded. Please download ",
-       "the DNA jar file matching the version number of rDNA and store it in ",
-       "the java/ sub-directory of your rDNA library installation path or in ",
-       "your working directory. Your current rDNA version is ", v, ".")
+  stop("DNA jar file could not be found in the library path or working "
+       "directory. Your current rDNA version is ", v, ".")
 }
 
 #' Provides a small sample database

From 19b5b59ecc6368901c4d249a56e569a05524caf8 Mon Sep 17 00:00:00 2001
From: leifeld <philip.leifeld@manchester.ac.uk>
Date: Mon, 19 Aug 2024 23:47:09 +0200
Subject: [PATCH 08/11] Updated dna_jar

---
 rDNA/rDNA/R/rDNA.R | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/rDNA/rDNA/R/rDNA.R b/rDNA/rDNA/R/rDNA.R
index c2587f05..7a93ee6a 100644
--- a/rDNA/rDNA/R/rDNA.R
+++ b/rDNA/rDNA/R/rDNA.R
@@ -158,7 +158,7 @@ dna_jar <- function() {
     }
   }, error = function(e) {success <- FALSE})
 
-  stop("DNA jar file could not be found in the library path or working "
+  stop("DNA jar file could not be found in the library path or working ",
        "directory. Your current rDNA version is ", v, ".")
 }
 

From 35c7665d6a0e0272cde86fe568272a3abbc5b0b9 Mon Sep 17 00:00:00 2001
From: leifeld <philip.leifeld@manchester.ac.uk>
Date: Mon, 19 Aug 2024 23:56:22 +0200
Subject: [PATCH 09/11] Split rDNA code into multiple R files

---
 rDNA/rDNA/R/dna_backbone.R         |  759 +++++
 rDNA/rDNA/R/dna_barplot.R          |  530 ++++
 rDNA/rDNA/R/dna_multiclust.R       | 1190 ++++++++
 rDNA/rDNA/R/dna_network.R          | 1166 ++++++++
 rDNA/rDNA/R/dna_phaseTransitions.R |  643 +++++
 rDNA/rDNA/R/rDNA.R                 | 4308 ----------------------------
 6 files changed, 4288 insertions(+), 4308 deletions(-)
 create mode 100644 rDNA/rDNA/R/dna_backbone.R
 create mode 100644 rDNA/rDNA/R/dna_barplot.R
 create mode 100644 rDNA/rDNA/R/dna_multiclust.R
 create mode 100644 rDNA/rDNA/R/dna_network.R
 create mode 100644 rDNA/rDNA/R/dna_phaseTransitions.R

diff --git a/rDNA/rDNA/R/dna_backbone.R b/rDNA/rDNA/R/dna_backbone.R
new file mode 100644
index 00000000..e5db7878
--- /dev/null
+++ b/rDNA/rDNA/R/dna_backbone.R
@@ -0,0 +1,759 @@
+#' Compute and retrieve the backbone and redundant set
+#'
+#' Compute and retrieve the backbone and redundant set of a discourse network.
+#'
+#' The dna_backbone function applies a simulated annealing algorithm to the
+#' discourse network to partition the set of second-mode entities (e.g.,
+#' concepts) into a backbone set and a complementary redundant set. Three
+#' methods are available:
+#' \itemize{
+#'   \item A simulated annealing algorithm with a penalty. You can play with
+#'     different penalties and see how they affect the size of your backbone
+#'     set.
+#'   \item A modified simulated annealing algorithm for a fixed number of
+#'     backbone entities to retain. This is computationally simpler, but you
+#'     have to know how large the set should be.
+#'   \item A fast and greedy nested algorithm, which evaluates all possible
+#'     fixed backbone solutions, i.e., for all sizes, and provides a nested
+#'     hierarchy of entities on the second mode. This algorithm may stay below
+#'     the optimum and is only an approximation but provides insights into the
+#'     hierarchy of concepts and their relative importance.
+#' }
+#'
+#' The \code{autoplot} function requires the ggplot2 package and can plot
+#' algorithm diagnostics and the hierarchy of entities as a dendrogram,
+#' depending on the method that was chosen. The \code{plot} function can do the
+#' same thing, just using base plots, not ggplot2.
+#'
+#' The \code{dna_evaluateBackboneSolution} function computes the spectral loss
+#' for an arbitrary backbone and its complement, the redundant set, specified by
+#' the user. For example, the user can evaluate how much structure would be lost
+#' if the second mode was composed only of the concepts provided to this
+#' function. This can be used to compare how useful different codebook models
+#' are. The penalty parameter \code{p} applies a penalty factor to the spectral
+#' loss. The default value of \code{0} switches off the penalty as it is usually
+#' not needed to evaluate a specific solution. The backbone set can be supplied
+#' as a vector of character objects, for example concepts.
+#'
+#' @param method The backbone algorithm used to compute the results. Several
+#'  methods are available:
+#'  \itemize{
+#'    \item \code{"nested"}: A relatively fast, deterministic algorithm that
+#'      produces the full hierarchy of entities. It starts with a complete
+#'      backbone set resembling the full network. There are as many iterations
+#'      as entities on the second mode. In each iteration, the entity whose
+#'      removal would yield the smallest backbone loss is moved from the
+#'      backbone set into the redundant set, and the (unpenalized) spectral
+#'      loss is recorded. This creates a solution for all backbone sizes, where
+#'      each backbone set is fully nested in the next larger backbone set. The
+#'      solution usually resembles an unconstrained solution where nesting is
+#'      not required, but in some cases the loss of a non-nested solution may be
+#'      larger at a given level or number of elements in the backbone set.
+#'    \item \code{"fixed"}: Simulated annealing with a fixed number of elements
+#'      in the backbone set (i.e., only lateral changes are possible) and
+#'      without penalty. This method may yield more optimal solutions than the
+#'      nested algorithm because it does not require a strict hierarchy.
+#'      However, it produces an approximation of the global optimum and is
+#'      slower than the nested method. With this method, you can specify that
+#'      backbone set should have, for example, exactly 10 concepts. Then fewer
+#'      iterations are necessary than with the penalty method because the search
+#'      space is smaller. The backbone set size is defined in the
+#'      \code{"backboneSize"} argument.
+#'    \item \code{"penalty"}: Simulated annealing with a variable number of
+#'      elements in the backbone set. The solution is stabilized by a penalty
+#'      parameter (see \code{"penalty"} argument). This algorithm takes longest
+#'      to compute for a single solution, and it is only an approximation, but
+#'      it considers slightly larger or smaller backbone sets if the solution is
+#'      better, thus this algorithm adds some flexibility. It requires more
+#'      iterations than the fixed method for achieving the same quality.
+#'  }
+#' @param backboneSize The number of elements in the backbone set, as a fixed
+#'   parameter. Only used when \code{method = "fixed"}.
+#' @param penalty The penalty parameter for large backbone sets. The larger the
+#'   value, the more strongly larger backbone sets are punished and the smaller
+#'   the resulting backbone is. Try out different values to find the right size
+#'   of the backbone set. Reasonable values could be \code{2.5}, \code{5},
+#'   \code{7.5}, or \code{12}, for example. The minimum is \code{0.0}, which
+#'   imposes no penalty on the size of the backbone set and produces a redundant
+#'   set with only one element. Start with \code{0.0} if you want to weed out a
+#'   single concept and subsequently increase the penalty to include more items
+#'   in the redundant set and shrink the backbone further. Only used when
+#'   \code{method = "penalty"}.
+#' @param iterations The number of iterations of the simulated annealing
+#'   algorithm. More iterations take more time but may lead to better
+#'   optimization results. Only used when \code{method = "penalty"} or
+#'   \code{method = "fixed"}.
+#' @param qualifierAggregation The aggregation rule for the \code{qualifier}
+#'   variable. This must be \code{"ignore"} (for ignoring the qualifier
+#'   variable), \code{"congruence"} (for recording a network tie only if both
+#'   nodes have the same qualifier value in the binary case or for recording the
+#'   similarity between the two nodes on the qualifier variable in the integer
+#'   case), \code{"conflict"} (for recording a network tie only if both nodes
+#'   have a different qualifier value in the binary case or for recording the
+#'   distance between the two nodes on the qualifier variable in the integer
+#'   case), or \code{"subtract"} (for subtracting the conflict tie value from
+#'   the congruence tie value in each dyad; note that negative values will be
+#'   replaced by \code{0} in the backbone calculation).
+#' @param normalization Normalization of edge weights. Valid settings are
+#'   \code{"no"} (for switching off normalization), \code{"average"} (for
+#'   average activity normalization), \code{"jaccard"} (for Jaccard coefficient
+#'   normalization), and \code{"cosine"} (for cosine similarity normalization).
+#' @param fileFormat An optional file format specification for saving the
+#'   backbone results to a file instead of returning an object. Valid values
+#'   are \code{"json"}, \code{"xml"}, and \code{NULL} (for returning the results
+#'   instead of writing them to a file).
+#' @inheritParams dna_network
+#'
+#' @examples
+#' \dontrun{
+#' dna_init()
+#' dna_sample()
+#' dna_openDatabase("sample.dna", coderId = 1, coderPassword = "sample")
+#'
+#' # compute backbone and redundant set using penalised spectral loss
+#' b <- dna_backbone(method = "penalty",
+#'                   penalty = 3.5,
+#'                   iterations = 10000,
+#'                   variable1 = "organization",
+#'                   variable2 = "concept",
+#'                   qualifier = "agreement",
+#'                   qualifierAggregation = "subtract",
+#'                   normalization = "average")
+#'
+#' b # display main results
+#'
+#' # extract results from the object
+#' b$backbone # show the set of backbone concepts
+#' b$redundant # show the set of redundant concepts
+#' b$unpenalized_backbone_loss # spectral loss between full and backbone network
+#' b$unpenalized_redundant_loss # spectral loss of redundant network
+#' b$backbone_network # show the backbone network
+#' b$redundant_network # show the redundant network
+#' b$full_network # show the full network
+#'
+#' # plot diagnostics with base R
+#' plot(b, ma = 500)
+#'
+#' # arrange plots in a 2 x 2 view
+#' par(mfrow = c(2, 2))
+#' plot(b)
+#'
+#' # plot diagnostics with ggplot2
+#' library("ggplot2")
+#' p <- autoplot(b)
+#' p
+#'
+#' # pick a specific diagnostic
+#' p[[3]]
+#'
+#' # use the patchwork package to arrange the diagnostics in a single plot
+#' library("patchwork")
+#' new_plot <- p[[1]] + p[[2]] + p[[3]] + p[[4]]
+#' new_plot & theme_grey() + theme(legend.position = "bottom")
+#'
+#' # use the gridExtra package to arrange the diagnostics in a single plot
+#' library("gridExtra")
+#' grid.arrange(p[[1]], p[[2]], p[[3]], p[[4]])
+#'
+#' # compute backbone with fixed size (here: 4 concepts)
+#' b <- dna_backbone(method = "fixed",
+#'                   backboneSize = 4,
+#'                   iterations = 2000,
+#'                   variable1 = "organization",
+#'                   variable2 = "concept",
+#'                   qualifier = "agreement",
+#'                   qualifierAggregation = "subtract",
+#'                   normalization = "average")
+#' b
+#'
+#' # compute backbone with a nested structure and plot dendrogram
+#' b <- dna_backbone(method = "nested",
+#'                   variable1 = "organization",
+#'                   variable2 = "concept",
+#'                   qualifier = "agreement",
+#'                   qualifierAggregation = "subtract",
+#'                   normalization = "average")
+#' b
+#' plot(b)
+#' autoplot(b)
+#' }
+#'
+#' @author Philip Leifeld, Tim Henrichsen
+#'
+#' @rdname dna_backbone
+#' @importFrom rJava .jarray
+#' @importFrom rJava .jcall
+#' @importFrom rJava .jnull
+#' @importFrom rJava J
+#' @export
+dna_backbone <- function(method = "nested",
+                         backboneSize = 1,
+                         penalty = 3.5,
+                         iterations = 10000,
+                         statementType = "DNA Statement",
+                         variable1 = "organization",
+                         variable1Document = FALSE,
+                         variable2 = "concept",
+                         variable2Document = FALSE,
+                         qualifier = "agreement",
+                         qualifierDocument = FALSE,
+                         qualifierAggregation = "subtract",
+                         normalization = "average",
+                         duplicates = "document",
+                         start.date = "01.01.1900",
+                         stop.date = "31.12.2099",
+                         start.time = "00:00:00",
+                         stop.time = "23:59:59",
+                         excludeValues = list(),
+                         excludeAuthors = character(),
+                         excludeSources = character(),
+                         excludeSections = character(),
+                         excludeTypes = character(),
+                         invertValues = FALSE,
+                         invertAuthors = FALSE,
+                         invertSources = FALSE,
+                         invertSections = FALSE,
+                         invertTypes = FALSE,
+                         fileFormat = NULL,
+                         outfile = NULL) {
+  
+  # wrap the vectors of exclude values for document variables into Java arrays
+  excludeAuthors <- .jarray(excludeAuthors)
+  excludeSources <- .jarray(excludeSources)
+  excludeSections <- .jarray(excludeSections)
+  excludeTypes <- .jarray(excludeTypes)
+  
+  # compile exclude variables and values vectors
+  dat <- matrix("", nrow = length(unlist(excludeValues)), ncol = 2)
+  count <- 0
+  if (length(excludeValues) > 0) {
+    for (i in 1:length(excludeValues)) {
+      if (length(excludeValues[[i]]) > 0) {
+        for (j in 1:length(excludeValues[[i]])) {
+          count <- count + 1
+          dat[count, 1] <- names(excludeValues)[i]
+          dat[count, 2] <- excludeValues[[i]][j]
+        }
+      }
+    }
+    var <- dat[, 1]
+    val <- dat[, 2]
+  } else {
+    var <- character()
+    val <- character()
+  }
+  var <- .jarray(var) # array of variable names of each excluded value
+  val <- .jarray(val) # array of values to be excluded
+  
+  # encode R NULL as Java null value if necessary
+  if (is.null(qualifier) || is.na(qualifier)) {
+    qualifier <- .jnull(class = "java/lang/String")
+  }
+  if (is.null(fileFormat)) {
+    fileFormat <- .jnull(class = "java/lang/String")
+  }
+  if (is.null(outfile)) {
+    outfile <- .jnull(class = "java/lang/String")
+  }
+  
+  # call rBackbone function to compute results
+  .jcall(dnaEnvironment[["dna"]]$headlessDna,
+         "V",
+         "rBackbone",
+         method,
+         as.integer(backboneSize),
+         as.double(penalty),
+         as.integer(iterations),
+         statementType,
+         variable1,
+         variable1Document,
+         variable2,
+         variable2Document,
+         qualifier,
+         qualifierDocument,
+         qualifierAggregation,
+         normalization,
+         duplicates,
+         start.date,
+         stop.date,
+         start.time,
+         stop.time,
+         var,
+         val,
+         excludeAuthors,
+         excludeSources,
+         excludeSections,
+         excludeTypes,
+         invertValues,
+         invertAuthors,
+         invertSources,
+         invertSections,
+         invertTypes,
+         outfile,
+         fileFormat
+  )
+  
+  exporter <- .jcall(dnaEnvironment[["dna"]]$headlessDna, "Lexport/Exporter;", "getExporter") # get a reference to the Exporter object, in which results are stored
+  if (!is.null(outfile) && !is.null(fileFormat) && is.character(outfile) && is.character(fileFormat) && fileFormat %in% c("json", "xml")) {
+    message("File exported.")
+  } else if (method[1] %in% c("penalty", "fixed")) {
+    result <- .jcall(exporter, "Lexport/SimulatedAnnealingBackboneResult;", "getSimulatedAnnealingBackboneResult", simplify = TRUE)
+    # create a list with various results
+    l <- list()
+    l$penalty <- .jcall(result, "D", "getPenalty")
+    if (method[1] == "fixed") {
+      l$backbone_size <- as.integer(backboneSize)
+    } else {
+      l$backbone_size <- as.integer(NA)
+    }
+    l$iterations <- .jcall(result, "I", "getIterations")
+    l$backbone <- .jcall(result, "[S", "getBackboneEntities")
+    l$redundant <- .jcall(result, "[S", "getRedundantEntities")
+    l$unpenalized_backbone_loss <- .jcall(result, "D", "getUnpenalizedBackboneLoss")
+    l$unpenalized_redundant_loss <- .jcall(result, "D", "getUnpenalizedRedundantLoss")
+    rn <- .jcall(result, "[S", "getLabels")
+    
+    # store the three matrices in the result list
+    fullmat <- .jcall(result, "[[D", "getFullNetwork", simplify = TRUE)
+    rownames(fullmat) <- rn
+    colnames(fullmat) <- rn
+    l$full_network <- fullmat
+    backbonemat <- .jcall(result, "[[D", "getBackboneNetwork", simplify = TRUE)
+    rownames(backbonemat) <- rn
+    colnames(backbonemat) <- rn
+    l$backbone_network <- backbonemat
+    redundantmat <- .jcall(result, "[[D", "getRedundantNetwork", simplify = TRUE)
+    rownames(redundantmat) <- rn
+    colnames(redundantmat) <- rn
+    l$redundant_network <- redundantmat
+    
+    # store diagnostics per iteration as a data frame
+    d <- data.frame(iteration = 1:.jcall(result, "I", "getIterations"),
+                    temperature = .jcall(result, "[D", "getTemperature"),
+                    acceptance_prob = .jcall(result, "[D", "getAcceptanceProbability"),
+                    acceptance = .jcall(result, "[I", "getAcceptance"),
+                    penalized_backbone_loss = .jcall(result, "[D", "getPenalizedBackboneLoss"),
+                    proposed_backbone_size = .jcall(result, "[I", "getProposedBackboneSize"),
+                    current_backbone_size = .jcall(result, "[I", "getCurrentBackboneSize"),
+                    optimal_backbone_size = .jcall(result, "[I", "getOptimalBackboneSize"),
+                    acceptance_ratio_ma = .jcall(result, "[D", "getAcceptanceRatioMovingAverage"))
+    
+    l$diagnostics <- d
+    
+    # store start date/time, end date/time, number of statements, call, and class label in each network matrix
+    start <- as.POSIXct(.jcall(result, "J", "getStart"), origin = "1970-01-01") # add the start date/time of the result as an attribute to the matrices
+    attributes(l$full_network)$start <- start
+    attributes(l$backbone_network)$start <- start
+    attributes(l$redundant_network)$start <- start
+    stop <- as.POSIXct(.jcall(result, "J", "getStop"), origin = "1970-01-01") # add the end date/time of the result as an attribute to the matrices
+    attributes(l$full_network)$stop <- stop
+    attributes(l$backbone_network)$stop <- stop
+    attributes(l$redundant_network)$stop <- stop
+    attributes(l$full_network)$numStatements <- .jcall(result, "I", "getNumStatements") # add the number of filtered statements the matrix is based on as an attribute to the matrix
+    attributes(l$full_network)$call <- match.call()
+    attributes(l$backbone_network)$call <- match.call()
+    attributes(l$redundant_network)$call <- match.call()
+    attributes(l)$method <- method[1]
+    class(l$full_network) <- c("dna_network_onemode", class(l$full_network))
+    class(l$backbone_network) <- c("dna_network_onemode", class(l$backbone_network))
+    class(l$redundant_network) <- c("dna_network_onemode", class(l$redundant_network))
+    class(l) <- c("dna_backbone", class(l))
+    return(l)
+  } else if (method[1] == "nested") {
+    result <- .jcall(exporter, "Lexport/NestedBackboneResult;", "getNestedBackboneResult", simplify = TRUE)
+    d <- data.frame(i = .jcall(result, "[I", "getIteration"),
+                    entity = .jcall(result, "[S", "getEntities"),
+                    backboneLoss = .jcall(result, "[D", "getBackboneLoss"),
+                    redundantLoss = .jcall(result, "[D", "getRedundantLoss"),
+                    statements = .jcall(result, "[I", "getNumStatements"))
+    rownames(d) <- NULL
+    attributes(d)$numStatementsFull <- .jcall(result, "I", "getNumStatementsFull")
+    attributes(d)$start <- as.POSIXct(.jcall(result, "J", "getStart"), origin = "1970-01-01") # add the start date/time of the result as an attribute
+    attributes(d)$stop <- as.POSIXct(.jcall(result, "J", "getStop"), origin = "1970-01-01") # add the end date/time of the result as an attribute
+    attributes(d)$method <- "nested"
+    class(d) <- c("dna_backbone", class(d))
+    return(d)
+  }
+}
+
+#' @rdname dna_backbone
+#' @param x A \code{"dna_backbone"} object.
+#' @param trim Number of maximum characters to display in entity labels. Labels
+#'   with more characters are truncated, and the last character is replaced by
+#'   an asterisk (\code{*}).
+#' @export
+print.dna_backbone <- function(x, trim = 50, ...) {
+  method <- attributes(x)$method
+  cat(paste0("Backbone method: ", method, ".\n\n"))
+  if (method %in% c("penalty", "fixed")) {
+    if (method == "penalty") {
+      cat(paste0("Penalty: ", x$penalty, ". Iterations: ", x$iterations, ".\n\n"))
+    } else {
+      cat(paste0("Backbone size: ", x$backbone_size, ". Iterations: ", x$iterations, ".\n\n"))
+    }
+    cat(paste0("Backbone set (loss: ", round(x$unpenalized_backbone_loss, 4), "):\n"))
+    cat(paste(1:length(x$backbone), x$backbone), sep = "\n")
+    cat(paste0("\nRedundant set (loss: ", round(x$unpenalized_redundant_loss, 4), "):\n"))
+    cat(paste(1:length(x$redundant), x$redundant), sep = "\n")
+  } else if (method == "nested") {
+    x2 <- x
+    x2$entity <- sapply(x2$entity, function(r) if (nchar(r) > trim) paste0(substr(r, 1, trim - 1), "*") else r)
+    print(as.data.frame(x2), row.names = FALSE)
+  }
+}
+
+#' @param ma Number of iterations to compute moving average.
+#' @rdname dna_backbone
+#' @importFrom graphics lines
+#' @importFrom stats filter
+#' @importFrom rlang .data
+#' @export
+plot.dna_backbone <- function(x, ma = 500, ...) {
+  
+  if (attr(x, "method") != "nested") {
+    # temperature and acceptance probability
+    plot(x = x$diagnostics$iteration,
+         y = x$diagnostics$temperature,
+         col = "red",
+         type = "l",
+         lwd = 3,
+         xlab = "Iteration",
+         ylab = "Acceptance probability",
+         main = "Temperature and acceptance probability")
+    # note that better solutions are coded as -1 and need to be skipped:
+    lines(x = x$diagnostics$iteration[x$diagnostics$acceptance_prob >= 0],
+          y = x$diagnostics$acceptance_prob[x$diagnostics$acceptance_prob >= 0])
+    
+    # spectral distance between full network and backbone network per iteration
+    bb_loss <- stats::filter(x$diagnostics$penalized_backbone_loss,
+                             rep(1 / ma, ma),
+                             sides = 1)
+    if (attributes(x)$method == "penalty") {
+      yl <- "Penalized backbone loss"
+      ti <- "Penalized spectral backbone distance"
+    } else {
+      yl <- "Backbone loss"
+      ti <- "Spectral backbone distance"
+    }
+    plot(x = x$diagnostics$iteration,
+         y = bb_loss,
+         type = "l",
+         xlab = "Iteration",
+         ylab = yl,
+         main = ti)
+    
+    # number of concepts in the backbone solution per iteration
+    current_size_ma <- stats::filter(x$diagnostics$current_backbone_size,
+                                     rep(1 / ma, ma),
+                                     sides = 1)
+    optimal_size_ma <- stats::filter(x$diagnostics$optimal_backbone_size,
+                                     rep(1 / ma, ma),
+                                     sides = 1)
+    plot(x = x$diagnostics$iteration,
+         y = current_size_ma,
+         ylim = c(min(c(current_size_ma, optimal_size_ma), na.rm = TRUE),
+                  max(c(current_size_ma, optimal_size_ma), na.rm = TRUE)),
+         type = "l",
+         xlab = "Iteration",
+         ylab = paste0("Number of elements (MA, last ", ma, ")"),
+         main = "Backbone size (red = best)")
+    lines(x = x$diagnostics$iteration, y = optimal_size_ma, col = "red")
+    
+    # ratio of recent acceptances
+    accept_ratio <- stats::filter(x$diagnostics$acceptance,
+                                  rep(1 / ma, ma),
+                                  sides = 1)
+    plot(x = x$diagnostics$iteration,
+         y = accept_ratio,
+         type = "l",
+         xlab = "Iteration",
+         ylab = paste("Acceptance ratio in the last", ma, "iterations"),
+         main = "Acceptance ratio")
+  } else { # create hclust object
+    # define merging pattern: negative numbers are leaves, positive are merged clusters
+    merges_clust <- matrix(nrow = nrow(x) - 1, ncol = 2)
+    
+    merges_clust[1,1] <- -nrow(x)
+    merges_clust[1,2] <- -(nrow(x) - 1)
+    
+    for (i in 2:(nrow(x) - 1)) {
+      merges_clust[i, 1] <- -(nrow(x) - i)
+      merges_clust[i, 2] <- i - 1
+    }
+    
+    # Initialize empty object
+    a <- list()
+    
+    # Add merges
+    a$merge <- merges_clust
+    
+    # Define merge heights
+    a$height <- x$backboneLoss[1:nrow(x) - 1]
+    
+    # Order of leaves
+    a$order <- 1:nrow(x)
+    
+    # Labels of leaves
+    a$labels <- rev(x$entity)
+    
+    # Define hclust class
+    class(a) <- "hclust"
+    
+    plot(a, ylab = "")
+  }
+}
+
+#' @rdname dna_backbone
+#' @param object A \code{"dna_backbone"} object.
+#' @param ... Additional arguments.
+#' @importFrom ggplot2 autoplot
+#' @importFrom ggplot2 ggplot
+#' @importFrom ggplot2 aes
+#' @importFrom ggplot2 geom_line
+#' @importFrom ggplot2 ylab
+#' @importFrom ggplot2 xlab
+#' @importFrom ggplot2 ggtitle
+#' @importFrom ggplot2 theme_bw
+#' @importFrom ggplot2 theme
+#' @importFrom ggplot2 coord_flip
+#' @importFrom ggplot2 scale_x_continuous
+#' @importFrom ggplot2 scale_y_continuous
+#' @importFrom rlang .data
+#' @export
+autoplot.dna_backbone <- function(object, ..., ma = 500) {
+  if (attr(object, "method") != "nested") {
+    bd <- object$diagnostics
+    bd$bb_loss <- stats::filter(bd$penalized_backbone_loss, rep(1 / ma, ma), sides = 1)
+    bd$current_size_ma <- stats::filter(bd$current_backbone_size, rep(1 / ma, ma), sides = 1)
+    bd$optimal_size_ma <- stats::filter(bd$optimal_backbone_size, rep(1 / ma, ma), sides = 1)
+    bd$accept_ratio <- stats::filter(bd$acceptance, rep(1 / ma, ma), sides = 1)
+    
+    # temperature and acceptance probability
+    g_accept <- ggplot2::ggplot(bd, ggplot2::aes(y = .data[["temperature"]], x = .data[["iteration"]])) +
+      ggplot2::geom_line(color = "#a50f15") +
+      ggplot2::geom_line(data = bd[bd$acceptance_prob >= 0, ],
+                         ggplot2::aes(y = .data[["acceptance_prob"]], x = .data[["iteration"]])) +
+      ggplot2::ylab("Acceptance probability") +
+      ggplot2::xlab("Iteration") +
+      ggplot2::ggtitle("Temperature and acceptance probability") +
+      ggplot2::theme_bw()
+    
+    # spectral distance between full network and backbone network per iteration
+    if (attributes(object)$method == "penalty") {
+      yl <- "Penalized backbone loss"
+      ti <- "Penalized spectral backbone distance"
+    } else {
+      yl <- "Backbone loss"
+      ti <- "Spectral backbone distance"
+    }
+    g_loss <- ggplot2::ggplot(bd, ggplot2::aes(y = .data[["bb_loss"]], x = .data[["iteration"]])) +
+      ggplot2::geom_line() +
+      ggplot2::ylab(yl) +
+      ggplot2::xlab("Iteration") +
+      ggplot2::ggtitle(ti) +
+      ggplot2::theme_bw()
+    
+    # number of concepts in the backbone solution per iteration
+    d <- data.frame(iteration = rep(bd$iteration, 2),
+                    size = c(bd$current_size_ma, bd$optimal_size_ma),
+                    Criterion = c(rep("Current iteration", nrow(bd)),
+                                  rep("Best solution", nrow(bd))))
+    g_size <- ggplot2::ggplot(d, ggplot2::aes(y = .data[["size"]], x = .data[["iteration"]], color = .data[["Criterion"]])) +
+      ggplot2::geom_line() +
+      ggplot2::ylab(paste0("Number of elements (MA, last ", ma, ")")) +
+      ggplot2::xlab("Iteration") +
+      ggplot2::ggtitle("Backbone size") +
+      ggplot2::theme_bw() +
+      ggplot2::theme(legend.position = "bottom")
+    
+    # ratio of recent acceptances
+    g_ar <- ggplot2::ggplot(bd, ggplot2::aes(y = .data[["accept_ratio"]], x = .data[["iteration"]])) +
+      ggplot2::geom_line() +
+      ggplot2::ylab(paste("Acceptance ratio in the last", ma, "iterations")) +
+      ggplot2::xlab("Iteration") +
+      ggplot2::ggtitle("Acceptance ratio") +
+      ggplot2::theme_bw()
+    
+    # wrap in list
+    plots <- list(g_accept, g_loss, g_size, g_ar)
+    return(plots)
+  } else { # create hclust object
+    # define merging pattern: negative numbers are leaves, positive are merged clusters
+    merges_clust <- matrix(nrow = nrow(object) - 1, ncol = 2)
+    
+    merges_clust[1,1] <- -nrow(object)
+    merges_clust[1,2] <- -(nrow(object) - 1)
+    
+    for (i in 2:(nrow(object) - 1)) {
+      merges_clust[i, 1] <- -(nrow(object) - i)
+      merges_clust[i, 2] <- i - 1
+    }
+    
+    # Initialize empty object
+    a <- list()
+    
+    # Add merges
+    a$merge <- merges_clust
+    
+    # Define merge heights
+    a$height <- object$backboneLoss[1:nrow(object) - 1]
+    height <- a$height
+    
+    # Order of leaves
+    a$order <- 1:nrow(object)
+    
+    # Labels of leaves
+    a$labels <- rev(object$entity)
+    
+    # Define hclust class
+    class(a) <- "hclust"
+    
+    # ensure ggraph is installed, otherwise throw error (better than importing it to avoid hard dependency)
+    if (!requireNamespace("ggraph", quietly = TRUE)) {
+      stop("The 'ggraph' package is required for plotting nested backbone dendrograms with 'ggplot2' but was not found. Consider installing it.")
+    }
+    
+    g_clust <- ggraph::ggraph(graph = a,
+                              layout = "dendrogram",
+                              circular = FALSE,
+                              height = height) + # TODO @Tim: "height" does not seem to exist
+      ggraph::geom_edge_elbow() +
+      ggraph::geom_node_point(aes(filter = .data[["leaf"]])) +
+      ggplot2::theme_bw() +
+      ggplot2::theme(panel.border = element_blank(),
+                     axis.title = element_blank(),
+                     panel.grid.major = element_blank(),
+                     panel.grid.minor = element_blank(),
+                     axis.line = element_blank(),
+                     axis.text.y = element_text(size = 6),
+                     axis.ticks.y = element_blank()) +
+      ggplot2::scale_x_continuous(breaks = seq(0, nrow(object) - 1, by = 1),
+                                  labels = rev(object$entity)) +
+      ggplot2::scale_y_continuous(expand = c(0, 0.01)) +
+      ggplot2::coord_flip()
+    
+    return(g_clust)
+  }
+}
+
+#' @param backboneEntities A vector of character values to be included in the
+#'   backbone. The function will compute the spectral loss between the full
+#'   network and the network composed only of those entities on the second mode
+#'   that are contained in this vector.
+#' @param p The penalty parameter. The default value of \code{0} means no
+#'   penalty for backbone size is applied.
+#' @inheritParams dna_backbone
+#' @return A vector with two numeric values: the backbone and redundant loss.
+#'
+#' @examples
+#' \dontrun{
+#' dna_init()
+#' dna_sample()
+#' dna_openDatabase("sample.dna", coderId = 1, coderPassword = "sample")
+#'
+#' dna_evaluateBackboneSolution(
+#'   c("There should be legislation to regulate emissions.",
+#'     "Emissions legislation should regulate CO2.")
+#' )
+#' }
+#'
+#' @rdname dna_backbone
+#' @importFrom rJava .jarray
+#' @importFrom rJava .jcall
+#' @importFrom rJava .jnull
+#' @export
+dna_evaluateBackboneSolution <- function(backboneEntities,
+                                         p = 0,
+                                         statementType = "DNA Statement",
+                                         variable1 = "organization",
+                                         variable1Document = FALSE,
+                                         variable2 = "concept",
+                                         variable2Document = FALSE,
+                                         qualifier = "agreement",
+                                         qualifierDocument = FALSE,
+                                         qualifierAggregation = "subtract",
+                                         normalization = "average",
+                                         duplicates = "document",
+                                         start.date = "01.01.1900",
+                                         stop.date = "31.12.2099",
+                                         start.time = "00:00:00",
+                                         stop.time = "23:59:59",
+                                         excludeValues = list(),
+                                         excludeAuthors = character(),
+                                         excludeSources = character(),
+                                         excludeSections = character(),
+                                         excludeTypes = character(),
+                                         invertValues = FALSE,
+                                         invertAuthors = FALSE,
+                                         invertSources = FALSE,
+                                         invertSections = FALSE,
+                                         invertTypes = FALSE) {
+  
+  # wrap the vectors of exclude values for document variables into Java arrays
+  excludeAuthors <- .jarray(excludeAuthors)
+  excludeSources <- .jarray(excludeSources)
+  excludeSections <- .jarray(excludeSections)
+  excludeTypes <- .jarray(excludeTypes)
+  
+  # compile exclude variables and values vectors
+  dat <- matrix("", nrow = length(unlist(excludeValues)), ncol = 2)
+  count <- 0
+  if (length(excludeValues) > 0) {
+    for (i in 1:length(excludeValues)) {
+      if (length(excludeValues[[i]]) > 0) {
+        for (j in 1:length(excludeValues[[i]])) {
+          count <- count + 1
+          dat[count, 1] <- names(excludeValues)[i]
+          dat[count, 2] <- excludeValues[[i]][j]
+        }
+      }
+    }
+    var <- dat[, 1]
+    val <- dat[, 2]
+  } else {
+    var <- character()
+    val <- character()
+  }
+  var <- .jarray(var) # array of variable names of each excluded value
+  val <- .jarray(val) # array of values to be excluded
+  
+  # encode R NULL as Java null value if necessary
+  if (is.null(qualifier) || is.na(qualifier)) {
+    qualifier <- .jnull(class = "java/lang/String")
+  }
+  
+  # call rBackbone function to compute results
+  result <- .jcall(dnaEnvironment[["dna"]]$headlessDna,
+                   "[D",
+                   "rEvaluateBackboneSolution",
+                   .jarray(backboneEntities),
+                   as.integer(p),
+                   statementType,
+                   variable1,
+                   variable1Document,
+                   variable2,
+                   variable2Document,
+                   qualifier,
+                   qualifierDocument,
+                   qualifierAggregation,
+                   normalization,
+                   duplicates,
+                   start.date,
+                   stop.date,
+                   start.time,
+                   stop.time,
+                   var,
+                   val,
+                   excludeAuthors,
+                   excludeSources,
+                   excludeSections,
+                   excludeTypes,
+                   invertValues,
+                   invertAuthors,
+                   invertSources,
+                   invertSections,
+                   invertTypes
+  )
+  names(result) <- c("backbone loss", "redundant loss")
+  return(result)
+}
\ No newline at end of file
diff --git a/rDNA/rDNA/R/dna_barplot.R b/rDNA/rDNA/R/dna_barplot.R
new file mode 100644
index 00000000..ecc24ee2
--- /dev/null
+++ b/rDNA/rDNA/R/dna_barplot.R
@@ -0,0 +1,530 @@
+#' Generate the data necessary for creating a barplot for a variable
+#'
+#' Generate the data necessary for creating a barplot for a variable.
+#'
+#' Create a \code{dna_barplot} object, which contains a data frame with
+#' entity value frequencies grouped by the levels of a qualifier variable.
+#' The qualifier variable is optional.
+#'
+#' @param variable The variable for which the barplot will be generated. There
+#'   will be one bar per entity label of this variable.
+#' @param qualifier A boolean (binary) or integer variable to group the value
+#'   frequencies by. Can be \code{NULL} to skip the grouping.
+#' @inheritParams dna_network
+#'
+#' @examples
+#' \dontrun{
+#' dna_init()
+#' dna_sample()
+#' dna_openDatabase("sample.dna", coderId = 1, coderPassword = "sample")
+#'
+#' # compute barplot data
+#' b <- dna_barplot(statementType = "DNA Statement",
+#'                  variable = "concept",
+#'                  qualifier = "agreement")
+#' b
+#' }
+#'
+#' @author Philip Leifeld
+#'
+#' @rdname dna_barplot
+#' @importFrom rJava .jarray
+#' @importFrom rJava .jcall
+#' @importFrom rJava .jevalArray
+#' @importFrom rJava .jnull
+#' @importFrom rJava is.jnull
+#' @export
+dna_barplot <- function(statementType = "DNA Statement",
+                        variable = "concept",
+                        qualifier = "agreement",
+                        duplicates = "document",
+                        start.date = "01.01.1900",
+                        stop.date = "31.12.2099",
+                        start.time = "00:00:00",
+                        stop.time = "23:59:59",
+                        excludeValues = list(),
+                        excludeAuthors = character(),
+                        excludeSources = character(),
+                        excludeSections = character(),
+                        excludeTypes = character(),
+                        invertValues = FALSE,
+                        invertAuthors = FALSE,
+                        invertSources = FALSE,
+                        invertSections = FALSE,
+                        invertTypes = FALSE) {
+  
+  # wrap the vectors of exclude values for document variables into Java arrays
+  excludeAuthors <- .jarray(excludeAuthors)
+  excludeSources <- .jarray(excludeSources)
+  excludeSections <- .jarray(excludeSections)
+  excludeTypes <- .jarray(excludeTypes)
+  
+  # compile exclude variables and values vectors
+  dat <- matrix("", nrow = length(unlist(excludeValues)), ncol = 2)
+  count <- 0
+  if (length(excludeValues) > 0) {
+    for (i in 1:length(excludeValues)) {
+      if (length(excludeValues[[i]]) > 0) {
+        for (j in 1:length(excludeValues[[i]])) {
+          count <- count + 1
+          dat[count, 1] <- names(excludeValues)[i]
+          dat[count, 2] <- excludeValues[[i]][j]
+        }
+      }
+    }
+    var <- dat[, 1]
+    val <- dat[, 2]
+  } else {
+    var <- character()
+    val <- character()
+  }
+  var <- .jarray(var) # array of variable names of each excluded value
+  val <- .jarray(val) # array of values to be excluded
+  
+  # encode R NULL as Java null value if necessary
+  if (is.null(qualifier) || is.na(qualifier)) {
+    qualifier <- .jnull(class = "java/lang/String")
+  }
+  
+  # call rBarplotData function to compute results
+  b <- .jcall(dnaEnvironment[["dna"]]$headlessDna,
+              "Lexport/BarplotResult;",
+              "rBarplotData",
+              statementType,
+              variable,
+              qualifier,
+              duplicates,
+              start.date,
+              stop.date,
+              start.time,
+              stop.time,
+              var,
+              val,
+              excludeAuthors,
+              excludeSources,
+              excludeSections,
+              excludeTypes,
+              invertValues,
+              invertAuthors,
+              invertSources,
+              invertSections,
+              invertTypes,
+              simplify = TRUE)
+  
+  at <- .jcall(b, "[[Ljava/lang/String;", "getAttributes")
+  at <- t(sapply(at, FUN = .jevalArray))
+  
+  counts <- .jcall(b, "[[I", "getCounts")
+  counts <- t(sapply(counts, FUN = .jevalArray))
+  if (nrow(counts) < nrow(at)) {
+    counts <- t(counts)
+  }
+  
+  results <- data.frame(.jcall(b, "[S", "getValues"),
+                        counts,
+                        at)
+  
+  intValues <- .jcall(b, "[I", "getIntValues")
+  intColNames <- intValues
+  if (is.jnull(qualifier)) {
+    intValues <- integer(0)
+    intColNames <- "Frequency"
+  }
+  
+  atVar <- .jcall(b, "[S", "getAttributeVariables")
+  
+  colnames(results) <- c("Entity", intColNames, atVar)
+  
+  attributes(results)$variable <- .jcall(b, "S", "getVariable")
+  attributes(results)$intValues <- intValues
+  attributes(results)$attributeVariables <- atVar
+  
+  class(results) <- c("dna_barplot", class(results))
+  
+  return(results)
+}
+
+#' Print a \code{dna_barplot} object
+#'
+#' Show details of a \code{dna_barplot} object.
+#'
+#' Print the data frame returned by the \code{\link{dna_barplot}} function.
+#'
+#' @param x A \code{dna_barplot} object, as returned by the
+#'   \code{\link{dna_barplot}} function.
+#' @param trim Number of maximum characters to display in entity labels.
+#'   Entities with more characters are truncated, and the last character is
+#'   replaced by an asterisk (\code{*}).
+#' @param attr Display attributes, such as the name of the variable and the
+#'   levels of the qualifier variable if available.
+#' @param ... Additional arguments. Currently not in use.
+#'
+#' @author Philip Leifeld
+#'
+#' @rdname dna_barplot
+#' @export
+print.dna_barplot <- function(x, trim = 30, attr = TRUE, ...) {
+  x2 <- x
+  if (isTRUE(attr)) {
+    cat("Variable:", attr(x2, "variable"))
+    intVal <- attr(x2, "intValues")
+    if (length(intVal) > 0) {
+      cat(".\nQualifier levels:", paste(intVal, collapse = ", "))
+    } else {
+      cat(".\nNo qualifier variable")
+    }
+    cat(".\n")
+  }
+  x2$Entity <- sapply(x2$Entity, function(e) if (nchar(e) > trim) paste0(substr(e, 1, trim - 1), "*") else e)
+  class(x2) <- "data.frame"
+  print(x2)
+}
+
+#' Plot \code{dna_barplot} object.
+#'
+#' Plot a barplot generated from \code{\link{dna_barplot}}.
+#'
+#' This function plots \code{dna_barplot} objects generated by the
+#' \code{\link{dna_barplot}} function. It plots agreement and disagreement with
+#' DNA statements for different entities such as \code{"concept"},
+#' \code{"organization"}, or \code{"person"}. Colors can be modified before
+#' plotting (see examples).
+#'
+#' @param object A \code{dna_barplot} object.
+#' @param ... Additional arguments; currently not in use.
+#' @param lab.pos,lab.neg Names for (dis-)agreement labels.
+#' @param lab Should (dis-)agreement labels and title be displayed?
+#' @param colors If \code{TRUE}, the \code{Colors} column in the
+#'   \code{dna_barplot} object will be used to fill the bars. Also accepts
+#'   character objects matching one of the attribute variables of the
+#'   \code{dna_barplot} object.
+#' @param fontSize Text size in pt.
+#' @param barWidth Thickness of the bars. Bars will touch when set to \code{1}.
+#'   When set to \code{0.5}, space between two bars is the same as thickness of
+#'   bars.
+#' @param axisWidth Thickness of the x-axis which separates agreement from
+#'   disagreement.
+#' @param truncate Sets the number of characters to which axis labels should be
+#'   truncated.
+#' @param exclude.min Reduces the plot to entities with a minimum frequency of
+#'   statements.
+#'
+#' @examples
+#' \dontrun{
+#' dna_init()
+#' dna_sample()
+#'
+#' dna_openDatabase("sample.dna", coderId = 1, coderPassword = "sample")
+#'
+#' # compute barplot data
+#' b <- dna_barplot(statementType = "DNA Statement",
+#'                  variable = "concept",
+#'                  qualifier = "agreement")
+#'
+#' # plot barplot with ggplot2
+#' library("ggplot2")
+#' autoplot(b)
+#'
+#' # use entity colours (here: colors of organizations as an illustration)
+#' b <- dna_barplot(statementType = "DNA Statement",
+#'                  variable = "organization",
+#'                  qualifier = "agreement")
+#' autoplot(b, colors = TRUE)
+#'
+#' # edit the colors before plotting
+#' b$Color[b$Type == "NGO"] <- "red"         # change NGO color to red
+#' b$Color[b$Type == "Government"] <- "blue" # change government color to blue
+#' autoplot(b, colors = TRUE)
+#'
+#' # use an attribute, such as type, to color the bars
+#' autoplot(b, colors = "Type") +
+#'   scale_colour_manual(values = "black")
+#'
+#' # replace colors for the three possible actor types with custom colors
+#' autoplot(b, colors = "Type") +
+#'   scale_fill_manual(values = c("red", "blue", "green")) +
+#'   scale_colour_manual(values = "black")
+#' }
+#'
+#' @author Johannes B. Gruber, Tim Henrichsen
+#'
+#' @rdname dna_barplot
+#' @importFrom ggplot2 autoplot
+#' @importFrom ggplot2 ggplot
+#' @importFrom ggplot2 aes
+#' @importFrom ggplot2 geom_line
+#' @importFrom ggplot2 theme_minimal
+#' @importFrom ggplot2 theme
+#' @importFrom ggplot2 geom_bar
+#' @importFrom ggplot2 position_stack
+#' @importFrom ggplot2 coord_flip
+#' @importFrom ggplot2 element_blank
+#' @importFrom ggplot2 element_text
+#' @importFrom ggplot2 scale_color_identity
+#' @importFrom ggplot2 scale_fill_identity
+#' @importFrom ggplot2 geom_text
+#' @importFrom ggplot2 .pt
+#' @importFrom ggplot2 annotate
+#' @importFrom ggplot2 scale_x_discrete
+#' @importFrom utils stack
+#' @importFrom grDevices col2rgb
+#' @importFrom rlang .data
+#' @export
+autoplot.dna_barplot <- function(object,
+                                 ...,
+                                 lab.pos = "Agreement",
+                                 lab.neg = "Disagreement",
+                                 lab = TRUE,
+                                 colors = FALSE,
+                                 fontSize = 12,
+                                 barWidth = 0.6,
+                                 axisWidth = 1.5,
+                                 truncate = 40,
+                                 exclude.min = NULL) {
+  
+  
+  if (!("dna_barplot" %in% class(object))) {
+    stop("Invalid data object. Please compute a dna_barplot object via the ",
+         "dna_barplot function before plotting.")
+  }
+  
+  if (!("Entity" %in% colnames(object))) {
+    stop("dna_barplot object does not have a \'Entity\' variable. Please ",
+         "compute a new dna_barplot object via the dna_barplot function before",
+         " plotting.")
+  }
+  
+  if (isTRUE(colors) & !("Color" %in% colnames(object)) |
+      is.character(colors) & !(colors %in% colnames(object))) {
+    colors <- FALSE
+    warning("No color variable found in dna_barplot object. Colors will be",
+            " ignored.")
+  }
+  
+  if (!is.numeric(truncate)) {
+    truncate <- Inf
+    warning("No numeric value provided for trimming of entities. Truncation ",
+            "will be ignored.")
+  }
+  
+  # Get qualifier values
+  w <- attr(object, "intValues")
+  
+  if (!all(w %in% colnames(object))) {
+    stop("dna_barplot object does not include all qualifier values of the ",
+         "statement type. Please compute a new dna_barplot object via the ",
+         "dna_barplot function.")
+  }
+  
+  # Check if qualifier is binary
+  binary <- all(w %in% c(0, 1))
+  
+  # Compute total values per entity
+  object$sum <- rowSums(object[, colnames(object) %in% w])
+  
+  # Exclude minimum number of statements per entity
+  if (is.numeric(exclude.min)) {
+    if (exclude.min > max(object$sum)) {
+      exclude.min <- NULL
+      warning("Value provided in exclude.min is higher than maximum frequency ",
+              "of entity (", max(object$sum), "). Will ignore exclude.min.")
+    } else {
+      object <- object[object$sum >= exclude.min, ]
+    }
+  }
+  
+  # Stack agreement and disagreement
+  object2 <- cbind(object$Entity, utils::stack(object, select = colnames(object) %in% w))
+  colnames(object2) <- c("entity", "frequency", "agreement")
+  
+  object <- object[order(object$sum, decreasing = TRUE), ]
+  
+  object2$entity <- factor(object2$entity, levels = rev(object$Entity))
+  
+  # Get colors
+  if (isTRUE(colors)) {
+    object2$color <- object$Color[match(object2$entity, object$Entity)]
+    object2$text_color <- "black"
+    # Change text color to white in case of dark bar colors
+    object2$text_color[sum(grDevices::col2rgb(object2$color) * c(299, 587, 114)) / 1000 < 123] <- "white"
+  } else if (is.character(colors)) {
+    object2$color <- object[, colors][match(object2$entity, object$Entity)]
+    object2$text_color <- "black"
+  } else {
+    object2$color <- "white"
+    object2$text_color <- "black"
+  }
+  
+  
+  if (binary) {
+    # setting disagreement as -1 instead 0
+    object2$agreement <- ifelse(object2$agreement == 0, -1, 1)
+    # recode frequency in positive and negative
+    object2$frequency <- object2$frequency * as.integer(object2$agreement)
+    
+    # generate position of bar labels
+    offset <- (max(object2$frequency) + abs(min(object2$frequency))) * 0.05
+    offset <- ifelse(offset < 0.5, 0.5, offset) # offset should be at least 0.5
+    if (offset > abs(min(object2$frequency))) {
+      offset <- abs(min(object2$frequency))
+    }
+    if (offset > max(object2$frequency)) {
+      offset <- abs(min(object2$frequency))
+    }
+    object2$pos <- ifelse(object2$frequency > 0,
+                          object2$frequency + offset,
+                          object2$frequency - offset)
+    
+    # move 0 labels where necessary
+    object2$pos[object2$frequency == 0] <- ifelse(object2$agreement[object2$frequency == 0] == 1,
+                                                  object2$pos[object2$frequency == 0] * -1,
+                                                  object2$pos[object2$frequency == 0])
+    object2$label <- as.factor(abs(object2$frequency))
+  } else {
+    object2$count <- object2$frequency
+    # set frequency of negative qualifiers to negative values
+    object2$frequency <- ifelse(as.numeric(as.character(object2$agreement)) >= 0, object2$frequency,
+                                object2$frequency * -1)
+    # remove zero frequencies
+    object2 <- object2[object2$frequency != 0, ]
+    # generate position of bar labels
+    object2$pos <- ifelse(object2$frequency > 0,
+                          1.1,
+                          -0.1)
+    # Add labels
+    object2$label <- paste(object2$count, object2$agreement, sep = " x ")
+  }
+  
+  offset <- (max(object2$frequency) + abs(min(object2$frequency))) * 0.05
+  offset <- ifelse(offset < 0.5, 0.5, offset)
+  yintercepts <- data.frame(x = c(0.5, length(unique(object2$entity)) + 0.5),
+                            y = c(0, 0))
+  high <- yintercepts$x[2] + 0.25
+  
+  object2 <- object2[order(as.numeric(as.character(object2$agreement)),
+                           decreasing = FALSE), ]
+  object2$agreement <- factor(object2$agreement, levels = w)
+  
+  # Plot
+  g <- ggplot2::ggplot(object2,
+                       ggplot2::aes(x = .data[["entity"]],
+                                    y = .data[["frequency"]],
+                                    fill = .data[["agreement"]],
+                                    group = .data[["agreement"]],
+                                    label = .data[["label"]]))
+  if (binary) { # Bars for the binary case
+    g <- g + ggplot2::geom_bar(ggplot2::aes(fill = .data[["color"]],
+                                            color = .data[["text_color"]]),
+                               stat = "identity",
+                               width = barWidth,
+                               show.legend = FALSE)
+    # For the integer case with positive and negative values
+  } else if (max(w) > 0 & min(w) < 0) {
+    g <- g + ggplot2::geom_bar(ggplot2::aes(fill = .data[["color"]],
+                                            color = .data[["text_color"]]),
+                               stat = "identity",
+                               width = barWidth,
+                               show.legend = FALSE,
+                               data = object2[as.numeric(as.character(object2$agreement)) >= 0, ],
+                               position = ggplot2::position_stack(reverse = TRUE)) +
+      ggplot2::geom_bar(ggplot2::aes(fill = .data[["color"]],
+                                     color = .data[["text_color"]]),
+                        stat = "identity",
+                        width = barWidth,
+                        show.legend = FALSE,
+                        data = object2[as.numeric(as.character(object2$agreement)) < 0, ])
+    # For the integer case with positive values only
+  } else if (min(w) >= 0) {
+    g <- g + ggplot2::geom_bar(ggplot2::aes(fill = .data[["color"]],
+                                            color = .data[["text_color"]]),
+                               stat = "identity",
+                               width = barWidth,
+                               show.legend = FALSE,
+                               position = ggplot2::position_stack(reverse = TRUE))
+    # For the integer case with negative values only
+  } else {
+    g <- g + ggplot2::geom_bar(ggplot2::aes(fill = .data[["color"]],
+                                            color = .data[["text_color"]]),
+                               stat = "identity",
+                               width = barWidth,
+                               show.legend = FALSE)
+  }
+  g <- g + ggplot2::coord_flip() +
+    ggplot2::theme_minimal() +
+    # Add intercept line
+    ggplot2::geom_line(ggplot2::aes(x = .data[["x"]], y = .data[["y"]]),
+                       data = yintercepts,
+                       linewidth = axisWidth,
+                       inherit.aes = FALSE) +
+    # Remove all panel grids, axis titles and axis ticks and text for x-axis
+    ggplot2::theme(panel.grid.major = ggplot2::element_blank(),
+                   panel.grid.minor = ggplot2::element_blank(),
+                   axis.title = ggplot2::element_blank(),
+                   axis.ticks.y = ggplot2::element_blank(),
+                   axis.text.x = ggplot2::element_blank(),
+                   axis.text.y = ggplot2::element_text(size = fontSize)) #+
+  if (is.logical(colors)) {
+    g <- g + ggplot2::scale_fill_identity() +
+      ggplot2::scale_color_identity()
+  }
+  if (binary) { # Add entity labels for binary case
+    g <- g +
+      ggplot2::geom_text(ggplot2::aes(x = .data[["entity"]],
+                                      y = .data[["pos"]],
+                                      label = .data[["label"]]),
+                         size = (fontSize / ggplot2::.pt),
+                         inherit.aes = FALSE,
+                         data = object2)
+    # Add entity labels for integer case with positive and negative values
+  } else if (max(w) > 0 & min(w) < 0) {
+    g <- g +
+      ggplot2::geom_text(ggplot2::aes(color = .data[["text_color"]]),
+                         size = (fontSize / ggplot2::.pt),
+                         position = ggplot2::position_stack(vjust = 0.5, reverse = TRUE),
+                         inherit.aes = TRUE,
+                         data = object2[object2$frequency >= 0, ]) +
+      ggplot2::geom_text(ggplot2::aes(color = .data[["text_color"]]),
+                         size = (fontSize / ggplot2::.pt),
+                         position = ggplot2::position_stack(vjust = 0.5),
+                         inherit.aes = TRUE,
+                         data = object2[object2$frequency < 0, ])
+    # Add entity labels for integer case with positive values only
+  } else if (min(w) >= 0) {
+    g <- g +
+      ggplot2::geom_text(ggplot2::aes(color = .data[["text_color"]]),
+                         size = (fontSize / ggplot2::.pt),
+                         position = ggplot2::position_stack(vjust = 0.5, reverse = TRUE),
+                         inherit.aes = TRUE)
+  } else {
+    g <- g +
+      ggplot2::geom_text(ggplot2::aes(color = .data[["text_color"]]),
+                         size = (fontSize / ggplot2::.pt),
+                         position = ggplot2::position_stack(vjust = 0.5),
+                         inherit.aes = TRUE)
+  }
+  if (lab) { # Add (dis-)agreement labels
+    g <- g +
+      ggplot2::annotate("text",
+                        x = high,
+                        y = offset * 2,
+                        hjust = 0,
+                        label = lab.pos,
+                        size = (fontSize / ggplot2::.pt)) +
+      ggplot2::annotate("text",
+                        x = high,
+                        y = 0 - offset * 2,
+                        hjust = 1,
+                        label = lab.neg,
+                        size = (fontSize / ggplot2::.pt)) +
+      # Truncate labels of entities
+      ggplot2::scale_x_discrete(labels = sapply(as.character(object2$entity), function(e) if (nchar(e) > truncate) paste0(substr(e, 1, truncate - 1), "*") else e),
+                                expand = c(0, 2, 0, 2),
+                                limits = levels(object2$entity))
+  } else {
+    g <- g +
+      # Truncate labels of entities
+      ggplot2::scale_x_discrete(labels = sapply(as.character(object2$entity), function(e) if (nchar(e) > truncate) paste0(substr(e, 1, truncate - 1), "*") else e),
+                                limits = levels(object2$entity))
+  }
+  return(g)
+}
\ No newline at end of file
diff --git a/rDNA/rDNA/R/dna_multiclust.R b/rDNA/rDNA/R/dna_multiclust.R
new file mode 100644
index 00000000..da2e9253
--- /dev/null
+++ b/rDNA/rDNA/R/dna_multiclust.R
@@ -0,0 +1,1190 @@
+#' Compute multiple cluster solutions for a discourse network
+#'
+#' Compute multiple cluster solutions for a discourse network.
+#'
+#' This function applies a number of different graph clustering techniques to
+#' a discourse network dataset. The user provides many of the same arguments as
+#' in the \code{\link{dna_network}} function and a few additional arguments that
+#' determine which kinds of clustering methods should be used and how. In
+#' particular, the \code{k} argument can be \code{0} (for arbitrary numbers of
+#' clusters) or any positive integer value (e.g., \code{2}, for constraining the
+#' number of clusters to exactly \code{k} groups). This is useful for assessing
+#' the polarization of a discourse network.
+#'
+#' In particular, the function can be used to compute the maximal modularity of
+#' a smoothed time series of discourse networks using the \code{timeWindow} and
+#' \code{windowSize} arguments for a given \code{k} across a number of
+#' clustering methods.
+#'
+#' It is also possible to switch off all but one clustering method using the
+#' respective arguments and carry out a simple cluster analysis with the method
+#' of choice for a certain time span of the discourse network, without any time
+#' window options.
+#'
+#' @param saveObjects Store the original output of the respective clustering
+#'   method in the \code{cl} slot of the return object? If \code{TRUE}, one
+#'   cluster object per time point will be saved, for all time points for which
+#'   network data are available. At each time point, only the cluster object
+#'   with the highest modularity score will be saved, all others discarded. The
+#'   \code{max_mod} slot of the object contains additional information on which
+#'   measure was saved at each time point and what the corresponding modularity
+#'   score is.
+#' @param k The number of clusters to compute. This constrains the choice of
+#'   clustering methods because some methods require a predefined \code{k} while
+#'   other methods do not. To permit arbitrary numbers of clusters, depending on
+#'   the respective algorithm (or the value of modularity in some cases), choose
+#'   \code{k = 0}. This corresponds to the theoretical notion of
+#'   "multipolarization". For "bipolarization", choose \code{k = 2} in order to
+#'   constrain the cluster solutions to exactly two groups.
+#' @param k.max If \code{k = 0}, there can be arbitrary numbers of clusters. In
+#'   this case, \code{k.max} sets the maximal number of clusters that can be
+#'   identified.
+#' @param single Include hierarchical clustering with single linkage in the pool
+#'   of clustering methods? The \code{\link[stats]{hclust}} function from
+#'   the \pkg{stats} package is applied to Jaccard distances in the affiliation
+#'   network for this purpose. Only valid if \code{k > 1}.
+#' @param average Include hierarchical clustering with average linkage in the
+#'   pool of clustering methods? The \code{\link[stats]{hclust}} function from
+#'   the \pkg{stats} package is applied to Jaccard distances in the affiliation
+#'   network for this purpose. Only valid if \code{k > 1}.
+#' @param complete Include hierarchical clustering with complete linkage in the
+#'   pool of clustering methods? The \code{\link[stats]{hclust}} function from
+#'   the \pkg{stats} package is applied to Jaccard distances in the affiliation
+#'   network for this purpose. Only valid if \code{k > 1}.
+#' @param ward Include hierarchical clustering with Ward's algorithm in the
+#'   pool of clustering methods? The \code{\link[stats]{hclust}} function from
+#'   the \pkg{stats} package is applied to Jaccard distances in the affiliation
+#'   network for this purpose. If \code{k = 0} is selected, different solutions
+#'   with varying \code{k} are attempted, and the solution with the highest
+#'   modularity is retained.
+#' @param kmeans Include k-means clustering in the pool of clustering methods?
+#'   The \code{\link[stats]{kmeans}} function from the \pkg{stats} package is
+#'   applied to Jaccard distances in the affiliation network for this purpose.
+#'   If \code{k = 0} is selected, different solutions with varying \code{k} are
+#'   attempted, and the solution with the highest modularity is retained.
+#' @param pam Include partitioning around medoids in the pool of clustering
+#'   methods? The \code{\link[cluster]{pam}} function from the \pkg{cluster}
+#'   package is applied to Jaccard distances in the affiliation network for this
+#'   purpose. If \code{k = 0} is selected, different solutions with varying
+#'   \code{k} are attempted, and the solution with the highest modularity is
+#'   retained.
+#' @param equivalence Include equivalence clustering (as implemented in the
+#'   \code{\link[sna]{equiv.clust}} function in the \pkg{sna} package), based on
+#'   shortest path distances between nodes (as implemented in the
+#'   \code{\link[sna]{sedist}} function in the \pkg{sna} package) in the
+#'   positive subtract network? If \code{k = 0} is selected, different solutions
+#'   with varying \code{k} are attempted, and the solution with the highest
+#'   modularity is retained.
+#' @param concor_one Include CONvergence of iterative CORrelations (CONCOR) in
+#'   the pool of clustering methods? The algorithm is applied to the positive
+#'   subtract network to identify \code{k = 2} clusters. The method is omitted
+#'   if \code{k != 2}.
+#' @param concor_two Include CONvergence of iterative CORrelations (CONCOR) in
+#'   the pool of clustering methods? The algorithm is applied to the affiliation
+#'   network to identify \code{k = 2} clusters. The method is omitted
+#'   if \code{k != 2}.
+#' @param louvain Include the Louvain community detection algorithm in the pool
+#'   of clustering methods? The \code{\link[igraph]{cluster_louvain}} function
+#'   in the \pkg{igraph} package is applied to the positive subtract network for
+#'   this purpose.
+#' @param fastgreedy Include the fast and greedy community detection algorithm
+#'   in the pool of clustering methods? The
+#'   \code{\link[igraph]{cluster_fast_greedy}} function in the \pkg{igraph}
+#'   package is applied to the positive subtract network for this purpose.
+#' @param walktrap Include the Walktrap community detection algorithm
+#'   in the pool of clustering methods? The
+#'   \code{\link[igraph]{cluster_walktrap}} function in the \pkg{igraph}
+#'   package is applied to the positive subtract network for this purpose.
+#' @param leading_eigen Include the leading eigenvector community detection
+#'   algorithm in the pool of clustering methods? The
+#'   \code{\link[igraph]{cluster_leading_eigen}} function in the \pkg{igraph}
+#'   package is applied to the positive subtract network for this purpose.
+#' @param edge_betweenness Include the edge betweenness community detection
+#'   algorithm by Girvan and Newman in the pool of clustering methods? The
+#'   \code{\link[igraph]{cluster_edge_betweenness}} function in the \pkg{igraph}
+#'   package is applied to the positive subtract network for this purpose.
+#' @param infomap Include the infomap community detection algorithm
+#'   in the pool of clustering methods? The
+#'   \code{\link[igraph]{cluster_infomap}} function in the \pkg{igraph}
+#'   package is applied to the positive subtract network for this purpose.
+#' @param label_prop Include the label propagation community detection algorithm
+#'   in the pool of clustering methods? The
+#'   \code{\link[igraph]{cluster_label_prop}} function in the \pkg{igraph}
+#'   package is applied to the positive subtract network for this purpose.
+#' @param spinglass Include the spinglass community detection algorithm
+#'   in the pool of clustering methods? The
+#'   \code{\link[igraph]{cluster_spinglass}} function in the \pkg{igraph}
+#'   package is applied to the positive subtract network for this purpose. Note
+#'   that this method is disabled by default because it is relatively slow.
+#' @inheritParams dna_network
+#'
+#' @return The function creates a \code{dna_multiclust} object, which contains
+#'   the following items:
+#' \describe{
+#'   \item{k}{The number of clusters determined by the user.}
+#'   \item{cl}{Cluster objects returned by the respective cluster function. If
+#'     multiple methods are used, this returns the object with the highest
+#'     modularity.}
+#'   \item{max_mod}{A data frame with one row per time point (that is, only one
+#'     row in the default case and multiple rows if time windows are used) and
+#'     the maximal modularity for the given time point across all cluster
+#'     methods.}
+#'   \item{modularity}{A data frame with the modularity values for all separate
+#'     cluster methods and all time points.}
+#'   \item{membership}{A large data frame with all nodes' membership information
+#'     for each time point and each clustering method.}
+#' }
+#'
+#' @author Philip Leifeld
+#'
+#' @examples
+#' \dontrun{
+#' library("rDNA")
+#' dna_init()
+#' samp <- dna_sample()
+#' dna_openDatabase(samp, coderId = 1, coderPassword = "sample")
+#'
+#' # example 1: compute 12 cluster solutions for one time point
+#' mc1 <- dna_multiclust(variable1 = "organization",
+#'                       variable2 = "concept",
+#'                       qualifier = "agreement",
+#'                       duplicates = "document",
+#'                       k = 0,                # flexible numbers of clusters
+#'                       saveObjects = TRUE)   # retain hclust object
+#'
+#' mc1$modularity      # return modularity scores for 12 clustering methods
+#' mc1$max_mod         # return the maximal value of the 12, along with dates
+#' mc1$memberships     # return cluster memberships for all 12 cluster methods
+#' plot(mc1$cl[[1]])   # plot hclust dendrogram
+#'
+#' # example 2: compute only Girvan-Newman edge betweenness with two clusters
+#' set.seed(12345)
+#' mc2 <- dna_multiclust(k = 2,
+#'                       single = FALSE,
+#'                       average = FALSE,
+#'                       complete = FALSE,
+#'                       ward = FALSE,
+#'                       kmeans = FALSE,
+#'                       pam = FALSE,
+#'                       equivalence = FALSE,
+#'                       concor_one = FALSE,
+#'                       concor_two = FALSE,
+#'                       louvain = FALSE,
+#'                       fastgreedy = FALSE,
+#'                       walktrap = FALSE,
+#'                       leading_eigen = FALSE,
+#'                       edge_betweenness = TRUE,
+#'                       infomap = FALSE,
+#'                       label_prop = FALSE,
+#'                       spinglass = FALSE)
+#' mc2$memberships     # return membership in two clusters
+#' mc2$modularity      # return modularity of the cluster solution
+#'
+#' # example 3: smoothed modularity using time window algorithm
+#' mc3 <- dna_multiclust(k = 2,
+#'                       timeWindow = "events",
+#'                       windowSize = 28)
+#' mc3$max_mod         # maximal modularity and method per time point
+#' }
+#'
+#' @rdname dna_multiclust
+#' @importFrom stats as.dist cor hclust cutree kmeans
+#' @export
+dna_multiclust <- function(statementType = "DNA Statement",
+                           variable1 = "organization",
+                           variable1Document = FALSE,
+                           variable2 = "concept",
+                           variable2Document = FALSE,
+                           qualifier = "agreement",
+                           duplicates = "include",
+                           start.date = "01.01.1900",
+                           stop.date = "31.12.2099",
+                           start.time = "00:00:00",
+                           stop.time = "23:59:59",
+                           timeWindow = "no",
+                           windowSize = 100,
+                           excludeValues = list(),
+                           excludeAuthors = character(),
+                           excludeSources = character(),
+                           excludeSections = character(),
+                           excludeTypes = character(),
+                           invertValues = FALSE,
+                           invertAuthors = FALSE,
+                           invertSources = FALSE,
+                           invertSections = FALSE,
+                           invertTypes = FALSE,
+                           saveObjects = FALSE,
+                           k = 0,
+                           k.max = 5,
+                           single = TRUE,
+                           average = TRUE,
+                           complete = TRUE,
+                           ward = TRUE,
+                           kmeans = TRUE,
+                           pam = TRUE,
+                           equivalence = TRUE,
+                           concor_one = TRUE,
+                           concor_two = TRUE,
+                           louvain = TRUE,
+                           fastgreedy = TRUE,
+                           walktrap = TRUE,
+                           leading_eigen = TRUE,
+                           edge_betweenness = TRUE,
+                           infomap = TRUE,
+                           label_prop = TRUE,
+                           spinglass = FALSE) {
+  
+  # check dependencies
+  if (!requireNamespace("igraph", quietly = TRUE)) { # version 0.8.1 required for edge betweenness to work fine.
+    stop("The 'dna_multiclust' function requires the 'igraph' package to be installed.\n",
+         "To do this, enter 'install.packages(\"igraph\")'.")
+  } else if (packageVersion("igraph") < "0.8.1" && edge_betweenness) {
+    warning("Package version of 'igraph' < 0.8.1. If edge betweenness algorithm encounters an empty network matrix, this will let R crash. See here: https://github.com/igraph/rigraph/issues/336. Consider updating 'igraph' to the latest version.")
+  }
+  if (pam && !requireNamespace("cluster", quietly = TRUE)) {
+    pam <- FALSE
+    warning("Argument 'pam = TRUE' requires the 'cluster' package, which is not installed.\nSetting 'pam = FALSE'. Consider installing the 'cluster' package.")
+  }
+  if (equivalence && !requireNamespace("sna", quietly = TRUE)) {
+    equivalence <- FALSE
+    warning("Argument 'equivalence = TRUE' requires the 'sna' package, which is not installed.\nSetting 'equivalence = FALSE'. Consider installing the 'sna' package.")
+  }
+  
+  # check argument validity
+  if (is.null(k) || is.na(k) || !is.numeric(k) || length(k) > 1 || is.infinite(k) || k < 0) {
+    stop("'k' must be a non-negative integer number. Can be 0 for flexible numbers of clusters.")
+  }
+  if (is.null(k.max) || is.na(k.max) || !is.numeric(k.max) || length(k.max) > 1 || is.infinite(k.max) || k.max < 1) {
+    stop("'k.max' must be a positive integer number.")
+  }
+  if (k == 1) {
+    k <- 0
+    warning("'k' must be 0 (for arbitrary numbers of clusters) or larger than 1 (to constrain number of clusters). Using 'k = 0'.")
+  }
+  
+  # determine what kind of two-mode network to create
+  if (is.null(qualifier) || is.na(qualifier) || !is.character(qualifier)) {
+    qualifierAggregation <- "ignore"
+  } else {
+    v <- dna_getVariables(statementType = statementType)
+    if (v$type[v$label == qualifier] == "boolean") {
+      qualifierAggregation <- "combine"
+    } else {
+      qualifierAggregation <- "subtract"
+    }
+  }
+  
+  nw_aff <- dna_network(networkType = "twomode",
+                        statementType = statementType,
+                        variable1 = variable1,
+                        variable1Document = variable1Document,
+                        variable2 = variable2,
+                        variable2Document = variable2Document,
+                        qualifier = qualifier,
+                        qualifierAggregation = qualifierAggregation,
+                        normalization = "no",
+                        duplicates = duplicates,
+                        start.date = start.date,
+                        stop.date = stop.date,
+                        start.time = start.time,
+                        stop.time = stop.time,
+                        timeWindow = timeWindow,
+                        windowSize = windowSize,
+                        excludeValues = excludeValues,
+                        excludeAuthors = excludeAuthors,
+                        excludeSources = excludeSources,
+                        excludeSections = excludeSections,
+                        excludeTypes = excludeTypes,
+                        invertValues = invertValues,
+                        invertAuthors = invertAuthors,
+                        invertSources = invertSources,
+                        invertSections = invertSections,
+                        invertTypes = invertTypes)
+  nw_sub <- dna_network(networkType = "onemode",
+                        statementType = statementType,
+                        variable1 = variable1,
+                        variable1Document = variable1Document,
+                        variable2 = variable2,
+                        variable2Document = variable2Document,
+                        qualifier = qualifier,
+                        qualifierAggregation = "subtract",
+                        normalization = "average",
+                        duplicates = duplicates,
+                        start.date = start.date,
+                        stop.date = stop.date,
+                        start.time = start.time,
+                        stop.time = stop.time,
+                        timeWindow = timeWindow,
+                        windowSize = windowSize,
+                        excludeValues = excludeValues,
+                        excludeAuthors = excludeAuthors,
+                        excludeSources = excludeSources,
+                        excludeSections = excludeSections,
+                        excludeTypes = excludeTypes,
+                        invertValues = invertValues,
+                        invertAuthors = invertAuthors,
+                        invertSources = invertSources,
+                        invertSections = invertSections,
+                        invertTypes = invertTypes)
+  
+  if (timeWindow == "no") {
+    dta <- list()
+    dta$networks <- list(nw_sub)
+    nw_sub <- dta
+    dta <- list()
+    dta$networks <- list(nw_aff)
+    nw_aff <- dta
+  }
+  
+  obj <- list()
+  if (isTRUE(saveObjects)) {
+    obj$cl <- list()
+  }
+  dta_dat <- list()
+  dta_mem <- list()
+  dta_mod <- list()
+  counter <- 1
+  if ("dna_network_onemode_timewindows" %in% class(nw_sub)) {
+    num_networks <- length(nw_sub)
+  } else {
+    num_networks <- 1
+  }
+  for (i in 1:num_networks) {
+    
+    # prepare dates
+    if (timeWindow == "no") {
+      dta_dat[[i]] <- data.frame(i = i,
+                                 start = attributes(nw_sub$networks[[i]])$start,
+                                 stop = attributes(nw_sub$networks[[i]])$stop)
+    } else {
+      dta_dat[[i]] <- data.frame(i = i,
+                                 start.date = attributes(nw_sub[[i]])$start,
+                                 middle.date = attributes(nw_sub[[i]])$middle,
+                                 stop.date = attributes(nw_sub[[i]])$stop)
+    }
+    
+    # prepare two-mode network
+    if ("dna_network_onemode_timewindows" %in% class(nw_sub)) {
+      x <- nw_aff[[i]]
+    } else {
+      x <- nw_aff$networks[[i]]
+    }
+    if (qualifierAggregation == "combine") {
+      combined <- cbind(apply(x, 1:2, function(x) ifelse(x %in% c(1, 3), 1, 0)),
+                        apply(x, 1:2, function(x) ifelse(x %in% c(2, 3), 1, 0)))
+    } else {
+      combined <- x
+    }
+    combined <- combined[rowSums(combined) > 0, , drop = FALSE]
+    rn <- rownames(combined)
+    
+    # Jaccard distances for two-mode network (could be done using vegdist function in vegan package, but saving the dependency)
+    combined <- matrix(as.integer(combined > 0), nrow = nrow(combined)) # probably not necessary, but ensure it's an integer matrix
+    intersections <- tcrossprod(combined) # compute intersections using cross-product
+    row_sums <- rowSums(combined) # compute row sums
+    unions <- matrix(outer(row_sums, row_sums, `+`), ncol = length(row_sums)) - intersections # compute unions
+    jaccard_similarities <- intersections / unions # calculate Jaccard similarities
+    jaccard_similarities[is.nan(jaccard_similarities)] <- 0 # avoid division by zero
+    jaccard_distances <- 1 - jaccard_similarities # convert to Jaccard distances
+    rownames(jaccard_distances) <- rn # re-attach the row names
+    jac <- stats::as.dist(jaccard_distances) # convert to dist object
+    
+    # prepare one-mode network
+    if ("dna_network_onemode_timewindows" %in% class(nw_sub)) {
+      y <- nw_sub[[i]]
+    } else {
+      y <- nw_sub$networks[[i]]
+    }
+    y[y < 0] <- 0
+    class(y) <- "matrix"
+    g <- igraph::graph_from_adjacency_matrix(y, mode = "undirected", weighted = TRUE)
+    
+    if (nrow(combined) > 1) {
+      counter_current <- 1
+      current_cl <- list()
+      current_mod <- numeric()
+      
+      # Hierarchical clustering with single linkage
+      if (isTRUE(single) && k > 1) {
+        try({
+          suppressWarnings(cl <- stats::hclust(jac, method = "single"))
+          mem <- stats::cutree(cl, k = k)
+          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
+                                           method = rep("Hierarchical (Single)", length(mem)),
+                                           node = rownames(x),
+                                           cluster = mem,
+                                           stringsAsFactors = FALSE)
+          dta_mod[[counter]] <- data.frame(i = i,
+                                           method = "Hierarchical (Single)",
+                                           k = k,
+                                           modularity = igraph::modularity(x = g, membership = mem),
+                                           stringsAsFactors = FALSE)
+          if (isTRUE(saveObjects)) {
+            current_cl[[counter_current]] <- cl
+            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
+            counter_current <- counter_current + 1
+          }
+          counter <- counter + 1
+        }, silent = TRUE)
+      }
+      
+      # Hierarchical clustering with single linkage with optimal k
+      if (isTRUE(single) && k < 2) {
+        try({
+          suppressWarnings(cl <- stats::hclust(jac, method = "single"))
+          opt_k <- lapply(2:k.max, function(x) {
+            mem <- stats::cutree(cl, k = x)
+            mod <- igraph::modularity(x = g, membership = mem)
+            return(list(mem = mem, mod = mod))
+          })
+          mod <- sapply(opt_k, function(x) x$mod)
+          kk <- which.max(mod)
+          mod <- max(mod)
+          mem <- opt_k[[kk]]$mem
+          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
+                                           method = rep("Hierarchical (Single)", length(mem)),
+                                           node = rownames(x),
+                                           cluster = mem,
+                                           stringsAsFactors = FALSE)
+          dta_mod[[counter]] <- data.frame(i = i,
+                                           method = "Hierarchical (Single)",
+                                           k = kk + 1, # add one because the series started with k = 2
+                                           modularity = mod,
+                                           stringsAsFactors = FALSE)
+          if (isTRUE(saveObjects)) {
+            current_cl[[counter_current]] <- cl
+            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
+            counter_current <- counter_current + 1
+          }
+          counter <- counter + 1
+        }, silent = TRUE)
+      }
+      
+      # Hierarchical clustering with average linkage
+      if (isTRUE(average) && k > 1) {
+        try({
+          suppressWarnings(cl <- stats::hclust(jac, method = "average"))
+          mem <- stats::cutree(cl, k = k)
+          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
+                                           method = rep("Hierarchical (Average)", length(mem)),
+                                           node = rownames(x),
+                                           cluster = mem,
+                                           stringsAsFactors = FALSE)
+          dta_mod[[counter]] <- data.frame(i = i,
+                                           method = "Hierarchical (Average)",
+                                           k = k,
+                                           modularity = igraph::modularity(x = g, membership = mem),
+                                           stringsAsFactors = FALSE)
+          if (isTRUE(saveObjects)) {
+            current_cl[[counter_current]] <- cl
+            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
+            counter_current <- counter_current + 1
+          }
+          counter <- counter + 1
+        }, silent = TRUE)
+      }
+      
+      # Hierarchical clustering with average linkage with optimal k
+      if (isTRUE(average) && k < 2) {
+        try({
+          suppressWarnings(cl <- stats::hclust(jac, method = "average"))
+          opt_k <- lapply(2:k.max, function(x) {
+            mem <- stats::cutree(cl, k = x)
+            mod <- igraph::modularity(x = g, membership = mem)
+            return(list(mem = mem, mod = mod))
+          })
+          mod <- sapply(opt_k, function(x) x$mod)
+          kk <- which.max(mod)
+          mod <- max(mod)
+          mem <- opt_k[[kk]]$mem
+          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
+                                           method = rep("Hierarchical (Average)", length(mem)),
+                                           node = rownames(x),
+                                           cluster = mem,
+                                           stringsAsFactors = FALSE)
+          dta_mod[[counter]] <- data.frame(i = i,
+                                           method = "Hierarchical (Average)",
+                                           k = kk + 1, # add one because the series started with k = 2
+                                           modularity = mod,
+                                           stringsAsFactors = FALSE)
+          if (isTRUE(saveObjects)) {
+            current_cl[[counter_current]] <- cl
+            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
+            counter_current <- counter_current + 1
+          }
+          counter <- counter + 1
+        }, silent = TRUE)
+      }
+      
+      # Hierarchical clustering with complete linkage
+      if (isTRUE(complete) && k > 1) {
+        try({
+          suppressWarnings(cl <- stats::hclust(jac, method = "complete"))
+          mem <- stats::cutree(cl, k = k)
+          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
+                                           method = rep("Hierarchical (Complete)", length(mem)),
+                                           node = rownames(x),
+                                           cluster = mem,
+                                           stringsAsFactors = FALSE)
+          dta_mod[[counter]] <- data.frame(i = i,
+                                           method = "Hierarchical (Complete)",
+                                           k = k,
+                                           modularity = igraph::modularity(x = g, membership = mem),
+                                           stringsAsFactors = FALSE)
+          if (isTRUE(saveObjects)) {
+            current_cl[[counter_current]] <- cl
+            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
+            counter_current <- counter_current + 1
+          }
+          counter <- counter + 1
+        }, silent = TRUE)
+      }
+      
+      # Hierarchical clustering with complete linkage with optimal k
+      if (isTRUE(complete) && k < 2) {
+        try({
+          suppressWarnings(cl <- stats::hclust(jac, method = "complete"))
+          opt_k <- lapply(2:k.max, function(x) {
+            mem <- stats::cutree(cl, k = x)
+            mod <- igraph::modularity(x = g, membership = mem)
+            return(list(mem = mem, mod = mod))
+          })
+          mod <- sapply(opt_k, function(x) x$mod)
+          kk <- which.max(mod)
+          mod <- max(mod)
+          mem <- opt_k[[kk]]$mem
+          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
+                                           method = rep("Hierarchical (Complete)", length(mem)),
+                                           node = rownames(x),
+                                           cluster = mem,
+                                           stringsAsFactors = FALSE)
+          dta_mod[[counter]] <- data.frame(i = i,
+                                           method = "Hierarchical (Complete)",
+                                           k = kk + 1, # add one because the series started with k = 2
+                                           modularity = mod,
+                                           stringsAsFactors = FALSE)
+          if (isTRUE(saveObjects)) {
+            current_cl[[counter_current]] <- cl
+            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
+            counter_current <- counter_current + 1
+          }
+          counter <- counter + 1
+        }, silent = TRUE)
+      }
+      
+      # Hierarchical clustering with the Ward algorithm
+      if (isTRUE(ward) && k > 1) {
+        try({
+          suppressWarnings(cl <- stats::hclust(jac, method = "ward.D2"))
+          mem <- stats::cutree(cl, k = k)
+          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
+                                           method = rep("Hierarchical (Ward)", length(mem)),
+                                           node = rownames(x),
+                                           cluster = mem,
+                                           stringsAsFactors = FALSE)
+          dta_mod[[counter]] <- data.frame(i = i,
+                                           method = "Hierarchical (Ward)",
+                                           k = k,
+                                           modularity = igraph::modularity(x = g, membership = mem),
+                                           stringsAsFactors = FALSE)
+          if (isTRUE(saveObjects)) {
+            current_cl[[counter_current]] <- cl
+            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
+            counter_current <- counter_current + 1
+          }
+          counter <- counter + 1
+        }, silent = TRUE)
+      }
+      
+      # Hierarchical clustering with the Ward algorithm with optimal k
+      if (isTRUE(ward) && k < 2) {
+        try({
+          suppressWarnings(cl <- stats::hclust(jac, method = "ward.D2"))
+          opt_k <- lapply(2:k.max, function(x) {
+            mem <- stats::cutree(cl, k = x)
+            mod <- igraph::modularity(x = g, membership = mem)
+            return(list(mem = mem, mod = mod))
+          })
+          mod <- sapply(opt_k, function(x) x$mod)
+          kk <- which.max(mod)
+          mod <- max(mod)
+          mem <- opt_k[[kk]]$mem
+          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
+                                           method = rep("Hierarchical (Ward)", length(mem)),
+                                           node = rownames(x),
+                                           cluster = mem,
+                                           stringsAsFactors = FALSE)
+          dta_mod[[counter]] <- data.frame(i = i,
+                                           method = "Hierarchical (Ward)",
+                                           k = kk + 1, # add one because the series started with k = 2
+                                           modularity = mod,
+                                           stringsAsFactors = FALSE)
+          if (isTRUE(saveObjects)) {
+            current_cl[[counter_current]] <- cl
+            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
+            counter_current <- counter_current + 1
+          }
+          counter <- counter + 1
+        }, silent = TRUE)
+      }
+      
+      # k-means
+      if (isTRUE(kmeans) && k > 1) {
+        try({
+          suppressWarnings(cl <- stats::kmeans(jac, centers = k))
+          mem <- cl$cluster
+          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
+                                           method = rep("k-Means", length(mem)),
+                                           node = rownames(x),
+                                           cluster = mem,
+                                           stringsAsFactors = FALSE)
+          dta_mod[[counter]] <- data.frame(i = i,
+                                           method = "k-Means",
+                                           k = k,
+                                           modularity = igraph::modularity(x = g, membership = mem),
+                                           stringsAsFactors = FALSE)
+          if (isTRUE(saveObjects)) {
+            current_cl[[counter_current]] <- cl
+            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
+            counter_current <- counter_current + 1
+          }
+          counter <- counter + 1
+        }, silent = TRUE)
+      }
+      
+      # k-means with optimal k
+      if (isTRUE(kmeans) && k < 2) {
+        try({
+          opt_k <- lapply(2:k.max, function(x) {
+            suppressWarnings(cl <- stats::kmeans(jac, centers = x))
+            mem <- cl$cluster
+            mod <- igraph::modularity(x = g, membership = mem)
+            return(list(cl = cl, mem = mem, mod = mod))
+          })
+          mod <- sapply(opt_k, function(x) x$mod)
+          kk <- which.max(mod)
+          mod <- max(mod)
+          mem <- opt_k[[kk]]$mem
+          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
+                                           method = rep("k-Means", length(mem)),
+                                           node = rownames(x),
+                                           cluster = mem,
+                                           stringsAsFactors = FALSE)
+          dta_mod[[counter]] <- data.frame(i = i,
+                                           method = "k-Means",
+                                           k = kk + 1, # add one because the series started with k = 2
+                                           modularity = mod,
+                                           stringsAsFactors = FALSE)
+          if (isTRUE(saveObjects)) {
+            cl <- opt_k[[kk]]$cl
+            current_cl[[counter_current]] <- cl
+            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
+            counter_current <- counter_current + 1
+          }
+          counter <- counter + 1
+        }, silent = TRUE)
+      }
+      
+      # pam
+      if (isTRUE(pam) && k > 1) {
+        try({
+          suppressWarnings(cl <- cluster::pam(jac, k = k))
+          mem <- cl$cluster
+          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
+                                           method = rep("Partitioning around Medoids", length(mem)),
+                                           node = rownames(x),
+                                           cluster = mem,
+                                           stringsAsFactors = FALSE)
+          dta_mod[[counter]] <- data.frame(i = i,
+                                           method = "Partitioning around Medoids",
+                                           k = k,
+                                           modularity = igraph::modularity(x = g, membership = mem),
+                                           stringsAsFactors = FALSE)
+          if (isTRUE(saveObjects)) {
+            current_cl[[counter_current]] <- cl
+            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
+            counter_current <- counter_current + 1
+          }
+          counter <- counter + 1
+        }, silent = TRUE)
+      }
+      
+      # pam with optimal k
+      if (isTRUE(pam) && k < 2) {
+        try({
+          opt_k <- lapply(2:k.max, function(x) {
+            suppressWarnings(cl <- cluster::pam(jac, k = x))
+            mem <- cl$cluster
+            mod <- igraph::modularity(x = g, membership = mem)
+            return(list(cl = cl, mem = mem, mod = mod))
+          })
+          mod <- sapply(opt_k, function(x) x$mod)
+          kk <- which.max(mod)
+          mod <- max(mod)
+          mem <- opt_k[[kk]]$mem
+          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
+                                           method = rep("Partitioning around Medoids", length(mem)),
+                                           node = rownames(x),
+                                           cluster = mem,
+                                           stringsAsFactors = FALSE)
+          dta_mod[[counter]] <- data.frame(i = i,
+                                           method = "Partitioning around Medoids",
+                                           k = kk + 1, # add one because the series started with k = 2
+                                           modularity = mod,
+                                           stringsAsFactors = FALSE)
+          if (isTRUE(saveObjects)) {
+            cl <- opt_k[[kk]]$cl
+            current_cl[[counter_current]] <- cl
+            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
+            counter_current <- counter_current + 1
+          }
+          counter <- counter + 1
+        }, silent = TRUE)
+      }
+      
+      # Equivalence clustering
+      if (isTRUE(equivalence) && k > 1) {
+        try({
+          suppressWarnings(cl <- sna::equiv.clust(y, equiv.dist = sna::sedist(y, method = "euclidean")))
+          mem <- stats::cutree(cl$cluster, k = k)
+          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
+                                           method = rep("Equivalence", length(mem)),
+                                           node = rownames(x),
+                                           cluster = mem,
+                                           stringsAsFactors = FALSE)
+          dta_mod[[counter]] <- data.frame(i = i,
+                                           method = "Equivalence",
+                                           k = k,
+                                           modularity = igraph::modularity(x = g, membership = mem),
+                                           stringsAsFactors = FALSE)
+          if (isTRUE(saveObjects)) {
+            current_cl[[counter_current]] <- cl
+            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
+            counter_current <- counter_current + 1
+          }
+          counter <- counter + 1
+        }, silent = TRUE)
+      }
+      
+      # Equivalence clustering with optimal k
+      if (isTRUE(equivalence) && k < 2) {
+        try({
+          suppressWarnings(cl <- sna::equiv.clust(y, equiv.dist = sna::sedist(y, method = "euclidean")))
+          opt_k <- lapply(2:k.max, function(x) {
+            mem <- stats::cutree(cl$cluster, k = x)
+            mod <- igraph::modularity(x = g, membership = mem)
+            return(list(mem = mem, mod = mod))
+          })
+          mod <- sapply(opt_k, function(x) x$mod)
+          kk <- which.max(mod)
+          mod <- max(mod)
+          mem <- opt_k[[kk]]$mem
+          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
+                                           method = rep("Equivalence", length(mem)),
+                                           node = rownames(x),
+                                           cluster = mem,
+                                           stringsAsFactors = FALSE)
+          dta_mod[[counter]] <- data.frame(i = i,
+                                           method = "Equivalence",
+                                           k = kk + 1, # add one because the series started with k = 2
+                                           modularity = mod,
+                                           stringsAsFactors = FALSE)
+          if (isTRUE(saveObjects)) {
+            current_cl[[counter_current]] <- cl
+            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
+            counter_current <- counter_current + 1
+          }
+          counter <- counter + 1
+        }, silent = TRUE)
+      }
+      
+      # CONCOR based on the positive subtract network
+      if (isTRUE(concor_one) && k %in% c(0, 2)) {
+        try({
+          suppressWarnings(mi <- stats::cor(y))
+          iter <- 1
+          while (any(abs(mi) <= 0.999) & iter <= 50) {
+            mi[is.na(mi)] <- 0
+            mi <- stats::cor(mi)
+            iter <- iter + 1
+          }
+          mem <- ((mi[, 1] > 0) * 1) + 1
+          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
+                                           method = rep("CONCOR (One-Mode)", length(mem)),
+                                           node = rownames(x),
+                                           cluster = mem,
+                                           stringsAsFactors = FALSE)
+          dta_mod[[counter]] <- data.frame(i = i,
+                                           method = "CONCOR (One-Mode)",
+                                           k = 2,
+                                           modularity = igraph::modularity(x = g, membership = mem),
+                                           stringsAsFactors = FALSE)
+          if (isTRUE(saveObjects)) {
+            current_cl[[counter_current]] <- mem
+            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
+            counter_current <- counter_current + 1
+          }
+          counter <- counter + 1
+        }, silent = TRUE)
+      }
+      
+      # CONCOR based on the combined affiliation network
+      if (isTRUE(concor_two) && k %in% c(0, 2)) {
+        try({
+          suppressWarnings(mi <- stats::cor(t(combined)))
+          iter <- 1
+          while (any(abs(mi) <= 0.999) & iter <= 50) {
+            mi[is.na(mi)] <- 0
+            mi <- stats::cor(mi)
+            iter <- iter + 1
+          }
+          mem <- ((mi[, 1] > 0) * 1) + 1
+          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
+                                           method = rep("CONCOR (Two-Mode)", length(mem)),
+                                           node = rownames(x),
+                                           cluster = mem,
+                                           stringsAsFactors = FALSE)
+          dta_mod[[counter]] <- data.frame(i = i,
+                                           method = "CONCOR (Two-Mode)",
+                                           k = 2,
+                                           modularity = igraph::modularity(x = g, membership = mem),
+                                           stringsAsFactors = FALSE)
+          if (isTRUE(saveObjects)) {
+            current_cl[[counter_current]] <- mem
+            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
+            counter_current <- counter_current + 1
+          }
+          counter <- counter + 1
+        }, silent = TRUE)
+      }
+      
+      # Louvain clustering
+      if (isTRUE(louvain) && k < 2) {
+        try({
+          suppressWarnings(cl <- igraph::cluster_louvain(g))
+          mem <- igraph::membership(cl)
+          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
+                                           method = rep("Louvain", length(mem)),
+                                           node = rownames(x),
+                                           cluster = as.numeric(mem),
+                                           stringsAsFactors = FALSE)
+          dta_mod[[counter]] <- data.frame(i = i,
+                                           method = "Louvain",
+                                           k = max(as.numeric(mem)),
+                                           modularity = igraph::modularity(x = g, membership = mem),
+                                           stringsAsFactors = FALSE)
+          if (isTRUE(saveObjects)) {
+            current_cl[[counter_current]] <- cl
+            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
+            counter_current <- counter_current + 1
+          }
+          counter <- counter + 1
+        }, silent = TRUE)
+      }
+      
+      # Fast & Greedy community detection (with or without cut)
+      if (isTRUE(fastgreedy)) {
+        try({
+          suppressWarnings(cl <- igraph::cluster_fast_greedy(g, merges = TRUE))
+          if (k == 0) {
+            mem <- igraph::membership(cl)
+          } else {
+            mem <- suppressWarnings(igraph::cut_at(cl, no = k))
+            if ((k + 1) %in% as.numeric(mem)) {
+              stop()
+            }
+          }
+          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
+                                           method = rep("Fast & Greedy", length(mem)),
+                                           node = rownames(x),
+                                           cluster = as.numeric(mem),
+                                           stringsAsFactors = FALSE)
+          dta_mod[[counter]] <- data.frame(i = i,
+                                           method = "Fast & Greedy",
+                                           k = ifelse(k == 0, max(as.numeric(mem)), k),
+                                           modularity = igraph::modularity(x = g, membership = mem),
+                                           stringsAsFactors = FALSE)
+          if (isTRUE(saveObjects)) {
+            current_cl[[counter_current]] <- cl
+            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
+            counter_current <- counter_current + 1
+          }
+          counter <- counter + 1
+        }, silent = TRUE)
+      }
+      
+      # Walktrap community detection (with or without cut)
+      if (isTRUE(walktrap)) {
+        try({
+          suppressWarnings(cl <- igraph::cluster_walktrap(g, merges = TRUE))
+          if (k == 0) {
+            mem <- igraph::membership(cl)
+          } else {
+            mem <- suppressWarnings(igraph::cut_at(cl, no = k))
+            if ((k + 1) %in% as.numeric(mem)) {
+              stop()
+            }
+          }
+          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
+                                           method = rep("Walktrap", length(mem)),
+                                           node = rownames(x),
+                                           cluster = as.numeric(mem),
+                                           stringsAsFactors = FALSE)
+          dta_mod[[counter]] <- data.frame(i = i,
+                                           method = "Walktrap",
+                                           k = ifelse(k == 0, max(as.numeric(mem)), k),
+                                           modularity = igraph::modularity(x = g, membership = mem),
+                                           stringsAsFactors = FALSE)
+          if (isTRUE(saveObjects)) {
+            current_cl[[counter_current]] <- cl
+            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
+            counter_current <- counter_current + 1
+          }
+          counter <- counter + 1
+        }, silent = TRUE)
+      }
+      
+      # Leading Eigenvector community detection (only without cut)
+      if (isTRUE(leading_eigen) && k < 2) { # it *should* work with cut_at because is.hierarchical(cl) returns TRUE, but it never works...
+        try({
+          suppressWarnings(cl <- igraph::cluster_leading_eigen(g))
+          mem <- igraph::membership(cl)
+          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
+                                           method = rep("Leading Eigenvector", length(mem)),
+                                           node = rownames(x),
+                                           cluster = as.numeric(mem),
+                                           stringsAsFactors = FALSE)
+          dta_mod[[counter]] <- data.frame(i = i,
+                                           method = "Leading Eigenvector",
+                                           k = max(as.numeric(mem)),
+                                           modularity = igraph::modularity(x = g, membership = mem),
+                                           stringsAsFactors = FALSE)
+          if (isTRUE(saveObjects)) {
+            current_cl[[counter_current]] <- cl
+            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
+            counter_current <- counter_current + 1
+          }
+          counter <- counter + 1
+        }, silent = TRUE)
+      }
+      
+      # Edge Betweenness community detection (with or without cut)
+      if (isTRUE(edge_betweenness)) {
+        try({
+          suppressWarnings(cl <- igraph::cluster_edge_betweenness(g, merges = TRUE))
+          if (k == 0) {
+            mem <- igraph::membership(cl)
+          } else {
+            mem <- suppressWarnings(igraph::cut_at(cl, no = k))
+            if ((k + 1) %in% as.numeric(mem)) {
+              stop()
+            }
+          }
+          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
+                                           method = rep("Edge Betweenness", length(mem)),
+                                           node = rownames(x),
+                                           cluster = as.numeric(mem),
+                                           stringsAsFactors = FALSE)
+          dta_mod[[counter]] <- data.frame(i = i,
+                                           method = "Edge Betweenness",
+                                           k = ifelse(k == 0, max(as.numeric(mem)), k),
+                                           modularity = igraph::modularity(x = g, membership = mem),
+                                           stringsAsFactors = FALSE)
+          if (isTRUE(saveObjects)) {
+            current_cl[[counter_current]] <- cl
+            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
+            counter_current <- counter_current + 1
+          }
+          counter <- counter + 1
+        }, silent = TRUE)
+      }
+      
+      # Infomap community detection
+      if (isTRUE(infomap) && k < 2) {
+        try({
+          suppressWarnings(cl <- igraph::cluster_infomap(g))
+          mem <- igraph::membership(cl)
+          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
+                                           method = rep("Infomap", length(mem)),
+                                           node = rownames(x),
+                                           cluster = as.numeric(mem),
+                                           stringsAsFactors = FALSE)
+          dta_mod[[counter]] <- data.frame(i = i,
+                                           method = "Infomap",
+                                           k = max(as.numeric(mem)),
+                                           modularity = igraph::modularity(x = g, membership = mem),
+                                           stringsAsFactors = FALSE)
+          if (isTRUE(saveObjects)) {
+            current_cl[[counter_current]] <- cl
+            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
+            counter_current <- counter_current + 1
+          }
+          counter <- counter + 1
+        }, silent = TRUE)
+      }
+      
+      # Label Propagation community detection
+      if (isTRUE(label_prop) && k < 2) {
+        try({
+          suppressWarnings(cl <- igraph::cluster_label_prop(g))
+          mem <- igraph::membership(cl)
+          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
+                                           method = rep("Label Propagation", length(mem)),
+                                           node = rownames(x),
+                                           cluster = as.numeric(mem),
+                                           stringsAsFactors = FALSE)
+          dta_mod[[counter]] <- data.frame(i = i,
+                                           method = "Label Propagation",
+                                           k = max(as.numeric(mem)),
+                                           modularity = igraph::modularity(x = g, membership = mem),
+                                           stringsAsFactors = FALSE)
+          if (isTRUE(saveObjects)) {
+            current_cl[[counter_current]] <- cl
+            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
+            counter_current <- counter_current + 1
+          }
+          counter <- counter + 1
+        }, silent = TRUE)
+      }
+      
+      # Spinglass community detection
+      if (isTRUE(spinglass) && k < 2) {
+        try({
+          suppressWarnings(cl <- igraph::cluster_spinglass(g))
+          mem <- igraph::membership(cl)
+          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
+                                           method = rep("Spinglass", length(mem)),
+                                           node = rownames(x),
+                                           cluster = as.numeric(mem),
+                                           stringsAsFactors = FALSE)
+          dta_mod[[counter]] <- data.frame(i = i,
+                                           method = "Spinglass",
+                                           k = max(as.numeric(mem)),
+                                           modularity = igraph::modularity(x = g, membership = mem),
+                                           stringsAsFactors = FALSE)
+          if (isTRUE(saveObjects)) {
+            current_cl[[counter_current]] <- cl
+            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
+            counter_current <- counter_current + 1
+          }
+          counter <- counter + 1
+        }, silent = TRUE)
+      }
+      
+      # retain cluster object where modularity was maximal
+      if (isTRUE(saveObjects) && length(current_cl) > 0) {
+        obj$cl[[i]] <- current_cl[[which.max(current_mod)]]
+      }
+    }
+  }
+  obj$cl <- obj$cl[!sapply(obj$cl, is.null)] # remove NULL objects that may occur when the network is empty
+  obj$k <- k
+  obj$max_mod <- do.call(rbind, dta_dat)
+  memberships <- do.call(rbind, dta_mem)
+  rownames(memberships) <- NULL
+  obj$memberships <- memberships
+  obj$modularity <- do.call(rbind, dta_mod)
+  if (nrow(obj$modularity) == 0) {
+    stop("No output rows. Either you switched all clustering methods off, or all methods you used produced errors.")
+  }
+  obj$max_mod <- obj$max_mod[obj$max_mod$i %in% obj$modularity$i, ] # remove date entries where the network is empty
+  obj$max_mod$max_mod <- sapply(obj$max_mod$i, function(x) max(obj$modularity$modularity[obj$modularity$i == x], na.rm = TRUE)) # attach max_mod to $max_mod
+  # attach max_method to $max_mod
+  obj$max_mod$max_method <- sapply(obj$max_mod$i,
+                                   function(x) obj$modularity$method[obj$modularity$i == x & obj$modularity$modularity == max(obj$modularity$modularity[obj$modularity$i == x], na.rm = TRUE)][1])
+  # attach k to max_mod
+  obj$max_mod$k <- sapply(obj$max_mod$i, function(x) max(obj$modularity$k[obj$modularity$i == x], na.rm = TRUE))
+  
+  # diagnostics
+  if (isTRUE(single) && !"Hierarchical (Single)" %in% obj$modularity$method && k > 1) {
+    warning("'single' omitted due to an unknown problem.")
+  }
+  if (isTRUE(average) && !"Hierarchical (Average)" %in% obj$modularity$method && k > 1) {
+    warning("'average' omitted due to an unknown problem.")
+  }
+  if (isTRUE(complete) && !"Hierarchical (Complete)" %in% obj$modularity$method && k > 1) {
+    warning("'complete' omitted due to an unknown problem.")
+  }
+  if (isTRUE(ward) && !"Hierarchical (Ward)" %in% obj$modularity$method) {
+    warning("'ward' omitted due to an unknown problem.")
+  }
+  if (isTRUE(kmeans) && !"k-Means" %in% obj$modularity$method) {
+    warning("'kmeans' omitted due to an unknown problem.")
+  }
+  if (isTRUE(pam) && !"Partitioning around Medoids" %in% obj$modularity$method) {
+    warning("'pam' omitted due to an unknown problem.")
+  }
+  if (isTRUE(equivalence) && !"Equivalence" %in% obj$modularity$method) {
+    warning("'equivalence' omitted due to an unknown problem.")
+  }
+  if (isTRUE(concor_one) && !"CONCOR (One-Mode)" %in% obj$modularity$method && k %in% c(0, 2)) {
+    warning("'concor_one' omitted due to an unknown problem.")
+  }
+  if (isTRUE(concor_two) && !"CONCOR (Two-Mode)" %in% obj$modularity$method && k %in% c(0, 2)) {
+    warning("'concor_two' omitted due to an unknown problem.")
+  }
+  if (isTRUE(louvain) && !"Louvain" %in% obj$modularity$method && k < 2) {
+    warning("'louvain' omitted due to an unknown problem.")
+  }
+  if (isTRUE(fastgreedy) && !"Fast & Greedy" %in% obj$modularity$method) {
+    warning("'fastgreedy' omitted due to an unknown problem.")
+  }
+  if (isTRUE(walktrap) && !"Walktrap" %in% obj$modularity$method) {
+    warning("'walktrap' omitted due to an unknown problem.")
+  }
+  if (isTRUE(leading_eigen) && !"Leading Eigenvector" %in% obj$modularity$method && k < 2) {
+    warning("'leading_eigen' omitted due to an unknown problem.")
+  }
+  if (isTRUE(edge_betweenness) && !"Edge Betweenness" %in% obj$modularity$method) {
+    warning("'edge_betweenness' omitted due to an unknown problem.")
+  }
+  if (isTRUE(infomap) && !"Infomap" %in% obj$modularity$method && k < 2) {
+    warning("'infomap' omitted due to an unknown problem.")
+  }
+  if (isTRUE(label_prop) && !"Label Propagation" %in% obj$modularity$method && k < 2) {
+    warning("'label_prop' omitted due to an unknown problem.")
+  }
+  if (isTRUE(spinglass) && !"Spinglass" %in% obj$modularity$method && k < 2) {
+    warning("'spinglass' omitted due to an unknown problem.")
+  }
+  
+  class(obj) <- "dna_multiclust"
+  return(obj)
+}
+
+#' Print the summary of a \code{dna_multiclust} object
+#'
+#' Show details of a \code{dna_multiclust} object.
+#'
+#' Print abbreviated contents for the slots of a \code{dna_multiclust} object,
+#' which can be created using the \link{dna_multiclust} function.
+#'
+#' @param x A \code{dna_multiclust} object.
+#' @param ... Further options (currently not used).
+#'
+#' @author Philip Leifeld
+#'
+#' @rdname dna_multiclust
+#' @importFrom utils head
+#' @export
+print.dna_multiclust <- function(x, ...) {
+  cat(paste0("$k\n", x$k, "\n"))
+  if ("cl" %in% names(x)) {
+    cat(paste0("\n$cl\n", length(x$cl), " cluster object(s) embedded.\n"))
+  }
+  cat("\n$max_mod\n")
+  print(utils::head(x$max_mod))
+  if (nrow(x$max_mod) > 6) {
+    cat(paste0("[... ", nrow(x$max_mod), " rows]\n"))
+  }
+  cat("\n$modularity\n")
+  print(utils::head(x$modularity))
+  if (nrow(x$modularity) > 6) {
+    cat(paste0("[... ", nrow(x$modularity), " rows]\n"))
+  }
+  cat("\n$memberships\n")
+  print(utils::head(x$memberships))
+  if (nrow(x$memberships) > 6) {
+    cat(paste0("[... ", nrow(x$memberships), " rows]\n"))
+  }
+}
\ No newline at end of file
diff --git a/rDNA/rDNA/R/dna_network.R b/rDNA/rDNA/R/dna_network.R
new file mode 100644
index 00000000..2fbfeac0
--- /dev/null
+++ b/rDNA/rDNA/R/dna_network.R
@@ -0,0 +1,1166 @@
+#' Compute and retrieve a network
+#'
+#' Compute and retrieve a network from DNA.
+#'
+#' This function serves to compute a one-mode or two-mode network or an event
+#' list in DNA and retrieve it as a matrix or data frame, respectively. The
+#' arguments resemble the export options in DNA. It is also possible to compute
+#' a temporal sequence of networks using the moving time window approach, in
+#' which case the networks are retrieved as a list of matrices.
+#'
+#' @param networkType The kind of network to be computed. Can be
+#'   \code{"twomode"}, \code{"onemode"}, or \code{"eventlist"}.
+#' @param statementType The name of the statement type in which the variable
+#'   of interest is nested. For example, \code{"DNA Statement"}.
+#' @param variable1 The first variable for network construction. In a one-mode
+#'   network, this is the variable for both the rows and columns. In a
+#'   two-mode network, this is the variable for the rows only. In an event
+#'   list, this variable is only used to check for duplicates (depending on
+#'   the setting of the \code{duplicates} argument).
+#' @param variable1Document A boolean value indicating whether the first
+#'   variable is at the document level (i.e., \code{"author"},
+#'   \code{"source"}, \code{"section"}, \code{"type"}, \code{"id"}, or
+#'   \code{"title"}).
+#' @param variable2 The second variable for network construction. In a one-mode
+#'   network, this is the variable over which the ties are created. For
+#'   example, if an organization x organization network is created, and ties
+#'   in this network indicate co-reference to a concept, then the second
+#'   variable is the \code{"concept"}. In a two-mode network, this is the
+#'   variable used for the columns of the network matrix. In an event list,
+#'   this variable is only used to check for duplicates (depending on the
+#'   setting of the \code{duplicates} argument).
+#' @param variable2Document A boolean value indicating whether the second
+#'   variable is at the document level (i.e., \code{"author"},
+#'   \code{"source"}, \code{"section"}, \code{"type"}, \code{"id"}, or
+#'   \code{"title"}
+#' @param qualifier The qualifier variable. In a one-mode network, this
+#'   variable can be used to count only congruence or conflict ties. For
+#'   example, in an organization x organization network via common concepts,
+#'   a binary \code{"agreement"} qualifier could be used to record only ties
+#'   where both organizations have a positive stance on the concept or where
+#'   both organizations have a negative stance on the concept. With an
+#'   integer qualifier, the tie weight between the organizations would be
+#'   proportional to the similarity or distance between the two organizations
+#'   on the scale of the integer variable. With a short text variable as a
+#'   qualifier, agreement on common categorical values of the qualifier is
+#'   required, for example a tie is established (or a tie weight increased) if
+#'   two actors both refer to the same value on the second variable AND match on
+#'   the categorical qualifier, for example the type of referral.
+#'
+#'   In a two-mode network, the qualifier variable can be used to retain only
+#'   positive or only negative statements or subtract negative from positive
+#'   mentions. All of this depends on the setting of the
+#'   \code{qualifierAggregation} argument. For event lists, the qualifier
+#'   variable is only used for filtering out duplicates (depending on the
+#'   setting of the \code{duplicates} argument.
+#'
+#'   The qualifier can also be \code{NULL}, in which case it is ignored, meaning
+#'   that values in \code{variable1} and \code{variable2} are unconditionally
+#'   associated with each other in the network when they co-occur. This is
+#'   identical to selecting a qualifier variable and setting
+#'   \code{qualifierAggregation = "ignore"}.
+#' @param qualifierDocument A boolean value indicating whether the qualifier
+#'   variable is at the document level (i.e., \code{"author"},
+#'   \code{"source"}, \code{"section"}, \code{"type"}, \code{"id"}, or
+#'   \code{"title"}
+#' @param qualifierAggregation The aggregation rule for the \code{qualifier}
+#'   variable. In one-mode networks, this must be \code{"ignore"} (for
+#'   ignoring the qualifier variable), \code{"congruence"} (for recording a
+#'   network tie only if both nodes have the same qualifier value in the
+#'   binary case or for recording the similarity between the two nodes on the
+#'   qualifier variable in the integer case), \code{"conflict"} (for
+#'   recording a network tie only if both nodes have a different qualifier
+#'   value in the binary case or for recording the distance between the two
+#'   nodes on the qualifier variable in the integer case), or
+#' \code{"subtract"} (for subtracting the conflict tie value from the
+#'   congruence tie value in each dyad). In two-mode networks, this must be
+#' \code{"ignore"}, \code{"combine"} (for creating multiplex combinations,
+#'   e.g., 1 for positive, 2 for negative, and 3 for mixed), or
+#' \code{subtract} (for subtracting negative from positive ties). In event
+#'   lists, this setting is ignored.
+#' @param normalization Normalization of edge weights. Valid settings for
+#'   one-mode networks are \code{"no"} (for switching off normalization),
+#'   \code{"average"} (for average activity normalization), \code{"jaccard"}
+#'   (for Jaccard coefficient normalization), and \code{"cosine"} (for
+#'   cosine similarity normalization). Valid settings for two-mode networks
+#'   are \code{"no"}, \code{"activity"} (for activity normalization), and
+#'   \code{"prominence"} (for prominence normalization).
+#' @param isolates Should all nodes of the respective variable be included in
+#'   the network matrix (\code{isolates = TRUE}), or should only those nodes
+#'   be included that are active in the current time period and are not
+#'   excluded (\code{isolates = FALSE})?
+#' @param duplicates Setting for excluding duplicate statements before network
+#'   construction. Valid settings are \code{"include"} (for including all
+#'   statements in network construction), \code{"document"} (for counting
+#'   only one identical statement per document), \code{"week"} (for counting
+#'   only one identical statement per calendar week), \code{"month"} (for
+#'   counting only one identical statement per calendar month), \code{"year"}
+#'   (for counting only one identical statement per calendar year), and
+#'   \code{"acrossrange"} (for counting only one identical statement across
+#'   the whole time range).
+#' @param start.date The start date for network construction in the format
+#'   \code{"dd.mm.yyyy"}. All statements before this date will be excluded.
+#' @param start.time The start time for network construction on the specified
+#'   \code{start.date}. All statements before this time on the specified date
+#'   will be excluded.
+#' @param stop.date The stop date for network construction in the format
+#'   \code{"dd.mm.yyyy"}. All statements after this date will be excluded.
+#' @param stop.time The stop time for network construction on the specified
+#'   \code{stop.date}. All statements after this time on the specified date
+#'   will be excluded.
+#' @param timeWindow Possible values are \code{"no"}, \code{"events"},
+#'   \code{"seconds"}, \code{"minutes"}, \code{"hours"}, \code{"days"},
+#'   \code{"weeks"}, \code{"months"}, and \code{"years"}. If \code{"no"} is
+#'   selected (= the default setting), no time window will be used. If any of
+#'   the time units is selected, a moving time window will be imposed, and
+#'   only the statements falling within the time period defined by the window
+#'   will be used to create the network. The time window will then be moved
+#'   forward by one time unit at a time, and a new network with the new time
+#'   boundaries will be created. This is repeated until the end of the overall
+#'   time span is reached. All time windows will be saved as separate
+#'   networks in a list. The duration of each time window is defined by the
+#'   \code{windowSize} argument. For example, this could be used to create a
+#'   time window of 6 months which moves forward by one month each time, thus
+#'   creating time windows that overlap by five months. If \code{"events"} is
+#'   used instead of a natural time unit, the time window will comprise
+#'   exactly as many statements as defined in the \code{windowSize} argument.
+#'   However, if the start or end statement falls on a date and time where
+#'   multiple events happen, those additional events that occur simultaneously
+#'   are included because there is no other way to decide which of the
+#'   statements should be selected. Therefore the window size is sometimes
+#'   extended when the start or end point of a time window is ambiguous in
+#'   event time.
+#' @param windowSize The number of time units of which a moving time window is
+#'   comprised. This can be the number of statement events, the number of days
+#'   etc., as defined in the \code{"timeWindow"} argument.
+#' @param kernel Use kernel smoothing for computing time windows? This option
+#'   only matters if the \code{timeWindow} argument has a value other than
+#'   \code{"no"} or \code{"event"}. The default value \code{kernel = "no"}
+#'   switches off kernel smoothing, which means all statements within a time
+#'   window are weighted equally. Other values down-weight statements the
+#'   farther they are temporally away from the mid-point of the time window.
+#'   Several kernel smoothing functions are available, similar to kernel density
+#'   estimation: \code{"uniform"} is similar to \code{"no"} and weights all
+#'   statements with a value of \code{0.5}. \code{"gaussian"} uses a standard
+#'   normal distribution as a kernel smoother. \code{"epanechnikov"} uses an
+#'   Epanechnikov kernel smoother. \code{"triangular"} uses a triangular kernel
+#'   function. If in doubt, do not use kernel smoothing.
+#' @param excludeValues A list of named character vectors that contains entries
+#'   which should be excluded during network construction. For example,
+#'   \code{list(concept = c("A", "B"), organization = c("org A", "org B"))}
+#'   would exclude all statements containing concepts "A" or "B" or
+#'   organizations "org A" or "org B" when the network is constructed. This
+#'   is irrespective of whether these values appear in \code{variable1},
+#'   \code{variable2}, or the \code{qualifier}. Note that only variables at
+#'   the statement level can be used here. There are separate arguments for
+#'   excluding statements nested in documents with certain meta-data.
+#' @param excludeAuthors A character vector of authors. If a statement is
+#'   nested in a document where one of these authors is set in the "Author"
+#'   meta-data field, the statement is excluded from network construction.
+#' @param excludeSources A character vector of sources. If a statement is
+#'   nested in a document where one of these sources is set in the "Source"
+#'   meta-data field, the statement is excluded from network construction.
+#' @param excludeSections A character vector of sections. If a statement is
+#'   nested in a document where one of these sections is set in the "Section"
+#'   meta-data field, the statement is excluded from network construction.
+#' @param excludeTypes A character vector of types. If a statement is
+#'   nested in a document where one of these types is set in the "Type"
+#'   meta-data field, the statement is excluded from network construction.
+#' @param invertValues A boolean value indicating whether the entries provided
+#'   by the \code{excludeValues} argument should be excluded from network
+#'   construction (\code{invertValues = FALSE}) or if they should be the only
+#'   values that should be included during network construction
+#'   (\code{invertValues = TRUE}).
+#' @param invertAuthors A boolean value indicating whether the entries provided
+#'   by the \code{excludeAuthors} argument should be excluded from network
+#'   construction (\code{invertAuthors = FALSE}) or if they should be the
+#'   only values that should be included during network construction
+#'   (\code{invertAuthors = TRUE}).
+#' @param invertSources A boolean value indicating whether the entries provided
+#'   by the \code{excludeSources} argument should be excluded from network
+#'   construction (\code{invertSources = FALSE}) or if they should be the
+#'   only values that should be included during network construction
+#'   (\code{invertSources = TRUE}).
+#' @param invertSections A boolean value indicating whether the entries
+#'   provided by the \code{excludeSections} argument should be excluded from
+#'   network construction (\code{invertSections = FALSE}) or if they should
+#'   be the only values that should be included during network construction
+#'   (\code{invertSections = TRUE}).
+#' @param invertTypes A boolean value indicating whether the entries provided
+#'   by the \code{excludeTypes} argument should be excluded from network
+#'   construction (\code{invertTypes = FALSE}) or if they should be the
+#'   only values that should be included during network construction
+#'   (\code{invertTypes = TRUE}).
+#' @param fileFormat An optional file format specification for saving the
+#'   resulting network(s) to a file instead of returning an object. Valid values
+#'   are \code{"csv"} (for network matrices or event lists), \code{"dl"} (for
+#'   UCINET DL full-matrix files), and \code{"graphml"} (for visone .graphml
+#'   files).
+#' @param outfile An optional output file name for saving the resulting
+#'   network(s) to a file instead of returning an object.
+#'
+#' @examples
+#' \dontrun{
+#' dna_init()
+#' dna_sample()
+#' dna_openDatabase("sample.dna", coderId = 1, coderPassword = "sample")
+#' nw <- dna_network(networkType = "onemode",
+#'   variable1 = "organization",
+#'   variable2 = "concept",
+#'   qualifier = "agreement",
+#'   qualifierAggregation = "congruence",
+#'   normalization = "average",
+#'   excludeValues = list("concept" =
+#'     c("There should be legislation to regulate emissions.")))
+#' }
+#'
+#' @author Philip Leifeld
+#'
+#' @family networks
+#'
+#' @importFrom rJava .jarray
+#' @importFrom rJava .jcall
+#' @importFrom rJava .jnull
+#' @importFrom rJava J
+#' @export
+dna_network <- function(networkType = "twomode",
+                        statementType = "DNA Statement",
+                        variable1 = "organization",
+                        variable1Document = FALSE,
+                        variable2 = "concept",
+                        variable2Document = FALSE,
+                        qualifier = "agreement",
+                        qualifierDocument = FALSE,
+                        qualifierAggregation = "ignore",
+                        normalization = "no",
+                        isolates = FALSE,
+                        duplicates = "include",
+                        start.date = "01.01.1900",
+                        stop.date = "31.12.2099",
+                        start.time = "00:00:00",
+                        stop.time = "23:59:59",
+                        timeWindow = "no",
+                        windowSize = 100,
+                        kernel = "no",
+                        excludeValues = list(),
+                        excludeAuthors = character(),
+                        excludeSources = character(),
+                        excludeSections = character(),
+                        excludeTypes = character(),
+                        invertValues = FALSE,
+                        invertAuthors = FALSE,
+                        invertSources = FALSE,
+                        invertSections = FALSE,
+                        invertTypes = FALSE,
+                        fileFormat = NULL,
+                        outfile = NULL) {
+  
+  # wrap the vectors of exclude values for document variables into Java arrays
+  excludeAuthors <- .jarray(excludeAuthors)
+  excludeSources <- .jarray(excludeSources)
+  excludeSections <- .jarray(excludeSections)
+  excludeTypes <- .jarray(excludeTypes)
+  
+  # compile exclude variables and values vectors
+  dat <- matrix("", nrow = length(unlist(excludeValues)), ncol = 2)
+  count <- 0
+  if (length(excludeValues) > 0) {
+    for (i in 1:length(excludeValues)) {
+      if (length(excludeValues[[i]]) > 0) {
+        for (j in 1:length(excludeValues[[i]])) {
+          count <- count + 1
+          dat[count, 1] <- names(excludeValues)[i]
+          dat[count, 2] <- excludeValues[[i]][j]
+        }
+      }
+    }
+    var <- dat[, 1]
+    val <- dat[, 2]
+  } else {
+    var <- character()
+    val <- character()
+  }
+  var <- .jarray(var) # array of variable names of each excluded value
+  val <- .jarray(val) # array of values to be excluded
+  
+  # encode R NULL as Java null value if necessary
+  if (is.null(qualifier) || is.na(qualifier)) {
+    qualifier <- .jnull(class = "java/lang/String")
+  }
+  if (is.null(fileFormat)) {
+    fileFormat <- .jnull(class = "java/lang/String")
+  }
+  if (is.null(outfile)) {
+    outfile <- .jnull(class = "java/lang/String")
+  }
+  
+  # call rNetwork function to compute results
+  .jcall(dna_getHeadlessDna(),
+         "V",
+         "rNetwork",
+         networkType,
+         statementType,
+         variable1,
+         variable1Document,
+         variable2,
+         variable2Document,
+         qualifier,
+         qualifierDocument,
+         qualifierAggregation,
+         normalization,
+         isolates,
+         duplicates,
+         start.date,
+         stop.date,
+         start.time,
+         stop.time,
+         timeWindow,
+         as.integer(windowSize),
+         kernel,
+         var,
+         val,
+         excludeAuthors,
+         excludeSources,
+         excludeSections,
+         excludeTypes,
+         invertValues,
+         invertAuthors,
+         invertSources,
+         invertSections,
+         invertTypes,
+         outfile,
+         fileFormat
+  )
+  
+  exporter <- .jcall(dna_getHeadlessDna(), "Lexport/Exporter;", "getExporter") # get a reference to the Exporter object, in which results are stored
+  
+  if (networkType == "eventlist") { # assemble an event list in the form of a data frame of filtered statements
+    f <- J(exporter, "getFilteredStatements", simplify = TRUE) # array list of filtered export statements; use J because array list return type not recognized using .jcall
+    l <- list() # create a list for filtered statements, later to be converted to data frame, with one row per statement
+    for (i in seq(.jcall(f, "I", "size")) - 1) { # loop through filtered statements, starting at 0
+      fi <- f$get(as.integer(i)) # retrieve filtered statement i
+      row <- list() # each filtered export statement is represented by a list, with multiple slots for the variables etc.
+      row$statement_id <- .jcall(fi, "I", "getId") # store the statement ID
+      row$time <- .jcall(fi, "J", "getDateTimeLong") # store the date/time in seconds since 1 January 1970; will be converted to POSIXct later because the conversion to data frame otherwise converts it back to long anyway
+      values <- J(fi, "getValues") # array list of variables with values; use J instead of .jcall because array list return type not recognized using .jcall
+      for (j in seq(.jcall(values, "I", "size")) - 1) { # loop through the variables
+        vi <- values$get(as.integer(j)) # save variable/value j temporarily to access its contents
+        dataType <- .jcall(vi, "S", "getDataType") # the data type of value j
+        if (dataType == "long text") {
+          row[[.jcall(vi, "S", "getKey")]] <- .jcall(vi, "S", "getValue") # store as character object under variable name if long text
+        } else if (dataType == "short text") {
+          row[[.jcall(vi, "S", "getKey")]] <- vi$getValue()$getValue() # extract character object from Entity object and store under variable name if short text
+        } else {
+          row[[.jcall(vi, "S", "getKey")]] <- vi$getValue() # store as integer under variable name if boolean or integer data type
+        }
+      }
+      row$start_position <- .jcall(fi, "I", "getStart") # store start caret in document text
+      row$stop_position <- .jcall(fi, "I", "getStop") # store end caret in document text
+      row$text <- .jcall(fi, "S", "getText") # text of the statement between start and end caret
+      row$coder <- .jcall(fi, "I", "getCoderId") # store coder ID; the user can merge this with other coder details like name and color later if needed
+      row$document_id <- .jcall(fi, "I", "getDocumentId") # store the document ID of the document the statement is contained in
+      row$document_title <- .jcall(fi, "S", "getTitle") # store the document title
+      row$document_author <- .jcall(fi, "S", "getAuthor") # store the document author
+      row$document_source <- .jcall(fi, "S", "getSource") # store the document source
+      row$document_section <- .jcall(fi, "S", "getSection") # store the document section
+      row$document_type <- .jcall(fi, "S", "getType") # store the document type
+      l[[i + 1]] <- row # add the row to the list
+    }
+    d <- do.call(rbind.data.frame, l) # convert the list of lists to data frame
+    d$time <- as.POSIXct(d$time, origin = "1970-01-01 00:00:00") # convert long date/time to POSIXct
+    return(d)
+  } else { # assemble a one-mode or two-mode matrix with attributes or a list of matrices (if time window)
+    m <- .jcall(exporter, "[Lexport/Matrix;", "getMatrixResultsArray") # get list of Matrix objects from Exporter object
+    l <- list() # create a list in which each result is stored; can be of length 1 if no time window is used
+    for (t in 1:length(m)) { # loop through the matrices
+      mat <- .jcall(m[[t]], "[[D", "getMatrix", simplify = TRUE) # get the resulting matrix at step t as a double[][] object and save as matrix
+      rownames(mat) <- .jcall(m[[t]], "[S", "getRowNames", simplify = TRUE) # add the row names to the matrix
+      colnames(mat) <- .jcall(m[[t]], "[S", "getColumnNames", simplify = TRUE) # add the column names to the matrix
+      attributes(mat)$start <- as.POSIXct(.jcall(m[[t]], "J", "getStartLong"), origin = "1970-01-01") # add the start date/time of the result as an attribute to the matrix
+      attributes(mat)$stop <- as.POSIXct(.jcall(m[[t]], "J", "getStopLong"), origin = "1970-01-01") # add the end date/time of the result as an attribute to the matrix
+      if (length(m) > 1) {
+        attributes(mat)$middle <- as.POSIXct(.jcall(m[[t]], "J", "getDateTimeLong"), origin = "1970-01-01") # add the mid-point date/time around which the time window is centered if the time window algorithm was used
+      }
+      attributes(mat)$numStatements <- .jcall(m[[t]], "I", "getNumStatements") # add the number of filtered statements the matrix is based on as an attribute to the matrix
+      attributes(mat)$call <- match.call() # add the arguments of the call as an attribute to the matrix
+      class(mat) <- c(paste0("dna_network_", networkType), class(mat)) # add "dna_network_onemode" or "dna_network_twomode" as a class label in addition to "matrix"
+      l[[t]] <- mat # add the matrix to the list
+    }
+    if (length(m) == 1) {
+      return(l[[1]]) # return the first matrix in the list if no time window was used
+    } else {
+      attributes(l)$call <- match.call() # add arguments of the call as an attribute also to the list, not just each network matrix
+      class(l) <- c(paste0("dna_network_", networkType, "_timewindows"), class(l)) # add "dna_network_onemode_timewindows" or "dna_network_twomode_timewindows" to class label
+      return(l) # return the list of network matrices
+    }
+  }
+}
+
+#' Convert a \code{dna_network_onemode} object to a matrix
+#'
+#' Convert a \code{dna_network_onemode} object to a matrix.
+#'
+#' Remove the attributes and \code{"dna_network_onemode"} class label from a
+#' \code{dna_network_onemode} object and return it as a numeric matrix.
+#'
+#' @param x The \code{dna_network_onemode} object, as returned by the
+#'   \code{\link{dna_network}} function.
+#' @param ... Additional arguments. Currently not in use.
+#'
+#' @author Philip Leifeld
+#'
+#' @family networks
+#'
+#' @export
+as.matrix.dna_network_onemode <- function(x, ...) {
+  attr(x, "start") <- NULL
+  attr(x, "stop") <- NULL
+  attr(x, "numStatements") <- NULL
+  attr(x, "call") <- NULL
+  attr(x, "class") <- NULL
+  return(x)
+}
+
+#' Convert a \code{dna_network_twomode} object to a matrix
+#'
+#' Convert a \code{dna_network_twomode} object to a matrix.
+#'
+#' Remove the attributes and \code{"dna_network_twomode"} class label from a
+#' \code{dna_network_twomode} object and return it as a numeric matrix.
+#'
+#' @param x The \code{dna_network_twomode} object, as returned by the
+#'   \code{\link{dna_network}} function.
+#' @param ... Additional arguments. Currently not in use.
+#'
+#' @author Philip Leifeld
+#'
+#' @family networks
+#'
+#' @export
+as.matrix.dna_network_twomode <- as.matrix.dna_network_onemode
+
+#' Print a \code{dna_network_onemode} object
+#'
+#' Show details of a \code{dna_network_onemode} object.
+#'
+#' Print a one-mode network matrix and its attributes.
+#'
+#' @param x A \code{dna_network_onemode} object, as returned by the
+#'   \code{\link{dna_network}} function.
+#' @param trim Number of maximum characters to display in row and column labels
+#'   of the matrix. Labels with more characters are truncated, and the last
+#'   character is replaced by an asterisk (\code{*}).
+#' @param attr Display attributes, such as the start and stop date and time, the
+#'   number of statements on which the matrix is based, the function call and
+#'   arguments on which the network matrix is based, and the full labels without
+#'   truncation.
+#' @param ... Additional arguments. Currently not in use.
+#'
+#' @author Philip Leifeld
+#'
+#' @family networks
+#'
+#' @export
+print.dna_network_onemode <- function(x, trim = 5, attr = TRUE, ...) {
+  rn <- rownames(x)
+  cn <- colnames(x)
+  rownames(x) <- sapply(rownames(x), function(r) if (nchar(r) > trim) paste0(substr(r, 1, trim - 1), "*") else r)
+  colnames(x) <- sapply(colnames(x), function(r) if (nchar(r) > trim) paste0(substr(r, 1, trim - 1), "*") else r)
+  x <- round(x, 2)
+  if ("dna_network_onemode" %in% class(x)) {
+    onemode <- TRUE
+    class(x) <- class(x)[class(x) != "dna_network_onemode"]
+  } else {
+    onemode <- FALSE
+    class(x) <- class(x)[class(x) != "dna_network_twomode"]
+  }
+  start <- attr(x, "start")
+  attr(x, "start") <- NULL
+  stop <- attr(x, "stop")
+  attr(x, "stop") <- NULL
+  ns <- attr(x, "numStatements")
+  attr(x, "numStatements") <- NULL
+  cl <- deparse(attr(x, "call"))
+  attr(x, "call") <- NULL
+  attr(x, "class") <- NULL
+  print(x)
+  if (attr) {
+    cat("\nStart:", as.character(start))
+    cat("\nStop: ", as.character(stop))
+    cat("\nStatements:", ns)
+    cat("\nCall:", trimws(cl))
+    if (onemode) {
+      cat("\n\nLabels:\n")
+      cat(paste(1:length(rn), rn), sep = "\n")
+    } else {
+      cat("\n\nRow labels:\n")
+      cat(paste(1:length(rn), rn), sep = "\n")
+      cat("\nColumn labels:\n")
+      cat(paste(1:length(cn), cn), sep = "\n")
+    }
+  }
+}
+
+#' Print a \code{dna_network_twomode} object
+#'
+#' Show details of a \code{dna_network_twomode} object.
+#'
+#' Print a two-mode network matrix and its attributes.
+#'
+#' @inheritParams print.dna_network_onemode
+#'
+#' @author Philip Leifeld
+#'
+#' @family networks
+#'
+#' @export
+print.dna_network_twomode <- print.dna_network_onemode
+
+#' Plot networks created using rDNA.
+#'
+#' Plot a network generated using \code{\link{dna_network}}.
+#'
+#' These functions plot \code{dna_network_onemode} and
+#' \code{dna_network_onemode} objects generated by the \code{\link{dna_network}}
+#' function. In order to use this function, please install the \code{igraph} and
+#' \code{ggraph} packages. Different layouts for one- and two-mode networks are
+#' available.
+#'
+#' @param object A \code{dna_network} object.
+#' @param ... Additional arguments; currently not in use.
+#' @param atts A \code{dna_attributes} object generated by
+#'   \code{\link{dna_getAttributes}}. Provide this object and matching
+#'   attributes when plotting custom node colors, node labels and/or node sizes.
+#' @param layout The type of node layout to use. The following layouts are
+#'   available from the \code{igraph} and \code{ggraph} packages at the time of
+#'   writing:
+#'   \itemize{
+#'    \item \code{"stress"} (the default layout)
+#'    \item \code{"bipartite"} (only for two-mode networks)
+#'    \item \code{"backbone"}
+#'    \item \code{"circle"}
+#'    \item \code{"dh"}
+#'    \item \code{"drl"}
+#'    \item \code{"fr"}
+#'    \item \code{"gem"}
+#'    \item \code{"graphopt"}
+#'    \item \code{"kk"}
+#'    \item \code{"lgl"}
+#'    \item \code{"mds"}
+#'    \item \code{"nicely"}
+#'    \item \code{"randomly"}
+#'    \item \code{"star"}
+#'   }
+#'   See \link[ggraph]{layout_tbl_graph_igraph} for the current list of layouts.
+#' @param edge_size_range Two values indicating the minimum and maximum value
+#'   to scale edge widths.
+#' @param edge_color Provide the name of a color for edge colors. The default
+#'   \code{"NULL"} colors edges in line with the specified
+#'   \code{qualifierAggregation} in \code{\link{dna_network}}.
+#' @param edge_alpha Takes numeric values to control the alpha-transparency of
+#'   edges. Possible values range from \code{0} (fully transparent) to \code{1}
+#'   (fully visible).
+#' @param node_size Takes positive numeric values to control the size of nodes.
+#'   Also accepts numeric values matching an attribute of the \code{atts} object
+#'   (see examples).
+#' @param node_colors Provide the name of a color or use an attribute from the
+#'   \code{atts} object for node colors (see examples). Defaults to
+#'   \code{"black"}.
+#' @param node_label If \code{TRUE}, the row names (in a one-mode network) or
+#'   the row and column names (in a two-mode network) of the network matrix are
+#'   used for node labels. Also accepts character objects matching one of the
+#'   attribute variables of the \code{atts} object (see examples). \code{FALSE}
+#'   turns off node labels.
+#' @param font_size Controls the font size of the node labels.
+#' @param truncate Sets the number of characters to which node labels should be
+#'   truncated.
+#' @param threshold Minimum threshold for which edges should be plotted.
+#' @param giant_component Only plot the giant component (the biggest connected
+#'   cluster) of the network. Defaults to \code{FALSE}.
+#' @param exclude_isolates Exclude isolates (nodes with no connection to other
+#'   nodes) from the plot. Defaults to \code{FALSE}.
+#' @param max_overlaps Value to exclude node labels that overlap with too many
+#'   other node labels (see \code{\link[ggrepel]{geom_label_repel}}. Defaults
+#'   to \code{10}.
+#' @param seed Numeric value passed to \link{set.seed}. Ensures that plots are
+#'   reproducible.
+#'
+#' @examples
+#' \dontrun{
+#' dna_init()
+#' dna_sample()
+#' dna_openDatabase("sample.dna", coderId = 1, coderPassword = "sample")
+#'
+#' ## one-mode network examples
+#'
+#' # compute network matrix (subtract + normalization)
+#' nw <- dna_network(networkType = "onemode",
+#'                   qualifierAggregation = "subtract",
+#'                   normalization = "average")
+#'
+#' # plot network
+#' library("ggplot2")
+#' autoplot(nw)
+#'
+#' # plot only positively weighted edges
+#' autoplot(nw, threshold = 0)
+#'
+#' # congruence network
+#' nw <- dna_network(networkType = "onemode",
+#'                   qualifierAggregation = "congruence",
+#'                   excludeValues = list("concept" =
+#'                     c("There should be legislation to regulate emissions.")))
+#' autoplot(nw)
+#'
+#' # use entity colors (here: colors of organizations) from attributes
+#' atts <- dna_getAttributes(variableId = 2)
+#' autoplot(nw, atts = atts, node_colors = "color", layout = "fr")
+#'
+#' # use colors from attributes (after editing some of them)
+#' atts$color[atts$Type == "NGO"] <- "red" # change NGO color to red
+#' atts$color[atts$Type == "Government"] <- "blue" # change government to blue
+#' autoplot(nw, atts = atts, node_colors = "color") # plot with custom colors
+#'
+#' # use an attribute, such as type, to plot node labels
+#' autoplot(nw, atts = atts, node_label = "Type")
+#'
+#' # plot node sizes according to the number of statements of entities;
+#' # first, compute additional matrix to calculate the number of statements
+#' nw_freq <- dna_network(networkType = "twomode",
+#'                        qualifierAggregation = "ignore",
+#'                        normalization = "no")
+#' # then add frequency of statements as an attribute
+#' atts$freq <- rowSums(nw_freq)[match(atts$value, rownames(nw_freq))]
+#' # plot network with node sizes matching statement frequencies
+#' autoplot(nw, atts = atts, node_size = "freq", node_colors = "color")
+#'
+#' # use igraph community detection for identification of network clusters;
+#' # remove negative edge weights
+#' nw[nw < 0] <- 0
+#' # convert dna_network to igraph object
+#' graph <- igraph::graph_from_adjacency_matrix(nw,
+#'                                              mode = "undirected",
+#'                                              weighted = TRUE,
+#'                                              diag = FALSE,
+#'                                              add.colnames = NULL,
+#'                                              add.rownames = NA)
+#' # compute communities using igraph cluster algorithms
+#' # (here: fast and greedy as an illustration))
+#' com <- igraph::cluster_fast_greedy(graph)
+#' # add node community membership as an attribute
+#' atts$membership <- com$membership[match(atts$value, com$names)]
+#' # use community membership as node color
+#' autoplot(nw, atts = atts, node_colors = "membership")
+#' # or plot ellipses using ggforce package
+#' library("ggforce")
+#' autoplot(nw, atts = atts, node_colors = "color") +
+#'   geom_mark_ellipse(aes(x = x,
+#'                         y = y,
+#'                         group = com$membership,
+#'                         fill = com$membership),
+#'                     show.legend = FALSE)
+#'
+#' # add legend to the network plot (here: colors mapped to type attribute)
+#' autoplot(nw, atts = atts, node_colors = "color") +
+#'   scale_color_identity(name = "",
+#'                        labels = c("Government", "NGO", "Business"),
+#'                        guide = "legend") +
+#'   theme(legend.position = "bottom", # change legend position
+#'         legend.text = element_text(size = 10)) # change legend font size
+#'
+#' ## two-mode network examples
+#'
+#' # compute two-mode network and plot it
+#' nw <- dna_network(networkType = "twomode",
+#'                   qualifierAggregation = "combine")
+#' library("ggplot2")
+#' autoplot(nw)
+#'
+#' # use entity colours (here: colors of organizations);
+#' # first, retrieve attributes for first-mode entities (organizations)
+#' atts <- dna_getAttributes(variableId = 2)
+#' # then, retrieve attributes for second-mode entities (concepts)
+#' atts2 <- dna_getAttributes(variableId = 3)
+#' # combine both attribute objects
+#' atts <- rbind(atts, atts2)
+#' # plot the network using the attributes of both variables
+#' autoplot(nw,
+#'          atts = atts,
+#'          node_colors = "color",
+#'          layout = "bipartite",
+#'          max_overlaps = 20)
+#' # edit the colors before plotting
+#' atts$color[atts$Type == "NGO"] <- "red" # change NGO color to red
+#' atts$color[atts$Type == "Government"] <- "blue" # government actors in blue
+#' # plot the network with custom colors
+#' autoplot(nw, atts = atts, node_colors = "color")
+#'
+#' # use an attribute, such as type, to plot node labels
+#' nw <- dna_network(networkType = "twomode",
+#'                   qualifierAggregation = "subtract",
+#'                   normalization = "activity")
+#' autoplot(nw, atts = atts, node_label = "Type")
+#'
+#' # plot node sizes according the number of statements of entities;
+#' # first, compute network matrix for plotting
+#' nw <- dna_network(networkType = "twomode",
+#'                   qualifierAggregation = "subtract",
+#'                   normalization = "activity")
+#' # compute dna_attributes objects
+#' atts <- dna_getAttributes(variableId = 2)
+#' atts2 <- dna_getAttributes(variableId = 3)
+#' # compute additional matrix to calculate the number of statements
+#' nw_freq <- dna_network(networkType = "twomode",
+#'                        qualifierAggregation = "ignore",
+#'                        normalization = "no")
+#' # add frequency of statements as attribute
+#' # compute statement frequencies of first-mode entities
+#' atts$freq <- rowSums(nw_freq)[match(atts$value, rownames(nw_freq))]
+#' # compute statement frequencies of second-mode entities
+#' atts2$freq <- colSums(nw_freq)[match(atts2$value, colnames(nw_freq))]
+#' # combine both attribute objects
+#' atts <- rbind(atts, atts2)
+#' # plot network with node sizes matching statement frequencies
+#' autoplot(nw, atts = atts, node_size = "freq", node_colors = "color")
+#'
+#' # use igraph community detection for identification of network clusters
+#' nw <- dna_network(networkType = "twomode",
+#'                   qualifierAggregation = "subtract",
+#'                   normalization = "activity")
+#' # compute dna_attributes objects and combine them
+#' atts <- dna_getAttributes(variableId = 2)
+#' atts2 <- dna_getAttributes(variableId = 3)
+#' atts <- rbind(atts, atts2)
+#' # remove negative edge weights
+#' nw[nw < 0] <- 0
+#' # convert dna_network to igraph object
+#' graph <- igraph::graph_from_incidence_matrix(nw,
+#'                                              directed = FALSE,
+#'                                              weighted = TRUE,
+#'                                              add.names = NULL)
+#' # compute communities using igraph cluster algorithms
+#' # (here: fast and greedy as an illustration))
+#' com <- igraph::cluster_fast_greedy(graph)
+#' # add node community membership as an attribute
+#' atts$membership <- com$membership[match(atts$value, com$names)]
+#' # use community membership as node color
+#' autoplot(nw, atts = atts, node_colors = "membership")
+#' # or plot ellipses using ggforce
+#' library("ggforce")
+#' autoplot(nw, atts = atts, node_colors = "color") +
+#'   geom_mark_ellipse(aes(x = x,
+#'                     y = y,
+#'                     group = com$membership,
+#'                     fill = com$membership),
+#'                     show.legend = FALSE)
+#' }
+#'
+#' @author Tim Henrichsen
+#'
+#' @family networks
+#'
+#' @importFrom ggplot2 autoplot
+#' @importFrom ggplot2 aes
+#' @importFrom ggplot2 scale_color_identity
+#' @importFrom rlang .data
+#' @name autoplot.dna_network
+NULL
+
+#' @rdname autoplot.dna_network
+#' @export
+autoplot.dna_network_onemode <- function(object,
+                                         ...,
+                                         atts = NULL,
+                                         layout = "auto",
+                                         edge_size_range = c(0.2, 2),
+                                         edge_color = NULL,
+                                         edge_alpha = 1,
+                                         node_size = 3,
+                                         node_colors = "black",
+                                         node_label = TRUE,
+                                         font_size = 6,
+                                         truncate = 50,
+                                         threshold = NULL,
+                                         giant_component = FALSE,
+                                         exclude_isolates = FALSE,
+                                         max_overlaps = 10,
+                                         seed = 12345) {
+  set.seed(seed)
+  
+  if (!grepl("dna_network", class(object)[1])) {
+    stop("Invalid data object. Please compute a dna_network object with the ",
+         "dna_network() function before plotting.")
+  }
+  
+  if (!requireNamespace("igraph", quietly = TRUE)) {
+    stop("The autoplot function requires the 'igraph' package to be installed.\n",
+         "To do this, enter 'install.packages(\"igraph\")'.")
+  }
+  
+  if (!requireNamespace("ggraph", quietly = TRUE)) {
+    stop("The autoplot function requires the 'ggraph' package to be installed.\n",
+         "To do this, enter 'install.packages(\"ggraph\")'.")
+  }
+  
+  if (!is.null(atts) & !"dna_attributes" %in% class(atts)) {
+    stop("Object provided in 'atts' is not a dna_attributes object. Please ",
+         "provide a dna_attributes object using dna_getAttributes() or set atts ",
+         "to NULL if you do not want to use DNA attributes.")
+  }
+  
+  if (!is.numeric(truncate)) {
+    truncate <- Inf
+    warning("No numeric value provided for trimming of entities. Truncation ",
+            "will be ignored.")
+  }
+  
+  # Convert network matrix to igraph network
+  if ("dna_network_onemode" %in% class(object)) {
+    graph <- igraph::graph_from_adjacency_matrix(object,
+                                                 mode = "undirected",
+                                                 weighted = TRUE,
+                                                 diag = FALSE,
+                                                 add.colnames = NULL,
+                                                 add.rownames = NA)
+    igraph::V(graph)$shape <- "circle"
+  } else if ("dna_network_twomode" %in% class(object)) {
+    graph <- igraph::graph_from_incidence_matrix(object,
+                                                 directed = FALSE,
+                                                 weighted = TRUE,
+                                                 add.names = NULL)
+    igraph::V(graph)$shape <- ifelse(igraph::V(graph)$type, "square", "circle")
+  }
+  
+  # Check if all entities are included in attributes object (if provided)
+  if (!is.null(atts) & !(all(igraph::V(graph)$name %in% atts$value))) {
+    miss <- which(!igraph::V(graph)$name %in% atts$value)
+    stop("Some network entities are missing in the attributes object:\n",
+         paste(igraph::V(graph)$name[miss], collapse = "\n"))
+  }
+  
+  # Remove tie weights below threshold
+  if (!is.null(threshold)) {
+    graph <- igraph::delete_edges(graph, which(!igraph::E(graph)$weight >= threshold))
+  }
+  
+  # Add node colors
+  if (is.character(node_colors)) {
+    if (!is.null(atts) & length(node_colors) == 1 && node_colors %in% colnames(atts)) {
+      col_pos <- which(colnames(atts) == node_colors)
+      igraph::V(graph)$color <- atts[match(igraph::V(graph)$name, atts$value), col_pos]
+    } else if (length(node_colors) > 1 & length(node_colors) != igraph::vcount(graph)) {
+      stop("Number of custom colors does not equal number of nodes in the network.")
+    } else {
+      igraph::V(graph)$color <- node_colors
+    }
+  } else {
+    igraph::V(graph)$color <- "black"
+  }
+  
+  # Add edge colors
+  if (is.null(edge_color)) {
+    if ("combine" %in% as.character(attributes(object)$call)) {
+      igraph::E(graph)$color <- "green"
+      igraph::E(graph)$color[igraph::E(graph)$weight == 2] <- "red"
+      igraph::E(graph)$color[igraph::E(graph)$weight == 3] <- "blue"
+      # Change edge weight for networks with combine aggregation
+      igraph::E(graph)$weight[igraph::E(graph)$weight > 0] <- 1
+    } else if ("subtract" %in% as.character(attributes(object)$call)) {
+      igraph::E(graph)$color <- "green"
+      igraph::E(graph)$color[igraph::E(graph)$weight < 0] <- "red"
+    } else if ("congruence" %in% as.character(attributes(object)$call)) {
+      igraph::E(graph)$color <- "green"
+    } else if ("conflict" %in% as.character(attributes(object)$call)) {
+      igraph::E(graph)$color <- "red"
+    } else {
+      igraph::E(graph)$color <- "gray"
+    }
+  } else if (!all(is.na(edge_color))) {
+    if (length(edge_color) > 1 & length(edge_color) != igraph::ecount(graph)) {
+      igraph::E(graph)$color <- "gray"
+      warning("Number of custom edge_colors does not match number of edges ",
+              "in the network. Will set edge_color to default (gray).")
+    } else {
+      igraph::E(graph)$color <- edge_color
+    }
+  } else {
+    igraph::E(graph)$color <- "gray"
+  }
+  
+  # Add node size(s)
+  if (length(node_size) > 1 & length(node_size) != igraph::vcount(graph)) {
+    igraph::V(graph)$size <- 7
+    warning("Number of provided node size values does not equal number of ",
+            "nodes in the network. node_size will be set to default value (7).")
+  } else if (is.character(node_size) & length(node_size) == 1 & !is.null(atts) && node_size %in% colnames(atts)) {
+    col_pos <- which(colnames(atts) == node_size)
+    igraph::V(graph)$size <- atts[match(igraph::V(graph)$name, atts$value), col_pos]
+  } else if (is.numeric(node_size)) {
+    igraph::V(graph)$size <- node_size
+  }
+  
+  # Add labels
+  if (!is.logical(node_label)) {
+    if (is.character(node_label) & length(node_label) == 1 & !is.null(atts) && node_label %in% colnames(atts)) {
+      col_pos <- which(colnames(atts) == node_label)
+      igraph::V(graph)$name <- atts[match(igraph::V(graph)$name, atts$value), col_pos]
+    } else if (!is.null(node_label)) {
+      if (length(node_label) > 1 & length(node_label) != igraph::vcount(graph)) {
+        stop("Number of custom labels does not equal number of nodes in the network.")
+      }
+      igraph::V(graph)$name <- node_label
+    }
+  }
+  
+  # Remove isolates
+  if (exclude_isolates) {
+    graph <- igraph::delete_vertices(graph, igraph::degree(graph) == 0)
+  }
+  
+  # Only plot giant component of network. Useful for some plotting algorithms.
+  if (giant_component) {
+    # Get giant component
+    components <- igraph::clusters(graph)
+    biggest_cluster_id <- which.max(components$csize)
+    
+    # Get members of giant component
+    vert_ids <- igraph::V(graph)[components$membership == biggest_cluster_id]
+    
+    # Create subgraph
+    graph <- igraph::induced_subgraph(graph, vert_ids)
+  }
+  
+  
+  # Truncate labels of entities
+  igraph::V(graph)$name <- sapply(igraph::V(graph)$name, function(e) if (nchar(e) > truncate) paste0(substr(e, 1, truncate - 1), "*") else e)
+  
+  # Use absolute edge weight values for plotting
+  igraph::E(graph)$weight <- abs(igraph::E(graph)$weight)
+  
+  # Start network plot
+  g <- ggraph::ggraph(graph, layout = layout, ...) +
+    suppressWarnings(ggraph::geom_edge_link(ggplot2::aes(edge_width = igraph::E(graph)$weight, edge_colour = igraph::E(graph)$color),
+                                            alpha = edge_alpha,
+                                            show.legend = FALSE)) + # add edges
+    ggraph::scale_edge_width(range = edge_size_range) + # add edge scale
+    ggraph::geom_node_point(ggplot2::aes(colour = igraph::V(graph)$color), # add nodes
+                            size = igraph::V(graph)$size,
+                            shape = igraph::V(graph)$shape,
+                            show.legend = NA)
+  # Add labels
+  if ((!is.null(node_label) && !all(is.na(node_label))) && (is.character(node_label) || node_label == TRUE)) {
+    g <- g +
+      ggraph::geom_node_text(ggplot2::aes(label = igraph::V(graph)$name),
+                             repel = TRUE,
+                             max.overlaps = max_overlaps,
+                             show.legend = FALSE)
+  }
+  
+  # Add theme and set node colors and edges to identity
+  g <- g +
+    ggraph::theme_graph(base_family = "", base_size = font_size) +
+    ggplot2::scale_color_identity() +
+    ggraph::scale_edge_color_identity()
+  
+  return(g)
+}
+
+#' @rdname autoplot.dna_network
+#' @export
+autoplot.dna_network_twomode <- autoplot.dna_network_onemode
+
+#' Convert a DNA network into a \code{tbl_graph} or \code{graph} object
+#'
+#' Convert a DNA network into a \code{tbl_graph} or \code{graph} object.
+#'
+#' Convert a \code{dna_network_onemode} or \code{dna_network_twomode} object
+#' into a \code{tbl_graph} object as defined in the tidygraph package. These
+#' objects can then be plotted using the ggraph package, which contains many
+#' network layouts.
+#'
+#' \code{tbl_graph} objects are an extension of \code{graph}
+#' objects defined in the igraph package. Functions for manipulating or plotting
+#' the resulting objects from either the tidygraph or igraph package or both
+#' can be used.
+#'
+#' The resulting objects can also be converted to \code{network} objects as
+#' defined in the network package (part of the statnet suite of packages) using
+#' the \code{asNetwork} function in the intergraph package.
+#'
+#' @param network A \code{dna_network_onemode} or \code{dna_network_twomode}
+#'   object to be converted into a \code{tbl_graph} object. Can also be a matrix
+#'   with edge weights and row and column names for the node labels.
+#' @param attributes A \code{dna_attributes} object created using the
+#'   \link{dna_getAttributes} function with attributes for the nodes in the
+#'   network. Can also be a data frame with a \code{values} column that contains
+#'   the node labels and further columns containing the attributes. The
+#'   attributes are saved as node attributes in the \code{tbl_graph} object. If
+#'   \code{NULL}, no attributes are included.
+#' @param ... Further arguments. Currently not in use.
+#'
+#' @examples
+#' \dontrun{
+#' # prepare toy data
+#' dna_sample()
+#' dna_openDatabase("sample.dna", coderPassword = "sample")
+#' nw <- dna_network(networkType = "onemode",
+#'                   qualifierAggregation = "congruence",
+#'                   excludeValues = list(concept =
+#'                     "There should be legislation to regulate emissions."))
+#' at <- dna_getAttributes(variableId = 2)
+#'
+#' # convert to tbl_graph object
+#' g <- dna_tidygraph(nw, at)
+#'
+#' # basic visualization
+#' ggraph::ggraph(g, layout = "fr") +
+#'   ggraph::geom_edge_link() +
+#'   ggraph::geom_node_point()
+#'
+#' # visualization with more bells and whistles
+#' ggraph::ggraph(g, layout = "graphopt") +
+#'   ggraph::geom_edge_link(ggplot2::aes(color = weight, width = weight)) +
+#'   ggraph::geom_node_point(ggplot2::aes(color = color), size = 5) +
+#'   ggplot2::scale_color_identity() +
+#'   ggraph::scale_edge_color_gradient(low = "azure2", high = "azure4") +
+#'   ggraph::theme_graph(background = "white") +
+#'   ggraph::geom_node_text(ggplot2::aes(label = name),
+#'                          repel = TRUE,
+#'                          max.overlaps = 10,
+#'                          show.legend = FALSE)
+#' # for more layouts, see vignette("Layouts", package = "ggraph")
+#'
+#' # hive plot example
+#' g <- g |>
+#'   tidygraph::activate(nodes) |>
+#'   tidygraph::mutate(centrality = tidygraph::centrality_betweenness())
+#' ggraph::ggraph(g, layout = "hive", axis = Type, sort.by = centrality) +
+#'   ggraph::geom_edge_hive(ggplot2::aes(colour = "gray", width = weight)) +
+#'   ggraph::geom_axis_hive(ggplot2::aes(colour = color),
+#'                                       size = 5,
+#'                                       label = TRUE) +
+#'   ggraph::scale_edge_color_identity() +
+#'   theme(legend.position = "none")
+#'
+#' # example with negative edge weights
+#' nw <- dna_network(networkType = "onemode",
+#'                   qualifierAggregation = "subtract",
+#'                   excludeValues = list(concept =
+#'                     "There should be legislation to regulate emissions."))
+#' g <- dna_tidygraph(nw, at)
+#' ggraph::ggraph(g, layout = "linear", circular = TRUE) +
+#'   ggraph::geom_edge_arc(aes(color = color, width = abs)) +
+#'   ggraph::scale_edge_color_identity() +
+#'   ggraph::geom_node_point(ggplot2::aes(color = color), size = 5) +
+#'   ggplot2::scale_color_identity() +
+#'   ggraph::theme_graph(background = "white") +
+#'   theme(legend.position = "none") +
+#'   ggraph::geom_node_text(ggplot2::aes(label = name),
+#'                          repel = TRUE,
+#'                          max.overlaps = 10,
+#'                          show.legend = FALSE)
+#'
+#' # example with a two-mode network
+#' nw <- dna_network(networkType = "twomode",
+#'                   qualifierAggregation = "combine")
+#' at1 <- dna_getAttributes(statementTypeId = 1, variable = "organization")
+#' at2 <- dna_getAttributes(statementTypeId = 1, variable = "concept")
+#' at1$Notes <- "organization"
+#' at2$Notes <- "concept"
+#' at <- rbind(at1, at2)
+#' g <- dna_tidygraph(nw, at)
+#' ggraph::ggraph(g, layout = "graphopt") +
+#'   ggraph::geom_edge_link(ggplot2::aes(color = color), width = 1) +
+#'   ggraph::scale_edge_color_identity() +
+#'   ggraph::geom_node_point(ggplot2::aes(color = color, shape = Notes),
+#'                           size = 5) +
+#'   ggplot2::scale_color_identity() +
+#'   ggraph::geom_node_text(ggplot2::aes(label = name),
+#'                          repel = TRUE,
+#'                          max.overlaps = 10,
+#'                          show.legend = FALSE) +
+#'   ggraph::theme_graph(background = "white") +
+#'   theme(legend.position = "none")
+#'
+#' # manipulate and plot using the igraph package
+#' library("igraph")
+#' class(g) # resulting objects are both tbl_graph and igraph objects
+#' igraph::V(g) # get the nodes using igraph functions
+#' igraph::E(g) # get the edges using igraph functions
+#' igraph::plot(g) # plot network using igraph package
+#'
+#' # convert to network object (network package, statnet suite of packages)
+#' library("intergraph")
+#' intergraph::asNetwork(g)
+#' }
+#'
+#' @author Philip Leifeld
+#' @family networks
+#' @importFrom rlang .data
+#' @export
+dna_tidygraph <- function(network, attributes = NULL, ...) {
+  if (length(intersect(c("dna_network_onemode", "dna_network_twomode", "matrix"), class(network))) < 1) {
+    stop("The 'network' argument must provide an object created by the 'dna_network' function or a matrix.")
+  }
+  if (!is.null(attributes) && (length(intersect(c("dna_attributes", "data.frame"), class(attributes))) < 1) || !"value" %in% colnames(attributes)) {
+    stop("The 'attributes' argument must be NULL or created by the 'dna_getAttributes' function or a data frame with a 'values' column.")
+  }
+  if (!requireNamespace("tidygraph", quietly = TRUE) || packageVersion("tidygraph") < "1.3.1") {
+    stop("The 'dna_tidygraph' function requires the 'tidygraph' package (>= 1.3.1) to be installed.\n",
+         "To do this, enter 'install.packages(\"tidygraph\")'.")
+  }
+  
+  if ("dna_network_twomode" %in% class(network)) {
+    nodes <- data.frame(name = c(rownames(network), colnames(network)), type = c(rep(TRUE, nrow(network)), rep(FALSE, ncol(network))), stringsAsFactors = FALSE)
+    edges <- data.frame(from = rep(rownames(network), times = ncol(network)), to = rep(colnames(network), each = nrow(network)), weight = as.vector(network))
+    edges <- edges[edges$weight != 0, ]
+    edges$from <- match(edges$from, nodes$name)
+    edges$to <- match(edges$to, nodes$name)
+    g <- tidygraph::tbl_graph(nodes = nodes, edges = edges, directed = FALSE) # create tbl_graph object for ggraph
+  } else if ("dna_network_onemode" %in% class(network)) {
+    g <- tidygraph::as_tbl_graph(network, directed = FALSE) # create tbl_graph object for ggraph
+  } else {
+    stop("Argument supplied by argument 'network' not recognized.")
+  }
+  
+  if (!is.null(attributes)) {
+    nodes <- tidygraph::as_tibble(g, active = "nodes")$name # extract nodes from graph for matching
+    at <- attributes[attributes$value %in% nodes, ] # retain only those attributes present in the network
+    at <- at[match(nodes, at$value), ] # sort attributes in the same order as the nodes in the graph
+    g <- tidygraph::mutate(g, at[, colnames(at) != "value"]) # embed node attributes in graph
+  }
+  
+  edges <- tidygraph::as_tibble(g, active = "edges") # extract edges from graph
+  u <- unique(edges$weight) # unique edge weights
+  combined <- length(u) < 5 && any(grepl("combine", attributes(network)$call)) # combined qualifier aggregation?
+  edgecol <- sapply(edges$weight, function(weight) { # create edge colors
+    if (length(u) == 2 & all(sort(u) %in% 0:1) & weight > 0) { # binary: 1 = gray
+      "gray"
+    } else if (combined) { # "combined" qualifier aggregation
+      if (weight == 1) {
+        "green"
+      } else if (weight == 2) {
+        "red"
+      } else if (weight == 3) {
+        "blue"
+      } else {
+        "gray"
+      }
+    } else if (any(u < 0)) { # "subtract" (or something else that generates negative ties)
+      if (weight < 0) {
+        "red"
+      } else {
+        "green"
+      }
+    } else { # any other scale, for example "congruence" qualifier aggregation
+      "gray"
+    }
+  })
+  g <- g |> # assign absolute values, edge colors, and sign as edge attributes
+    tidygraph::activate(edges) |>
+    tidygraph::mutate(abs = abs(.data$weight),
+                      color = .data$edgecol,
+                      sign = ifelse(.data$weight < 0, "negative", "positive"))
+  
+  return(g)
+}
\ No newline at end of file
diff --git a/rDNA/rDNA/R/dna_phaseTransitions.R b/rDNA/rDNA/R/dna_phaseTransitions.R
new file mode 100644
index 00000000..6984bc5d
--- /dev/null
+++ b/rDNA/rDNA/R/dna_phaseTransitions.R
@@ -0,0 +1,643 @@
+#' Detect phase transitions and states in a discourse network
+#'
+#' Detect phase transitions and states in a discourse network.
+#'
+#' This function applies the state dynamics methods of Masuda and Holme to a
+#' time window discourse network. It computes temporally overlapping discourse
+#' networks, computes the dissimilarity between all networks, and clusters them.
+#' For the dissimilarity, the sum of absolute edge weight differences and the
+#' Euclidean spectral distance are available. Several clustering techniques can
+#' be applied to identify the different stages and phases from the resulting
+#' distance matrix.
+#'
+#' The function offers kernel smoothing, which means the farther away from a
+#' time point a statement is, the less important it becomes for the network that
+#' is created around the time point. Several kernel smoothing functions are
+#' available; see the \code{kernel} argument.
+#'
+#' @param distanceMethod The distance measure that expresses the dissimilarity
+#'   between any two network matrices. The following choices are available:
+#'   \itemize{
+#'     \item \code{"absdiff"}: The sum of the cell-wise absolute differences
+#'       between the two matrices, i.e., the sum of differences in edge weights.
+#'       This is equivalent to the graph edit distance because the network
+#'       dimensions are kept constant across all networks by including all nodes
+#'       at all time points (i.e., by including isolates).
+#'     \item \code{"spectral"}: The Euclidean distance between the normalized
+#'       eigenvalues of the graph Laplacian matrices, also called the spectral
+#'       distance between two network matrices. Any negative values (e.g., from
+#'       the subtract method) are replaced by zero before computing the
+#'       distance.
+#'   }
+#' @param clusterMethods The clustering techniques that are applied to the
+#'   distance matrix in the end. Hierarchical methods are repeatedly cut off at
+#'   different levels, and solutions are compared using network modularity to
+#'   pick the best-fitting cluster membership vector. Some of the methods are
+#'   slower than others, hence they are not included by default. It is possible
+#'   to include any number of methods in the argument. For each included method,
+#'   the cluster membership vector (i.e., the states over time) along with the
+#'   associated time stamps of the networks are returned, and the modularity of
+#'   each included method is computed for comparison. The following methods are
+#'   available:
+#'   \itemize{
+#'     \item \code{"single"}: Hierarchical clustering with single linkage using
+#'       the \code{\link[stats]{hclust}} function from the \pkg{stats} package.
+#'     \item \code{"average"}: Hierarchical clustering with average linkage
+#'       using the \code{\link[stats]{hclust}} function from the \pkg{stats}
+#'       package.
+#'     \item \code{"complete"}: Hierarchical clustering with complete linkage
+#'       using the \code{\link[stats]{hclust}} function from the \pkg{stats}
+#'       package.
+#'     \item \code{"ward"}: Hierarchical clustering with Ward's method (D2)
+#'       using the \code{\link[stats]{hclust}} function from the \pkg{stats}
+#'       package.
+#'     \item \code{"kmeans"}: k-means clustering using the
+#'       \code{\link[stats]{kmeans}} function from the \pkg{stats} package.
+#'     \item \code{"pam"}: Partitioning around medoids using the
+#'       \code{\link[cluster]{pam}} function from the \pkg{cluster} package.
+#'     \item \code{"spectral"}: Spectral clustering. An affinity matrix using a
+#'       Gaussian (RBF) kernel is created. The Laplacian matrix of the affinity
+#'       matrix is computed and normalized. The first first k eigenvectors of
+#'       the normalized Laplacian matrix are clustered using k-means.
+#'     \item \code{"concor"}: CONvergence of iterative CORrelations (CONCOR)
+#'       with exactly \code{k = 2} clusters. (Not included by default because of
+#'       the limit to \code{k = 2}.)
+#'     \item \code{"fastgreedy"}: Fast & greedy community detection using the
+#'       \code{\link[igraph]{cluster_fast_greedy}} function in the \pkg{igraph}
+#'       package.
+#'     \item \code{"walktrap"}: Walktrap community detection using the
+#'       \code{\link[igraph]{cluster_walktrap}} function in the \pkg{igraph}
+#'       package.
+#'     \item \code{"leading_eigen"}: Leading eigenvector community detection
+#'       using the \code{\link[igraph]{cluster_leading_eigen}} function in the
+#'       \pkg{igraph} package. (Can be slow, hence not included by default.)
+#'     \item \code{"edge_betweenness"}: Girvan-Newman edge betweenness community
+#'       detection using the \code{\link[igraph]{cluster_edge_betweenness}}
+#'       function in the \pkg{igraph} package. (Can be slow, hence not included
+#'       by default.)
+#'   }
+#' @param k.min For the hierarchical cluster methods, how many clusters or
+#'   states should at least be identified? Only the best solution between
+#'   \code{k.min} and \code{k.max} clusters is retained and compared to other
+#'   methods.
+#' @param k.max For the hierarchical cluster methods, up to how many clusters or
+#'   states should be identified? Only the best solution between \code{k.min}
+#'   and \code{k.max} clusters is retained and compared to other methods.
+#' @param cores The number of computing cores for parallel processing. If
+#'   \code{1} (the default), no parallel processing is used. If a larger number,
+#'   the \pkg{pbmcapply} package is used to parallelize the clustering. Note
+#'   that this method is based on forking and is only available on Unix
+#'   operating systems, including MacOS and Linux. Note also that the remaining
+#'   computations, including the computation of the distance matrix and the
+#'   time window network generation with kernel smoothing, are done in parallel
+#'   using threads in Java, irrespective of this setting, using as many parallel
+#'   threads as cores are available on the system.
+#' @param kernel Use kernel smoothing for computing network time slices? Several
+#'   kernel smoothing functions are available, similar to kernel density
+#'   estimation. They down-weight statements the farther they are temporally
+#'   away from the temporal mid-point of the respective time slice. Valid
+#'   settings are:
+#'   \itemize{
+#'     \item \code{"uniform"}: Weight all statements within a time window
+#'       equally with a value of \code{0.5}.
+#'     \item \code{"triangular"}: Use a triangular kernel function.
+#'     \item \code{"epanechnikov"}: Use an Epanechnikov kernel smoother.
+#'     \item \code{"gaussian"}: Use a standard normal distribution as a kernel
+#'       smoother.
+#'     \item \code{"no"}: Circumvent kernel smoothing and weight all statements
+#'       with a value of \code{1.0}. This is a legacy setting and is slow and
+#'       may not return the same results as \code{"uniform"} due to the way it
+#'       was written up.
+#'   }
+#' @param normalizeToOne Divide all cells by the sum of all cells before
+#'   computing the dissimilarity between two network matrices? This
+#'   normalization scales all edge weights to a sum of \code{1.0}. Doing so can
+#'   make networks more comparable by boosting the edge weights of networks that
+#'   are relatively sparsely populated by concepts, for example at the beginning
+#'   or end of the debate. Note that this normalization should not make any
+#'   difference with Euclidean spectral distances of the graph Laplacian because
+#'   the eigenvalues are normalized to sum to one in this distance method.
+#' @param indentTime If \code{TRUE}, the sequence of time slices under the time
+#'   window algorithm starts with the first network and ends with the last
+#'   network that are entirely covered within the timeline defined by the start
+#'   and stop dates and times. For example, if the start date is 1 February, the
+#'   stop date is 31 December, and the time window duration is 21 days, the
+#'   mid-point of the first time window will be 11 February (to ensure the first
+#'   network entirely fits into the timeline), and the last network will be
+#'   centered around 20 December (to ensure the last network entirely fits into
+#'   the timeline). If \code{FALSE}, the start and stop dates and times are used
+#'   as the first and last mid-points. In that case, the first and last few
+#'   networks may contain fewer statements than other time slices and may,
+#'   therefore, be more similar to each other. This can potentially be
+#'   counter-acted by setting the \code{normalizeToOne} argument.
+#' @inheritParams dna_network
+#'
+#' @examples
+#' \dontrun{
+#' library("ggplot2")
+#' dna_init()
+#' dna_sample()
+#' dna_openDatabase("sample.dna", coderId = 1, coderPassword = "sample")
+#'
+#' # compute states and phases for sample dataset
+#' results <- dna_phaseTransitions(distanceMethod = "spectral",
+#'                                 clusterMethods = c("ward",
+#'                                                    "pam",
+#'                                                    "concor",
+#'                                                    "walktrap"),
+#'                                 k.min = 2,
+#'                                 k.max = 6,
+#'                                 networkType = "onemode",
+#'                                 variable1 = "organization",
+#'                                 variable2 = "concept",
+#'                                 timeWindow = "days",
+#'                                 windowSize = 15,
+#'                                 kernel = "gaussian",
+#'                                 indentTime = FALSE,
+#'                                 normalizeToOne = FALSE)
+#' results
+#' autoplot(results)
+#'
+#' # access individual plots
+#' plots <- autoplot(results)
+#' plots[[1]] # show heatmap
+#' plots[[2]] # show cluster silhouettes
+#' plots[[3]] # show temporal embedding
+#' plots[[4]] # show state dynamics
+#'
+#' # save plots to combined PDF
+#' library("ggplotify") # needed to convert heatmap to ggplot diagram
+#' library("patchwork") # needed to merge plots into 4 x 4 diagram
+#' p1 <- ggplotify::as.ggplot(plots[[1]])
+#' p <- p1 + plots[[2]] + plots[[3]] + plots[[4]] + plot_layout(ncol = 2)
+#' ggsave(filename = "phase_transitions.pdf", p, width = 14, height = 12)
+#' }
+#'
+#' @rdname dna_phaseTransitions
+#' @author Philip Leifeld
+#' @importFrom stats dist
+#' @importFrom utils combn
+#' @importFrom rJava .jarray .jcall .jnull J
+#' @export
+dna_phaseTransitions <- function(distanceMethod = "absdiff",
+                                 clusterMethods = c("single",
+                                                    "average",
+                                                    "complete",
+                                                    "ward",
+                                                    "kmeans",
+                                                    "pam",
+                                                    "spectral",
+                                                    "fastgreedy",
+                                                    "walktrap"),
+                                 k.min = 2,
+                                 k.max = 6,
+                                 cores = 1,
+                                 networkType = "twomode",
+                                 statementType = "DNA Statement",
+                                 variable1 = "organization",
+                                 variable1Document = FALSE,
+                                 variable2 = "concept",
+                                 variable2Document = FALSE,
+                                 qualifier = "agreement",
+                                 qualifierDocument = FALSE,
+                                 qualifierAggregation = "subtract",
+                                 normalization = "no",
+                                 duplicates = "document",
+                                 start.date = "01.01.1900",
+                                 stop.date = "31.12.2099",
+                                 start.time = "00:00:00",
+                                 stop.time = "23:59:59",
+                                 timeWindow = "days",
+                                 windowSize = 200,
+                                 kernel = "uniform",
+                                 normalizeToOne = TRUE,
+                                 indentTime = FALSE,
+                                 excludeValues = list(),
+                                 excludeAuthors = character(),
+                                 excludeSources = character(),
+                                 excludeSections = character(),
+                                 excludeTypes = character(),
+                                 invertValues = FALSE,
+                                 invertAuthors = FALSE,
+                                 invertSources = FALSE,
+                                 invertSections = FALSE,
+                                 invertTypes = FALSE) {
+  
+  # check arguments and packages
+  if (distanceMethod == "spectral" && networkType == "twomode") {
+    distanceMethod <- "absdiff"
+    warning("Spectral distances only work with one-mode networks. Using 'distanceMethod = \"absdiff\"' instead.")
+  }
+  if (cores > 1 && !requireNamespace("pbmcapply", quietly = TRUE)) {
+    pbmclapply <- FALSE
+    warning("Argument 'cores' requires the 'pbmcapply' package, which is not installed.\nSetting 'cores = 1'. Consider installing the 'pbmcapply' package if you use Linux or MacOS.")
+  }
+  igraphMethods <- c("louvain", "fastgreedy", "walktrap", "leading_eigen", "edge_betweenness", "infomap", "label_prop", "spinglass")
+  if (any(igraphMethods %in% clusterMethods) && !requireNamespace("igraph", quietly = TRUE)) {
+    clusterMethods <- clusterMethods[-igraphMethods]
+    warning("'igraph' package not installed. Dropping clustering methods from the 'igraph' package. Consider installing 'igraph'.")
+  }
+  if ("pam" %in% clusterMethods && !requireNamespace("cluster", quietly = TRUE)) {
+    clusterMethods <- clusterMethods[which(clusterMethods != "pam")]
+    warning("'cluster' package not installed. Dropping clustering methods from the 'cluster' package. Consider installing 'cluster'.")
+  }
+  if ("concor" %in% clusterMethods && k.min > 2) {
+    clusterMethods <- clusterMethods[which(clusterMethods != "concor")]
+    warning("Dropping 'concor' from clustering methods because the CONCOR implementation in rDNA can only find exactly two clusters, but the 'k.min' argument was larger than 2.")
+  }
+  clusterMethods <- rev(clusterMethods) # reverse order to save time during parallel computation by starting the computationally intensive methods first
+  mcall <- match.call() # save the arguments for storing them in the results later
+  
+  # generate the time window networks
+  if (is.null(timeWindow) || is.na(timeWindow) || !is.character(timeWindow) || length(timeWindow) != 1 || !timeWindow %in% c("events", "seconds", "minutes", "hours", "days", "weeks", "months", "years")) {
+    timeWindow <- "events"
+    warning("The 'timeWindow' argument was invalid. Proceeding with 'timeWindow = \"events\" instead.")
+  }
+  
+  # wrap the vectors of exclude values for document variables into Java arrays
+  excludeAuthors <- .jarray(excludeAuthors)
+  excludeSources <- .jarray(excludeSources)
+  excludeSections <- .jarray(excludeSections)
+  excludeTypes <- .jarray(excludeTypes)
+  
+  # compile exclude variables and values vectors
+  dat <- matrix("", nrow = length(unlist(excludeValues)), ncol = 2)
+  count <- 0
+  if (length(excludeValues) > 0) {
+    for (i in 1:length(excludeValues)) {
+      if (length(excludeValues[[i]]) > 0) {
+        for (j in 1:length(excludeValues[[i]])) {
+          count <- count + 1
+          dat[count, 1] <- names(excludeValues)[i]
+          dat[count, 2] <- excludeValues[[i]][j]
+        }
+      }
+    }
+    var <- dat[, 1]
+    val <- dat[, 2]
+  } else {
+    var <- character()
+    val <- character()
+  }
+  var <- .jarray(var) # array of variable names of each excluded value
+  val <- .jarray(val) # array of values to be excluded
+  
+  # encode R NULL as Java null value if necessary
+  if (is.null(qualifier) || is.na(qualifier)) {
+    qualifier <- .jnull(class = "java/lang/String")
+  }
+  
+  # call rNetwork function to compute results
+  .jcall(dna_getHeadlessDna(),
+         "V",
+         "rTimeWindow",
+         networkType,
+         statementType,
+         variable1,
+         variable1Document,
+         variable2,
+         variable2Document,
+         qualifier,
+         qualifierDocument,
+         qualifierAggregation,
+         normalization,
+         TRUE,
+         duplicates,
+         start.date,
+         stop.date,
+         start.time,
+         stop.time,
+         timeWindow,
+         as.integer(windowSize),
+         kernel,
+         normalizeToOne,
+         indentTime,
+         var,
+         val,
+         excludeAuthors,
+         excludeSources,
+         excludeSections,
+         excludeTypes,
+         invertValues,
+         invertAuthors,
+         invertSources,
+         invertSections,
+         invertTypes
+  )
+  exporter <- dna_getHeadlessDna()$getExporter() # save Java object reference to exporter class
+  
+  # compute distance matrix
+  if (distanceMethod == "modularity") {
+    stop("Differences in modularity have not been implemented yet. Please use absolute differences or spectral Euclidean distance as a distance method.")
+  } else if (!distanceMethod %in% c("absdiff", "spectral")) {
+    stop("Distance method not recognized. Try \"absdiff\" or \"spectral\".")
+  }
+  distance_mat <- .jcall(exporter,
+                         "[[D",
+                         "computeDistanceMatrix",
+                         distanceMethod,
+                         simplify = TRUE)
+  distance_mat <- distance_mat / max(distance_mat) # rescale between 0 and 1
+  
+  # retrieve mid-point dates (gamma)
+  m <- .jcall(exporter, "[Lexport/Matrix;", "getMatrixResultsArray") # get list of Matrix objects from Exporter object
+  dates <- sapply(m, function(x) .jcall(x, "J", "getDateTimeLong")) # long integers, still needs conversion to date
+  
+  # define clustering function
+  hclustMethods <- c("single", "average", "complete", "ward")
+  cl <- function(method, distmat) {
+    tryCatch({
+      similarity_mat <- 1 - distmat
+      g <- igraph::graph_from_adjacency_matrix(similarity_mat, mode = "undirected", weighted = TRUE, diag = FALSE) # graph needs to be based on similarity, not distance
+      if (method %in% hclustMethods) {
+        if (method == "single") {
+          suppressWarnings(cl <- stats::hclust(as.dist(distmat), method = "single"))
+        } else if (method == "average") {
+          suppressWarnings(cl <- stats::hclust(as.dist(distmat), method = "average"))
+        } else if (method == "complete") {
+          suppressWarnings(cl <- stats::hclust(as.dist(distmat), method = "complete"))
+        } else if (method == "ward") {
+          suppressWarnings(cl <- stats::hclust(as.dist(distmat), method = "ward.D2"))
+        }
+        opt_k <- lapply(k.min:k.max, function(x) {
+          mem <- stats::cutree(cl, k = x)
+          mod <- igraph::modularity(x = g, weights = igraph::E(g)$weight, membership = mem)
+          return(list(mem = mem, mod = mod))
+        })
+        mod <- sapply(opt_k, function(x) x$mod)
+        kk <- which.max(mod)
+        mem <- opt_k[[kk]]$mem
+      } else if (method == "kmeans") {
+        opt_k <- lapply(k.min:k.max, function(x) {
+          suppressWarnings(cl <- stats::kmeans(distmat, centers = x))
+          mem <- cl$cluster
+          mod <- igraph::modularity(x = g, weights = igraph::E(g)$weight, membership = mem)
+          return(list(cl = cl, mem = mem, mod = mod))
+        })
+        mod <- sapply(opt_k, function(x) x$mod)
+        kk <- which.max(mod)
+        mem <- opt_k[[kk]]$mem
+      } else if (method == "pam") {
+        opt_k <- lapply(k.min:k.max, function(x) {
+          suppressWarnings(cl <- cluster::pam(distmat, k = x))
+          mem <- cl$cluster
+          mod <- igraph::modularity(x = g, weights = igraph::E(g)$weight, membership = mem)
+          return(list(cl = cl, mem = mem, mod = mod))
+        })
+        mod <- sapply(opt_k, function(x) x$mod)
+        kk <- which.max(mod)
+        mem <- opt_k[[kk]]$mem
+      } else if (method == "spectral") {
+        sigma <- 1.0
+        affinity_matrix <- exp(-distmat^2 / (2 * sigma^2))
+        L <- diag(rowSums(affinity_matrix)) - affinity_matrix
+        D.sqrt.inv <- diag(1 / sqrt(rowSums(affinity_matrix)))
+        L.norm <- D.sqrt.inv %*% L %*% D.sqrt.inv
+        eigenvalues <- eigen(L.norm) # eigenvalue decomposition
+        opt_k <- lapply(k.min:k.max, function(x) {
+          U <- eigenvalues$vectors[, 1:x]
+          mem <- kmeans(U, centers = x)$cluster # cluster the eigenvectors
+          mod <- igraph::modularity(x = g, weights = igraph::E(g)$weight, membership = mem)
+          return(list(mem = mem, mod = mod))
+        })
+        mod <- sapply(opt_k, function(x) x$mod)
+        kk <- which.max(mod)
+        mem <- opt_k[[kk]]$mem
+      } else if (method == "concor") {
+        suppressWarnings(mi <- stats::cor(similarity_mat))
+        iter <- 1
+        while (any(abs(mi) <= 0.999) & iter <= 50) {
+          mi[is.na(mi)] <- 0
+          mi <- stats::cor(mi)
+          iter <- iter + 1
+        }
+        mem <- ((mi[, 1] > 0) * 1) + 1
+      } else if (method %in% igraphMethods) {
+        if (method == "fastgreedy") {
+          suppressWarnings(cl <- igraph::cluster_fast_greedy(g))
+        } else if (method == "walktrap") {
+          suppressWarnings(cl <- igraph::cluster_walktrap(g))
+        } else if (method == "leading_eigen") {
+          suppressWarnings(cl <- igraph::cluster_leading_eigen(g))
+        } else if (method == "edge_betweenness") {
+          suppressWarnings(cl <- igraph::cluster_edge_betweenness(g))
+        } else if (method == "spinglass") {
+          suppressWarnings(cl <- igraph::cluster_spinglass(g))
+        }
+        opt_k <- lapply(k.min:k.max, function(x) {
+          mem <- igraph::cut_at(communities = cl, no = x)
+          mod <- igraph::modularity(x = g, weights = igraph::E(g)$weight, membership = mem)
+          return(list(mem = mem, mod = mod))
+        })
+        mod <- sapply(opt_k, function(x) x$mod)
+        kk <- which.max(mod)
+        mem <- opt_k[[kk]]$mem
+      }
+      list(method = method,
+           modularity = igraph::modularity(x = g, weights = igraph::E(g)$weight, membership = mem),
+           memberships = mem)
+    },
+    error = function(e) {
+      warning("Cluster method '", method, "' could not be computed due to an error: ", e)
+    },
+    warning = function(w) {
+      warning("Cluster method '", method, "' threw a warning: ", w)
+    })
+  }
+  
+  # apply all clustering methods to distance matrix
+  if (cores > 1) {
+    cat(paste("Clustering distance matrix on", cores, "cores.\n"))
+    a <- Sys.time()
+    l <- pbmcapply::pbmclapply(clusterMethods, cl, distmat = distance_mat, mc.cores = cores)
+    b <- Sys.time()
+  } else {
+    cat("Clustering distance matrix... ")
+    a <- Sys.time()
+    l <- lapply(clusterMethods, cl, distmat = distance_mat)
+    b <- Sys.time()
+    cat(intToUtf8(0x2714), "\n")
+  }
+  print(b - a)
+  for (i in length(l):1) {
+    if (length(l[[i]]) == 1) {
+      l <- l[-i]
+      clusterMethods <- clusterMethods[-i]
+    }
+  }
+  results <- list()
+  mod <- sapply(l, function(x) x$modularity)
+  best <- which(mod == max(mod))[1]
+  results$modularity <- mod[best]
+  results$clusterMethod <- clusterMethods[best]
+  
+  # temporal embedding via MDS
+  if (!requireNamespace("MASS", quietly = TRUE)) {
+    mem <- data.frame("date" = as.POSIXct(dates, tz = "UTC", origin = "1970-01-01"),
+                      "state" = l[[best]]$memberships)
+    results$states <- mem
+    warning("Skipping temporal embedding because the 'MASS' package is not installed. Consider installing it.")
+  } else {
+    cat("Temporal embedding...\n")
+    a <- Sys.time()
+    distmat <- distance_mat + 1e-12
+    mds <- MASS::isoMDS(distmat) # MDS of distance matrix
+    points <- mds$points
+    mem <- data.frame("date" = as.POSIXct(dates, tz = "UTC", origin = "1970-01-01"),
+                      "state" = l[[best]]$memberships,
+                      "X1" = points[, 1],
+                      "X2" = points[, 2])
+    results$states <- mem
+    b <- Sys.time()
+    print(b - a)
+  }
+  
+  results$distmat <- distance_mat
+  class(results) <- "dna_phaseTransitions"
+  attributes(results)$stress <- ifelse(ncol(results$states) == 2, NA, mds$stress)
+  attributes(results)$call <- mcall
+  return(results)
+}
+
+#' Print the summary of a \code{dna_phaseTransitions} object
+#'
+#' Show details of a \code{dna_phaseTransitions} object.
+#'
+#' Print a summary of a \code{dna_phaseTransitions} object, which can be created
+#' using the \link{dna_phaseTransitions} function.
+#'
+#' @param x A \code{dna_phaseTransitions} object.
+#' @param ... Further options (currently not used).
+#'
+#' @author Philip Leifeld
+#'
+#' @rdname dna_phaseTransitions
+#' @importFrom utils head
+#' @export
+print.dna_phaseTransitions <- function(x, ...) {
+  cat(paste0("States: ", max(x$states$state), ". Cluster method: ", x$clusterMethod, ". Modularity: ", round(x$modularity, 3), ".\n\n"))
+  print(utils::head(x$states, 20))
+  cat(paste0("...", nrow(x$states), " further rows\n"))
+}
+
+#' @rdname dna_phaseTransitions
+#' @param object A \code{"dna_phaseTransitions"} object.
+#' @param ... Additional arguments. Currently not in use.
+#' @param plots The plots to include in the output list. Can be one or more of
+#'   the following: \code{"heatmap"}, \code{"silhouette"}, \code{"mds"},
+#'   \code{"states"}.
+#'
+#' @author Philip Leifeld, Kristijan Garic
+#' @importFrom ggplot2 autoplot ggplot aes geom_line geom_point xlab ylab
+#'   labs ggtitle theme_bw theme arrow unit scale_shape_manual element_text
+#'   scale_x_datetime scale_colour_manual guides
+#' @importFrom rlang .data
+#' @export
+autoplot.dna_phaseTransitions <- function(object, ..., plots = c("heatmap", "silhouette", "mds", "states")) {
+  # settings for all plots
+  k <- max(object$states$state)
+  shapes <- c(21:25, 0:14)[1:k]
+  l <- list()
+  
+  # heatmap
+  if ("heatmap" %in% plots) {
+    try({
+      if (!requireNamespace("heatmaply", quietly = TRUE)) {
+        warning("Heatmap skipped because the 'heatmaply' package is not installed.")
+      } else {
+        l[[length(l) + 1]] <- heatmaply::ggheatmap(1 - object$distmat,
+                                                   dendrogram = "both",
+                                                   showticklabels = FALSE, # remove axis labels
+                                                   show_dendrogram = TRUE,
+                                                   hide_colorbar = TRUE)
+      }
+    })
+  }
+  
+  # silhouette plot
+  if ("silhouette" %in% plots) {
+    try({
+      if (!requireNamespace("cluster", quietly = TRUE)) {
+        warning("Silhouette plot skipped because the 'cluster' package is not installed.")
+      } else if (!requireNamespace("factoextra", quietly = TRUE)) {
+        warning("Silhouette plot skipped because the 'factoextra' package is not installed.")
+      } else {
+        sil <- cluster::silhouette(object$states$state, dist(object$distmat))
+        l[[length(l) + 1]] <- factoextra::fviz_silhouette(sil, print.summary = FALSE) +
+          ggplot2::ggtitle(paste0("Cluster silhouettes (mean width: ", round(mean(sil[, 3]), 3), ")")) +
+          ggplot2::ylab("Silhouette width") +
+          ggplot2::labs(fill = "State", color = "State") +
+          ggplot2::theme_classic() +
+          ggplot2::theme(axis.text.x = element_blank(), axis.ticks.x = element_blank())
+      }
+    })
+  }
+  
+  # temporal embedding
+  if ("mds" %in% plots) {
+    try({
+      if (is.na(attributes(object)$stress)) {
+        warning("No temporal embedding found. Skipping this plot.")
+      } else if (!requireNamespace("igraph", quietly = TRUE)) {
+        warning("Temporal embedding plot skipped because the 'igraph' package is not installed.")
+      } else if (!requireNamespace("ggraph", quietly = TRUE)) {
+        warning("Temporal embedding plot skipped because the 'ggraph' package is not installed.")
+      } else {
+        nodes <- object$states
+        nodes$date <- as.character(nodes$date)
+        nodes$State <- as.factor(nodes$state)
+        
+        # Extract state values
+        state_values <- nodes$State
+        
+        edges <- data.frame(sender = as.character(object$states$date),
+                            receiver = c(as.character(object$states$date[2:(nrow(object$states))]), "NA"))
+        edges <- edges[-nrow(edges), ]
+        g <- igraph::graph_from_data_frame(edges, directed = TRUE, vertices = nodes)
+        l[[length(l) + 1]] <- ggraph::ggraph(g, layout = "manual", x = igraph::V(g)$X1, y = igraph::V(g)$X2) +
+          ggraph::geom_edge_link(arrow = ggplot2::arrow(type = "closed", length = ggplot2::unit(2, "mm")),
+                                 start_cap = ggraph::circle(1, "mm"),
+                                 end_cap = ggraph::circle(2, "mm")) +
+          ggraph::geom_node_point(ggplot2::aes(shape = state_values, fill = state_values), size = 2) +
+          ggplot2::scale_shape_manual(values = shapes) +
+          ggplot2::ggtitle("Temporal embedding (MDS)") +
+          ggplot2::xlab("Dimension 1") +
+          ggplot2::ylab("Dimension 2") +
+          ggplot2::theme_bw() +
+          ggplot2::guides(size = "none") +
+          ggplot2::labs(shape = "State", fill = "State")
+      }
+    })
+  }
+  
+  # state dynamics
+  if ("states" %in% plots) {
+    try({
+      d <- data.frame(
+        time = object$states$date,
+        id = cumsum(c(TRUE, diff(object$states$state) != 0)),
+        State = factor(object$states$state, levels = 1:k, labels = paste("State", 1:k)),
+        time1 = as.Date(object$states$date)
+      )
+      
+      # Extracting values
+      time_values <- d$time
+      state_values <- d$State
+      id_values <- d$id
+      
+      l[[length(l) + 1]] <- ggplot2::ggplot(d, ggplot2::aes(x = time_values, y = state_values, colour = state_values)) +
+        ggplot2::geom_line(aes(group = 1), linewidth = 2, color = "black", lineend = "square") +
+        ggplot2::geom_line(aes(group = id_values), linewidth = 2, lineend = "square") +
+        ggplot2::scale_x_datetime(date_labels = "%b %Y", breaks = "4 months") + # format x-axis as month year
+        ggplot2::xlab("Time") +
+        ggplot2::ylab("") +
+        ggplot2::ggtitle("State dynamics") +
+        ggplot2::theme_bw() +
+        ggplot2::theme(axis.text.x = ggplot2::element_text(angle = 45, hjust = 1)) +
+        ggplot2::guides(linewidth = "none") +
+        ggplot2::labs(color = "State")
+    })
+  }
+  
+  return(l)
+}
\ No newline at end of file
diff --git a/rDNA/rDNA/R/rDNA.R b/rDNA/rDNA/R/rDNA.R
index 7a93ee6a..288124d4 100644
--- a/rDNA/rDNA/R/rDNA.R
+++ b/rDNA/rDNA/R/rDNA.R
@@ -796,4312 +796,4 @@ dna_getAttributes <- function(statementType = NULL,
   colnames(dat) <- varNames
   class(dat) <- c("dna_attributes", class(dat))
   return(dat)
-}
-
-
-# Networks ---------------------------------------------------------------------
-
-#' Compute and retrieve a network
-#'
-#' Compute and retrieve a network from DNA.
-#'
-#' This function serves to compute a one-mode or two-mode network or an event
-#' list in DNA and retrieve it as a matrix or data frame, respectively. The
-#' arguments resemble the export options in DNA. It is also possible to compute
-#' a temporal sequence of networks using the moving time window approach, in
-#' which case the networks are retrieved as a list of matrices.
-#'
-#' @param networkType The kind of network to be computed. Can be
-#'   \code{"twomode"}, \code{"onemode"}, or \code{"eventlist"}.
-#' @param statementType The name of the statement type in which the variable
-#'   of interest is nested. For example, \code{"DNA Statement"}.
-#' @param variable1 The first variable for network construction. In a one-mode
-#'   network, this is the variable for both the rows and columns. In a
-#'   two-mode network, this is the variable for the rows only. In an event
-#'   list, this variable is only used to check for duplicates (depending on
-#'   the setting of the \code{duplicates} argument).
-#' @param variable1Document A boolean value indicating whether the first
-#'   variable is at the document level (i.e., \code{"author"},
-#'   \code{"source"}, \code{"section"}, \code{"type"}, \code{"id"}, or
-#'   \code{"title"}).
-#' @param variable2 The second variable for network construction. In a one-mode
-#'   network, this is the variable over which the ties are created. For
-#'   example, if an organization x organization network is created, and ties
-#'   in this network indicate co-reference to a concept, then the second
-#'   variable is the \code{"concept"}. In a two-mode network, this is the
-#'   variable used for the columns of the network matrix. In an event list,
-#'   this variable is only used to check for duplicates (depending on the
-#'   setting of the \code{duplicates} argument).
-#' @param variable2Document A boolean value indicating whether the second
-#'   variable is at the document level (i.e., \code{"author"},
-#'   \code{"source"}, \code{"section"}, \code{"type"}, \code{"id"}, or
-#'   \code{"title"}
-#' @param qualifier The qualifier variable. In a one-mode network, this
-#'   variable can be used to count only congruence or conflict ties. For
-#'   example, in an organization x organization network via common concepts,
-#'   a binary \code{"agreement"} qualifier could be used to record only ties
-#'   where both organizations have a positive stance on the concept or where
-#'   both organizations have a negative stance on the concept. With an
-#'   integer qualifier, the tie weight between the organizations would be
-#'   proportional to the similarity or distance between the two organizations
-#'   on the scale of the integer variable. With a short text variable as a
-#'   qualifier, agreement on common categorical values of the qualifier is
-#'   required, for example a tie is established (or a tie weight increased) if
-#'   two actors both refer to the same value on the second variable AND match on
-#'   the categorical qualifier, for example the type of referral.
-#'
-#'   In a two-mode network, the qualifier variable can be used to retain only
-#'   positive or only negative statements or subtract negative from positive
-#'   mentions. All of this depends on the setting of the
-#'   \code{qualifierAggregation} argument. For event lists, the qualifier
-#'   variable is only used for filtering out duplicates (depending on the
-#'   setting of the \code{duplicates} argument.
-#'
-#'   The qualifier can also be \code{NULL}, in which case it is ignored, meaning
-#'   that values in \code{variable1} and \code{variable2} are unconditionally
-#'   associated with each other in the network when they co-occur. This is
-#'   identical to selecting a qualifier variable and setting
-#'   \code{qualifierAggregation = "ignore"}.
-#' @param qualifierDocument A boolean value indicating whether the qualifier
-#'   variable is at the document level (i.e., \code{"author"},
-#'   \code{"source"}, \code{"section"}, \code{"type"}, \code{"id"}, or
-#'   \code{"title"}
-#' @param qualifierAggregation The aggregation rule for the \code{qualifier}
-#'   variable. In one-mode networks, this must be \code{"ignore"} (for
-#'   ignoring the qualifier variable), \code{"congruence"} (for recording a
-#'   network tie only if both nodes have the same qualifier value in the
-#'   binary case or for recording the similarity between the two nodes on the
-#'   qualifier variable in the integer case), \code{"conflict"} (for
-#'   recording a network tie only if both nodes have a different qualifier
-#'   value in the binary case or for recording the distance between the two
-#'   nodes on the qualifier variable in the integer case), or
-#' \code{"subtract"} (for subtracting the conflict tie value from the
-#'   congruence tie value in each dyad). In two-mode networks, this must be
-#' \code{"ignore"}, \code{"combine"} (for creating multiplex combinations,
-#'   e.g., 1 for positive, 2 for negative, and 3 for mixed), or
-#' \code{subtract} (for subtracting negative from positive ties). In event
-#'   lists, this setting is ignored.
-#' @param normalization Normalization of edge weights. Valid settings for
-#'   one-mode networks are \code{"no"} (for switching off normalization),
-#'   \code{"average"} (for average activity normalization), \code{"jaccard"}
-#'   (for Jaccard coefficient normalization), and \code{"cosine"} (for
-#'   cosine similarity normalization). Valid settings for two-mode networks
-#'   are \code{"no"}, \code{"activity"} (for activity normalization), and
-#'   \code{"prominence"} (for prominence normalization).
-#' @param isolates Should all nodes of the respective variable be included in
-#'   the network matrix (\code{isolates = TRUE}), or should only those nodes
-#'   be included that are active in the current time period and are not
-#'   excluded (\code{isolates = FALSE})?
-#' @param duplicates Setting for excluding duplicate statements before network
-#'   construction. Valid settings are \code{"include"} (for including all
-#'   statements in network construction), \code{"document"} (for counting
-#'   only one identical statement per document), \code{"week"} (for counting
-#'   only one identical statement per calendar week), \code{"month"} (for
-#'   counting only one identical statement per calendar month), \code{"year"}
-#'   (for counting only one identical statement per calendar year), and
-#'   \code{"acrossrange"} (for counting only one identical statement across
-#'   the whole time range).
-#' @param start.date The start date for network construction in the format
-#'   \code{"dd.mm.yyyy"}. All statements before this date will be excluded.
-#' @param start.time The start time for network construction on the specified
-#'   \code{start.date}. All statements before this time on the specified date
-#'   will be excluded.
-#' @param stop.date The stop date for network construction in the format
-#'   \code{"dd.mm.yyyy"}. All statements after this date will be excluded.
-#' @param stop.time The stop time for network construction on the specified
-#'   \code{stop.date}. All statements after this time on the specified date
-#'   will be excluded.
-#' @param timeWindow Possible values are \code{"no"}, \code{"events"},
-#'   \code{"seconds"}, \code{"minutes"}, \code{"hours"}, \code{"days"},
-#'   \code{"weeks"}, \code{"months"}, and \code{"years"}. If \code{"no"} is
-#'   selected (= the default setting), no time window will be used. If any of
-#'   the time units is selected, a moving time window will be imposed, and
-#'   only the statements falling within the time period defined by the window
-#'   will be used to create the network. The time window will then be moved
-#'   forward by one time unit at a time, and a new network with the new time
-#'   boundaries will be created. This is repeated until the end of the overall
-#'   time span is reached. All time windows will be saved as separate
-#'   networks in a list. The duration of each time window is defined by the
-#'   \code{windowSize} argument. For example, this could be used to create a
-#'   time window of 6 months which moves forward by one month each time, thus
-#'   creating time windows that overlap by five months. If \code{"events"} is
-#'   used instead of a natural time unit, the time window will comprise
-#'   exactly as many statements as defined in the \code{windowSize} argument.
-#'   However, if the start or end statement falls on a date and time where
-#'   multiple events happen, those additional events that occur simultaneously
-#'   are included because there is no other way to decide which of the
-#'   statements should be selected. Therefore the window size is sometimes
-#'   extended when the start or end point of a time window is ambiguous in
-#'   event time.
-#' @param windowSize The number of time units of which a moving time window is
-#'   comprised. This can be the number of statement events, the number of days
-#'   etc., as defined in the \code{"timeWindow"} argument.
-#' @param kernel Use kernel smoothing for computing time windows? This option
-#'   only matters if the \code{timeWindow} argument has a value other than
-#'   \code{"no"} or \code{"event"}. The default value \code{kernel = "no"}
-#'   switches off kernel smoothing, which means all statements within a time
-#'   window are weighted equally. Other values down-weight statements the
-#'   farther they are temporally away from the mid-point of the time window.
-#'   Several kernel smoothing functions are available, similar to kernel density
-#'   estimation: \code{"uniform"} is similar to \code{"no"} and weights all
-#'   statements with a value of \code{0.5}. \code{"gaussian"} uses a standard
-#'   normal distribution as a kernel smoother. \code{"epanechnikov"} uses an
-#'   Epanechnikov kernel smoother. \code{"triangular"} uses a triangular kernel
-#'   function. If in doubt, do not use kernel smoothing.
-#' @param excludeValues A list of named character vectors that contains entries
-#'   which should be excluded during network construction. For example,
-#'   \code{list(concept = c("A", "B"), organization = c("org A", "org B"))}
-#'   would exclude all statements containing concepts "A" or "B" or
-#'   organizations "org A" or "org B" when the network is constructed. This
-#'   is irrespective of whether these values appear in \code{variable1},
-#'   \code{variable2}, or the \code{qualifier}. Note that only variables at
-#'   the statement level can be used here. There are separate arguments for
-#'   excluding statements nested in documents with certain meta-data.
-#' @param excludeAuthors A character vector of authors. If a statement is
-#'   nested in a document where one of these authors is set in the "Author"
-#'   meta-data field, the statement is excluded from network construction.
-#' @param excludeSources A character vector of sources. If a statement is
-#'   nested in a document where one of these sources is set in the "Source"
-#'   meta-data field, the statement is excluded from network construction.
-#' @param excludeSections A character vector of sections. If a statement is
-#'   nested in a document where one of these sections is set in the "Section"
-#'   meta-data field, the statement is excluded from network construction.
-#' @param excludeTypes A character vector of types. If a statement is
-#'   nested in a document where one of these types is set in the "Type"
-#'   meta-data field, the statement is excluded from network construction.
-#' @param invertValues A boolean value indicating whether the entries provided
-#'   by the \code{excludeValues} argument should be excluded from network
-#'   construction (\code{invertValues = FALSE}) or if they should be the only
-#'   values that should be included during network construction
-#'   (\code{invertValues = TRUE}).
-#' @param invertAuthors A boolean value indicating whether the entries provided
-#'   by the \code{excludeAuthors} argument should be excluded from network
-#'   construction (\code{invertAuthors = FALSE}) or if they should be the
-#'   only values that should be included during network construction
-#'   (\code{invertAuthors = TRUE}).
-#' @param invertSources A boolean value indicating whether the entries provided
-#'   by the \code{excludeSources} argument should be excluded from network
-#'   construction (\code{invertSources = FALSE}) or if they should be the
-#'   only values that should be included during network construction
-#'   (\code{invertSources = TRUE}).
-#' @param invertSections A boolean value indicating whether the entries
-#'   provided by the \code{excludeSections} argument should be excluded from
-#'   network construction (\code{invertSections = FALSE}) or if they should
-#'   be the only values that should be included during network construction
-#'   (\code{invertSections = TRUE}).
-#' @param invertTypes A boolean value indicating whether the entries provided
-#'   by the \code{excludeTypes} argument should be excluded from network
-#'   construction (\code{invertTypes = FALSE}) or if they should be the
-#'   only values that should be included during network construction
-#'   (\code{invertTypes = TRUE}).
-#' @param fileFormat An optional file format specification for saving the
-#'   resulting network(s) to a file instead of returning an object. Valid values
-#'   are \code{"csv"} (for network matrices or event lists), \code{"dl"} (for
-#'   UCINET DL full-matrix files), and \code{"graphml"} (for visone .graphml
-#'   files).
-#' @param outfile An optional output file name for saving the resulting
-#'   network(s) to a file instead of returning an object.
-#'
-#' @examples
-#' \dontrun{
-#' dna_init()
-#' dna_sample()
-#' dna_openDatabase("sample.dna", coderId = 1, coderPassword = "sample")
-#' nw <- dna_network(networkType = "onemode",
-#'   variable1 = "organization",
-#'   variable2 = "concept",
-#'   qualifier = "agreement",
-#'   qualifierAggregation = "congruence",
-#'   normalization = "average",
-#'   excludeValues = list("concept" =
-#'     c("There should be legislation to regulate emissions.")))
-#' }
-#'
-#' @author Philip Leifeld
-#'
-#' @family networks
-#'
-#' @importFrom rJava .jarray
-#' @importFrom rJava .jcall
-#' @importFrom rJava .jnull
-#' @importFrom rJava J
-#' @export
-dna_network <- function(networkType = "twomode",
-                        statementType = "DNA Statement",
-                        variable1 = "organization",
-                        variable1Document = FALSE,
-                        variable2 = "concept",
-                        variable2Document = FALSE,
-                        qualifier = "agreement",
-                        qualifierDocument = FALSE,
-                        qualifierAggregation = "ignore",
-                        normalization = "no",
-                        isolates = FALSE,
-                        duplicates = "include",
-                        start.date = "01.01.1900",
-                        stop.date = "31.12.2099",
-                        start.time = "00:00:00",
-                        stop.time = "23:59:59",
-                        timeWindow = "no",
-                        windowSize = 100,
-                        kernel = "no",
-                        excludeValues = list(),
-                        excludeAuthors = character(),
-                        excludeSources = character(),
-                        excludeSections = character(),
-                        excludeTypes = character(),
-                        invertValues = FALSE,
-                        invertAuthors = FALSE,
-                        invertSources = FALSE,
-                        invertSections = FALSE,
-                        invertTypes = FALSE,
-                        fileFormat = NULL,
-                        outfile = NULL) {
-
-  # wrap the vectors of exclude values for document variables into Java arrays
-  excludeAuthors <- .jarray(excludeAuthors)
-  excludeSources <- .jarray(excludeSources)
-  excludeSections <- .jarray(excludeSections)
-  excludeTypes <- .jarray(excludeTypes)
-
-  # compile exclude variables and values vectors
-  dat <- matrix("", nrow = length(unlist(excludeValues)), ncol = 2)
-  count <- 0
-  if (length(excludeValues) > 0) {
-    for (i in 1:length(excludeValues)) {
-      if (length(excludeValues[[i]]) > 0) {
-        for (j in 1:length(excludeValues[[i]])) {
-          count <- count + 1
-          dat[count, 1] <- names(excludeValues)[i]
-          dat[count, 2] <- excludeValues[[i]][j]
-        }
-      }
-    }
-    var <- dat[, 1]
-    val <- dat[, 2]
-  } else {
-    var <- character()
-    val <- character()
-  }
-  var <- .jarray(var) # array of variable names of each excluded value
-  val <- .jarray(val) # array of values to be excluded
-
-  # encode R NULL as Java null value if necessary
-  if (is.null(qualifier) || is.na(qualifier)) {
-    qualifier <- .jnull(class = "java/lang/String")
-  }
-  if (is.null(fileFormat)) {
-    fileFormat <- .jnull(class = "java/lang/String")
-  }
-  if (is.null(outfile)) {
-    outfile <- .jnull(class = "java/lang/String")
-  }
-
-  # call rNetwork function to compute results
-  .jcall(dna_getHeadlessDna(),
-         "V",
-         "rNetwork",
-         networkType,
-         statementType,
-         variable1,
-         variable1Document,
-         variable2,
-         variable2Document,
-         qualifier,
-         qualifierDocument,
-         qualifierAggregation,
-         normalization,
-         isolates,
-         duplicates,
-         start.date,
-         stop.date,
-         start.time,
-         stop.time,
-         timeWindow,
-         as.integer(windowSize),
-         kernel,
-         var,
-         val,
-         excludeAuthors,
-         excludeSources,
-         excludeSections,
-         excludeTypes,
-         invertValues,
-         invertAuthors,
-         invertSources,
-         invertSections,
-         invertTypes,
-         outfile,
-         fileFormat
-  )
-
-  exporter <- .jcall(dna_getHeadlessDna(), "Lexport/Exporter;", "getExporter") # get a reference to the Exporter object, in which results are stored
-
-  if (networkType == "eventlist") { # assemble an event list in the form of a data frame of filtered statements
-    f <- J(exporter, "getFilteredStatements", simplify = TRUE) # array list of filtered export statements; use J because array list return type not recognized using .jcall
-    l <- list() # create a list for filtered statements, later to be converted to data frame, with one row per statement
-    for (i in seq(.jcall(f, "I", "size")) - 1) { # loop through filtered statements, starting at 0
-      fi <- f$get(as.integer(i)) # retrieve filtered statement i
-      row <- list() # each filtered export statement is represented by a list, with multiple slots for the variables etc.
-      row$statement_id <- .jcall(fi, "I", "getId") # store the statement ID
-      row$time <- .jcall(fi, "J", "getDateTimeLong") # store the date/time in seconds since 1 January 1970; will be converted to POSIXct later because the conversion to data frame otherwise converts it back to long anyway
-      values <- J(fi, "getValues") # array list of variables with values; use J instead of .jcall because array list return type not recognized using .jcall
-      for (j in seq(.jcall(values, "I", "size")) - 1) { # loop through the variables
-        vi <- values$get(as.integer(j)) # save variable/value j temporarily to access its contents
-        dataType <- .jcall(vi, "S", "getDataType") # the data type of value j
-        if (dataType == "long text") {
-          row[[.jcall(vi, "S", "getKey")]] <- .jcall(vi, "S", "getValue") # store as character object under variable name if long text
-        } else if (dataType == "short text") {
-          row[[.jcall(vi, "S", "getKey")]] <- vi$getValue()$getValue() # extract character object from Entity object and store under variable name if short text
-        } else {
-          row[[.jcall(vi, "S", "getKey")]] <- vi$getValue() # store as integer under variable name if boolean or integer data type
-        }
-      }
-      row$start_position <- .jcall(fi, "I", "getStart") # store start caret in document text
-      row$stop_position <- .jcall(fi, "I", "getStop") # store end caret in document text
-      row$text <- .jcall(fi, "S", "getText") # text of the statement between start and end caret
-      row$coder <- .jcall(fi, "I", "getCoderId") # store coder ID; the user can merge this with other coder details like name and color later if needed
-      row$document_id <- .jcall(fi, "I", "getDocumentId") # store the document ID of the document the statement is contained in
-      row$document_title <- .jcall(fi, "S", "getTitle") # store the document title
-      row$document_author <- .jcall(fi, "S", "getAuthor") # store the document author
-      row$document_source <- .jcall(fi, "S", "getSource") # store the document source
-      row$document_section <- .jcall(fi, "S", "getSection") # store the document section
-      row$document_type <- .jcall(fi, "S", "getType") # store the document type
-      l[[i + 1]] <- row # add the row to the list
-    }
-    d <- do.call(rbind.data.frame, l) # convert the list of lists to data frame
-    d$time <- as.POSIXct(d$time, origin = "1970-01-01 00:00:00") # convert long date/time to POSIXct
-    return(d)
-  } else { # assemble a one-mode or two-mode matrix with attributes or a list of matrices (if time window)
-    m <- .jcall(exporter, "[Lexport/Matrix;", "getMatrixResultsArray") # get list of Matrix objects from Exporter object
-    l <- list() # create a list in which each result is stored; can be of length 1 if no time window is used
-    for (t in 1:length(m)) { # loop through the matrices
-      mat <- .jcall(m[[t]], "[[D", "getMatrix", simplify = TRUE) # get the resulting matrix at step t as a double[][] object and save as matrix
-      rownames(mat) <- .jcall(m[[t]], "[S", "getRowNames", simplify = TRUE) # add the row names to the matrix
-      colnames(mat) <- .jcall(m[[t]], "[S", "getColumnNames", simplify = TRUE) # add the column names to the matrix
-      attributes(mat)$start <- as.POSIXct(.jcall(m[[t]], "J", "getStartLong"), origin = "1970-01-01") # add the start date/time of the result as an attribute to the matrix
-      attributes(mat)$stop <- as.POSIXct(.jcall(m[[t]], "J", "getStopLong"), origin = "1970-01-01") # add the end date/time of the result as an attribute to the matrix
-      if (length(m) > 1) {
-        attributes(mat)$middle <- as.POSIXct(.jcall(m[[t]], "J", "getDateTimeLong"), origin = "1970-01-01") # add the mid-point date/time around which the time window is centered if the time window algorithm was used
-      }
-      attributes(mat)$numStatements <- .jcall(m[[t]], "I", "getNumStatements") # add the number of filtered statements the matrix is based on as an attribute to the matrix
-      attributes(mat)$call <- match.call() # add the arguments of the call as an attribute to the matrix
-      class(mat) <- c(paste0("dna_network_", networkType), class(mat)) # add "dna_network_onemode" or "dna_network_twomode" as a class label in addition to "matrix"
-      l[[t]] <- mat # add the matrix to the list
-    }
-    if (length(m) == 1) {
-      return(l[[1]]) # return the first matrix in the list if no time window was used
-    } else {
-      attributes(l)$call <- match.call() # add arguments of the call as an attribute also to the list, not just each network matrix
-      class(l) <- c(paste0("dna_network_", networkType, "_timewindows"), class(l)) # add "dna_network_onemode_timewindows" or "dna_network_twomode_timewindows" to class label
-      return(l) # return the list of network matrices
-    }
-  }
-}
-
-#' Convert a \code{dna_network_onemode} object to a matrix
-#'
-#' Convert a \code{dna_network_onemode} object to a matrix.
-#'
-#' Remove the attributes and \code{"dna_network_onemode"} class label from a
-#' \code{dna_network_onemode} object and return it as a numeric matrix.
-#'
-#' @param x The \code{dna_network_onemode} object, as returned by the
-#'   \code{\link{dna_network}} function.
-#' @param ... Additional arguments. Currently not in use.
-#'
-#' @author Philip Leifeld
-#'
-#' @family networks
-#'
-#' @export
-as.matrix.dna_network_onemode <- function(x, ...) {
-  attr(x, "start") <- NULL
-  attr(x, "stop") <- NULL
-  attr(x, "numStatements") <- NULL
-  attr(x, "call") <- NULL
-  attr(x, "class") <- NULL
-  return(x)
-}
-
-#' Convert a \code{dna_network_twomode} object to a matrix
-#'
-#' Convert a \code{dna_network_twomode} object to a matrix.
-#'
-#' Remove the attributes and \code{"dna_network_twomode"} class label from a
-#' \code{dna_network_twomode} object and return it as a numeric matrix.
-#'
-#' @param x The \code{dna_network_twomode} object, as returned by the
-#'   \code{\link{dna_network}} function.
-#' @param ... Additional arguments. Currently not in use.
-#'
-#' @author Philip Leifeld
-#'
-#' @family networks
-#'
-#' @export
-as.matrix.dna_network_twomode <- as.matrix.dna_network_onemode
-
-#' Print a \code{dna_network_onemode} object
-#'
-#' Show details of a \code{dna_network_onemode} object.
-#'
-#' Print a one-mode network matrix and its attributes.
-#'
-#' @param x A \code{dna_network_onemode} object, as returned by the
-#'   \code{\link{dna_network}} function.
-#' @param trim Number of maximum characters to display in row and column labels
-#'   of the matrix. Labels with more characters are truncated, and the last
-#'   character is replaced by an asterisk (\code{*}).
-#' @param attr Display attributes, such as the start and stop date and time, the
-#'   number of statements on which the matrix is based, the function call and
-#'   arguments on which the network matrix is based, and the full labels without
-#'   truncation.
-#' @param ... Additional arguments. Currently not in use.
-#'
-#' @author Philip Leifeld
-#'
-#' @family networks
-#'
-#' @export
-print.dna_network_onemode <- function(x, trim = 5, attr = TRUE, ...) {
-  rn <- rownames(x)
-  cn <- colnames(x)
-  rownames(x) <- sapply(rownames(x), function(r) if (nchar(r) > trim) paste0(substr(r, 1, trim - 1), "*") else r)
-  colnames(x) <- sapply(colnames(x), function(r) if (nchar(r) > trim) paste0(substr(r, 1, trim - 1), "*") else r)
-  x <- round(x, 2)
-  if ("dna_network_onemode" %in% class(x)) {
-    onemode <- TRUE
-    class(x) <- class(x)[class(x) != "dna_network_onemode"]
-  } else {
-    onemode <- FALSE
-    class(x) <- class(x)[class(x) != "dna_network_twomode"]
-  }
-  start <- attr(x, "start")
-  attr(x, "start") <- NULL
-  stop <- attr(x, "stop")
-  attr(x, "stop") <- NULL
-  ns <- attr(x, "numStatements")
-  attr(x, "numStatements") <- NULL
-  cl <- deparse(attr(x, "call"))
-  attr(x, "call") <- NULL
-  attr(x, "class") <- NULL
-  print(x)
-  if (attr) {
-    cat("\nStart:", as.character(start))
-    cat("\nStop: ", as.character(stop))
-    cat("\nStatements:", ns)
-    cat("\nCall:", trimws(cl))
-    if (onemode) {
-      cat("\n\nLabels:\n")
-      cat(paste(1:length(rn), rn), sep = "\n")
-    } else {
-      cat("\n\nRow labels:\n")
-      cat(paste(1:length(rn), rn), sep = "\n")
-      cat("\nColumn labels:\n")
-      cat(paste(1:length(cn), cn), sep = "\n")
-    }
-  }
-}
-
-#' Print a \code{dna_network_twomode} object
-#'
-#' Show details of a \code{dna_network_twomode} object.
-#'
-#' Print a two-mode network matrix and its attributes.
-#'
-#' @inheritParams print.dna_network_onemode
-#'
-#' @author Philip Leifeld
-#'
-#' @family networks
-#'
-#' @export
-print.dna_network_twomode <- print.dna_network_onemode
-
-#' Plot networks created using rDNA.
-#'
-#' Plot a network generated using \code{\link{dna_network}}.
-#'
-#' These functions plot \code{dna_network_onemode} and
-#' \code{dna_network_onemode} objects generated by the \code{\link{dna_network}}
-#' function. In order to use this function, please install the \code{igraph} and
-#' \code{ggraph} packages. Different layouts for one- and two-mode networks are
-#' available.
-#'
-#' @param object A \code{dna_network} object.
-#' @param ... Additional arguments; currently not in use.
-#' @param atts A \code{dna_attributes} object generated by
-#'   \code{\link{dna_getAttributes}}. Provide this object and matching
-#'   attributes when plotting custom node colors, node labels and/or node sizes.
-#' @param layout The type of node layout to use. The following layouts are
-#'   available from the \code{igraph} and \code{ggraph} packages at the time of
-#'   writing:
-#'   \itemize{
-#'    \item \code{"stress"} (the default layout)
-#'    \item \code{"bipartite"} (only for two-mode networks)
-#'    \item \code{"backbone"}
-#'    \item \code{"circle"}
-#'    \item \code{"dh"}
-#'    \item \code{"drl"}
-#'    \item \code{"fr"}
-#'    \item \code{"gem"}
-#'    \item \code{"graphopt"}
-#'    \item \code{"kk"}
-#'    \item \code{"lgl"}
-#'    \item \code{"mds"}
-#'    \item \code{"nicely"}
-#'    \item \code{"randomly"}
-#'    \item \code{"star"}
-#'   }
-#'   See \link[ggraph]{layout_tbl_graph_igraph} for the current list of layouts.
-#' @param edge_size_range Two values indicating the minimum and maximum value
-#'   to scale edge widths.
-#' @param edge_color Provide the name of a color for edge colors. The default
-#'   \code{"NULL"} colors edges in line with the specified
-#'   \code{qualifierAggregation} in \code{\link{dna_network}}.
-#' @param edge_alpha Takes numeric values to control the alpha-transparency of
-#'   edges. Possible values range from \code{0} (fully transparent) to \code{1}
-#'   (fully visible).
-#' @param node_size Takes positive numeric values to control the size of nodes.
-#'   Also accepts numeric values matching an attribute of the \code{atts} object
-#'   (see examples).
-#' @param node_colors Provide the name of a color or use an attribute from the
-#'   \code{atts} object for node colors (see examples). Defaults to
-#'   \code{"black"}.
-#' @param node_label If \code{TRUE}, the row names (in a one-mode network) or
-#'   the row and column names (in a two-mode network) of the network matrix are
-#'   used for node labels. Also accepts character objects matching one of the
-#'   attribute variables of the \code{atts} object (see examples). \code{FALSE}
-#'   turns off node labels.
-#' @param font_size Controls the font size of the node labels.
-#' @param truncate Sets the number of characters to which node labels should be
-#'   truncated.
-#' @param threshold Minimum threshold for which edges should be plotted.
-#' @param giant_component Only plot the giant component (the biggest connected
-#'   cluster) of the network. Defaults to \code{FALSE}.
-#' @param exclude_isolates Exclude isolates (nodes with no connection to other
-#'   nodes) from the plot. Defaults to \code{FALSE}.
-#' @param max_overlaps Value to exclude node labels that overlap with too many
-#'   other node labels (see \code{\link[ggrepel]{geom_label_repel}}. Defaults
-#'   to \code{10}.
-#' @param seed Numeric value passed to \link{set.seed}. Ensures that plots are
-#'   reproducible.
-#'
-#' @examples
-#' \dontrun{
-#' dna_init()
-#' dna_sample()
-#' dna_openDatabase("sample.dna", coderId = 1, coderPassword = "sample")
-#'
-#' ## one-mode network examples
-#'
-#' # compute network matrix (subtract + normalization)
-#' nw <- dna_network(networkType = "onemode",
-#'                   qualifierAggregation = "subtract",
-#'                   normalization = "average")
-#'
-#' # plot network
-#' library("ggplot2")
-#' autoplot(nw)
-#'
-#' # plot only positively weighted edges
-#' autoplot(nw, threshold = 0)
-#'
-#' # congruence network
-#' nw <- dna_network(networkType = "onemode",
-#'                   qualifierAggregation = "congruence",
-#'                   excludeValues = list("concept" =
-#'                     c("There should be legislation to regulate emissions.")))
-#' autoplot(nw)
-#'
-#' # use entity colors (here: colors of organizations) from attributes
-#' atts <- dna_getAttributes(variableId = 2)
-#' autoplot(nw, atts = atts, node_colors = "color", layout = "fr")
-#'
-#' # use colors from attributes (after editing some of them)
-#' atts$color[atts$Type == "NGO"] <- "red" # change NGO color to red
-#' atts$color[atts$Type == "Government"] <- "blue" # change government to blue
-#' autoplot(nw, atts = atts, node_colors = "color") # plot with custom colors
-#'
-#' # use an attribute, such as type, to plot node labels
-#' autoplot(nw, atts = atts, node_label = "Type")
-#'
-#' # plot node sizes according to the number of statements of entities;
-#' # first, compute additional matrix to calculate the number of statements
-#' nw_freq <- dna_network(networkType = "twomode",
-#'                        qualifierAggregation = "ignore",
-#'                        normalization = "no")
-#' # then add frequency of statements as an attribute
-#' atts$freq <- rowSums(nw_freq)[match(atts$value, rownames(nw_freq))]
-#' # plot network with node sizes matching statement frequencies
-#' autoplot(nw, atts = atts, node_size = "freq", node_colors = "color")
-#'
-#' # use igraph community detection for identification of network clusters;
-#' # remove negative edge weights
-#' nw[nw < 0] <- 0
-#' # convert dna_network to igraph object
-#' graph <- igraph::graph_from_adjacency_matrix(nw,
-#'                                              mode = "undirected",
-#'                                              weighted = TRUE,
-#'                                              diag = FALSE,
-#'                                              add.colnames = NULL,
-#'                                              add.rownames = NA)
-#' # compute communities using igraph cluster algorithms
-#' # (here: fast and greedy as an illustration))
-#' com <- igraph::cluster_fast_greedy(graph)
-#' # add node community membership as an attribute
-#' atts$membership <- com$membership[match(atts$value, com$names)]
-#' # use community membership as node color
-#' autoplot(nw, atts = atts, node_colors = "membership")
-#' # or plot ellipses using ggforce package
-#' library("ggforce")
-#' autoplot(nw, atts = atts, node_colors = "color") +
-#'   geom_mark_ellipse(aes(x = x,
-#'                         y = y,
-#'                         group = com$membership,
-#'                         fill = com$membership),
-#'                     show.legend = FALSE)
-#'
-#' # add legend to the network plot (here: colors mapped to type attribute)
-#' autoplot(nw, atts = atts, node_colors = "color") +
-#'   scale_color_identity(name = "",
-#'                        labels = c("Government", "NGO", "Business"),
-#'                        guide = "legend") +
-#'   theme(legend.position = "bottom", # change legend position
-#'         legend.text = element_text(size = 10)) # change legend font size
-#'
-#' ## two-mode network examples
-#'
-#' # compute two-mode network and plot it
-#' nw <- dna_network(networkType = "twomode",
-#'                   qualifierAggregation = "combine")
-#' library("ggplot2")
-#' autoplot(nw)
-#'
-#' # use entity colours (here: colors of organizations);
-#' # first, retrieve attributes for first-mode entities (organizations)
-#' atts <- dna_getAttributes(variableId = 2)
-#' # then, retrieve attributes for second-mode entities (concepts)
-#' atts2 <- dna_getAttributes(variableId = 3)
-#' # combine both attribute objects
-#' atts <- rbind(atts, atts2)
-#' # plot the network using the attributes of both variables
-#' autoplot(nw,
-#'          atts = atts,
-#'          node_colors = "color",
-#'          layout = "bipartite",
-#'          max_overlaps = 20)
-#' # edit the colors before plotting
-#' atts$color[atts$Type == "NGO"] <- "red" # change NGO color to red
-#' atts$color[atts$Type == "Government"] <- "blue" # government actors in blue
-#' # plot the network with custom colors
-#' autoplot(nw, atts = atts, node_colors = "color")
-#'
-#' # use an attribute, such as type, to plot node labels
-#' nw <- dna_network(networkType = "twomode",
-#'                   qualifierAggregation = "subtract",
-#'                   normalization = "activity")
-#' autoplot(nw, atts = atts, node_label = "Type")
-#'
-#' # plot node sizes according the number of statements of entities;
-#' # first, compute network matrix for plotting
-#' nw <- dna_network(networkType = "twomode",
-#'                   qualifierAggregation = "subtract",
-#'                   normalization = "activity")
-#' # compute dna_attributes objects
-#' atts <- dna_getAttributes(variableId = 2)
-#' atts2 <- dna_getAttributes(variableId = 3)
-#' # compute additional matrix to calculate the number of statements
-#' nw_freq <- dna_network(networkType = "twomode",
-#'                        qualifierAggregation = "ignore",
-#'                        normalization = "no")
-#' # add frequency of statements as attribute
-#' # compute statement frequencies of first-mode entities
-#' atts$freq <- rowSums(nw_freq)[match(atts$value, rownames(nw_freq))]
-#' # compute statement frequencies of second-mode entities
-#' atts2$freq <- colSums(nw_freq)[match(atts2$value, colnames(nw_freq))]
-#' # combine both attribute objects
-#' atts <- rbind(atts, atts2)
-#' # plot network with node sizes matching statement frequencies
-#' autoplot(nw, atts = atts, node_size = "freq", node_colors = "color")
-#'
-#' # use igraph community detection for identification of network clusters
-#' nw <- dna_network(networkType = "twomode",
-#'                   qualifierAggregation = "subtract",
-#'                   normalization = "activity")
-#' # compute dna_attributes objects and combine them
-#' atts <- dna_getAttributes(variableId = 2)
-#' atts2 <- dna_getAttributes(variableId = 3)
-#' atts <- rbind(atts, atts2)
-#' # remove negative edge weights
-#' nw[nw < 0] <- 0
-#' # convert dna_network to igraph object
-#' graph <- igraph::graph_from_incidence_matrix(nw,
-#'                                              directed = FALSE,
-#'                                              weighted = TRUE,
-#'                                              add.names = NULL)
-#' # compute communities using igraph cluster algorithms
-#' # (here: fast and greedy as an illustration))
-#' com <- igraph::cluster_fast_greedy(graph)
-#' # add node community membership as an attribute
-#' atts$membership <- com$membership[match(atts$value, com$names)]
-#' # use community membership as node color
-#' autoplot(nw, atts = atts, node_colors = "membership")
-#' # or plot ellipses using ggforce
-#' library("ggforce")
-#' autoplot(nw, atts = atts, node_colors = "color") +
-#'   geom_mark_ellipse(aes(x = x,
-#'                     y = y,
-#'                     group = com$membership,
-#'                     fill = com$membership),
-#'                     show.legend = FALSE)
-#' }
-#'
-#' @author Tim Henrichsen
-#'
-#' @family networks
-#'
-#' @importFrom ggplot2 autoplot
-#' @importFrom ggplot2 aes
-#' @importFrom ggplot2 scale_color_identity
-#' @importFrom rlang .data
-#' @name autoplot.dna_network
-NULL
-
-#' @rdname autoplot.dna_network
-#' @export
-autoplot.dna_network_onemode <- function(object,
-                                         ...,
-                                         atts = NULL,
-                                         layout = "auto",
-                                         edge_size_range = c(0.2, 2),
-                                         edge_color = NULL,
-                                         edge_alpha = 1,
-                                         node_size = 3,
-                                         node_colors = "black",
-                                         node_label = TRUE,
-                                         font_size = 6,
-                                         truncate = 50,
-                                         threshold = NULL,
-                                         giant_component = FALSE,
-                                         exclude_isolates = FALSE,
-                                         max_overlaps = 10,
-                                         seed = 12345) {
-  set.seed(seed)
-
-  if (!grepl("dna_network", class(object)[1])) {
-    stop("Invalid data object. Please compute a dna_network object with the ",
-         "dna_network() function before plotting.")
-  }
-
-  if (!requireNamespace("igraph", quietly = TRUE)) {
-    stop("The autoplot function requires the 'igraph' package to be installed.\n",
-         "To do this, enter 'install.packages(\"igraph\")'.")
-  }
-
-  if (!requireNamespace("ggraph", quietly = TRUE)) {
-    stop("The autoplot function requires the 'ggraph' package to be installed.\n",
-         "To do this, enter 'install.packages(\"ggraph\")'.")
-  }
-
-  if (!is.null(atts) & !"dna_attributes" %in% class(atts)) {
-    stop("Object provided in 'atts' is not a dna_attributes object. Please ",
-         "provide a dna_attributes object using dna_getAttributes() or set atts ",
-         "to NULL if you do not want to use DNA attributes.")
-  }
-
-  if (!is.numeric(truncate)) {
-    truncate <- Inf
-    warning("No numeric value provided for trimming of entities. Truncation ",
-            "will be ignored.")
-  }
-
-  # Convert network matrix to igraph network
-  if ("dna_network_onemode" %in% class(object)) {
-    graph <- igraph::graph_from_adjacency_matrix(object,
-                                                 mode = "undirected",
-                                                 weighted = TRUE,
-                                                 diag = FALSE,
-                                                 add.colnames = NULL,
-                                                 add.rownames = NA)
-    igraph::V(graph)$shape <- "circle"
-  } else if ("dna_network_twomode" %in% class(object)) {
-    graph <- igraph::graph_from_incidence_matrix(object,
-                                                 directed = FALSE,
-                                                 weighted = TRUE,
-                                                 add.names = NULL)
-    igraph::V(graph)$shape <- ifelse(igraph::V(graph)$type, "square", "circle")
-  }
-
-  # Check if all entities are included in attributes object (if provided)
-  if (!is.null(atts) & !(all(igraph::V(graph)$name %in% atts$value))) {
-    miss <- which(!igraph::V(graph)$name %in% atts$value)
-    stop("Some network entities are missing in the attributes object:\n",
-         paste(igraph::V(graph)$name[miss], collapse = "\n"))
-  }
-
-  # Remove tie weights below threshold
-  if (!is.null(threshold)) {
-    graph <- igraph::delete_edges(graph, which(!igraph::E(graph)$weight >= threshold))
-  }
-
-  # Add node colors
-  if (is.character(node_colors)) {
-    if (!is.null(atts) & length(node_colors) == 1 && node_colors %in% colnames(atts)) {
-      col_pos <- which(colnames(atts) == node_colors)
-      igraph::V(graph)$color <- atts[match(igraph::V(graph)$name, atts$value), col_pos]
-    } else if (length(node_colors) > 1 & length(node_colors) != igraph::vcount(graph)) {
-      stop("Number of custom colors does not equal number of nodes in the network.")
-    } else {
-      igraph::V(graph)$color <- node_colors
-    }
-  } else {
-    igraph::V(graph)$color <- "black"
-  }
-
-  # Add edge colors
-  if (is.null(edge_color)) {
-    if ("combine" %in% as.character(attributes(object)$call)) {
-      igraph::E(graph)$color <- "green"
-      igraph::E(graph)$color[igraph::E(graph)$weight == 2] <- "red"
-      igraph::E(graph)$color[igraph::E(graph)$weight == 3] <- "blue"
-      # Change edge weight for networks with combine aggregation
-      igraph::E(graph)$weight[igraph::E(graph)$weight > 0] <- 1
-    } else if ("subtract" %in% as.character(attributes(object)$call)) {
-      igraph::E(graph)$color <- "green"
-      igraph::E(graph)$color[igraph::E(graph)$weight < 0] <- "red"
-    } else if ("congruence" %in% as.character(attributes(object)$call)) {
-      igraph::E(graph)$color <- "green"
-    } else if ("conflict" %in% as.character(attributes(object)$call)) {
-      igraph::E(graph)$color <- "red"
-    } else {
-      igraph::E(graph)$color <- "gray"
-    }
-  } else if (!all(is.na(edge_color))) {
-    if (length(edge_color) > 1 & length(edge_color) != igraph::ecount(graph)) {
-      igraph::E(graph)$color <- "gray"
-      warning("Number of custom edge_colors does not match number of edges ",
-              "in the network. Will set edge_color to default (gray).")
-    } else {
-      igraph::E(graph)$color <- edge_color
-    }
-  } else {
-    igraph::E(graph)$color <- "gray"
-  }
-
-  # Add node size(s)
-  if (length(node_size) > 1 & length(node_size) != igraph::vcount(graph)) {
-    igraph::V(graph)$size <- 7
-    warning("Number of provided node size values does not equal number of ",
-            "nodes in the network. node_size will be set to default value (7).")
-  } else if (is.character(node_size) & length(node_size) == 1 & !is.null(atts) && node_size %in% colnames(atts)) {
-    col_pos <- which(colnames(atts) == node_size)
-    igraph::V(graph)$size <- atts[match(igraph::V(graph)$name, atts$value), col_pos]
-  } else if (is.numeric(node_size)) {
-    igraph::V(graph)$size <- node_size
-  }
-
-  # Add labels
-  if (!is.logical(node_label)) {
-    if (is.character(node_label) & length(node_label) == 1 & !is.null(atts) && node_label %in% colnames(atts)) {
-      col_pos <- which(colnames(atts) == node_label)
-      igraph::V(graph)$name <- atts[match(igraph::V(graph)$name, atts$value), col_pos]
-    } else if (!is.null(node_label)) {
-      if (length(node_label) > 1 & length(node_label) != igraph::vcount(graph)) {
-        stop("Number of custom labels does not equal number of nodes in the network.")
-      }
-      igraph::V(graph)$name <- node_label
-    }
-  }
-
-  # Remove isolates
-  if (exclude_isolates) {
-    graph <- igraph::delete_vertices(graph, igraph::degree(graph) == 0)
-  }
-
-  # Only plot giant component of network. Useful for some plotting algorithms.
-  if (giant_component) {
-    # Get giant component
-    components <- igraph::clusters(graph)
-    biggest_cluster_id <- which.max(components$csize)
-
-    # Get members of giant component
-    vert_ids <- igraph::V(graph)[components$membership == biggest_cluster_id]
-
-    # Create subgraph
-    graph <- igraph::induced_subgraph(graph, vert_ids)
-  }
-
-
-  # Truncate labels of entities
-  igraph::V(graph)$name <- sapply(igraph::V(graph)$name, function(e) if (nchar(e) > truncate) paste0(substr(e, 1, truncate - 1), "*") else e)
-
-  # Use absolute edge weight values for plotting
-  igraph::E(graph)$weight <- abs(igraph::E(graph)$weight)
-
-  # Start network plot
-  g <- ggraph::ggraph(graph, layout = layout, ...) +
-    suppressWarnings(ggraph::geom_edge_link(ggplot2::aes(edge_width = igraph::E(graph)$weight, edge_colour = igraph::E(graph)$color),
-                           alpha = edge_alpha,
-                           show.legend = FALSE)) + # add edges
-    ggraph::scale_edge_width(range = edge_size_range) + # add edge scale
-    ggraph::geom_node_point(ggplot2::aes(colour = igraph::V(graph)$color), # add nodes
-                            size = igraph::V(graph)$size,
-                            shape = igraph::V(graph)$shape,
-                            show.legend = NA)
-  # Add labels
-  if ((!is.null(node_label) && !all(is.na(node_label))) && (is.character(node_label) || node_label == TRUE)) {
-    g <- g +
-      ggraph::geom_node_text(ggplot2::aes(label = igraph::V(graph)$name),
-                             repel = TRUE,
-                             max.overlaps = max_overlaps,
-                             show.legend = FALSE)
-  }
-
-  # Add theme and set node colors and edges to identity
-  g <- g +
-    ggraph::theme_graph(base_family = "", base_size = font_size) +
-    ggplot2::scale_color_identity() +
-    ggraph::scale_edge_color_identity()
-
-  return(g)
-}
-
-#' @rdname autoplot.dna_network
-#' @export
-autoplot.dna_network_twomode <- autoplot.dna_network_onemode
-
-#' Convert a DNA network into a \code{tbl_graph} or \code{graph} object
-#'
-#' Convert a DNA network into a \code{tbl_graph} or \code{graph} object.
-#'
-#' Convert a \code{dna_network_onemode} or \code{dna_network_twomode} object
-#' into a \code{tbl_graph} object as defined in the tidygraph package. These
-#' objects can then be plotted using the ggraph package, which contains many
-#' network layouts.
-#'
-#' \code{tbl_graph} objects are an extension of \code{graph}
-#' objects defined in the igraph package. Functions for manipulating or plotting
-#' the resulting objects from either the tidygraph or igraph package or both
-#' can be used.
-#'
-#' The resulting objects can also be converted to \code{network} objects as
-#' defined in the network package (part of the statnet suite of packages) using
-#' the \code{asNetwork} function in the intergraph package.
-#'
-#' @param network A \code{dna_network_onemode} or \code{dna_network_twomode}
-#'   object to be converted into a \code{tbl_graph} object. Can also be a matrix
-#'   with edge weights and row and column names for the node labels.
-#' @param attributes A \code{dna_attributes} object created using the
-#'   \link{dna_getAttributes} function with attributes for the nodes in the
-#'   network. Can also be a data frame with a \code{values} column that contains
-#'   the node labels and further columns containing the attributes. The
-#'   attributes are saved as node attributes in the \code{tbl_graph} object. If
-#'   \code{NULL}, no attributes are included.
-#' @param ... Further arguments. Currently not in use.
-#'
-#' @examples
-#' \dontrun{
-#' # prepare toy data
-#' dna_sample()
-#' dna_openDatabase("sample.dna", coderPassword = "sample")
-#' nw <- dna_network(networkType = "onemode",
-#'                   qualifierAggregation = "congruence",
-#'                   excludeValues = list(concept =
-#'                     "There should be legislation to regulate emissions."))
-#' at <- dna_getAttributes(variableId = 2)
-#'
-#' # convert to tbl_graph object
-#' g <- dna_tidygraph(nw, at)
-#'
-#' # basic visualization
-#' ggraph::ggraph(g, layout = "fr") +
-#'   ggraph::geom_edge_link() +
-#'   ggraph::geom_node_point()
-#'
-#' # visualization with more bells and whistles
-#' ggraph::ggraph(g, layout = "graphopt") +
-#'   ggraph::geom_edge_link(ggplot2::aes(color = weight, width = weight)) +
-#'   ggraph::geom_node_point(ggplot2::aes(color = color), size = 5) +
-#'   ggplot2::scale_color_identity() +
-#'   ggraph::scale_edge_color_gradient(low = "azure2", high = "azure4") +
-#'   ggraph::theme_graph(background = "white") +
-#'   ggraph::geom_node_text(ggplot2::aes(label = name),
-#'                          repel = TRUE,
-#'                          max.overlaps = 10,
-#'                          show.legend = FALSE)
-#' # for more layouts, see vignette("Layouts", package = "ggraph")
-#'
-#' # hive plot example
-#' g <- g |>
-#'   tidygraph::activate(nodes) |>
-#'   tidygraph::mutate(centrality = tidygraph::centrality_betweenness())
-#' ggraph::ggraph(g, layout = "hive", axis = Type, sort.by = centrality) +
-#'   ggraph::geom_edge_hive(ggplot2::aes(colour = "gray", width = weight)) +
-#'   ggraph::geom_axis_hive(ggplot2::aes(colour = color),
-#'                                       size = 5,
-#'                                       label = TRUE) +
-#'   ggraph::scale_edge_color_identity() +
-#'   theme(legend.position = "none")
-#'
-#' # example with negative edge weights
-#' nw <- dna_network(networkType = "onemode",
-#'                   qualifierAggregation = "subtract",
-#'                   excludeValues = list(concept =
-#'                     "There should be legislation to regulate emissions."))
-#' g <- dna_tidygraph(nw, at)
-#' ggraph::ggraph(g, layout = "linear", circular = TRUE) +
-#'   ggraph::geom_edge_arc(aes(color = color, width = abs)) +
-#'   ggraph::scale_edge_color_identity() +
-#'   ggraph::geom_node_point(ggplot2::aes(color = color), size = 5) +
-#'   ggplot2::scale_color_identity() +
-#'   ggraph::theme_graph(background = "white") +
-#'   theme(legend.position = "none") +
-#'   ggraph::geom_node_text(ggplot2::aes(label = name),
-#'                          repel = TRUE,
-#'                          max.overlaps = 10,
-#'                          show.legend = FALSE)
-#'
-#' # example with a two-mode network
-#' nw <- dna_network(networkType = "twomode",
-#'                   qualifierAggregation = "combine")
-#' at1 <- dna_getAttributes(statementTypeId = 1, variable = "organization")
-#' at2 <- dna_getAttributes(statementTypeId = 1, variable = "concept")
-#' at1$Notes <- "organization"
-#' at2$Notes <- "concept"
-#' at <- rbind(at1, at2)
-#' g <- dna_tidygraph(nw, at)
-#' ggraph::ggraph(g, layout = "graphopt") +
-#'   ggraph::geom_edge_link(ggplot2::aes(color = color), width = 1) +
-#'   ggraph::scale_edge_color_identity() +
-#'   ggraph::geom_node_point(ggplot2::aes(color = color, shape = Notes),
-#'                           size = 5) +
-#'   ggplot2::scale_color_identity() +
-#'   ggraph::geom_node_text(ggplot2::aes(label = name),
-#'                          repel = TRUE,
-#'                          max.overlaps = 10,
-#'                          show.legend = FALSE) +
-#'   ggraph::theme_graph(background = "white") +
-#'   theme(legend.position = "none")
-#'
-#' # manipulate and plot using the igraph package
-#' library("igraph")
-#' class(g) # resulting objects are both tbl_graph and igraph objects
-#' igraph::V(g) # get the nodes using igraph functions
-#' igraph::E(g) # get the edges using igraph functions
-#' igraph::plot(g) # plot network using igraph package
-#'
-#' # convert to network object (network package, statnet suite of packages)
-#' library("intergraph")
-#' intergraph::asNetwork(g)
-#' }
-#'
-#' @author Philip Leifeld
-#' @family networks
-#' @importFrom rlang .data
-#' @export
-dna_tidygraph <- function(network, attributes = NULL, ...) {
-  if (length(intersect(c("dna_network_onemode", "dna_network_twomode", "matrix"), class(network))) < 1) {
-    stop("The 'network' argument must provide an object created by the 'dna_network' function or a matrix.")
-  }
-  if (!is.null(attributes) && (length(intersect(c("dna_attributes", "data.frame"), class(attributes))) < 1) || !"value" %in% colnames(attributes)) {
-    stop("The 'attributes' argument must be NULL or created by the 'dna_getAttributes' function or a data frame with a 'values' column.")
-  }
-  if (!requireNamespace("tidygraph", quietly = TRUE) || packageVersion("tidygraph") < "1.3.1") {
-    stop("The 'dna_tidygraph' function requires the 'tidygraph' package (>= 1.3.1) to be installed.\n",
-         "To do this, enter 'install.packages(\"tidygraph\")'.")
-  }
-
-  if ("dna_network_twomode" %in% class(network)) {
-    nodes <- data.frame(name = c(rownames(network), colnames(network)), type = c(rep(TRUE, nrow(network)), rep(FALSE, ncol(network))), stringsAsFactors = FALSE)
-    edges <- data.frame(from = rep(rownames(network), times = ncol(network)), to = rep(colnames(network), each = nrow(network)), weight = as.vector(network))
-    edges <- edges[edges$weight != 0, ]
-    edges$from <- match(edges$from, nodes$name)
-    edges$to <- match(edges$to, nodes$name)
-    g <- tidygraph::tbl_graph(nodes = nodes, edges = edges, directed = FALSE) # create tbl_graph object for ggraph
-  } else if ("dna_network_onemode" %in% class(network)) {
-    g <- tidygraph::as_tbl_graph(network, directed = FALSE) # create tbl_graph object for ggraph
-  } else {
-    stop("Argument supplied by argument 'network' not recognized.")
-  }
-
-  if (!is.null(attributes)) {
-    nodes <- tidygraph::as_tibble(g, active = "nodes")$name # extract nodes from graph for matching
-    at <- attributes[attributes$value %in% nodes, ] # retain only those attributes present in the network
-    at <- at[match(nodes, at$value), ] # sort attributes in the same order as the nodes in the graph
-    g <- tidygraph::mutate(g, at[, colnames(at) != "value"]) # embed node attributes in graph
-  }
-
-  edges <- tidygraph::as_tibble(g, active = "edges") # extract edges from graph
-  u <- unique(edges$weight) # unique edge weights
-  combined <- length(u) < 5 && any(grepl("combine", attributes(network)$call)) # combined qualifier aggregation?
-  edgecol <- sapply(edges$weight, function(weight) { # create edge colors
-    if (length(u) == 2 & all(sort(u) %in% 0:1) & weight > 0) { # binary: 1 = gray
-      "gray"
-    } else if (combined) { # "combined" qualifier aggregation
-      if (weight == 1) {
-        "green"
-      } else if (weight == 2) {
-        "red"
-      } else if (weight == 3) {
-        "blue"
-      } else {
-        "gray"
-      }
-    } else if (any(u < 0)) { # "subtract" (or something else that generates negative ties)
-      if (weight < 0) {
-        "red"
-      } else {
-        "green"
-      }
-    } else { # any other scale, for example "congruence" qualifier aggregation
-      "gray"
-    }
-  })
-  g <- g |> # assign absolute values, edge colors, and sign as edge attributes
-    tidygraph::activate(edges) |>
-    tidygraph::mutate(abs = abs(.data$weight),
-                      color = .data$edgecol,
-                      sign = ifelse(.data$weight < 0, "negative", "positive"))
-
-  return(g)
-}
-
-
-# Barplots ---------------------------------------------------------------------
-
-#' Generate the data necessary for creating a barplot for a variable
-#'
-#' Generate the data necessary for creating a barplot for a variable.
-#'
-#' Create a \code{dna_barplot} object, which contains a data frame with
-#' entity value frequencies grouped by the levels of a qualifier variable.
-#' The qualifier variable is optional.
-#'
-#' @param variable The variable for which the barplot will be generated. There
-#'   will be one bar per entity label of this variable.
-#' @param qualifier A boolean (binary) or integer variable to group the value
-#'   frequencies by. Can be \code{NULL} to skip the grouping.
-#' @inheritParams dna_network
-#'
-#' @examples
-#' \dontrun{
-#' dna_init()
-#' dna_sample()
-#' dna_openDatabase("sample.dna", coderId = 1, coderPassword = "sample")
-#'
-#' # compute barplot data
-#' b <- dna_barplot(statementType = "DNA Statement",
-#'                  variable = "concept",
-#'                  qualifier = "agreement")
-#' b
-#' }
-#'
-#' @author Philip Leifeld
-#'
-#' @rdname dna_barplot
-#' @importFrom rJava .jarray
-#' @importFrom rJava .jcall
-#' @importFrom rJava .jevalArray
-#' @importFrom rJava .jnull
-#' @importFrom rJava is.jnull
-#' @export
-dna_barplot <- function(statementType = "DNA Statement",
-                        variable = "concept",
-                        qualifier = "agreement",
-                        duplicates = "document",
-                        start.date = "01.01.1900",
-                        stop.date = "31.12.2099",
-                        start.time = "00:00:00",
-                        stop.time = "23:59:59",
-                        excludeValues = list(),
-                        excludeAuthors = character(),
-                        excludeSources = character(),
-                        excludeSections = character(),
-                        excludeTypes = character(),
-                        invertValues = FALSE,
-                        invertAuthors = FALSE,
-                        invertSources = FALSE,
-                        invertSections = FALSE,
-                        invertTypes = FALSE) {
-
-  # wrap the vectors of exclude values for document variables into Java arrays
-  excludeAuthors <- .jarray(excludeAuthors)
-  excludeSources <- .jarray(excludeSources)
-  excludeSections <- .jarray(excludeSections)
-  excludeTypes <- .jarray(excludeTypes)
-
-  # compile exclude variables and values vectors
-  dat <- matrix("", nrow = length(unlist(excludeValues)), ncol = 2)
-  count <- 0
-  if (length(excludeValues) > 0) {
-    for (i in 1:length(excludeValues)) {
-      if (length(excludeValues[[i]]) > 0) {
-        for (j in 1:length(excludeValues[[i]])) {
-          count <- count + 1
-          dat[count, 1] <- names(excludeValues)[i]
-          dat[count, 2] <- excludeValues[[i]][j]
-        }
-      }
-    }
-    var <- dat[, 1]
-    val <- dat[, 2]
-  } else {
-    var <- character()
-    val <- character()
-  }
-  var <- .jarray(var) # array of variable names of each excluded value
-  val <- .jarray(val) # array of values to be excluded
-
-  # encode R NULL as Java null value if necessary
-  if (is.null(qualifier) || is.na(qualifier)) {
-    qualifier <- .jnull(class = "java/lang/String")
-  }
-
-  # call rBarplotData function to compute results
-  b <- .jcall(dnaEnvironment[["dna"]]$headlessDna,
-              "Lexport/BarplotResult;",
-              "rBarplotData",
-              statementType,
-              variable,
-              qualifier,
-              duplicates,
-              start.date,
-              stop.date,
-              start.time,
-              stop.time,
-              var,
-              val,
-              excludeAuthors,
-              excludeSources,
-              excludeSections,
-              excludeTypes,
-              invertValues,
-              invertAuthors,
-              invertSources,
-              invertSections,
-              invertTypes,
-              simplify = TRUE)
-
-  at <- .jcall(b, "[[Ljava/lang/String;", "getAttributes")
-  at <- t(sapply(at, FUN = .jevalArray))
-
-  counts <- .jcall(b, "[[I", "getCounts")
-  counts <- t(sapply(counts, FUN = .jevalArray))
-  if (nrow(counts) < nrow(at)) {
-    counts <- t(counts)
-  }
-
-  results <- data.frame(.jcall(b, "[S", "getValues"),
-                        counts,
-                        at)
-
-  intValues <- .jcall(b, "[I", "getIntValues")
-  intColNames <- intValues
-  if (is.jnull(qualifier)) {
-    intValues <- integer(0)
-    intColNames <- "Frequency"
-  }
-
-  atVar <- .jcall(b, "[S", "getAttributeVariables")
-
-  colnames(results) <- c("Entity", intColNames, atVar)
-
-  attributes(results)$variable <- .jcall(b, "S", "getVariable")
-  attributes(results)$intValues <- intValues
-  attributes(results)$attributeVariables <- atVar
-
-  class(results) <- c("dna_barplot", class(results))
-
-  return(results)
-}
-
-#' Print a \code{dna_barplot} object
-#'
-#' Show details of a \code{dna_barplot} object.
-#'
-#' Print the data frame returned by the \code{\link{dna_barplot}} function.
-#'
-#' @param x A \code{dna_barplot} object, as returned by the
-#'   \code{\link{dna_barplot}} function.
-#' @param trim Number of maximum characters to display in entity labels.
-#'   Entities with more characters are truncated, and the last character is
-#'   replaced by an asterisk (\code{*}).
-#' @param attr Display attributes, such as the name of the variable and the
-#'   levels of the qualifier variable if available.
-#' @param ... Additional arguments. Currently not in use.
-#'
-#' @author Philip Leifeld
-#'
-#' @rdname dna_barplot
-#' @export
-print.dna_barplot <- function(x, trim = 30, attr = TRUE, ...) {
-  x2 <- x
-  if (isTRUE(attr)) {
-    cat("Variable:", attr(x2, "variable"))
-    intVal <- attr(x2, "intValues")
-    if (length(intVal) > 0) {
-      cat(".\nQualifier levels:", paste(intVal, collapse = ", "))
-    } else {
-      cat(".\nNo qualifier variable")
-    }
-    cat(".\n")
-  }
-  x2$Entity <- sapply(x2$Entity, function(e) if (nchar(e) > trim) paste0(substr(e, 1, trim - 1), "*") else e)
-  class(x2) <- "data.frame"
-  print(x2)
-}
-
-#' Plot \code{dna_barplot} object.
-#'
-#' Plot a barplot generated from \code{\link{dna_barplot}}.
-#'
-#' This function plots \code{dna_barplot} objects generated by the
-#' \code{\link{dna_barplot}} function. It plots agreement and disagreement with
-#' DNA statements for different entities such as \code{"concept"},
-#' \code{"organization"}, or \code{"person"}. Colors can be modified before
-#' plotting (see examples).
-#'
-#' @param object A \code{dna_barplot} object.
-#' @param ... Additional arguments; currently not in use.
-#' @param lab.pos,lab.neg Names for (dis-)agreement labels.
-#' @param lab Should (dis-)agreement labels and title be displayed?
-#' @param colors If \code{TRUE}, the \code{Colors} column in the
-#'   \code{dna_barplot} object will be used to fill the bars. Also accepts
-#'   character objects matching one of the attribute variables of the
-#'   \code{dna_barplot} object.
-#' @param fontSize Text size in pt.
-#' @param barWidth Thickness of the bars. Bars will touch when set to \code{1}.
-#'   When set to \code{0.5}, space between two bars is the same as thickness of
-#'   bars.
-#' @param axisWidth Thickness of the x-axis which separates agreement from
-#'   disagreement.
-#' @param truncate Sets the number of characters to which axis labels should be
-#'   truncated.
-#' @param exclude.min Reduces the plot to entities with a minimum frequency of
-#'   statements.
-#'
-#' @examples
-#' \dontrun{
-#' dna_init()
-#' dna_sample()
-#'
-#' dna_openDatabase("sample.dna", coderId = 1, coderPassword = "sample")
-#'
-#' # compute barplot data
-#' b <- dna_barplot(statementType = "DNA Statement",
-#'                  variable = "concept",
-#'                  qualifier = "agreement")
-#'
-#' # plot barplot with ggplot2
-#' library("ggplot2")
-#' autoplot(b)
-#'
-#' # use entity colours (here: colors of organizations as an illustration)
-#' b <- dna_barplot(statementType = "DNA Statement",
-#'                  variable = "organization",
-#'                  qualifier = "agreement")
-#' autoplot(b, colors = TRUE)
-#'
-#' # edit the colors before plotting
-#' b$Color[b$Type == "NGO"] <- "red"         # change NGO color to red
-#' b$Color[b$Type == "Government"] <- "blue" # change government color to blue
-#' autoplot(b, colors = TRUE)
-#'
-#' # use an attribute, such as type, to color the bars
-#' autoplot(b, colors = "Type") +
-#'   scale_colour_manual(values = "black")
-#'
-#' # replace colors for the three possible actor types with custom colors
-#' autoplot(b, colors = "Type") +
-#'   scale_fill_manual(values = c("red", "blue", "green")) +
-#'   scale_colour_manual(values = "black")
-#' }
-#'
-#' @author Johannes B. Gruber, Tim Henrichsen
-#'
-#' @rdname dna_barplot
-#' @importFrom ggplot2 autoplot
-#' @importFrom ggplot2 ggplot
-#' @importFrom ggplot2 aes
-#' @importFrom ggplot2 geom_line
-#' @importFrom ggplot2 theme_minimal
-#' @importFrom ggplot2 theme
-#' @importFrom ggplot2 geom_bar
-#' @importFrom ggplot2 position_stack
-#' @importFrom ggplot2 coord_flip
-#' @importFrom ggplot2 element_blank
-#' @importFrom ggplot2 element_text
-#' @importFrom ggplot2 scale_color_identity
-#' @importFrom ggplot2 scale_fill_identity
-#' @importFrom ggplot2 geom_text
-#' @importFrom ggplot2 .pt
-#' @importFrom ggplot2 annotate
-#' @importFrom ggplot2 scale_x_discrete
-#' @importFrom utils stack
-#' @importFrom grDevices col2rgb
-#' @importFrom rlang .data
-#' @export
-autoplot.dna_barplot <- function(object,
-                                 ...,
-                                 lab.pos = "Agreement",
-                                 lab.neg = "Disagreement",
-                                 lab = TRUE,
-                                 colors = FALSE,
-                                 fontSize = 12,
-                                 barWidth = 0.6,
-                                 axisWidth = 1.5,
-                                 truncate = 40,
-                                 exclude.min = NULL) {
-
-
-  if (!("dna_barplot" %in% class(object))) {
-    stop("Invalid data object. Please compute a dna_barplot object via the ",
-         "dna_barplot function before plotting.")
-  }
-
-  if (!("Entity" %in% colnames(object))) {
-    stop("dna_barplot object does not have a \'Entity\' variable. Please ",
-         "compute a new dna_barplot object via the dna_barplot function before",
-         " plotting.")
-  }
-
-  if (isTRUE(colors) & !("Color" %in% colnames(object)) |
-      is.character(colors) & !(colors %in% colnames(object))) {
-    colors <- FALSE
-    warning("No color variable found in dna_barplot object. Colors will be",
-            " ignored.")
-  }
-
-  if (!is.numeric(truncate)) {
-    truncate <- Inf
-    warning("No numeric value provided for trimming of entities. Truncation ",
-            "will be ignored.")
-  }
-
-  # Get qualifier values
-  w <- attr(object, "intValues")
-
-  if (!all(w %in% colnames(object))) {
-    stop("dna_barplot object does not include all qualifier values of the ",
-         "statement type. Please compute a new dna_barplot object via the ",
-         "dna_barplot function.")
-  }
-
-  # Check if qualifier is binary
-  binary <- all(w %in% c(0, 1))
-
-  # Compute total values per entity
-  object$sum <- rowSums(object[, colnames(object) %in% w])
-
-  # Exclude minimum number of statements per entity
-  if (is.numeric(exclude.min)) {
-    if (exclude.min > max(object$sum)) {
-      exclude.min <- NULL
-      warning("Value provided in exclude.min is higher than maximum frequency ",
-              "of entity (", max(object$sum), "). Will ignore exclude.min.")
-    } else {
-      object <- object[object$sum >= exclude.min, ]
-    }
-  }
-
-  # Stack agreement and disagreement
-  object2 <- cbind(object$Entity, utils::stack(object, select = colnames(object) %in% w))
-  colnames(object2) <- c("entity", "frequency", "agreement")
-
-  object <- object[order(object$sum, decreasing = TRUE), ]
-
-  object2$entity <- factor(object2$entity, levels = rev(object$Entity))
-
-  # Get colors
-  if (isTRUE(colors)) {
-    object2$color <- object$Color[match(object2$entity, object$Entity)]
-    object2$text_color <- "black"
-    # Change text color to white in case of dark bar colors
-    object2$text_color[sum(grDevices::col2rgb(object2$color) * c(299, 587, 114)) / 1000 < 123] <- "white"
-  } else if (is.character(colors)) {
-    object2$color <- object[, colors][match(object2$entity, object$Entity)]
-    object2$text_color <- "black"
-  } else {
-    object2$color <- "white"
-    object2$text_color <- "black"
-  }
-
-
-  if (binary) {
-    # setting disagreement as -1 instead 0
-    object2$agreement <- ifelse(object2$agreement == 0, -1, 1)
-    # recode frequency in positive and negative
-    object2$frequency <- object2$frequency * as.integer(object2$agreement)
-
-    # generate position of bar labels
-    offset <- (max(object2$frequency) + abs(min(object2$frequency))) * 0.05
-    offset <- ifelse(offset < 0.5, 0.5, offset) # offset should be at least 0.5
-    if (offset > abs(min(object2$frequency))) {
-      offset <- abs(min(object2$frequency))
-    }
-    if (offset > max(object2$frequency)) {
-      offset <- abs(min(object2$frequency))
-    }
-    object2$pos <- ifelse(object2$frequency > 0,
-                          object2$frequency + offset,
-                          object2$frequency - offset)
-
-    # move 0 labels where necessary
-    object2$pos[object2$frequency == 0] <- ifelse(object2$agreement[object2$frequency == 0] == 1,
-                                                  object2$pos[object2$frequency == 0] * -1,
-                                                  object2$pos[object2$frequency == 0])
-    object2$label <- as.factor(abs(object2$frequency))
-  } else {
-    object2$count <- object2$frequency
-    # set frequency of negative qualifiers to negative values
-    object2$frequency <- ifelse(as.numeric(as.character(object2$agreement)) >= 0, object2$frequency,
-                                object2$frequency * -1)
-    # remove zero frequencies
-    object2 <- object2[object2$frequency != 0, ]
-    # generate position of bar labels
-    object2$pos <- ifelse(object2$frequency > 0,
-                          1.1,
-                          -0.1)
-    # Add labels
-    object2$label <- paste(object2$count, object2$agreement, sep = " x ")
-  }
-
-  offset <- (max(object2$frequency) + abs(min(object2$frequency))) * 0.05
-  offset <- ifelse(offset < 0.5, 0.5, offset)
-  yintercepts <- data.frame(x = c(0.5, length(unique(object2$entity)) + 0.5),
-                            y = c(0, 0))
-  high <- yintercepts$x[2] + 0.25
-
-  object2 <- object2[order(as.numeric(as.character(object2$agreement)),
-                           decreasing = FALSE), ]
-  object2$agreement <- factor(object2$agreement, levels = w)
-
-  # Plot
-  g <- ggplot2::ggplot(object2,
-                       ggplot2::aes(x = .data[["entity"]],
-                                           y = .data[["frequency"]],
-                                           fill = .data[["agreement"]],
-                                           group = .data[["agreement"]],
-                                           label = .data[["label"]]))
-  if (binary) { # Bars for the binary case
-    g <- g + ggplot2::geom_bar(ggplot2::aes(fill = .data[["color"]],
-                                                   color = .data[["text_color"]]),
-                               stat = "identity",
-                               width = barWidth,
-                               show.legend = FALSE)
-    # For the integer case with positive and negative values
-  } else if (max(w) > 0 & min(w) < 0) {
-    g <- g + ggplot2::geom_bar(ggplot2::aes(fill = .data[["color"]],
-                                                   color = .data[["text_color"]]),
-                               stat = "identity",
-                               width = barWidth,
-                               show.legend = FALSE,
-                               data = object2[as.numeric(as.character(object2$agreement)) >= 0, ],
-                               position = ggplot2::position_stack(reverse = TRUE)) +
-      ggplot2::geom_bar(ggplot2::aes(fill = .data[["color"]],
-                                            color = .data[["text_color"]]),
-                        stat = "identity",
-                        width = barWidth,
-                        show.legend = FALSE,
-                        data = object2[as.numeric(as.character(object2$agreement)) < 0, ])
-    # For the integer case with positive values only
-  } else if (min(w) >= 0) {
-    g <- g + ggplot2::geom_bar(ggplot2::aes(fill = .data[["color"]],
-                                                   color = .data[["text_color"]]),
-                               stat = "identity",
-                               width = barWidth,
-                               show.legend = FALSE,
-                               position = ggplot2::position_stack(reverse = TRUE))
-    # For the integer case with negative values only
-  } else {
-    g <- g + ggplot2::geom_bar(ggplot2::aes(fill = .data[["color"]],
-                                                   color = .data[["text_color"]]),
-                               stat = "identity",
-                               width = barWidth,
-                               show.legend = FALSE)
-  }
-  g <- g + ggplot2::coord_flip() +
-    ggplot2::theme_minimal() +
-    # Add intercept line
-    ggplot2::geom_line(ggplot2::aes(x = .data[["x"]], y = .data[["y"]]),
-                       data = yintercepts,
-                       linewidth = axisWidth,
-                       inherit.aes = FALSE) +
-    # Remove all panel grids, axis titles and axis ticks and text for x-axis
-    ggplot2::theme(panel.grid.major = ggplot2::element_blank(),
-                   panel.grid.minor = ggplot2::element_blank(),
-                   axis.title = ggplot2::element_blank(),
-                   axis.ticks.y = ggplot2::element_blank(),
-                   axis.text.x = ggplot2::element_blank(),
-                   axis.text.y = ggplot2::element_text(size = fontSize)) #+
-  if (is.logical(colors)) {
-    g <- g + ggplot2::scale_fill_identity() +
-      ggplot2::scale_color_identity()
-  }
-  if (binary) { # Add entity labels for binary case
-    g <- g +
-      ggplot2::geom_text(ggplot2::aes(x = .data[["entity"]],
-                                             y = .data[["pos"]],
-                                             label = .data[["label"]]),
-                         size = (fontSize / ggplot2::.pt),
-                         inherit.aes = FALSE,
-                         data = object2)
-    # Add entity labels for integer case with positive and negative values
-  } else if (max(w) > 0 & min(w) < 0) {
-    g <- g +
-      ggplot2::geom_text(ggplot2::aes(color = .data[["text_color"]]),
-                         size = (fontSize / ggplot2::.pt),
-                         position = ggplot2::position_stack(vjust = 0.5, reverse = TRUE),
-                         inherit.aes = TRUE,
-                         data = object2[object2$frequency >= 0, ]) +
-      ggplot2::geom_text(ggplot2::aes(color = .data[["text_color"]]),
-                         size = (fontSize / ggplot2::.pt),
-                         position = ggplot2::position_stack(vjust = 0.5),
-                         inherit.aes = TRUE,
-                         data = object2[object2$frequency < 0, ])
-    # Add entity labels for integer case with positive values only
-  } else if (min(w) >= 0) {
-    g <- g +
-      ggplot2::geom_text(ggplot2::aes(color = .data[["text_color"]]),
-                         size = (fontSize / ggplot2::.pt),
-                         position = ggplot2::position_stack(vjust = 0.5, reverse = TRUE),
-                         inherit.aes = TRUE)
-  } else {
-    g <- g +
-      ggplot2::geom_text(ggplot2::aes(color = .data[["text_color"]]),
-                         size = (fontSize / ggplot2::.pt),
-                         position = ggplot2::position_stack(vjust = 0.5),
-                         inherit.aes = TRUE)
-  }
-  if (lab) { # Add (dis-)agreement labels
-    g <- g +
-      ggplot2::annotate("text",
-                        x = high,
-                        y = offset * 2,
-                        hjust = 0,
-                        label = lab.pos,
-                        size = (fontSize / ggplot2::.pt)) +
-      ggplot2::annotate("text",
-                        x = high,
-                        y = 0 - offset * 2,
-                        hjust = 1,
-                        label = lab.neg,
-                        size = (fontSize / ggplot2::.pt)) +
-      # Truncate labels of entities
-      ggplot2::scale_x_discrete(labels = sapply(as.character(object2$entity), function(e) if (nchar(e) > truncate) paste0(substr(e, 1, truncate - 1), "*") else e),
-                                expand = c(0, 2, 0, 2),
-                                limits = levels(object2$entity))
-  } else {
-    g <- g +
-      # Truncate labels of entities
-      ggplot2::scale_x_discrete(labels = sapply(as.character(object2$entity), function(e) if (nchar(e) > truncate) paste0(substr(e, 1, truncate - 1), "*") else e),
-                                limits = levels(object2$entity))
-  }
-  return(g)
-}
-
-
-# Backbones --------------------------------------------------------------------
-
-#' Compute and retrieve the backbone and redundant set
-#'
-#' Compute and retrieve the backbone and redundant set of a discourse network.
-#'
-#' The dna_backbone function applies a simulated annealing algorithm to the
-#' discourse network to partition the set of second-mode entities (e.g.,
-#' concepts) into a backbone set and a complementary redundant set. Three
-#' methods are available:
-#' \itemize{
-#'   \item A simulated annealing algorithm with a penalty. You can play with
-#'     different penalties and see how they affect the size of your backbone
-#'     set.
-#'   \item A modified simulated annealing algorithm for a fixed number of
-#'     backbone entities to retain. This is computationally simpler, but you
-#'     have to know how large the set should be.
-#'   \item A fast and greedy nested algorithm, which evaluates all possible
-#'     fixed backbone solutions, i.e., for all sizes, and provides a nested
-#'     hierarchy of entities on the second mode. This algorithm may stay below
-#'     the optimum and is only an approximation but provides insights into the
-#'     hierarchy of concepts and their relative importance.
-#' }
-#'
-#' The \code{autoplot} function requires the ggplot2 package and can plot
-#' algorithm diagnostics and the hierarchy of entities as a dendrogram,
-#' depending on the method that was chosen. The \code{plot} function can do the
-#' same thing, just using base plots, not ggplot2.
-#'
-#' The \code{dna_evaluateBackboneSolution} function computes the spectral loss
-#' for an arbitrary backbone and its complement, the redundant set, specified by
-#' the user. For example, the user can evaluate how much structure would be lost
-#' if the second mode was composed only of the concepts provided to this
-#' function. This can be used to compare how useful different codebook models
-#' are. The penalty parameter \code{p} applies a penalty factor to the spectral
-#' loss. The default value of \code{0} switches off the penalty as it is usually
-#' not needed to evaluate a specific solution. The backbone set can be supplied
-#' as a vector of character objects, for example concepts.
-#'
-#' @param method The backbone algorithm used to compute the results. Several
-#'  methods are available:
-#'  \itemize{
-#'    \item \code{"nested"}: A relatively fast, deterministic algorithm that
-#'      produces the full hierarchy of entities. It starts with a complete
-#'      backbone set resembling the full network. There are as many iterations
-#'      as entities on the second mode. In each iteration, the entity whose
-#'      removal would yield the smallest backbone loss is moved from the
-#'      backbone set into the redundant set, and the (unpenalized) spectral
-#'      loss is recorded. This creates a solution for all backbone sizes, where
-#'      each backbone set is fully nested in the next larger backbone set. The
-#'      solution usually resembles an unconstrained solution where nesting is
-#'      not required, but in some cases the loss of a non-nested solution may be
-#'      larger at a given level or number of elements in the backbone set.
-#'    \item \code{"fixed"}: Simulated annealing with a fixed number of elements
-#'      in the backbone set (i.e., only lateral changes are possible) and
-#'      without penalty. This method may yield more optimal solutions than the
-#'      nested algorithm because it does not require a strict hierarchy.
-#'      However, it produces an approximation of the global optimum and is
-#'      slower than the nested method. With this method, you can specify that
-#'      backbone set should have, for example, exactly 10 concepts. Then fewer
-#'      iterations are necessary than with the penalty method because the search
-#'      space is smaller. The backbone set size is defined in the
-#'      \code{"backboneSize"} argument.
-#'    \item \code{"penalty"}: Simulated annealing with a variable number of
-#'      elements in the backbone set. The solution is stabilized by a penalty
-#'      parameter (see \code{"penalty"} argument). This algorithm takes longest
-#'      to compute for a single solution, and it is only an approximation, but
-#'      it considers slightly larger or smaller backbone sets if the solution is
-#'      better, thus this algorithm adds some flexibility. It requires more
-#'      iterations than the fixed method for achieving the same quality.
-#'  }
-#' @param backboneSize The number of elements in the backbone set, as a fixed
-#'   parameter. Only used when \code{method = "fixed"}.
-#' @param penalty The penalty parameter for large backbone sets. The larger the
-#'   value, the more strongly larger backbone sets are punished and the smaller
-#'   the resulting backbone is. Try out different values to find the right size
-#'   of the backbone set. Reasonable values could be \code{2.5}, \code{5},
-#'   \code{7.5}, or \code{12}, for example. The minimum is \code{0.0}, which
-#'   imposes no penalty on the size of the backbone set and produces a redundant
-#'   set with only one element. Start with \code{0.0} if you want to weed out a
-#'   single concept and subsequently increase the penalty to include more items
-#'   in the redundant set and shrink the backbone further. Only used when
-#'   \code{method = "penalty"}.
-#' @param iterations The number of iterations of the simulated annealing
-#'   algorithm. More iterations take more time but may lead to better
-#'   optimization results. Only used when \code{method = "penalty"} or
-#'   \code{method = "fixed"}.
-#' @param qualifierAggregation The aggregation rule for the \code{qualifier}
-#'   variable. This must be \code{"ignore"} (for ignoring the qualifier
-#'   variable), \code{"congruence"} (for recording a network tie only if both
-#'   nodes have the same qualifier value in the binary case or for recording the
-#'   similarity between the two nodes on the qualifier variable in the integer
-#'   case), \code{"conflict"} (for recording a network tie only if both nodes
-#'   have a different qualifier value in the binary case or for recording the
-#'   distance between the two nodes on the qualifier variable in the integer
-#'   case), or \code{"subtract"} (for subtracting the conflict tie value from
-#'   the congruence tie value in each dyad; note that negative values will be
-#'   replaced by \code{0} in the backbone calculation).
-#' @param normalization Normalization of edge weights. Valid settings are
-#'   \code{"no"} (for switching off normalization), \code{"average"} (for
-#'   average activity normalization), \code{"jaccard"} (for Jaccard coefficient
-#'   normalization), and \code{"cosine"} (for cosine similarity normalization).
-#' @param fileFormat An optional file format specification for saving the
-#'   backbone results to a file instead of returning an object. Valid values
-#'   are \code{"json"}, \code{"xml"}, and \code{NULL} (for returning the results
-#'   instead of writing them to a file).
-#' @inheritParams dna_network
-#'
-#' @examples
-#' \dontrun{
-#' dna_init()
-#' dna_sample()
-#' dna_openDatabase("sample.dna", coderId = 1, coderPassword = "sample")
-#'
-#' # compute backbone and redundant set using penalised spectral loss
-#' b <- dna_backbone(method = "penalty",
-#'                   penalty = 3.5,
-#'                   iterations = 10000,
-#'                   variable1 = "organization",
-#'                   variable2 = "concept",
-#'                   qualifier = "agreement",
-#'                   qualifierAggregation = "subtract",
-#'                   normalization = "average")
-#'
-#' b # display main results
-#'
-#' # extract results from the object
-#' b$backbone # show the set of backbone concepts
-#' b$redundant # show the set of redundant concepts
-#' b$unpenalized_backbone_loss # spectral loss between full and backbone network
-#' b$unpenalized_redundant_loss # spectral loss of redundant network
-#' b$backbone_network # show the backbone network
-#' b$redundant_network # show the redundant network
-#' b$full_network # show the full network
-#'
-#' # plot diagnostics with base R
-#' plot(b, ma = 500)
-#'
-#' # arrange plots in a 2 x 2 view
-#' par(mfrow = c(2, 2))
-#' plot(b)
-#'
-#' # plot diagnostics with ggplot2
-#' library("ggplot2")
-#' p <- autoplot(b)
-#' p
-#'
-#' # pick a specific diagnostic
-#' p[[3]]
-#'
-#' # use the patchwork package to arrange the diagnostics in a single plot
-#' library("patchwork")
-#' new_plot <- p[[1]] + p[[2]] + p[[3]] + p[[4]]
-#' new_plot & theme_grey() + theme(legend.position = "bottom")
-#'
-#' # use the gridExtra package to arrange the diagnostics in a single plot
-#' library("gridExtra")
-#' grid.arrange(p[[1]], p[[2]], p[[3]], p[[4]])
-#'
-#' # compute backbone with fixed size (here: 4 concepts)
-#' b <- dna_backbone(method = "fixed",
-#'                   backboneSize = 4,
-#'                   iterations = 2000,
-#'                   variable1 = "organization",
-#'                   variable2 = "concept",
-#'                   qualifier = "agreement",
-#'                   qualifierAggregation = "subtract",
-#'                   normalization = "average")
-#' b
-#'
-#' # compute backbone with a nested structure and plot dendrogram
-#' b <- dna_backbone(method = "nested",
-#'                   variable1 = "organization",
-#'                   variable2 = "concept",
-#'                   qualifier = "agreement",
-#'                   qualifierAggregation = "subtract",
-#'                   normalization = "average")
-#' b
-#' plot(b)
-#' autoplot(b)
-#' }
-#'
-#' @author Philip Leifeld, Tim Henrichsen
-#'
-#' @rdname dna_backbone
-#' @importFrom rJava .jarray
-#' @importFrom rJava .jcall
-#' @importFrom rJava .jnull
-#' @importFrom rJava J
-#' @export
-dna_backbone <- function(method = "nested",
-                         backboneSize = 1,
-                         penalty = 3.5,
-                         iterations = 10000,
-                         statementType = "DNA Statement",
-                         variable1 = "organization",
-                         variable1Document = FALSE,
-                         variable2 = "concept",
-                         variable2Document = FALSE,
-                         qualifier = "agreement",
-                         qualifierDocument = FALSE,
-                         qualifierAggregation = "subtract",
-                         normalization = "average",
-                         duplicates = "document",
-                         start.date = "01.01.1900",
-                         stop.date = "31.12.2099",
-                         start.time = "00:00:00",
-                         stop.time = "23:59:59",
-                         excludeValues = list(),
-                         excludeAuthors = character(),
-                         excludeSources = character(),
-                         excludeSections = character(),
-                         excludeTypes = character(),
-                         invertValues = FALSE,
-                         invertAuthors = FALSE,
-                         invertSources = FALSE,
-                         invertSections = FALSE,
-                         invertTypes = FALSE,
-                         fileFormat = NULL,
-                         outfile = NULL) {
-
-  # wrap the vectors of exclude values for document variables into Java arrays
-  excludeAuthors <- .jarray(excludeAuthors)
-  excludeSources <- .jarray(excludeSources)
-  excludeSections <- .jarray(excludeSections)
-  excludeTypes <- .jarray(excludeTypes)
-
-  # compile exclude variables and values vectors
-  dat <- matrix("", nrow = length(unlist(excludeValues)), ncol = 2)
-  count <- 0
-  if (length(excludeValues) > 0) {
-    for (i in 1:length(excludeValues)) {
-      if (length(excludeValues[[i]]) > 0) {
-        for (j in 1:length(excludeValues[[i]])) {
-          count <- count + 1
-          dat[count, 1] <- names(excludeValues)[i]
-          dat[count, 2] <- excludeValues[[i]][j]
-        }
-      }
-    }
-    var <- dat[, 1]
-    val <- dat[, 2]
-  } else {
-    var <- character()
-    val <- character()
-  }
-  var <- .jarray(var) # array of variable names of each excluded value
-  val <- .jarray(val) # array of values to be excluded
-
-  # encode R NULL as Java null value if necessary
-  if (is.null(qualifier) || is.na(qualifier)) {
-    qualifier <- .jnull(class = "java/lang/String")
-  }
-  if (is.null(fileFormat)) {
-    fileFormat <- .jnull(class = "java/lang/String")
-  }
-  if (is.null(outfile)) {
-    outfile <- .jnull(class = "java/lang/String")
-  }
-
-  # call rBackbone function to compute results
-  .jcall(dnaEnvironment[["dna"]]$headlessDna,
-         "V",
-         "rBackbone",
-         method,
-         as.integer(backboneSize),
-         as.double(penalty),
-         as.integer(iterations),
-         statementType,
-         variable1,
-         variable1Document,
-         variable2,
-         variable2Document,
-         qualifier,
-         qualifierDocument,
-         qualifierAggregation,
-         normalization,
-         duplicates,
-         start.date,
-         stop.date,
-         start.time,
-         stop.time,
-         var,
-         val,
-         excludeAuthors,
-         excludeSources,
-         excludeSections,
-         excludeTypes,
-         invertValues,
-         invertAuthors,
-         invertSources,
-         invertSections,
-         invertTypes,
-         outfile,
-         fileFormat
-  )
-
-  exporter <- .jcall(dnaEnvironment[["dna"]]$headlessDna, "Lexport/Exporter;", "getExporter") # get a reference to the Exporter object, in which results are stored
-  if (!is.null(outfile) && !is.null(fileFormat) && is.character(outfile) && is.character(fileFormat) && fileFormat %in% c("json", "xml")) {
-    message("File exported.")
-  } else if (method[1] %in% c("penalty", "fixed")) {
-    result <- .jcall(exporter, "Lexport/SimulatedAnnealingBackboneResult;", "getSimulatedAnnealingBackboneResult", simplify = TRUE)
-    # create a list with various results
-    l <- list()
-    l$penalty <- .jcall(result, "D", "getPenalty")
-    if (method[1] == "fixed") {
-      l$backbone_size <- as.integer(backboneSize)
-    } else {
-      l$backbone_size <- as.integer(NA)
-    }
-    l$iterations <- .jcall(result, "I", "getIterations")
-    l$backbone <- .jcall(result, "[S", "getBackboneEntities")
-    l$redundant <- .jcall(result, "[S", "getRedundantEntities")
-    l$unpenalized_backbone_loss <- .jcall(result, "D", "getUnpenalizedBackboneLoss")
-    l$unpenalized_redundant_loss <- .jcall(result, "D", "getUnpenalizedRedundantLoss")
-    rn <- .jcall(result, "[S", "getLabels")
-
-    # store the three matrices in the result list
-    fullmat <- .jcall(result, "[[D", "getFullNetwork", simplify = TRUE)
-    rownames(fullmat) <- rn
-    colnames(fullmat) <- rn
-    l$full_network <- fullmat
-    backbonemat <- .jcall(result, "[[D", "getBackboneNetwork", simplify = TRUE)
-    rownames(backbonemat) <- rn
-    colnames(backbonemat) <- rn
-    l$backbone_network <- backbonemat
-    redundantmat <- .jcall(result, "[[D", "getRedundantNetwork", simplify = TRUE)
-    rownames(redundantmat) <- rn
-    colnames(redundantmat) <- rn
-    l$redundant_network <- redundantmat
-
-    # store diagnostics per iteration as a data frame
-    d <- data.frame(iteration = 1:.jcall(result, "I", "getIterations"),
-                    temperature = .jcall(result, "[D", "getTemperature"),
-                    acceptance_prob = .jcall(result, "[D", "getAcceptanceProbability"),
-                    acceptance = .jcall(result, "[I", "getAcceptance"),
-                    penalized_backbone_loss = .jcall(result, "[D", "getPenalizedBackboneLoss"),
-                    proposed_backbone_size = .jcall(result, "[I", "getProposedBackboneSize"),
-                    current_backbone_size = .jcall(result, "[I", "getCurrentBackboneSize"),
-                    optimal_backbone_size = .jcall(result, "[I", "getOptimalBackboneSize"),
-                    acceptance_ratio_ma = .jcall(result, "[D", "getAcceptanceRatioMovingAverage"))
-
-    l$diagnostics <- d
-
-    # store start date/time, end date/time, number of statements, call, and class label in each network matrix
-    start <- as.POSIXct(.jcall(result, "J", "getStart"), origin = "1970-01-01") # add the start date/time of the result as an attribute to the matrices
-    attributes(l$full_network)$start <- start
-    attributes(l$backbone_network)$start <- start
-    attributes(l$redundant_network)$start <- start
-    stop <- as.POSIXct(.jcall(result, "J", "getStop"), origin = "1970-01-01") # add the end date/time of the result as an attribute to the matrices
-    attributes(l$full_network)$stop <- stop
-    attributes(l$backbone_network)$stop <- stop
-    attributes(l$redundant_network)$stop <- stop
-    attributes(l$full_network)$numStatements <- .jcall(result, "I", "getNumStatements") # add the number of filtered statements the matrix is based on as an attribute to the matrix
-    attributes(l$full_network)$call <- match.call()
-    attributes(l$backbone_network)$call <- match.call()
-    attributes(l$redundant_network)$call <- match.call()
-    attributes(l)$method <- method[1]
-    class(l$full_network) <- c("dna_network_onemode", class(l$full_network))
-    class(l$backbone_network) <- c("dna_network_onemode", class(l$backbone_network))
-    class(l$redundant_network) <- c("dna_network_onemode", class(l$redundant_network))
-    class(l) <- c("dna_backbone", class(l))
-    return(l)
-  } else if (method[1] == "nested") {
-    result <- .jcall(exporter, "Lexport/NestedBackboneResult;", "getNestedBackboneResult", simplify = TRUE)
-    d <- data.frame(i = .jcall(result, "[I", "getIteration"),
-                    entity = .jcall(result, "[S", "getEntities"),
-                    backboneLoss = .jcall(result, "[D", "getBackboneLoss"),
-                    redundantLoss = .jcall(result, "[D", "getRedundantLoss"),
-                    statements = .jcall(result, "[I", "getNumStatements"))
-    rownames(d) <- NULL
-    attributes(d)$numStatementsFull <- .jcall(result, "I", "getNumStatementsFull")
-    attributes(d)$start <- as.POSIXct(.jcall(result, "J", "getStart"), origin = "1970-01-01") # add the start date/time of the result as an attribute
-    attributes(d)$stop <- as.POSIXct(.jcall(result, "J", "getStop"), origin = "1970-01-01") # add the end date/time of the result as an attribute
-    attributes(d)$method <- "nested"
-    class(d) <- c("dna_backbone", class(d))
-    return(d)
-  }
-}
-
-#' @rdname dna_backbone
-#' @param x A \code{"dna_backbone"} object.
-#' @param trim Number of maximum characters to display in entity labels. Labels
-#'   with more characters are truncated, and the last character is replaced by
-#'   an asterisk (\code{*}).
-#' @export
-print.dna_backbone <- function(x, trim = 50, ...) {
-  method <- attributes(x)$method
-  cat(paste0("Backbone method: ", method, ".\n\n"))
-  if (method %in% c("penalty", "fixed")) {
-    if (method == "penalty") {
-      cat(paste0("Penalty: ", x$penalty, ". Iterations: ", x$iterations, ".\n\n"))
-    } else {
-      cat(paste0("Backbone size: ", x$backbone_size, ". Iterations: ", x$iterations, ".\n\n"))
-    }
-    cat(paste0("Backbone set (loss: ", round(x$unpenalized_backbone_loss, 4), "):\n"))
-    cat(paste(1:length(x$backbone), x$backbone), sep = "\n")
-    cat(paste0("\nRedundant set (loss: ", round(x$unpenalized_redundant_loss, 4), "):\n"))
-    cat(paste(1:length(x$redundant), x$redundant), sep = "\n")
-  } else if (method == "nested") {
-    x2 <- x
-    x2$entity <- sapply(x2$entity, function(r) if (nchar(r) > trim) paste0(substr(r, 1, trim - 1), "*") else r)
-    print(as.data.frame(x2), row.names = FALSE)
-  }
-}
-
-#' @param ma Number of iterations to compute moving average.
-#' @rdname dna_backbone
-#' @importFrom graphics lines
-#' @importFrom stats filter
-#' @importFrom rlang .data
-#' @export
-plot.dna_backbone <- function(x, ma = 500, ...) {
-
-  if (attr(x, "method") != "nested") {
-    # temperature and acceptance probability
-    plot(x = x$diagnostics$iteration,
-         y = x$diagnostics$temperature,
-         col = "red",
-         type = "l",
-         lwd = 3,
-         xlab = "Iteration",
-         ylab = "Acceptance probability",
-         main = "Temperature and acceptance probability")
-    # note that better solutions are coded as -1 and need to be skipped:
-    lines(x = x$diagnostics$iteration[x$diagnostics$acceptance_prob >= 0],
-          y = x$diagnostics$acceptance_prob[x$diagnostics$acceptance_prob >= 0])
-
-    # spectral distance between full network and backbone network per iteration
-    bb_loss <- stats::filter(x$diagnostics$penalized_backbone_loss,
-                             rep(1 / ma, ma),
-                             sides = 1)
-    if (attributes(x)$method == "penalty") {
-      yl <- "Penalized backbone loss"
-      ti <- "Penalized spectral backbone distance"
-    } else {
-      yl <- "Backbone loss"
-      ti <- "Spectral backbone distance"
-    }
-    plot(x = x$diagnostics$iteration,
-         y = bb_loss,
-         type = "l",
-         xlab = "Iteration",
-         ylab = yl,
-         main = ti)
-
-    # number of concepts in the backbone solution per iteration
-    current_size_ma <- stats::filter(x$diagnostics$current_backbone_size,
-                                     rep(1 / ma, ma),
-                                     sides = 1)
-    optimal_size_ma <- stats::filter(x$diagnostics$optimal_backbone_size,
-                                     rep(1 / ma, ma),
-                                     sides = 1)
-    plot(x = x$diagnostics$iteration,
-         y = current_size_ma,
-         ylim = c(min(c(current_size_ma, optimal_size_ma), na.rm = TRUE),
-                  max(c(current_size_ma, optimal_size_ma), na.rm = TRUE)),
-         type = "l",
-         xlab = "Iteration",
-         ylab = paste0("Number of elements (MA, last ", ma, ")"),
-         main = "Backbone size (red = best)")
-    lines(x = x$diagnostics$iteration, y = optimal_size_ma, col = "red")
-
-    # ratio of recent acceptances
-    accept_ratio <- stats::filter(x$diagnostics$acceptance,
-                                  rep(1 / ma, ma),
-                                  sides = 1)
-    plot(x = x$diagnostics$iteration,
-         y = accept_ratio,
-         type = "l",
-         xlab = "Iteration",
-         ylab = paste("Acceptance ratio in the last", ma, "iterations"),
-         main = "Acceptance ratio")
-  } else { # create hclust object
-    # define merging pattern: negative numbers are leaves, positive are merged clusters
-    merges_clust <- matrix(nrow = nrow(x) - 1, ncol = 2)
-
-    merges_clust[1,1] <- -nrow(x)
-    merges_clust[1,2] <- -(nrow(x) - 1)
-
-    for (i in 2:(nrow(x) - 1)) {
-      merges_clust[i, 1] <- -(nrow(x) - i)
-      merges_clust[i, 2] <- i - 1
-    }
-
-    # Initialize empty object
-    a <- list()
-
-    # Add merges
-    a$merge <- merges_clust
-
-    # Define merge heights
-    a$height <- x$backboneLoss[1:nrow(x) - 1]
-
-    # Order of leaves
-    a$order <- 1:nrow(x)
-
-    # Labels of leaves
-    a$labels <- rev(x$entity)
-
-    # Define hclust class
-    class(a) <- "hclust"
-
-    plot(a, ylab = "")
-  }
-}
-
-#' @rdname dna_backbone
-#' @param object A \code{"dna_backbone"} object.
-#' @param ... Additional arguments.
-#' @importFrom ggplot2 autoplot
-#' @importFrom ggplot2 ggplot
-#' @importFrom ggplot2 aes
-#' @importFrom ggplot2 geom_line
-#' @importFrom ggplot2 ylab
-#' @importFrom ggplot2 xlab
-#' @importFrom ggplot2 ggtitle
-#' @importFrom ggplot2 theme_bw
-#' @importFrom ggplot2 theme
-#' @importFrom ggplot2 coord_flip
-#' @importFrom ggplot2 scale_x_continuous
-#' @importFrom ggplot2 scale_y_continuous
-#' @importFrom rlang .data
-#' @export
-autoplot.dna_backbone <- function(object, ..., ma = 500) {
-  if (attr(object, "method") != "nested") {
-    bd <- object$diagnostics
-    bd$bb_loss <- stats::filter(bd$penalized_backbone_loss, rep(1 / ma, ma), sides = 1)
-    bd$current_size_ma <- stats::filter(bd$current_backbone_size, rep(1 / ma, ma), sides = 1)
-    bd$optimal_size_ma <- stats::filter(bd$optimal_backbone_size, rep(1 / ma, ma), sides = 1)
-    bd$accept_ratio <- stats::filter(bd$acceptance, rep(1 / ma, ma), sides = 1)
-
-    # temperature and acceptance probability
-    g_accept <- ggplot2::ggplot(bd, ggplot2::aes(y = .data[["temperature"]], x = .data[["iteration"]])) +
-      ggplot2::geom_line(color = "#a50f15") +
-      ggplot2::geom_line(data = bd[bd$acceptance_prob >= 0, ],
-                         ggplot2::aes(y = .data[["acceptance_prob"]], x = .data[["iteration"]])) +
-      ggplot2::ylab("Acceptance probability") +
-      ggplot2::xlab("Iteration") +
-      ggplot2::ggtitle("Temperature and acceptance probability") +
-      ggplot2::theme_bw()
-
-    # spectral distance between full network and backbone network per iteration
-    if (attributes(object)$method == "penalty") {
-      yl <- "Penalized backbone loss"
-      ti <- "Penalized spectral backbone distance"
-    } else {
-      yl <- "Backbone loss"
-      ti <- "Spectral backbone distance"
-    }
-    g_loss <- ggplot2::ggplot(bd, ggplot2::aes(y = .data[["bb_loss"]], x = .data[["iteration"]])) +
-      ggplot2::geom_line() +
-      ggplot2::ylab(yl) +
-      ggplot2::xlab("Iteration") +
-      ggplot2::ggtitle(ti) +
-      ggplot2::theme_bw()
-
-    # number of concepts in the backbone solution per iteration
-    d <- data.frame(iteration = rep(bd$iteration, 2),
-                    size = c(bd$current_size_ma, bd$optimal_size_ma),
-                    Criterion = c(rep("Current iteration", nrow(bd)),
-                                  rep("Best solution", nrow(bd))))
-    g_size <- ggplot2::ggplot(d, ggplot2::aes(y = .data[["size"]], x = .data[["iteration"]], color = .data[["Criterion"]])) +
-      ggplot2::geom_line() +
-      ggplot2::ylab(paste0("Number of elements (MA, last ", ma, ")")) +
-      ggplot2::xlab("Iteration") +
-      ggplot2::ggtitle("Backbone size") +
-      ggplot2::theme_bw() +
-      ggplot2::theme(legend.position = "bottom")
-
-    # ratio of recent acceptances
-    g_ar <- ggplot2::ggplot(bd, ggplot2::aes(y = .data[["accept_ratio"]], x = .data[["iteration"]])) +
-      ggplot2::geom_line() +
-      ggplot2::ylab(paste("Acceptance ratio in the last", ma, "iterations")) +
-      ggplot2::xlab("Iteration") +
-      ggplot2::ggtitle("Acceptance ratio") +
-      ggplot2::theme_bw()
-
-    # wrap in list
-    plots <- list(g_accept, g_loss, g_size, g_ar)
-    return(plots)
-  } else { # create hclust object
-    # define merging pattern: negative numbers are leaves, positive are merged clusters
-    merges_clust <- matrix(nrow = nrow(object) - 1, ncol = 2)
-
-    merges_clust[1,1] <- -nrow(object)
-    merges_clust[1,2] <- -(nrow(object) - 1)
-
-    for (i in 2:(nrow(object) - 1)) {
-      merges_clust[i, 1] <- -(nrow(object) - i)
-      merges_clust[i, 2] <- i - 1
-    }
-
-    # Initialize empty object
-    a <- list()
-
-    # Add merges
-    a$merge <- merges_clust
-
-    # Define merge heights
-    a$height <- object$backboneLoss[1:nrow(object) - 1]
-    height <- a$height
-
-    # Order of leaves
-    a$order <- 1:nrow(object)
-
-    # Labels of leaves
-    a$labels <- rev(object$entity)
-
-    # Define hclust class
-    class(a) <- "hclust"
-
-    # ensure ggraph is installed, otherwise throw error (better than importing it to avoid hard dependency)
-    if (!requireNamespace("ggraph", quietly = TRUE)) {
-      stop("The 'ggraph' package is required for plotting nested backbone dendrograms with 'ggplot2' but was not found. Consider installing it.")
-    }
-
-    g_clust <- ggraph::ggraph(graph = a,
-                              layout = "dendrogram",
-                              circular = FALSE,
-                              height = height) + # TODO @Tim: "height" does not seem to exist
-      ggraph::geom_edge_elbow() +
-      ggraph::geom_node_point(aes(filter = .data[["leaf"]])) +
-      ggplot2::theme_bw() +
-      ggplot2::theme(panel.border = element_blank(),
-                     axis.title = element_blank(),
-                     panel.grid.major = element_blank(),
-                     panel.grid.minor = element_blank(),
-                     axis.line = element_blank(),
-                     axis.text.y = element_text(size = 6),
-                     axis.ticks.y = element_blank()) +
-      ggplot2::scale_x_continuous(breaks = seq(0, nrow(object) - 1, by = 1),
-                                  labels = rev(object$entity)) +
-      ggplot2::scale_y_continuous(expand = c(0, 0.01)) +
-      ggplot2::coord_flip()
-
-    return(g_clust)
-  }
-}
-
-#' @param backboneEntities A vector of character values to be included in the
-#'   backbone. The function will compute the spectral loss between the full
-#'   network and the network composed only of those entities on the second mode
-#'   that are contained in this vector.
-#' @param p The penalty parameter. The default value of \code{0} means no
-#'   penalty for backbone size is applied.
-#' @inheritParams dna_backbone
-#' @return A vector with two numeric values: the backbone and redundant loss.
-#'
-#' @examples
-#' \dontrun{
-#' dna_init()
-#' dna_sample()
-#' dna_openDatabase("sample.dna", coderId = 1, coderPassword = "sample")
-#'
-#' dna_evaluateBackboneSolution(
-#'   c("There should be legislation to regulate emissions.",
-#'     "Emissions legislation should regulate CO2.")
-#' )
-#' }
-#'
-#' @rdname dna_backbone
-#' @importFrom rJava .jarray
-#' @importFrom rJava .jcall
-#' @importFrom rJava .jnull
-#' @export
-dna_evaluateBackboneSolution <- function(backboneEntities,
-                                         p = 0,
-                                         statementType = "DNA Statement",
-                                         variable1 = "organization",
-                                         variable1Document = FALSE,
-                                         variable2 = "concept",
-                                         variable2Document = FALSE,
-                                         qualifier = "agreement",
-                                         qualifierDocument = FALSE,
-                                         qualifierAggregation = "subtract",
-                                         normalization = "average",
-                                         duplicates = "document",
-                                         start.date = "01.01.1900",
-                                         stop.date = "31.12.2099",
-                                         start.time = "00:00:00",
-                                         stop.time = "23:59:59",
-                                         excludeValues = list(),
-                                         excludeAuthors = character(),
-                                         excludeSources = character(),
-                                         excludeSections = character(),
-                                         excludeTypes = character(),
-                                         invertValues = FALSE,
-                                         invertAuthors = FALSE,
-                                         invertSources = FALSE,
-                                         invertSections = FALSE,
-                                         invertTypes = FALSE) {
-
-  # wrap the vectors of exclude values for document variables into Java arrays
-  excludeAuthors <- .jarray(excludeAuthors)
-  excludeSources <- .jarray(excludeSources)
-  excludeSections <- .jarray(excludeSections)
-  excludeTypes <- .jarray(excludeTypes)
-
-  # compile exclude variables and values vectors
-  dat <- matrix("", nrow = length(unlist(excludeValues)), ncol = 2)
-  count <- 0
-  if (length(excludeValues) > 0) {
-    for (i in 1:length(excludeValues)) {
-      if (length(excludeValues[[i]]) > 0) {
-        for (j in 1:length(excludeValues[[i]])) {
-          count <- count + 1
-          dat[count, 1] <- names(excludeValues)[i]
-          dat[count, 2] <- excludeValues[[i]][j]
-        }
-      }
-    }
-    var <- dat[, 1]
-    val <- dat[, 2]
-  } else {
-    var <- character()
-    val <- character()
-  }
-  var <- .jarray(var) # array of variable names of each excluded value
-  val <- .jarray(val) # array of values to be excluded
-
-  # encode R NULL as Java null value if necessary
-  if (is.null(qualifier) || is.na(qualifier)) {
-    qualifier <- .jnull(class = "java/lang/String")
-  }
-
-  # call rBackbone function to compute results
-  result <- .jcall(dnaEnvironment[["dna"]]$headlessDna,
-                   "[D",
-                   "rEvaluateBackboneSolution",
-                   .jarray(backboneEntities),
-                   as.integer(p),
-                   statementType,
-                   variable1,
-                   variable1Document,
-                   variable2,
-                   variable2Document,
-                   qualifier,
-                   qualifierDocument,
-                   qualifierAggregation,
-                   normalization,
-                   duplicates,
-                   start.date,
-                   stop.date,
-                   start.time,
-                   stop.time,
-                   var,
-                   val,
-                   excludeAuthors,
-                   excludeSources,
-                   excludeSections,
-                   excludeTypes,
-                   invertValues,
-                   invertAuthors,
-                   invertSources,
-                   invertSections,
-                   invertTypes
-  )
-  names(result) <- c("backbone loss", "redundant loss")
-  return(result)
-}
-
-
-# Clustering -------------------------------------------------------------------
-
-#' Compute multiple cluster solutions for a discourse network
-#'
-#' Compute multiple cluster solutions for a discourse network.
-#'
-#' This function applies a number of different graph clustering techniques to
-#' a discourse network dataset. The user provides many of the same arguments as
-#' in the \code{\link{dna_network}} function and a few additional arguments that
-#' determine which kinds of clustering methods should be used and how. In
-#' particular, the \code{k} argument can be \code{0} (for arbitrary numbers of
-#' clusters) or any positive integer value (e.g., \code{2}, for constraining the
-#' number of clusters to exactly \code{k} groups). This is useful for assessing
-#' the polarization of a discourse network.
-#'
-#' In particular, the function can be used to compute the maximal modularity of
-#' a smoothed time series of discourse networks using the \code{timeWindow} and
-#' \code{windowSize} arguments for a given \code{k} across a number of
-#' clustering methods.
-#'
-#' It is also possible to switch off all but one clustering method using the
-#' respective arguments and carry out a simple cluster analysis with the method
-#' of choice for a certain time span of the discourse network, without any time
-#' window options.
-#'
-#' @param saveObjects Store the original output of the respective clustering
-#'   method in the \code{cl} slot of the return object? If \code{TRUE}, one
-#'   cluster object per time point will be saved, for all time points for which
-#'   network data are available. At each time point, only the cluster object
-#'   with the highest modularity score will be saved, all others discarded. The
-#'   \code{max_mod} slot of the object contains additional information on which
-#'   measure was saved at each time point and what the corresponding modularity
-#'   score is.
-#' @param k The number of clusters to compute. This constrains the choice of
-#'   clustering methods because some methods require a predefined \code{k} while
-#'   other methods do not. To permit arbitrary numbers of clusters, depending on
-#'   the respective algorithm (or the value of modularity in some cases), choose
-#'   \code{k = 0}. This corresponds to the theoretical notion of
-#'   "multipolarization". For "bipolarization", choose \code{k = 2} in order to
-#'   constrain the cluster solutions to exactly two groups.
-#' @param k.max If \code{k = 0}, there can be arbitrary numbers of clusters. In
-#'   this case, \code{k.max} sets the maximal number of clusters that can be
-#'   identified.
-#' @param single Include hierarchical clustering with single linkage in the pool
-#'   of clustering methods? The \code{\link[stats]{hclust}} function from
-#'   the \pkg{stats} package is applied to Jaccard distances in the affiliation
-#'   network for this purpose. Only valid if \code{k > 1}.
-#' @param average Include hierarchical clustering with average linkage in the
-#'   pool of clustering methods? The \code{\link[stats]{hclust}} function from
-#'   the \pkg{stats} package is applied to Jaccard distances in the affiliation
-#'   network for this purpose. Only valid if \code{k > 1}.
-#' @param complete Include hierarchical clustering with complete linkage in the
-#'   pool of clustering methods? The \code{\link[stats]{hclust}} function from
-#'   the \pkg{stats} package is applied to Jaccard distances in the affiliation
-#'   network for this purpose. Only valid if \code{k > 1}.
-#' @param ward Include hierarchical clustering with Ward's algorithm in the
-#'   pool of clustering methods? The \code{\link[stats]{hclust}} function from
-#'   the \pkg{stats} package is applied to Jaccard distances in the affiliation
-#'   network for this purpose. If \code{k = 0} is selected, different solutions
-#'   with varying \code{k} are attempted, and the solution with the highest
-#'   modularity is retained.
-#' @param kmeans Include k-means clustering in the pool of clustering methods?
-#'   The \code{\link[stats]{kmeans}} function from the \pkg{stats} package is
-#'   applied to Jaccard distances in the affiliation network for this purpose.
-#'   If \code{k = 0} is selected, different solutions with varying \code{k} are
-#'   attempted, and the solution with the highest modularity is retained.
-#' @param pam Include partitioning around medoids in the pool of clustering
-#'   methods? The \code{\link[cluster]{pam}} function from the \pkg{cluster}
-#'   package is applied to Jaccard distances in the affiliation network for this
-#'   purpose. If \code{k = 0} is selected, different solutions with varying
-#'   \code{k} are attempted, and the solution with the highest modularity is
-#'   retained.
-#' @param equivalence Include equivalence clustering (as implemented in the
-#'   \code{\link[sna]{equiv.clust}} function in the \pkg{sna} package), based on
-#'   shortest path distances between nodes (as implemented in the
-#'   \code{\link[sna]{sedist}} function in the \pkg{sna} package) in the
-#'   positive subtract network? If \code{k = 0} is selected, different solutions
-#'   with varying \code{k} are attempted, and the solution with the highest
-#'   modularity is retained.
-#' @param concor_one Include CONvergence of iterative CORrelations (CONCOR) in
-#'   the pool of clustering methods? The algorithm is applied to the positive
-#'   subtract network to identify \code{k = 2} clusters. The method is omitted
-#'   if \code{k != 2}.
-#' @param concor_two Include CONvergence of iterative CORrelations (CONCOR) in
-#'   the pool of clustering methods? The algorithm is applied to the affiliation
-#'   network to identify \code{k = 2} clusters. The method is omitted
-#'   if \code{k != 2}.
-#' @param louvain Include the Louvain community detection algorithm in the pool
-#'   of clustering methods? The \code{\link[igraph]{cluster_louvain}} function
-#'   in the \pkg{igraph} package is applied to the positive subtract network for
-#'   this purpose.
-#' @param fastgreedy Include the fast and greedy community detection algorithm
-#'   in the pool of clustering methods? The
-#'   \code{\link[igraph]{cluster_fast_greedy}} function in the \pkg{igraph}
-#'   package is applied to the positive subtract network for this purpose.
-#' @param walktrap Include the Walktrap community detection algorithm
-#'   in the pool of clustering methods? The
-#'   \code{\link[igraph]{cluster_walktrap}} function in the \pkg{igraph}
-#'   package is applied to the positive subtract network for this purpose.
-#' @param leading_eigen Include the leading eigenvector community detection
-#'   algorithm in the pool of clustering methods? The
-#'   \code{\link[igraph]{cluster_leading_eigen}} function in the \pkg{igraph}
-#'   package is applied to the positive subtract network for this purpose.
-#' @param edge_betweenness Include the edge betweenness community detection
-#'   algorithm by Girvan and Newman in the pool of clustering methods? The
-#'   \code{\link[igraph]{cluster_edge_betweenness}} function in the \pkg{igraph}
-#'   package is applied to the positive subtract network for this purpose.
-#' @param infomap Include the infomap community detection algorithm
-#'   in the pool of clustering methods? The
-#'   \code{\link[igraph]{cluster_infomap}} function in the \pkg{igraph}
-#'   package is applied to the positive subtract network for this purpose.
-#' @param label_prop Include the label propagation community detection algorithm
-#'   in the pool of clustering methods? The
-#'   \code{\link[igraph]{cluster_label_prop}} function in the \pkg{igraph}
-#'   package is applied to the positive subtract network for this purpose.
-#' @param spinglass Include the spinglass community detection algorithm
-#'   in the pool of clustering methods? The
-#'   \code{\link[igraph]{cluster_spinglass}} function in the \pkg{igraph}
-#'   package is applied to the positive subtract network for this purpose. Note
-#'   that this method is disabled by default because it is relatively slow.
-#' @inheritParams dna_network
-#'
-#' @return The function creates a \code{dna_multiclust} object, which contains
-#'   the following items:
-#' \describe{
-#'   \item{k}{The number of clusters determined by the user.}
-#'   \item{cl}{Cluster objects returned by the respective cluster function. If
-#'     multiple methods are used, this returns the object with the highest
-#'     modularity.}
-#'   \item{max_mod}{A data frame with one row per time point (that is, only one
-#'     row in the default case and multiple rows if time windows are used) and
-#'     the maximal modularity for the given time point across all cluster
-#'     methods.}
-#'   \item{modularity}{A data frame with the modularity values for all separate
-#'     cluster methods and all time points.}
-#'   \item{membership}{A large data frame with all nodes' membership information
-#'     for each time point and each clustering method.}
-#' }
-#'
-#' @author Philip Leifeld
-#'
-#' @examples
-#' \dontrun{
-#' library("rDNA")
-#' dna_init()
-#' samp <- dna_sample()
-#' dna_openDatabase(samp, coderId = 1, coderPassword = "sample")
-#'
-#' # example 1: compute 12 cluster solutions for one time point
-#' mc1 <- dna_multiclust(variable1 = "organization",
-#'                       variable2 = "concept",
-#'                       qualifier = "agreement",
-#'                       duplicates = "document",
-#'                       k = 0,                # flexible numbers of clusters
-#'                       saveObjects = TRUE)   # retain hclust object
-#'
-#' mc1$modularity      # return modularity scores for 12 clustering methods
-#' mc1$max_mod         # return the maximal value of the 12, along with dates
-#' mc1$memberships     # return cluster memberships for all 12 cluster methods
-#' plot(mc1$cl[[1]])   # plot hclust dendrogram
-#'
-#' # example 2: compute only Girvan-Newman edge betweenness with two clusters
-#' set.seed(12345)
-#' mc2 <- dna_multiclust(k = 2,
-#'                       single = FALSE,
-#'                       average = FALSE,
-#'                       complete = FALSE,
-#'                       ward = FALSE,
-#'                       kmeans = FALSE,
-#'                       pam = FALSE,
-#'                       equivalence = FALSE,
-#'                       concor_one = FALSE,
-#'                       concor_two = FALSE,
-#'                       louvain = FALSE,
-#'                       fastgreedy = FALSE,
-#'                       walktrap = FALSE,
-#'                       leading_eigen = FALSE,
-#'                       edge_betweenness = TRUE,
-#'                       infomap = FALSE,
-#'                       label_prop = FALSE,
-#'                       spinglass = FALSE)
-#' mc2$memberships     # return membership in two clusters
-#' mc2$modularity      # return modularity of the cluster solution
-#'
-#' # example 3: smoothed modularity using time window algorithm
-#' mc3 <- dna_multiclust(k = 2,
-#'                       timeWindow = "events",
-#'                       windowSize = 28)
-#' mc3$max_mod         # maximal modularity and method per time point
-#' }
-#'
-#' @rdname dna_multiclust
-#' @importFrom stats as.dist cor hclust cutree kmeans
-#' @export
-dna_multiclust <- function(statementType = "DNA Statement",
-                           variable1 = "organization",
-                           variable1Document = FALSE,
-                           variable2 = "concept",
-                           variable2Document = FALSE,
-                           qualifier = "agreement",
-                           duplicates = "include",
-                           start.date = "01.01.1900",
-                           stop.date = "31.12.2099",
-                           start.time = "00:00:00",
-                           stop.time = "23:59:59",
-                           timeWindow = "no",
-                           windowSize = 100,
-                           excludeValues = list(),
-                           excludeAuthors = character(),
-                           excludeSources = character(),
-                           excludeSections = character(),
-                           excludeTypes = character(),
-                           invertValues = FALSE,
-                           invertAuthors = FALSE,
-                           invertSources = FALSE,
-                           invertSections = FALSE,
-                           invertTypes = FALSE,
-                           saveObjects = FALSE,
-                           k = 0,
-                           k.max = 5,
-                           single = TRUE,
-                           average = TRUE,
-                           complete = TRUE,
-                           ward = TRUE,
-                           kmeans = TRUE,
-                           pam = TRUE,
-                           equivalence = TRUE,
-                           concor_one = TRUE,
-                           concor_two = TRUE,
-                           louvain = TRUE,
-                           fastgreedy = TRUE,
-                           walktrap = TRUE,
-                           leading_eigen = TRUE,
-                           edge_betweenness = TRUE,
-                           infomap = TRUE,
-                           label_prop = TRUE,
-                           spinglass = FALSE) {
-
-  # check dependencies
-  if (!requireNamespace("igraph", quietly = TRUE)) { # version 0.8.1 required for edge betweenness to work fine.
-    stop("The 'dna_multiclust' function requires the 'igraph' package to be installed.\n",
-         "To do this, enter 'install.packages(\"igraph\")'.")
-  } else if (packageVersion("igraph") < "0.8.1" && edge_betweenness) {
-    warning("Package version of 'igraph' < 0.8.1. If edge betweenness algorithm encounters an empty network matrix, this will let R crash. See here: https://github.com/igraph/rigraph/issues/336. Consider updating 'igraph' to the latest version.")
-  }
-  if (pam && !requireNamespace("cluster", quietly = TRUE)) {
-    pam <- FALSE
-    warning("Argument 'pam = TRUE' requires the 'cluster' package, which is not installed.\nSetting 'pam = FALSE'. Consider installing the 'cluster' package.")
-  }
-  if (equivalence && !requireNamespace("sna", quietly = TRUE)) {
-    equivalence <- FALSE
-    warning("Argument 'equivalence = TRUE' requires the 'sna' package, which is not installed.\nSetting 'equivalence = FALSE'. Consider installing the 'sna' package.")
-  }
-
-  # check argument validity
-  if (is.null(k) || is.na(k) || !is.numeric(k) || length(k) > 1 || is.infinite(k) || k < 0) {
-    stop("'k' must be a non-negative integer number. Can be 0 for flexible numbers of clusters.")
-  }
-  if (is.null(k.max) || is.na(k.max) || !is.numeric(k.max) || length(k.max) > 1 || is.infinite(k.max) || k.max < 1) {
-    stop("'k.max' must be a positive integer number.")
-  }
-  if (k == 1) {
-    k <- 0
-    warning("'k' must be 0 (for arbitrary numbers of clusters) or larger than 1 (to constrain number of clusters). Using 'k = 0'.")
-  }
-
-  # determine what kind of two-mode network to create
-  if (is.null(qualifier) || is.na(qualifier) || !is.character(qualifier)) {
-    qualifierAggregation <- "ignore"
-  } else {
-    v <- dna_getVariables(statementType = statementType)
-    if (v$type[v$label == qualifier] == "boolean") {
-      qualifierAggregation <- "combine"
-    } else {
-      qualifierAggregation <- "subtract"
-    }
-  }
-
-  nw_aff <- dna_network(networkType = "twomode",
-                        statementType = statementType,
-                        variable1 = variable1,
-                        variable1Document = variable1Document,
-                        variable2 = variable2,
-                        variable2Document = variable2Document,
-                        qualifier = qualifier,
-                        qualifierAggregation = qualifierAggregation,
-                        normalization = "no",
-                        duplicates = duplicates,
-                        start.date = start.date,
-                        stop.date = stop.date,
-                        start.time = start.time,
-                        stop.time = stop.time,
-                        timeWindow = timeWindow,
-                        windowSize = windowSize,
-                        excludeValues = excludeValues,
-                        excludeAuthors = excludeAuthors,
-                        excludeSources = excludeSources,
-                        excludeSections = excludeSections,
-                        excludeTypes = excludeTypes,
-                        invertValues = invertValues,
-                        invertAuthors = invertAuthors,
-                        invertSources = invertSources,
-                        invertSections = invertSections,
-                        invertTypes = invertTypes)
-  nw_sub <- dna_network(networkType = "onemode",
-                        statementType = statementType,
-                        variable1 = variable1,
-                        variable1Document = variable1Document,
-                        variable2 = variable2,
-                        variable2Document = variable2Document,
-                        qualifier = qualifier,
-                        qualifierAggregation = "subtract",
-                        normalization = "average",
-                        duplicates = duplicates,
-                        start.date = start.date,
-                        stop.date = stop.date,
-                        start.time = start.time,
-                        stop.time = stop.time,
-                        timeWindow = timeWindow,
-                        windowSize = windowSize,
-                        excludeValues = excludeValues,
-                        excludeAuthors = excludeAuthors,
-                        excludeSources = excludeSources,
-                        excludeSections = excludeSections,
-                        excludeTypes = excludeTypes,
-                        invertValues = invertValues,
-                        invertAuthors = invertAuthors,
-                        invertSources = invertSources,
-                        invertSections = invertSections,
-                        invertTypes = invertTypes)
-
-  if (timeWindow == "no") {
-    dta <- list()
-    dta$networks <- list(nw_sub)
-    nw_sub <- dta
-    dta <- list()
-    dta$networks <- list(nw_aff)
-    nw_aff <- dta
-  }
-
-  obj <- list()
-  if (isTRUE(saveObjects)) {
-    obj$cl <- list()
-  }
-  dta_dat <- list()
-  dta_mem <- list()
-  dta_mod <- list()
-  counter <- 1
-  if ("dna_network_onemode_timewindows" %in% class(nw_sub)) {
-    num_networks <- length(nw_sub)
-  } else {
-    num_networks <- 1
-  }
-  for (i in 1:num_networks) {
-
-    # prepare dates
-    if (timeWindow == "no") {
-      dta_dat[[i]] <- data.frame(i = i,
-                                 start = attributes(nw_sub$networks[[i]])$start,
-                                 stop = attributes(nw_sub$networks[[i]])$stop)
-    } else {
-      dta_dat[[i]] <- data.frame(i = i,
-                                 start.date = attributes(nw_sub[[i]])$start,
-                                 middle.date = attributes(nw_sub[[i]])$middle,
-                                 stop.date = attributes(nw_sub[[i]])$stop)
-    }
-
-    # prepare two-mode network
-    if ("dna_network_onemode_timewindows" %in% class(nw_sub)) {
-      x <- nw_aff[[i]]
-    } else {
-      x <- nw_aff$networks[[i]]
-    }
-    if (qualifierAggregation == "combine") {
-      combined <- cbind(apply(x, 1:2, function(x) ifelse(x %in% c(1, 3), 1, 0)),
-                        apply(x, 1:2, function(x) ifelse(x %in% c(2, 3), 1, 0)))
-    } else {
-      combined <- x
-    }
-    combined <- combined[rowSums(combined) > 0, , drop = FALSE]
-    rn <- rownames(combined)
-
-    # Jaccard distances for two-mode network (could be done using vegdist function in vegan package, but saving the dependency)
-    combined <- matrix(as.integer(combined > 0), nrow = nrow(combined)) # probably not necessary, but ensure it's an integer matrix
-    intersections <- tcrossprod(combined) # compute intersections using cross-product
-    row_sums <- rowSums(combined) # compute row sums
-    unions <- matrix(outer(row_sums, row_sums, `+`), ncol = length(row_sums)) - intersections # compute unions
-    jaccard_similarities <- intersections / unions # calculate Jaccard similarities
-    jaccard_similarities[is.nan(jaccard_similarities)] <- 0 # avoid division by zero
-    jaccard_distances <- 1 - jaccard_similarities # convert to Jaccard distances
-    rownames(jaccard_distances) <- rn # re-attach the row names
-    jac <- stats::as.dist(jaccard_distances) # convert to dist object
-
-    # prepare one-mode network
-    if ("dna_network_onemode_timewindows" %in% class(nw_sub)) {
-      y <- nw_sub[[i]]
-    } else {
-      y <- nw_sub$networks[[i]]
-    }
-    y[y < 0] <- 0
-    class(y) <- "matrix"
-    g <- igraph::graph_from_adjacency_matrix(y, mode = "undirected", weighted = TRUE)
-
-    if (nrow(combined) > 1) {
-      counter_current <- 1
-      current_cl <- list()
-      current_mod <- numeric()
-
-      # Hierarchical clustering with single linkage
-      if (isTRUE(single) && k > 1) {
-        try({
-          suppressWarnings(cl <- stats::hclust(jac, method = "single"))
-          mem <- stats::cutree(cl, k = k)
-          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
-                                           method = rep("Hierarchical (Single)", length(mem)),
-                                           node = rownames(x),
-                                           cluster = mem,
-                                           stringsAsFactors = FALSE)
-          dta_mod[[counter]] <- data.frame(i = i,
-                                           method = "Hierarchical (Single)",
-                                           k = k,
-                                           modularity = igraph::modularity(x = g, membership = mem),
-                                           stringsAsFactors = FALSE)
-          if (isTRUE(saveObjects)) {
-            current_cl[[counter_current]] <- cl
-            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
-            counter_current <- counter_current + 1
-          }
-          counter <- counter + 1
-        }, silent = TRUE)
-      }
-
-      # Hierarchical clustering with single linkage with optimal k
-      if (isTRUE(single) && k < 2) {
-        try({
-          suppressWarnings(cl <- stats::hclust(jac, method = "single"))
-          opt_k <- lapply(2:k.max, function(x) {
-            mem <- stats::cutree(cl, k = x)
-            mod <- igraph::modularity(x = g, membership = mem)
-            return(list(mem = mem, mod = mod))
-          })
-          mod <- sapply(opt_k, function(x) x$mod)
-          kk <- which.max(mod)
-          mod <- max(mod)
-          mem <- opt_k[[kk]]$mem
-          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
-                                           method = rep("Hierarchical (Single)", length(mem)),
-                                           node = rownames(x),
-                                           cluster = mem,
-                                           stringsAsFactors = FALSE)
-          dta_mod[[counter]] <- data.frame(i = i,
-                                           method = "Hierarchical (Single)",
-                                           k = kk + 1, # add one because the series started with k = 2
-                                           modularity = mod,
-                                           stringsAsFactors = FALSE)
-          if (isTRUE(saveObjects)) {
-            current_cl[[counter_current]] <- cl
-            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
-            counter_current <- counter_current + 1
-          }
-          counter <- counter + 1
-        }, silent = TRUE)
-      }
-
-      # Hierarchical clustering with average linkage
-      if (isTRUE(average) && k > 1) {
-        try({
-          suppressWarnings(cl <- stats::hclust(jac, method = "average"))
-          mem <- stats::cutree(cl, k = k)
-          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
-                                           method = rep("Hierarchical (Average)", length(mem)),
-                                           node = rownames(x),
-                                           cluster = mem,
-                                           stringsAsFactors = FALSE)
-          dta_mod[[counter]] <- data.frame(i = i,
-                                           method = "Hierarchical (Average)",
-                                           k = k,
-                                           modularity = igraph::modularity(x = g, membership = mem),
-                                           stringsAsFactors = FALSE)
-          if (isTRUE(saveObjects)) {
-            current_cl[[counter_current]] <- cl
-            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
-            counter_current <- counter_current + 1
-          }
-          counter <- counter + 1
-        }, silent = TRUE)
-      }
-
-      # Hierarchical clustering with average linkage with optimal k
-      if (isTRUE(average) && k < 2) {
-        try({
-          suppressWarnings(cl <- stats::hclust(jac, method = "average"))
-          opt_k <- lapply(2:k.max, function(x) {
-            mem <- stats::cutree(cl, k = x)
-            mod <- igraph::modularity(x = g, membership = mem)
-            return(list(mem = mem, mod = mod))
-          })
-          mod <- sapply(opt_k, function(x) x$mod)
-          kk <- which.max(mod)
-          mod <- max(mod)
-          mem <- opt_k[[kk]]$mem
-          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
-                                           method = rep("Hierarchical (Average)", length(mem)),
-                                           node = rownames(x),
-                                           cluster = mem,
-                                           stringsAsFactors = FALSE)
-          dta_mod[[counter]] <- data.frame(i = i,
-                                           method = "Hierarchical (Average)",
-                                           k = kk + 1, # add one because the series started with k = 2
-                                           modularity = mod,
-                                           stringsAsFactors = FALSE)
-          if (isTRUE(saveObjects)) {
-            current_cl[[counter_current]] <- cl
-            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
-            counter_current <- counter_current + 1
-          }
-          counter <- counter + 1
-        }, silent = TRUE)
-      }
-
-      # Hierarchical clustering with complete linkage
-      if (isTRUE(complete) && k > 1) {
-        try({
-          suppressWarnings(cl <- stats::hclust(jac, method = "complete"))
-          mem <- stats::cutree(cl, k = k)
-          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
-                                           method = rep("Hierarchical (Complete)", length(mem)),
-                                           node = rownames(x),
-                                           cluster = mem,
-                                           stringsAsFactors = FALSE)
-          dta_mod[[counter]] <- data.frame(i = i,
-                                           method = "Hierarchical (Complete)",
-                                           k = k,
-                                           modularity = igraph::modularity(x = g, membership = mem),
-                                           stringsAsFactors = FALSE)
-          if (isTRUE(saveObjects)) {
-            current_cl[[counter_current]] <- cl
-            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
-            counter_current <- counter_current + 1
-          }
-          counter <- counter + 1
-        }, silent = TRUE)
-      }
-
-      # Hierarchical clustering with complete linkage with optimal k
-      if (isTRUE(complete) && k < 2) {
-        try({
-          suppressWarnings(cl <- stats::hclust(jac, method = "complete"))
-          opt_k <- lapply(2:k.max, function(x) {
-            mem <- stats::cutree(cl, k = x)
-            mod <- igraph::modularity(x = g, membership = mem)
-            return(list(mem = mem, mod = mod))
-          })
-          mod <- sapply(opt_k, function(x) x$mod)
-          kk <- which.max(mod)
-          mod <- max(mod)
-          mem <- opt_k[[kk]]$mem
-          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
-                                           method = rep("Hierarchical (Complete)", length(mem)),
-                                           node = rownames(x),
-                                           cluster = mem,
-                                           stringsAsFactors = FALSE)
-          dta_mod[[counter]] <- data.frame(i = i,
-                                           method = "Hierarchical (Complete)",
-                                           k = kk + 1, # add one because the series started with k = 2
-                                           modularity = mod,
-                                           stringsAsFactors = FALSE)
-          if (isTRUE(saveObjects)) {
-            current_cl[[counter_current]] <- cl
-            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
-            counter_current <- counter_current + 1
-          }
-          counter <- counter + 1
-        }, silent = TRUE)
-      }
-
-      # Hierarchical clustering with the Ward algorithm
-      if (isTRUE(ward) && k > 1) {
-        try({
-          suppressWarnings(cl <- stats::hclust(jac, method = "ward.D2"))
-          mem <- stats::cutree(cl, k = k)
-          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
-                                           method = rep("Hierarchical (Ward)", length(mem)),
-                                           node = rownames(x),
-                                           cluster = mem,
-                                           stringsAsFactors = FALSE)
-          dta_mod[[counter]] <- data.frame(i = i,
-                                           method = "Hierarchical (Ward)",
-                                           k = k,
-                                           modularity = igraph::modularity(x = g, membership = mem),
-                                           stringsAsFactors = FALSE)
-          if (isTRUE(saveObjects)) {
-            current_cl[[counter_current]] <- cl
-            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
-            counter_current <- counter_current + 1
-          }
-          counter <- counter + 1
-        }, silent = TRUE)
-      }
-
-      # Hierarchical clustering with the Ward algorithm with optimal k
-      if (isTRUE(ward) && k < 2) {
-        try({
-          suppressWarnings(cl <- stats::hclust(jac, method = "ward.D2"))
-          opt_k <- lapply(2:k.max, function(x) {
-            mem <- stats::cutree(cl, k = x)
-            mod <- igraph::modularity(x = g, membership = mem)
-            return(list(mem = mem, mod = mod))
-          })
-          mod <- sapply(opt_k, function(x) x$mod)
-          kk <- which.max(mod)
-          mod <- max(mod)
-          mem <- opt_k[[kk]]$mem
-          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
-                                           method = rep("Hierarchical (Ward)", length(mem)),
-                                           node = rownames(x),
-                                           cluster = mem,
-                                           stringsAsFactors = FALSE)
-          dta_mod[[counter]] <- data.frame(i = i,
-                                           method = "Hierarchical (Ward)",
-                                           k = kk + 1, # add one because the series started with k = 2
-                                           modularity = mod,
-                                           stringsAsFactors = FALSE)
-          if (isTRUE(saveObjects)) {
-            current_cl[[counter_current]] <- cl
-            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
-            counter_current <- counter_current + 1
-          }
-          counter <- counter + 1
-        }, silent = TRUE)
-      }
-
-      # k-means
-      if (isTRUE(kmeans) && k > 1) {
-        try({
-          suppressWarnings(cl <- stats::kmeans(jac, centers = k))
-          mem <- cl$cluster
-          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
-                                           method = rep("k-Means", length(mem)),
-                                           node = rownames(x),
-                                           cluster = mem,
-                                           stringsAsFactors = FALSE)
-          dta_mod[[counter]] <- data.frame(i = i,
-                                           method = "k-Means",
-                                           k = k,
-                                           modularity = igraph::modularity(x = g, membership = mem),
-                                           stringsAsFactors = FALSE)
-          if (isTRUE(saveObjects)) {
-            current_cl[[counter_current]] <- cl
-            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
-            counter_current <- counter_current + 1
-          }
-          counter <- counter + 1
-        }, silent = TRUE)
-      }
-
-      # k-means with optimal k
-      if (isTRUE(kmeans) && k < 2) {
-        try({
-          opt_k <- lapply(2:k.max, function(x) {
-            suppressWarnings(cl <- stats::kmeans(jac, centers = x))
-            mem <- cl$cluster
-            mod <- igraph::modularity(x = g, membership = mem)
-            return(list(cl = cl, mem = mem, mod = mod))
-          })
-          mod <- sapply(opt_k, function(x) x$mod)
-          kk <- which.max(mod)
-          mod <- max(mod)
-          mem <- opt_k[[kk]]$mem
-          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
-                                           method = rep("k-Means", length(mem)),
-                                           node = rownames(x),
-                                           cluster = mem,
-                                           stringsAsFactors = FALSE)
-          dta_mod[[counter]] <- data.frame(i = i,
-                                           method = "k-Means",
-                                           k = kk + 1, # add one because the series started with k = 2
-                                           modularity = mod,
-                                           stringsAsFactors = FALSE)
-          if (isTRUE(saveObjects)) {
-            cl <- opt_k[[kk]]$cl
-            current_cl[[counter_current]] <- cl
-            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
-            counter_current <- counter_current + 1
-          }
-          counter <- counter + 1
-        }, silent = TRUE)
-      }
-
-      # pam
-      if (isTRUE(pam) && k > 1) {
-        try({
-          suppressWarnings(cl <- cluster::pam(jac, k = k))
-          mem <- cl$cluster
-          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
-                                           method = rep("Partitioning around Medoids", length(mem)),
-                                           node = rownames(x),
-                                           cluster = mem,
-                                           stringsAsFactors = FALSE)
-          dta_mod[[counter]] <- data.frame(i = i,
-                                           method = "Partitioning around Medoids",
-                                           k = k,
-                                           modularity = igraph::modularity(x = g, membership = mem),
-                                           stringsAsFactors = FALSE)
-          if (isTRUE(saveObjects)) {
-            current_cl[[counter_current]] <- cl
-            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
-            counter_current <- counter_current + 1
-          }
-          counter <- counter + 1
-        }, silent = TRUE)
-      }
-
-      # pam with optimal k
-      if (isTRUE(pam) && k < 2) {
-        try({
-          opt_k <- lapply(2:k.max, function(x) {
-            suppressWarnings(cl <- cluster::pam(jac, k = x))
-            mem <- cl$cluster
-            mod <- igraph::modularity(x = g, membership = mem)
-            return(list(cl = cl, mem = mem, mod = mod))
-          })
-          mod <- sapply(opt_k, function(x) x$mod)
-          kk <- which.max(mod)
-          mod <- max(mod)
-          mem <- opt_k[[kk]]$mem
-          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
-                                           method = rep("Partitioning around Medoids", length(mem)),
-                                           node = rownames(x),
-                                           cluster = mem,
-                                           stringsAsFactors = FALSE)
-          dta_mod[[counter]] <- data.frame(i = i,
-                                           method = "Partitioning around Medoids",
-                                           k = kk + 1, # add one because the series started with k = 2
-                                           modularity = mod,
-                                           stringsAsFactors = FALSE)
-          if (isTRUE(saveObjects)) {
-            cl <- opt_k[[kk]]$cl
-            current_cl[[counter_current]] <- cl
-            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
-            counter_current <- counter_current + 1
-          }
-          counter <- counter + 1
-        }, silent = TRUE)
-      }
-
-      # Equivalence clustering
-      if (isTRUE(equivalence) && k > 1) {
-        try({
-          suppressWarnings(cl <- sna::equiv.clust(y, equiv.dist = sna::sedist(y, method = "euclidean")))
-          mem <- stats::cutree(cl$cluster, k = k)
-          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
-                                           method = rep("Equivalence", length(mem)),
-                                           node = rownames(x),
-                                           cluster = mem,
-                                           stringsAsFactors = FALSE)
-          dta_mod[[counter]] <- data.frame(i = i,
-                                           method = "Equivalence",
-                                           k = k,
-                                           modularity = igraph::modularity(x = g, membership = mem),
-                                           stringsAsFactors = FALSE)
-          if (isTRUE(saveObjects)) {
-            current_cl[[counter_current]] <- cl
-            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
-            counter_current <- counter_current + 1
-          }
-          counter <- counter + 1
-        }, silent = TRUE)
-      }
-
-      # Equivalence clustering with optimal k
-      if (isTRUE(equivalence) && k < 2) {
-        try({
-          suppressWarnings(cl <- sna::equiv.clust(y, equiv.dist = sna::sedist(y, method = "euclidean")))
-          opt_k <- lapply(2:k.max, function(x) {
-            mem <- stats::cutree(cl$cluster, k = x)
-            mod <- igraph::modularity(x = g, membership = mem)
-            return(list(mem = mem, mod = mod))
-          })
-          mod <- sapply(opt_k, function(x) x$mod)
-          kk <- which.max(mod)
-          mod <- max(mod)
-          mem <- opt_k[[kk]]$mem
-          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
-                                           method = rep("Equivalence", length(mem)),
-                                           node = rownames(x),
-                                           cluster = mem,
-                                           stringsAsFactors = FALSE)
-          dta_mod[[counter]] <- data.frame(i = i,
-                                           method = "Equivalence",
-                                           k = kk + 1, # add one because the series started with k = 2
-                                           modularity = mod,
-                                           stringsAsFactors = FALSE)
-          if (isTRUE(saveObjects)) {
-            current_cl[[counter_current]] <- cl
-            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
-            counter_current <- counter_current + 1
-          }
-          counter <- counter + 1
-        }, silent = TRUE)
-      }
-
-      # CONCOR based on the positive subtract network
-      if (isTRUE(concor_one) && k %in% c(0, 2)) {
-        try({
-          suppressWarnings(mi <- stats::cor(y))
-          iter <- 1
-          while (any(abs(mi) <= 0.999) & iter <= 50) {
-            mi[is.na(mi)] <- 0
-            mi <- stats::cor(mi)
-            iter <- iter + 1
-          }
-          mem <- ((mi[, 1] > 0) * 1) + 1
-          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
-                                           method = rep("CONCOR (One-Mode)", length(mem)),
-                                           node = rownames(x),
-                                           cluster = mem,
-                                           stringsAsFactors = FALSE)
-          dta_mod[[counter]] <- data.frame(i = i,
-                                           method = "CONCOR (One-Mode)",
-                                           k = 2,
-                                           modularity = igraph::modularity(x = g, membership = mem),
-                                           stringsAsFactors = FALSE)
-          if (isTRUE(saveObjects)) {
-            current_cl[[counter_current]] <- mem
-            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
-            counter_current <- counter_current + 1
-          }
-          counter <- counter + 1
-        }, silent = TRUE)
-      }
-
-      # CONCOR based on the combined affiliation network
-      if (isTRUE(concor_two) && k %in% c(0, 2)) {
-        try({
-          suppressWarnings(mi <- stats::cor(t(combined)))
-          iter <- 1
-          while (any(abs(mi) <= 0.999) & iter <= 50) {
-            mi[is.na(mi)] <- 0
-            mi <- stats::cor(mi)
-            iter <- iter + 1
-          }
-          mem <- ((mi[, 1] > 0) * 1) + 1
-          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
-                                           method = rep("CONCOR (Two-Mode)", length(mem)),
-                                           node = rownames(x),
-                                           cluster = mem,
-                                           stringsAsFactors = FALSE)
-          dta_mod[[counter]] <- data.frame(i = i,
-                                           method = "CONCOR (Two-Mode)",
-                                           k = 2,
-                                           modularity = igraph::modularity(x = g, membership = mem),
-                                           stringsAsFactors = FALSE)
-          if (isTRUE(saveObjects)) {
-            current_cl[[counter_current]] <- mem
-            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
-            counter_current <- counter_current + 1
-          }
-          counter <- counter + 1
-        }, silent = TRUE)
-      }
-
-      # Louvain clustering
-      if (isTRUE(louvain) && k < 2) {
-        try({
-          suppressWarnings(cl <- igraph::cluster_louvain(g))
-          mem <- igraph::membership(cl)
-          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
-                                           method = rep("Louvain", length(mem)),
-                                           node = rownames(x),
-                                           cluster = as.numeric(mem),
-                                           stringsAsFactors = FALSE)
-          dta_mod[[counter]] <- data.frame(i = i,
-                                           method = "Louvain",
-                                           k = max(as.numeric(mem)),
-                                           modularity = igraph::modularity(x = g, membership = mem),
-                                           stringsAsFactors = FALSE)
-          if (isTRUE(saveObjects)) {
-            current_cl[[counter_current]] <- cl
-            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
-            counter_current <- counter_current + 1
-          }
-          counter <- counter + 1
-        }, silent = TRUE)
-      }
-
-      # Fast & Greedy community detection (with or without cut)
-      if (isTRUE(fastgreedy)) {
-        try({
-          suppressWarnings(cl <- igraph::cluster_fast_greedy(g, merges = TRUE))
-          if (k == 0) {
-            mem <- igraph::membership(cl)
-          } else {
-            mem <- suppressWarnings(igraph::cut_at(cl, no = k))
-            if ((k + 1) %in% as.numeric(mem)) {
-              stop()
-            }
-          }
-          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
-                                           method = rep("Fast & Greedy", length(mem)),
-                                           node = rownames(x),
-                                           cluster = as.numeric(mem),
-                                           stringsAsFactors = FALSE)
-          dta_mod[[counter]] <- data.frame(i = i,
-                                           method = "Fast & Greedy",
-                                           k = ifelse(k == 0, max(as.numeric(mem)), k),
-                                           modularity = igraph::modularity(x = g, membership = mem),
-                                           stringsAsFactors = FALSE)
-          if (isTRUE(saveObjects)) {
-            current_cl[[counter_current]] <- cl
-            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
-            counter_current <- counter_current + 1
-          }
-          counter <- counter + 1
-        }, silent = TRUE)
-      }
-
-      # Walktrap community detection (with or without cut)
-      if (isTRUE(walktrap)) {
-        try({
-          suppressWarnings(cl <- igraph::cluster_walktrap(g, merges = TRUE))
-          if (k == 0) {
-            mem <- igraph::membership(cl)
-          } else {
-            mem <- suppressWarnings(igraph::cut_at(cl, no = k))
-            if ((k + 1) %in% as.numeric(mem)) {
-              stop()
-            }
-          }
-          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
-                                           method = rep("Walktrap", length(mem)),
-                                           node = rownames(x),
-                                           cluster = as.numeric(mem),
-                                           stringsAsFactors = FALSE)
-          dta_mod[[counter]] <- data.frame(i = i,
-                                           method = "Walktrap",
-                                           k = ifelse(k == 0, max(as.numeric(mem)), k),
-                                           modularity = igraph::modularity(x = g, membership = mem),
-                                           stringsAsFactors = FALSE)
-          if (isTRUE(saveObjects)) {
-            current_cl[[counter_current]] <- cl
-            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
-            counter_current <- counter_current + 1
-          }
-          counter <- counter + 1
-        }, silent = TRUE)
-      }
-
-      # Leading Eigenvector community detection (only without cut)
-      if (isTRUE(leading_eigen) && k < 2) { # it *should* work with cut_at because is.hierarchical(cl) returns TRUE, but it never works...
-        try({
-          suppressWarnings(cl <- igraph::cluster_leading_eigen(g))
-          mem <- igraph::membership(cl)
-          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
-                                           method = rep("Leading Eigenvector", length(mem)),
-                                           node = rownames(x),
-                                           cluster = as.numeric(mem),
-                                           stringsAsFactors = FALSE)
-          dta_mod[[counter]] <- data.frame(i = i,
-                                           method = "Leading Eigenvector",
-                                           k = max(as.numeric(mem)),
-                                           modularity = igraph::modularity(x = g, membership = mem),
-                                           stringsAsFactors = FALSE)
-          if (isTRUE(saveObjects)) {
-            current_cl[[counter_current]] <- cl
-            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
-            counter_current <- counter_current + 1
-          }
-          counter <- counter + 1
-        }, silent = TRUE)
-      }
-
-      # Edge Betweenness community detection (with or without cut)
-      if (isTRUE(edge_betweenness)) {
-        try({
-          suppressWarnings(cl <- igraph::cluster_edge_betweenness(g, merges = TRUE))
-          if (k == 0) {
-            mem <- igraph::membership(cl)
-          } else {
-            mem <- suppressWarnings(igraph::cut_at(cl, no = k))
-            if ((k + 1) %in% as.numeric(mem)) {
-              stop()
-            }
-          }
-          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
-                                           method = rep("Edge Betweenness", length(mem)),
-                                           node = rownames(x),
-                                           cluster = as.numeric(mem),
-                                           stringsAsFactors = FALSE)
-          dta_mod[[counter]] <- data.frame(i = i,
-                                           method = "Edge Betweenness",
-                                           k = ifelse(k == 0, max(as.numeric(mem)), k),
-                                           modularity = igraph::modularity(x = g, membership = mem),
-                                           stringsAsFactors = FALSE)
-          if (isTRUE(saveObjects)) {
-            current_cl[[counter_current]] <- cl
-            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
-            counter_current <- counter_current + 1
-          }
-          counter <- counter + 1
-        }, silent = TRUE)
-      }
-
-      # Infomap community detection
-      if (isTRUE(infomap) && k < 2) {
-        try({
-          suppressWarnings(cl <- igraph::cluster_infomap(g))
-          mem <- igraph::membership(cl)
-          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
-                                           method = rep("Infomap", length(mem)),
-                                           node = rownames(x),
-                                           cluster = as.numeric(mem),
-                                           stringsAsFactors = FALSE)
-          dta_mod[[counter]] <- data.frame(i = i,
-                                           method = "Infomap",
-                                           k = max(as.numeric(mem)),
-                                           modularity = igraph::modularity(x = g, membership = mem),
-                                           stringsAsFactors = FALSE)
-          if (isTRUE(saveObjects)) {
-            current_cl[[counter_current]] <- cl
-            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
-            counter_current <- counter_current + 1
-          }
-          counter <- counter + 1
-        }, silent = TRUE)
-      }
-
-      # Label Propagation community detection
-      if (isTRUE(label_prop) && k < 2) {
-        try({
-          suppressWarnings(cl <- igraph::cluster_label_prop(g))
-          mem <- igraph::membership(cl)
-          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
-                                           method = rep("Label Propagation", length(mem)),
-                                           node = rownames(x),
-                                           cluster = as.numeric(mem),
-                                           stringsAsFactors = FALSE)
-          dta_mod[[counter]] <- data.frame(i = i,
-                                           method = "Label Propagation",
-                                           k = max(as.numeric(mem)),
-                                           modularity = igraph::modularity(x = g, membership = mem),
-                                           stringsAsFactors = FALSE)
-          if (isTRUE(saveObjects)) {
-            current_cl[[counter_current]] <- cl
-            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
-            counter_current <- counter_current + 1
-          }
-          counter <- counter + 1
-        }, silent = TRUE)
-      }
-
-      # Spinglass community detection
-      if (isTRUE(spinglass) && k < 2) {
-        try({
-          suppressWarnings(cl <- igraph::cluster_spinglass(g))
-          mem <- igraph::membership(cl)
-          dta_mem[[counter]] <- data.frame(i = rep(i, length(mem)),
-                                           method = rep("Spinglass", length(mem)),
-                                           node = rownames(x),
-                                           cluster = as.numeric(mem),
-                                           stringsAsFactors = FALSE)
-          dta_mod[[counter]] <- data.frame(i = i,
-                                           method = "Spinglass",
-                                           k = max(as.numeric(mem)),
-                                           modularity = igraph::modularity(x = g, membership = mem),
-                                           stringsAsFactors = FALSE)
-          if (isTRUE(saveObjects)) {
-            current_cl[[counter_current]] <- cl
-            current_mod[counter_current] <- dta_mod[[counter]]$modularity[nrow(dta_mod[[counter]])]
-            counter_current <- counter_current + 1
-          }
-          counter <- counter + 1
-        }, silent = TRUE)
-      }
-
-      # retain cluster object where modularity was maximal
-      if (isTRUE(saveObjects) && length(current_cl) > 0) {
-        obj$cl[[i]] <- current_cl[[which.max(current_mod)]]
-      }
-    }
-  }
-  obj$cl <- obj$cl[!sapply(obj$cl, is.null)] # remove NULL objects that may occur when the network is empty
-  obj$k <- k
-  obj$max_mod <- do.call(rbind, dta_dat)
-  memberships <- do.call(rbind, dta_mem)
-  rownames(memberships) <- NULL
-  obj$memberships <- memberships
-  obj$modularity <- do.call(rbind, dta_mod)
-  if (nrow(obj$modularity) == 0) {
-    stop("No output rows. Either you switched all clustering methods off, or all methods you used produced errors.")
-  }
-  obj$max_mod <- obj$max_mod[obj$max_mod$i %in% obj$modularity$i, ] # remove date entries where the network is empty
-  obj$max_mod$max_mod <- sapply(obj$max_mod$i, function(x) max(obj$modularity$modularity[obj$modularity$i == x], na.rm = TRUE)) # attach max_mod to $max_mod
-  # attach max_method to $max_mod
-  obj$max_mod$max_method <- sapply(obj$max_mod$i,
-                                   function(x) obj$modularity$method[obj$modularity$i == x & obj$modularity$modularity == max(obj$modularity$modularity[obj$modularity$i == x], na.rm = TRUE)][1])
-  # attach k to max_mod
-  obj$max_mod$k <- sapply(obj$max_mod$i, function(x) max(obj$modularity$k[obj$modularity$i == x], na.rm = TRUE))
-
-  # diagnostics
-  if (isTRUE(single) && !"Hierarchical (Single)" %in% obj$modularity$method && k > 1) {
-    warning("'single' omitted due to an unknown problem.")
-  }
-  if (isTRUE(average) && !"Hierarchical (Average)" %in% obj$modularity$method && k > 1) {
-    warning("'average' omitted due to an unknown problem.")
-  }
-  if (isTRUE(complete) && !"Hierarchical (Complete)" %in% obj$modularity$method && k > 1) {
-    warning("'complete' omitted due to an unknown problem.")
-  }
-  if (isTRUE(ward) && !"Hierarchical (Ward)" %in% obj$modularity$method) {
-    warning("'ward' omitted due to an unknown problem.")
-  }
-  if (isTRUE(kmeans) && !"k-Means" %in% obj$modularity$method) {
-    warning("'kmeans' omitted due to an unknown problem.")
-  }
-  if (isTRUE(pam) && !"Partitioning around Medoids" %in% obj$modularity$method) {
-    warning("'pam' omitted due to an unknown problem.")
-  }
-  if (isTRUE(equivalence) && !"Equivalence" %in% obj$modularity$method) {
-    warning("'equivalence' omitted due to an unknown problem.")
-  }
-  if (isTRUE(concor_one) && !"CONCOR (One-Mode)" %in% obj$modularity$method && k %in% c(0, 2)) {
-    warning("'concor_one' omitted due to an unknown problem.")
-  }
-  if (isTRUE(concor_two) && !"CONCOR (Two-Mode)" %in% obj$modularity$method && k %in% c(0, 2)) {
-    warning("'concor_two' omitted due to an unknown problem.")
-  }
-  if (isTRUE(louvain) && !"Louvain" %in% obj$modularity$method && k < 2) {
-    warning("'louvain' omitted due to an unknown problem.")
-  }
-  if (isTRUE(fastgreedy) && !"Fast & Greedy" %in% obj$modularity$method) {
-    warning("'fastgreedy' omitted due to an unknown problem.")
-  }
-  if (isTRUE(walktrap) && !"Walktrap" %in% obj$modularity$method) {
-    warning("'walktrap' omitted due to an unknown problem.")
-  }
-  if (isTRUE(leading_eigen) && !"Leading Eigenvector" %in% obj$modularity$method && k < 2) {
-    warning("'leading_eigen' omitted due to an unknown problem.")
-  }
-  if (isTRUE(edge_betweenness) && !"Edge Betweenness" %in% obj$modularity$method) {
-    warning("'edge_betweenness' omitted due to an unknown problem.")
-  }
-  if (isTRUE(infomap) && !"Infomap" %in% obj$modularity$method && k < 2) {
-    warning("'infomap' omitted due to an unknown problem.")
-  }
-  if (isTRUE(label_prop) && !"Label Propagation" %in% obj$modularity$method && k < 2) {
-    warning("'label_prop' omitted due to an unknown problem.")
-  }
-  if (isTRUE(spinglass) && !"Spinglass" %in% obj$modularity$method && k < 2) {
-    warning("'spinglass' omitted due to an unknown problem.")
-  }
-
-  class(obj) <- "dna_multiclust"
-  return(obj)
-}
-
-#' Print the summary of a \code{dna_multiclust} object
-#'
-#' Show details of a \code{dna_multiclust} object.
-#'
-#' Print abbreviated contents for the slots of a \code{dna_multiclust} object,
-#' which can be created using the \link{dna_multiclust} function.
-#'
-#' @param x A \code{dna_multiclust} object.
-#' @param ... Further options (currently not used).
-#'
-#' @author Philip Leifeld
-#'
-#' @rdname dna_multiclust
-#' @importFrom utils head
-#' @export
-print.dna_multiclust <- function(x, ...) {
-  cat(paste0("$k\n", x$k, "\n"))
-  if ("cl" %in% names(x)) {
-    cat(paste0("\n$cl\n", length(x$cl), " cluster object(s) embedded.\n"))
-  }
-  cat("\n$max_mod\n")
-  print(utils::head(x$max_mod))
-  if (nrow(x$max_mod) > 6) {
-    cat(paste0("[... ", nrow(x$max_mod), " rows]\n"))
-  }
-  cat("\n$modularity\n")
-  print(utils::head(x$modularity))
-  if (nrow(x$modularity) > 6) {
-    cat(paste0("[... ", nrow(x$modularity), " rows]\n"))
-  }
-  cat("\n$memberships\n")
-  print(utils::head(x$memberships))
-  if (nrow(x$memberships) > 6) {
-    cat(paste0("[... ", nrow(x$memberships), " rows]\n"))
-  }
-}
-
-
-# Phase transitions ------------------------------------------------------------
-
-#' Detect phase transitions and states in a discourse network
-#'
-#' Detect phase transitions and states in a discourse network.
-#'
-#' This function applies the state dynamics methods of Masuda and Holme to a
-#' time window discourse network. It computes temporally overlapping discourse
-#' networks, computes the dissimilarity between all networks, and clusters them.
-#' For the dissimilarity, the sum of absolute edge weight differences and the
-#' Euclidean spectral distance are available. Several clustering techniques can
-#' be applied to identify the different stages and phases from the resulting
-#' distance matrix.
-#'
-#' The function offers kernel smoothing, which means the farther away from a
-#' time point a statement is, the less important it becomes for the network that
-#' is created around the time point. Several kernel smoothing functions are
-#' available; see the \code{kernel} argument.
-#'
-#' @param distanceMethod The distance measure that expresses the dissimilarity
-#'   between any two network matrices. The following choices are available:
-#'   \itemize{
-#'     \item \code{"absdiff"}: The sum of the cell-wise absolute differences
-#'       between the two matrices, i.e., the sum of differences in edge weights.
-#'       This is equivalent to the graph edit distance because the network
-#'       dimensions are kept constant across all networks by including all nodes
-#'       at all time points (i.e., by including isolates).
-#'     \item \code{"spectral"}: The Euclidean distance between the normalized
-#'       eigenvalues of the graph Laplacian matrices, also called the spectral
-#'       distance between two network matrices. Any negative values (e.g., from
-#'       the subtract method) are replaced by zero before computing the
-#'       distance.
-#'   }
-#' @param clusterMethods The clustering techniques that are applied to the
-#'   distance matrix in the end. Hierarchical methods are repeatedly cut off at
-#'   different levels, and solutions are compared using network modularity to
-#'   pick the best-fitting cluster membership vector. Some of the methods are
-#'   slower than others, hence they are not included by default. It is possible
-#'   to include any number of methods in the argument. For each included method,
-#'   the cluster membership vector (i.e., the states over time) along with the
-#'   associated time stamps of the networks are returned, and the modularity of
-#'   each included method is computed for comparison. The following methods are
-#'   available:
-#'   \itemize{
-#'     \item \code{"single"}: Hierarchical clustering with single linkage using
-#'       the \code{\link[stats]{hclust}} function from the \pkg{stats} package.
-#'     \item \code{"average"}: Hierarchical clustering with average linkage
-#'       using the \code{\link[stats]{hclust}} function from the \pkg{stats}
-#'       package.
-#'     \item \code{"complete"}: Hierarchical clustering with complete linkage
-#'       using the \code{\link[stats]{hclust}} function from the \pkg{stats}
-#'       package.
-#'     \item \code{"ward"}: Hierarchical clustering with Ward's method (D2)
-#'       using the \code{\link[stats]{hclust}} function from the \pkg{stats}
-#'       package.
-#'     \item \code{"kmeans"}: k-means clustering using the
-#'       \code{\link[stats]{kmeans}} function from the \pkg{stats} package.
-#'     \item \code{"pam"}: Partitioning around medoids using the
-#'       \code{\link[cluster]{pam}} function from the \pkg{cluster} package.
-#'     \item \code{"spectral"}: Spectral clustering. An affinity matrix using a
-#'       Gaussian (RBF) kernel is created. The Laplacian matrix of the affinity
-#'       matrix is computed and normalized. The first first k eigenvectors of
-#'       the normalized Laplacian matrix are clustered using k-means.
-#'     \item \code{"concor"}: CONvergence of iterative CORrelations (CONCOR)
-#'       with exactly \code{k = 2} clusters. (Not included by default because of
-#'       the limit to \code{k = 2}.)
-#'     \item \code{"fastgreedy"}: Fast & greedy community detection using the
-#'       \code{\link[igraph]{cluster_fast_greedy}} function in the \pkg{igraph}
-#'       package.
-#'     \item \code{"walktrap"}: Walktrap community detection using the
-#'       \code{\link[igraph]{cluster_walktrap}} function in the \pkg{igraph}
-#'       package.
-#'     \item \code{"leading_eigen"}: Leading eigenvector community detection
-#'       using the \code{\link[igraph]{cluster_leading_eigen}} function in the
-#'       \pkg{igraph} package. (Can be slow, hence not included by default.)
-#'     \item \code{"edge_betweenness"}: Girvan-Newman edge betweenness community
-#'       detection using the \code{\link[igraph]{cluster_edge_betweenness}}
-#'       function in the \pkg{igraph} package. (Can be slow, hence not included
-#'       by default.)
-#'   }
-#' @param k.min For the hierarchical cluster methods, how many clusters or
-#'   states should at least be identified? Only the best solution between
-#'   \code{k.min} and \code{k.max} clusters is retained and compared to other
-#'   methods.
-#' @param k.max For the hierarchical cluster methods, up to how many clusters or
-#'   states should be identified? Only the best solution between \code{k.min}
-#'   and \code{k.max} clusters is retained and compared to other methods.
-#' @param cores The number of computing cores for parallel processing. If
-#'   \code{1} (the default), no parallel processing is used. If a larger number,
-#'   the \pkg{pbmcapply} package is used to parallelize the clustering. Note
-#'   that this method is based on forking and is only available on Unix
-#'   operating systems, including MacOS and Linux. Note also that the remaining
-#'   computations, including the computation of the distance matrix and the
-#'   time window network generation with kernel smoothing, are done in parallel
-#'   using threads in Java, irrespective of this setting, using as many parallel
-#'   threads as cores are available on the system.
-#' @param kernel Use kernel smoothing for computing network time slices? Several
-#'   kernel smoothing functions are available, similar to kernel density
-#'   estimation. They down-weight statements the farther they are temporally
-#'   away from the temporal mid-point of the respective time slice. Valid
-#'   settings are:
-#'   \itemize{
-#'     \item \code{"uniform"}: Weight all statements within a time window
-#'       equally with a value of \code{0.5}.
-#'     \item \code{"triangular"}: Use a triangular kernel function.
-#'     \item \code{"epanechnikov"}: Use an Epanechnikov kernel smoother.
-#'     \item \code{"gaussian"}: Use a standard normal distribution as a kernel
-#'       smoother.
-#'     \item \code{"no"}: Circumvent kernel smoothing and weight all statements
-#'       with a value of \code{1.0}. This is a legacy setting and is slow and
-#'       may not return the same results as \code{"uniform"} due to the way it
-#'       was written up.
-#'   }
-#' @param normalizeToOne Divide all cells by the sum of all cells before
-#'   computing the dissimilarity between two network matrices? This
-#'   normalization scales all edge weights to a sum of \code{1.0}. Doing so can
-#'   make networks more comparable by boosting the edge weights of networks that
-#'   are relatively sparsely populated by concepts, for example at the beginning
-#'   or end of the debate. Note that this normalization should not make any
-#'   difference with Euclidean spectral distances of the graph Laplacian because
-#'   the eigenvalues are normalized to sum to one in this distance method.
-#' @param indentTime If \code{TRUE}, the sequence of time slices under the time
-#'   window algorithm starts with the first network and ends with the last
-#'   network that are entirely covered within the timeline defined by the start
-#'   and stop dates and times. For example, if the start date is 1 February, the
-#'   stop date is 31 December, and the time window duration is 21 days, the
-#'   mid-point of the first time window will be 11 February (to ensure the first
-#'   network entirely fits into the timeline), and the last network will be
-#'   centered around 20 December (to ensure the last network entirely fits into
-#'   the timeline). If \code{FALSE}, the start and stop dates and times are used
-#'   as the first and last mid-points. In that case, the first and last few
-#'   networks may contain fewer statements than other time slices and may,
-#'   therefore, be more similar to each other. This can potentially be
-#'   counter-acted by setting the \code{normalizeToOne} argument.
-#' @inheritParams dna_network
-#'
-#' @examples
-#' \dontrun{
-#' library("ggplot2")
-#' dna_init()
-#' dna_sample()
-#' dna_openDatabase("sample.dna", coderId = 1, coderPassword = "sample")
-#'
-#' # compute states and phases for sample dataset
-#' results <- dna_phaseTransitions(distanceMethod = "spectral",
-#'                                 clusterMethods = c("ward",
-#'                                                    "pam",
-#'                                                    "concor",
-#'                                                    "walktrap"),
-#'                                 k.min = 2,
-#'                                 k.max = 6,
-#'                                 networkType = "onemode",
-#'                                 variable1 = "organization",
-#'                                 variable2 = "concept",
-#'                                 timeWindow = "days",
-#'                                 windowSize = 15,
-#'                                 kernel = "gaussian",
-#'                                 indentTime = FALSE,
-#'                                 normalizeToOne = FALSE)
-#' results
-#' autoplot(results)
-#'
-#' # access individual plots
-#' plots <- autoplot(results)
-#' plots[[1]] # show heatmap
-#' plots[[2]] # show cluster silhouettes
-#' plots[[3]] # show temporal embedding
-#' plots[[4]] # show state dynamics
-#'
-#' # save plots to combined PDF
-#' library("ggplotify") # needed to convert heatmap to ggplot diagram
-#' library("patchwork") # needed to merge plots into 4 x 4 diagram
-#' p1 <- ggplotify::as.ggplot(plots[[1]])
-#' p <- p1 + plots[[2]] + plots[[3]] + plots[[4]] + plot_layout(ncol = 2)
-#' ggsave(filename = "phase_transitions.pdf", p, width = 14, height = 12)
-#' }
-#'
-#' @rdname dna_phaseTransitions
-#' @author Philip Leifeld
-#' @importFrom stats dist
-#' @importFrom utils combn
-#' @importFrom rJava .jarray .jcall .jnull J
-#' @export
-dna_phaseTransitions <- function(distanceMethod = "absdiff",
-                                 clusterMethods = c("single",
-                                                    "average",
-                                                    "complete",
-                                                    "ward",
-                                                    "kmeans",
-                                                    "pam",
-                                                    "spectral",
-                                                    "fastgreedy",
-                                                    "walktrap"),
-                                 k.min = 2,
-                                 k.max = 6,
-                                 cores = 1,
-                                 networkType = "twomode",
-                                 statementType = "DNA Statement",
-                                 variable1 = "organization",
-                                 variable1Document = FALSE,
-                                 variable2 = "concept",
-                                 variable2Document = FALSE,
-                                 qualifier = "agreement",
-                                 qualifierDocument = FALSE,
-                                 qualifierAggregation = "subtract",
-                                 normalization = "no",
-                                 duplicates = "document",
-                                 start.date = "01.01.1900",
-                                 stop.date = "31.12.2099",
-                                 start.time = "00:00:00",
-                                 stop.time = "23:59:59",
-                                 timeWindow = "days",
-                                 windowSize = 200,
-                                 kernel = "uniform",
-                                 normalizeToOne = TRUE,
-                                 indentTime = FALSE,
-                                 excludeValues = list(),
-                                 excludeAuthors = character(),
-                                 excludeSources = character(),
-                                 excludeSections = character(),
-                                 excludeTypes = character(),
-                                 invertValues = FALSE,
-                                 invertAuthors = FALSE,
-                                 invertSources = FALSE,
-                                 invertSections = FALSE,
-                                 invertTypes = FALSE) {
-
-  # check arguments and packages
-  if (distanceMethod == "spectral" && networkType == "twomode") {
-    distanceMethod <- "absdiff"
-    warning("Spectral distances only work with one-mode networks. Using 'distanceMethod = \"absdiff\"' instead.")
-  }
-  if (cores > 1 && !requireNamespace("pbmcapply", quietly = TRUE)) {
-    pbmclapply <- FALSE
-    warning("Argument 'cores' requires the 'pbmcapply' package, which is not installed.\nSetting 'cores = 1'. Consider installing the 'pbmcapply' package if you use Linux or MacOS.")
-  }
-  igraphMethods <- c("louvain", "fastgreedy", "walktrap", "leading_eigen", "edge_betweenness", "infomap", "label_prop", "spinglass")
-  if (any(igraphMethods %in% clusterMethods) && !requireNamespace("igraph", quietly = TRUE)) {
-    clusterMethods <- clusterMethods[-igraphMethods]
-    warning("'igraph' package not installed. Dropping clustering methods from the 'igraph' package. Consider installing 'igraph'.")
-  }
-  if ("pam" %in% clusterMethods && !requireNamespace("cluster", quietly = TRUE)) {
-    clusterMethods <- clusterMethods[which(clusterMethods != "pam")]
-    warning("'cluster' package not installed. Dropping clustering methods from the 'cluster' package. Consider installing 'cluster'.")
-  }
-  if ("concor" %in% clusterMethods && k.min > 2) {
-    clusterMethods <- clusterMethods[which(clusterMethods != "concor")]
-    warning("Dropping 'concor' from clustering methods because the CONCOR implementation in rDNA can only find exactly two clusters, but the 'k.min' argument was larger than 2.")
-  }
-  clusterMethods <- rev(clusterMethods) # reverse order to save time during parallel computation by starting the computationally intensive methods first
-  mcall <- match.call() # save the arguments for storing them in the results later
-
-  # generate the time window networks
-  if (is.null(timeWindow) || is.na(timeWindow) || !is.character(timeWindow) || length(timeWindow) != 1 || !timeWindow %in% c("events", "seconds", "minutes", "hours", "days", "weeks", "months", "years")) {
-    timeWindow <- "events"
-    warning("The 'timeWindow' argument was invalid. Proceeding with 'timeWindow = \"events\" instead.")
-  }
-
-  # wrap the vectors of exclude values for document variables into Java arrays
-  excludeAuthors <- .jarray(excludeAuthors)
-  excludeSources <- .jarray(excludeSources)
-  excludeSections <- .jarray(excludeSections)
-  excludeTypes <- .jarray(excludeTypes)
-
-  # compile exclude variables and values vectors
-  dat <- matrix("", nrow = length(unlist(excludeValues)), ncol = 2)
-  count <- 0
-  if (length(excludeValues) > 0) {
-    for (i in 1:length(excludeValues)) {
-      if (length(excludeValues[[i]]) > 0) {
-        for (j in 1:length(excludeValues[[i]])) {
-          count <- count + 1
-          dat[count, 1] <- names(excludeValues)[i]
-          dat[count, 2] <- excludeValues[[i]][j]
-        }
-      }
-    }
-    var <- dat[, 1]
-    val <- dat[, 2]
-  } else {
-    var <- character()
-    val <- character()
-  }
-  var <- .jarray(var) # array of variable names of each excluded value
-  val <- .jarray(val) # array of values to be excluded
-
-  # encode R NULL as Java null value if necessary
-  if (is.null(qualifier) || is.na(qualifier)) {
-    qualifier <- .jnull(class = "java/lang/String")
-  }
-
-  # call rNetwork function to compute results
-  .jcall(dna_getHeadlessDna(),
-         "V",
-         "rTimeWindow",
-         networkType,
-         statementType,
-         variable1,
-         variable1Document,
-         variable2,
-         variable2Document,
-         qualifier,
-         qualifierDocument,
-         qualifierAggregation,
-         normalization,
-         TRUE,
-         duplicates,
-         start.date,
-         stop.date,
-         start.time,
-         stop.time,
-         timeWindow,
-         as.integer(windowSize),
-         kernel,
-         normalizeToOne,
-         indentTime,
-         var,
-         val,
-         excludeAuthors,
-         excludeSources,
-         excludeSections,
-         excludeTypes,
-         invertValues,
-         invertAuthors,
-         invertSources,
-         invertSections,
-         invertTypes
-  )
-  exporter <- dna_getHeadlessDna()$getExporter() # save Java object reference to exporter class
-
-  # compute distance matrix
-  if (distanceMethod == "modularity") {
-    stop("Differences in modularity have not been implemented yet. Please use absolute differences or spectral Euclidean distance as a distance method.")
-  } else if (!distanceMethod %in% c("absdiff", "spectral")) {
-    stop("Distance method not recognized. Try \"absdiff\" or \"spectral\".")
-  }
-  distance_mat <- .jcall(exporter,
-                         "[[D",
-                         "computeDistanceMatrix",
-                         distanceMethod,
-                         simplify = TRUE)
-  distance_mat <- distance_mat / max(distance_mat) # rescale between 0 and 1
-
-  # retrieve mid-point dates (gamma)
-  m <- .jcall(exporter, "[Lexport/Matrix;", "getMatrixResultsArray") # get list of Matrix objects from Exporter object
-  dates <- sapply(m, function(x) .jcall(x, "J", "getDateTimeLong")) # long integers, still needs conversion to date
-
-  # define clustering function
-  hclustMethods <- c("single", "average", "complete", "ward")
-  cl <- function(method, distmat) {
-    tryCatch({
-      similarity_mat <- 1 - distmat
-      g <- igraph::graph_from_adjacency_matrix(similarity_mat, mode = "undirected", weighted = TRUE, diag = FALSE) # graph needs to be based on similarity, not distance
-      if (method %in% hclustMethods) {
-        if (method == "single") {
-          suppressWarnings(cl <- stats::hclust(as.dist(distmat), method = "single"))
-        } else if (method == "average") {
-          suppressWarnings(cl <- stats::hclust(as.dist(distmat), method = "average"))
-        } else if (method == "complete") {
-          suppressWarnings(cl <- stats::hclust(as.dist(distmat), method = "complete"))
-        } else if (method == "ward") {
-          suppressWarnings(cl <- stats::hclust(as.dist(distmat), method = "ward.D2"))
-        }
-        opt_k <- lapply(k.min:k.max, function(x) {
-          mem <- stats::cutree(cl, k = x)
-          mod <- igraph::modularity(x = g, weights = igraph::E(g)$weight, membership = mem)
-          return(list(mem = mem, mod = mod))
-        })
-        mod <- sapply(opt_k, function(x) x$mod)
-        kk <- which.max(mod)
-        mem <- opt_k[[kk]]$mem
-      } else if (method == "kmeans") {
-        opt_k <- lapply(k.min:k.max, function(x) {
-          suppressWarnings(cl <- stats::kmeans(distmat, centers = x))
-          mem <- cl$cluster
-          mod <- igraph::modularity(x = g, weights = igraph::E(g)$weight, membership = mem)
-          return(list(cl = cl, mem = mem, mod = mod))
-        })
-        mod <- sapply(opt_k, function(x) x$mod)
-        kk <- which.max(mod)
-        mem <- opt_k[[kk]]$mem
-      } else if (method == "pam") {
-        opt_k <- lapply(k.min:k.max, function(x) {
-          suppressWarnings(cl <- cluster::pam(distmat, k = x))
-          mem <- cl$cluster
-          mod <- igraph::modularity(x = g, weights = igraph::E(g)$weight, membership = mem)
-          return(list(cl = cl, mem = mem, mod = mod))
-        })
-        mod <- sapply(opt_k, function(x) x$mod)
-        kk <- which.max(mod)
-        mem <- opt_k[[kk]]$mem
-      } else if (method == "spectral") {
-        sigma <- 1.0
-        affinity_matrix <- exp(-distmat^2 / (2 * sigma^2))
-        L <- diag(rowSums(affinity_matrix)) - affinity_matrix
-        D.sqrt.inv <- diag(1 / sqrt(rowSums(affinity_matrix)))
-        L.norm <- D.sqrt.inv %*% L %*% D.sqrt.inv
-        eigenvalues <- eigen(L.norm) # eigenvalue decomposition
-        opt_k <- lapply(k.min:k.max, function(x) {
-          U <- eigenvalues$vectors[, 1:x]
-          mem <- kmeans(U, centers = x)$cluster # cluster the eigenvectors
-          mod <- igraph::modularity(x = g, weights = igraph::E(g)$weight, membership = mem)
-          return(list(mem = mem, mod = mod))
-        })
-        mod <- sapply(opt_k, function(x) x$mod)
-        kk <- which.max(mod)
-        mem <- opt_k[[kk]]$mem
-      } else if (method == "concor") {
-        suppressWarnings(mi <- stats::cor(similarity_mat))
-        iter <- 1
-        while (any(abs(mi) <= 0.999) & iter <= 50) {
-          mi[is.na(mi)] <- 0
-          mi <- stats::cor(mi)
-          iter <- iter + 1
-        }
-        mem <- ((mi[, 1] > 0) * 1) + 1
-      } else if (method %in% igraphMethods) {
-        if (method == "fastgreedy") {
-          suppressWarnings(cl <- igraph::cluster_fast_greedy(g))
-        } else if (method == "walktrap") {
-          suppressWarnings(cl <- igraph::cluster_walktrap(g))
-        } else if (method == "leading_eigen") {
-          suppressWarnings(cl <- igraph::cluster_leading_eigen(g))
-        } else if (method == "edge_betweenness") {
-          suppressWarnings(cl <- igraph::cluster_edge_betweenness(g))
-        } else if (method == "spinglass") {
-          suppressWarnings(cl <- igraph::cluster_spinglass(g))
-        }
-        opt_k <- lapply(k.min:k.max, function(x) {
-          mem <- igraph::cut_at(communities = cl, no = x)
-          mod <- igraph::modularity(x = g, weights = igraph::E(g)$weight, membership = mem)
-          return(list(mem = mem, mod = mod))
-        })
-        mod <- sapply(opt_k, function(x) x$mod)
-        kk <- which.max(mod)
-        mem <- opt_k[[kk]]$mem
-      }
-      list(method = method,
-           modularity = igraph::modularity(x = g, weights = igraph::E(g)$weight, membership = mem),
-           memberships = mem)
-    },
-    error = function(e) {
-      warning("Cluster method '", method, "' could not be computed due to an error: ", e)
-    },
-    warning = function(w) {
-      warning("Cluster method '", method, "' threw a warning: ", w)
-    })
-  }
-
-  # apply all clustering methods to distance matrix
-  if (cores > 1) {
-    cat(paste("Clustering distance matrix on", cores, "cores.\n"))
-    a <- Sys.time()
-    l <- pbmcapply::pbmclapply(clusterMethods, cl, distmat = distance_mat, mc.cores = cores)
-    b <- Sys.time()
-  } else {
-    cat("Clustering distance matrix... ")
-    a <- Sys.time()
-    l <- lapply(clusterMethods, cl, distmat = distance_mat)
-    b <- Sys.time()
-    cat(intToUtf8(0x2714), "\n")
-  }
-  print(b - a)
-  for (i in length(l):1) {
-    if (length(l[[i]]) == 1) {
-      l <- l[-i]
-      clusterMethods <- clusterMethods[-i]
-    }
-  }
-  results <- list()
-  mod <- sapply(l, function(x) x$modularity)
-  best <- which(mod == max(mod))[1]
-  results$modularity <- mod[best]
-  results$clusterMethod <- clusterMethods[best]
-
-  # temporal embedding via MDS
-  if (!requireNamespace("MASS", quietly = TRUE)) {
-    mem <- data.frame("date" = as.POSIXct(dates, tz = "UTC", origin = "1970-01-01"),
-                      "state" = l[[best]]$memberships)
-    results$states <- mem
-    warning("Skipping temporal embedding because the 'MASS' package is not installed. Consider installing it.")
-  } else {
-    cat("Temporal embedding...\n")
-    a <- Sys.time()
-    distmat <- distance_mat + 1e-12
-    mds <- MASS::isoMDS(distmat) # MDS of distance matrix
-    points <- mds$points
-    mem <- data.frame("date" = as.POSIXct(dates, tz = "UTC", origin = "1970-01-01"),
-                      "state" = l[[best]]$memberships,
-                      "X1" = points[, 1],
-                      "X2" = points[, 2])
-    results$states <- mem
-    b <- Sys.time()
-    print(b - a)
-  }
-
-  results$distmat <- distance_mat
-  class(results) <- "dna_phaseTransitions"
-  attributes(results)$stress <- ifelse(ncol(results$states) == 2, NA, mds$stress)
-  attributes(results)$call <- mcall
-  return(results)
-}
-
-#' Print the summary of a \code{dna_phaseTransitions} object
-#'
-#' Show details of a \code{dna_phaseTransitions} object.
-#'
-#' Print a summary of a \code{dna_phaseTransitions} object, which can be created
-#' using the \link{dna_phaseTransitions} function.
-#'
-#' @param x A \code{dna_phaseTransitions} object.
-#' @param ... Further options (currently not used).
-#'
-#' @author Philip Leifeld
-#'
-#' @rdname dna_phaseTransitions
-#' @importFrom utils head
-#' @export
-print.dna_phaseTransitions <- function(x, ...) {
-  cat(paste0("States: ", max(x$states$state), ". Cluster method: ", x$clusterMethod, ". Modularity: ", round(x$modularity, 3), ".\n\n"))
-  print(utils::head(x$states, 20))
-  cat(paste0("...", nrow(x$states), " further rows\n"))
-}
-
-#' @rdname dna_phaseTransitions
-#' @param object A \code{"dna_phaseTransitions"} object.
-#' @param ... Additional arguments. Currently not in use.
-#' @param plots The plots to include in the output list. Can be one or more of
-#'   the following: \code{"heatmap"}, \code{"silhouette"}, \code{"mds"},
-#'   \code{"states"}.
-#'
-#' @author Philip Leifeld, Kristijan Garic
-#' @importFrom ggplot2 autoplot ggplot aes geom_line geom_point xlab ylab
-#'   labs ggtitle theme_bw theme arrow unit scale_shape_manual element_text
-#'   scale_x_datetime scale_colour_manual guides
-#' @importFrom rlang .data
-#' @export
-autoplot.dna_phaseTransitions <- function(object, ..., plots = c("heatmap", "silhouette", "mds", "states")) {
-  # settings for all plots
-  k <- max(object$states$state)
-  shapes <- c(21:25, 0:14)[1:k]
-  l <- list()
-
-  # heatmap
-  if ("heatmap" %in% plots) {
-    try({
-      if (!requireNamespace("heatmaply", quietly = TRUE)) {
-        warning("Heatmap skipped because the 'heatmaply' package is not installed.")
-      } else {
-        l[[length(l) + 1]] <- heatmaply::ggheatmap(1 - object$distmat,
-                                                   dendrogram = "both",
-                                                   showticklabels = FALSE, # remove axis labels
-                                                   show_dendrogram = TRUE,
-                                                   hide_colorbar = TRUE)
-      }
-    })
-  }
-
-  # silhouette plot
-  if ("silhouette" %in% plots) {
-    try({
-      if (!requireNamespace("cluster", quietly = TRUE)) {
-        warning("Silhouette plot skipped because the 'cluster' package is not installed.")
-      } else if (!requireNamespace("factoextra", quietly = TRUE)) {
-        warning("Silhouette plot skipped because the 'factoextra' package is not installed.")
-      } else {
-        sil <- cluster::silhouette(object$states$state, dist(object$distmat))
-        l[[length(l) + 1]] <- factoextra::fviz_silhouette(sil, print.summary = FALSE) +
-          ggplot2::ggtitle(paste0("Cluster silhouettes (mean width: ", round(mean(sil[, 3]), 3), ")")) +
-          ggplot2::ylab("Silhouette width") +
-          ggplot2::labs(fill = "State", color = "State") +
-          ggplot2::theme_classic() +
-          ggplot2::theme(axis.text.x = element_blank(), axis.ticks.x = element_blank())
-      }
-    })
-  }
-
-  # temporal embedding
-  if ("mds" %in% plots) {
-    try({
-      if (is.na(attributes(object)$stress)) {
-        warning("No temporal embedding found. Skipping this plot.")
-      } else if (!requireNamespace("igraph", quietly = TRUE)) {
-        warning("Temporal embedding plot skipped because the 'igraph' package is not installed.")
-      } else if (!requireNamespace("ggraph", quietly = TRUE)) {
-        warning("Temporal embedding plot skipped because the 'ggraph' package is not installed.")
-      } else {
-        nodes <- object$states
-        nodes$date <- as.character(nodes$date)
-        nodes$State <- as.factor(nodes$state)
-
-        # Extract state values
-        state_values <- nodes$State
-
-        edges <- data.frame(sender = as.character(object$states$date),
-                            receiver = c(as.character(object$states$date[2:(nrow(object$states))]), "NA"))
-        edges <- edges[-nrow(edges), ]
-        g <- igraph::graph_from_data_frame(edges, directed = TRUE, vertices = nodes)
-        l[[length(l) + 1]] <- ggraph::ggraph(g, layout = "manual", x = igraph::V(g)$X1, y = igraph::V(g)$X2) +
-          ggraph::geom_edge_link(arrow = ggplot2::arrow(type = "closed", length = ggplot2::unit(2, "mm")),
-                                 start_cap = ggraph::circle(1, "mm"),
-                                 end_cap = ggraph::circle(2, "mm")) +
-          ggraph::geom_node_point(ggplot2::aes(shape = state_values, fill = state_values), size = 2) +
-          ggplot2::scale_shape_manual(values = shapes) +
-          ggplot2::ggtitle("Temporal embedding (MDS)") +
-          ggplot2::xlab("Dimension 1") +
-          ggplot2::ylab("Dimension 2") +
-          ggplot2::theme_bw() +
-          ggplot2::guides(size = "none") +
-          ggplot2::labs(shape = "State", fill = "State")
-      }
-    })
-  }
-
-  # state dynamics
-  if ("states" %in% plots) {
-    try({
-      d <- data.frame(
-        time = object$states$date,
-        id = cumsum(c(TRUE, diff(object$states$state) != 0)),
-        State = factor(object$states$state, levels = 1:k, labels = paste("State", 1:k)),
-        time1 = as.Date(object$states$date)
-      )
-
-      # Extracting values
-      time_values <- d$time
-      state_values <- d$State
-      id_values <- d$id
-
-      l[[length(l) + 1]] <- ggplot2::ggplot(d, ggplot2::aes(x = time_values, y = state_values, colour = state_values)) +
-        ggplot2::geom_line(aes(group = 1), linewidth = 2, color = "black", lineend = "square") +
-        ggplot2::geom_line(aes(group = id_values), linewidth = 2, lineend = "square") +
-        ggplot2::scale_x_datetime(date_labels = "%b %Y", breaks = "4 months") + # format x-axis as month year
-        ggplot2::xlab("Time") +
-        ggplot2::ylab("") +
-        ggplot2::ggtitle("State dynamics") +
-        ggplot2::theme_bw() +
-        ggplot2::theme(axis.text.x = ggplot2::element_text(angle = 45, hjust = 1)) +
-        ggplot2::guides(linewidth = "none") +
-        ggplot2::labs(color = "State")
-    })
-  }
-
-  return(l)
 }
\ No newline at end of file

From 5bbfb95dea4a65b8f98e1c81b7ab7fc361d701b0 Mon Sep 17 00:00:00 2001
From: leifeld <philip.leifeld@manchester.ac.uk>
Date: Tue, 20 Aug 2024 01:06:50 +0200
Subject: [PATCH 10/11] Adjusted release date in DNA and rDNA

---
 dna/src/main/java/dna/Dna.java | 2 +-
 rDNA/rDNA/DESCRIPTION          | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/dna/src/main/java/dna/Dna.java b/dna/src/main/java/dna/Dna.java
index ac7b2078..20202d8b 100644
--- a/dna/src/main/java/dna/Dna.java
+++ b/dna/src/main/java/dna/Dna.java
@@ -17,7 +17,7 @@ public class Dna {
 	public static Dna dna;
 	public static Logger logger;
 	public static Sql sql;
-	public static final String date = "2024-07-22";
+	public static final String date = "2024-08-20";
 	public static final String version = "3.0.11";
 	public static final String operatingSystem = System.getProperty("os.name");
 	public static File workingDirectory = null;
diff --git a/rDNA/rDNA/DESCRIPTION b/rDNA/rDNA/DESCRIPTION
index 30d9889d..103e06eb 100755
--- a/rDNA/rDNA/DESCRIPTION
+++ b/rDNA/rDNA/DESCRIPTION
@@ -1,6 +1,6 @@
 Package: rDNA
 Version: 3.0.11
-Date: 2024-08-19
+Date: 2024-08-20
 Title: Discourse Network Analysis in R
 Authors@R: 
   c(person(given = "Philip",

From 8da39b8721f2bcd4e8809d0e4182e055f31612d0 Mon Sep 17 00:00:00 2001
From: leifeld <philip.leifeld@manchester.ac.uk>
Date: Tue, 20 Aug 2024 01:46:37 +0200
Subject: [PATCH 11/11] Updated gradle build tasks

---
 rDNA/build.gradle | 40 ++++++++++++++++++++--------------------
 1 file changed, 20 insertions(+), 20 deletions(-)

diff --git a/rDNA/build.gradle b/rDNA/build.gradle
index 513400bb..a780e156 100644
--- a/rDNA/build.gradle
+++ b/rDNA/build.gradle
@@ -16,20 +16,15 @@ task rDNADocument {
     }
 }
 
-// Task to find the most recent JAR file in the build directory
-def findLatestJarFile() {
-    def jarDir = file("$rootDir/build")
-    def jarFiles = jarDir.listFiles({ file -> file.name.endsWith('.jar') } as FileFilter)
-
-    if (jarFiles && jarFiles.size() > 0) {
-        return jarFiles.sort { -it.lastModified() }[0]
-    } else {
-        throw new GradleException("No jar files found in the build directory.")
-    }
+// Task to copy R package sources to a temporary build directory
+task copyRPackageSourcesToBuildDir(type: Copy, dependsOn: rDNADocument) {
+    from "$rootDir/rDNA/rDNA"
+    into "$rootDir/build/temp-rDNA"
+    exclude 'inst/java/**'
 }
 
 // Task to ensure the inst/java directory exists in the temporary build directory
-task createJavaDirInTempBuildDir {
+task createJavaDirInTempBuildDir (dependsOn: copyRPackageSourcesToBuildDir) {
     doLast {
         def javaDir = file("$rootDir/build/temp-rDNA/inst/java")
         if (!javaDir.exists()) {
@@ -41,8 +36,20 @@ task createJavaDirInTempBuildDir {
     }
 }
 
+// Task to find the most recent JAR file in the build directory
+def findLatestJarFile() {
+    def jarDir = file("$rootDir/build")
+    def jarFiles = jarDir.listFiles({ file -> file.name.endsWith('.jar') } as FileFilter)
+
+    if (jarFiles && jarFiles.size() > 0) {
+        return jarFiles.sort { -it.lastModified() }[0]
+    } else {
+        throw new GradleException("No jar files found in the build directory.")
+    }
+}
+
 // Task to copy the JAR file into the inst/java directory
-task copyJarIntoTempBuildDir {
+task copyJarIntoTempBuildDir (dependsOn: createJavaDirInTempBuildDir) {
     dependsOn ':dna:build', createJavaDirInTempBuildDir
     doLast {
         def latestJar = findLatestJarFile()
@@ -57,15 +64,8 @@ task copyJarIntoTempBuildDir {
     }
 }
 
-// Task to copy R package sources to a temporary build directory
-task copyRPackageSourcesToBuildDir(type: Copy) {
-    from "$rootDir/rDNA/rDNA"
-    into "$rootDir/build/temp-rDNA"
-    exclude 'inst/java/**'
-}
-
 // Task to build the R package (create a .tar.gz file) and clean up after
-task rDNABuild(dependsOn: [rDNADocument, copyRPackageSourcesToBuildDir, copyJarIntoTempBuildDir]) {
+task rDNABuild(dependsOn: copyJarIntoTempBuildDir) {
     doLast {
         // Delete old .tar.gz files in the build directory
         def buildDir = file("$rootDir/build")