From 346a88d0e0ada9b434606dd12988f51dc8c7bd72 Mon Sep 17 00:00:00 2001 From: gagolews Date: Tue, 5 Jan 2021 09:39:06 +1100 Subject: [PATCH] v0.9.6 - Use RcppMLPACK directly instead of via a wrapper, emstreeR. --- .github/workflows/py.yml | 2 +- .github/workflows/r.yml | 2 +- DESCRIPTION | 7 ++-- NEWS | 4 +- R/RcppExports.R | 4 ++ R/gclust.R | 4 +- R/mst.R | 42 ++++++++------------ devel/sphinx/conf.py | 2 +- devel/sphinx/rapi/emst_mlpack.rst | 9 +---- devel/sphinx/rapi/gclust.rst | 2 +- devel/tinytest/test-gclust.R | 6 +-- devel/tinytest/test-mst.R | 13 +++--- docs/_sources/rapi/emst_mlpack.rst.txt | 9 +---- docs/_sources/rapi/gclust.rst.txt | 2 +- docs/_static/documentation_options.js | 2 +- docs/genieclust.html | 6 +-- docs/genieclust_compare_partitions.html | 6 +-- docs/genieclust_genie.html | 6 +-- docs/genieclust_inequity.html | 6 +-- docs/genieclust_internal.html | 6 +-- docs/genieclust_plots-1.pdf | Bin 8288 -> 8288 bytes docs/genieclust_plots-2.pdf | Bin 12135 -> 12135 bytes docs/genieclust_plots-3.pdf | Bin 7168 -> 7168 bytes docs/genieclust_plots-4.pdf | Bin 8830 -> 8830 bytes docs/genieclust_plots.html | 6 +-- docs/genieclust_tools.html | 6 +-- docs/genindex.html | 6 +-- docs/index.html | 6 +-- docs/objects.inv | Bin 1561 -> 1556 bytes docs/py-modindex.html | 6 +-- docs/rapi.html | 6 +-- docs/rapi/comparing_partitions.html | 6 +-- docs/rapi/emst_mlpack.html | 14 ++----- docs/rapi/gclust.html | 8 ++-- docs/rapi/genieclust-package.html | 6 +-- docs/rapi/inequity.html | 6 +-- docs/rapi/mst.html | 6 +-- docs/search.html | 6 +-- docs/searchindex.js | 2 +- docs/weave/basics.html | 6 +-- docs/weave/benchmarks_approx.html | 6 +-- docs/weave/benchmarks_ar.html | 6 +-- docs/weave/benchmarks_details.html | 6 +-- docs/weave/noise.html | 6 +-- docs/weave/r.html | 6 +-- docs/weave/sklearn_toy_example.html | 6 +-- docs/weave/sparse.html | 6 +-- docs/weave/string.html | 6 +-- docs/weave/timings.html | 6 +-- docs/z_bibliography.html | 6 +-- genieclust/__init__.py | 2 +- man/emst_mlpack.Rd | 12 ++---- man/gclust.Rd | 2 +- setup.py | 2 +- src/RcppExports.cpp | 14 +++++++ src/c_common.h | 2 +- src/r_compare_partitions.cpp | 2 +- src/r_emst.cpp | 50 ++++++++++++++++++++++++ src/r_gclust.cpp | 33 +--------------- src/r_inequity.cpp | 2 +- 60 files changed, 207 insertions(+), 210 deletions(-) create mode 100644 src/r_emst.cpp diff --git a/.github/workflows/py.yml b/.github/workflows/py.yml index 7c7ac5d1..479223c9 100644 --- a/.github/workflows/py.yml +++ b/.github/workflows/py.yml @@ -25,7 +25,7 @@ jobs: sudo apt-get update sudo apt-get -y upgrade sudo apt-get -y install libcurl4-openssl-dev python3-rpy2 libmlpack-dev r-base-dev python3-dev pandoc - sudo Rscript -e "install.packages(c('genie', 'Rcpp', 'tinytest', 'emstreeR', 'knitr', 'roxygen2'))" + sudo Rscript -e "install.packages(c('genie', 'Rcpp', 'tinytest', 'RcppArmadillo', 'RcppMLPACK', 'knitr', 'roxygen2'))" #sudo Rscript -e "devtools::install_github('gagolews/Rd2rst')" python -m pip install --upgrade pip if [ -f requirements.txt ]; then pip install -r requirements.txt --upgrade; fi diff --git a/.github/workflows/r.yml b/.github/workflows/r.yml index 248e3b8c..88be8026 100644 --- a/.github/workflows/r.yml +++ b/.github/workflows/r.yml @@ -16,7 +16,7 @@ jobs: sudo apt-get update sudo apt-get -y upgrade sudo apt-get -y install libcurl4-openssl-dev python3-rpy2 libmlpack-dev r-base-dev - sudo Rscript -e "install.packages(c('genie', 'Rcpp', 'tinytest', 'emstreeR', 'roxygen2'))" + sudo Rscript -e "install.packages(c('genie', 'Rcpp', 'tinytest', 'RcppArmadillo', 'RcppMLPACK', 'roxygen2'))" - name: Test and check R run: | sudo make r-test diff --git a/DESCRIPTION b/DESCRIPTION index 8e34bb09..ff72463d 100644 --- a/DESCRIPTION +++ b/DESCRIPTION @@ -2,7 +2,7 @@ Package: genieclust Type: Package Title: The Genie++ Hierarchical Clustering Algorithm with Noise Points Detection Version: 0.9.6 -Date: 2021-01-04 +Date: 2021-01-05 Authors@R: c( person("Marek", "Gagolewski", role = c("aut", "cre", "cph"), @@ -37,9 +37,8 @@ Imports: stats, utils Suggests: - datasets, - emstreeR -LinkingTo: Rcpp + datasets +LinkingTo: Rcpp, RcppArmadillo, RcppMLPACK Encoding: UTF-8 SystemRequirements: OpenMP, C++11 RoxygenNote: 7.1.1 diff --git a/NEWS b/NEWS index 788c3761..87fb3ba7 100644 --- a/NEWS +++ b/NEWS @@ -1,11 +1,11 @@ # `genieclust` Package NEWS -## genieclust 0.9.6 (under development) +## genieclust 0.9.6 (2021-01-05) - [Python] Python >= 3.7 is now required (implied by `numpy`). -- ... (nothing yet) ... +- [R] Use `RcppMLPACK` directly instead of via a wrapper, `emstreeR`. ## genieclust 0.9.5 (2021-01-04) diff --git a/R/RcppExports.R b/R/RcppExports.R index 3a770e94..d1ca23ce 100644 --- a/R/RcppExports.R +++ b/R/RcppExports.R @@ -149,6 +149,10 @@ pair_sets_index <- function(x, y = NULL) { .Call(`_genieclust_pair_sets_index`, x, y) } +.emst_mlpack <- function(X) { + .Call(`_genieclust___emst_mlpack`, X) +} + .gclust <- function(mst, gini_threshold, verbose) { .Call(`_genieclust___gclust`, mst, gini_threshold, verbose) } diff --git a/R/gclust.R b/R/gclust.R index c9368afb..db890cd0 100644 --- a/R/gclust.R +++ b/R/gclust.R @@ -2,7 +2,7 @@ # ############################################################################ # # # -# Copyleft (C) 2020, Marek Gagolewski # +# Copyleft (C) 2020-2021, Marek Gagolewski # # # # # # This program is free software: you can redistribute it and/or modify # @@ -165,7 +165,7 @@ #' pair_sets_index(y_test, y_pred) #' #' # Fast for low-dimensional Euclidean spaces: -#' if (require("emstreeR")) h <- gclust(emst_mlpack(X)) +#' h <- gclust(emst_mlpack(X)) #' #' @rdname gclust #' @export diff --git a/R/mst.R b/R/mst.R index f7986584..d04d4950 100644 --- a/R/mst.R +++ b/R/mst.R @@ -2,7 +2,7 @@ # ############################################################################ # # # -# Copyleft (C) 2020, Marek Gagolewski # +# Copyleft (C) 2020-2021, Marek Gagolewski # # # # # # This program is free software: you can redistribute it and/or modify # @@ -177,18 +177,12 @@ registerS3method("mst", "dist", "mst.dist") #' #' @description #' Provides access to an implementation of the Dual-Tree Borůvka -#' algorithm based on kd-trees. It is fast for (very) low-dimensional +#' algorithm based on kd-trees from MLPACK. It is fast for (very) low-dimensional #' Euclidean spaces. For higher dimensional spaces (say, over 5 features) -#' or other metrics, -#' use the parallelised Prim-like algorithm implemented in \code{\link{mst}()}. +#' or other metrics, use the parallelised Prim-like algorithm implemented +#' in \code{\link{mst}()}. #' #' -#' @details -#' Calls \code{emstreeR::mlpack_mst()} and converts the result -#' so that it is compatible with the output of \code{\link{mst}()}. -#' -#' If the \code{emstreeR} package is not available, an error is generated. -#' #' @param X a numeric matrix (or an object coercible to one, #' e.g., a data frame with numeric-like columns) #' @param verbose logical; whether to print diagnostic messages @@ -209,20 +203,16 @@ registerS3method("mst", "dist", "mst.dist") emst_mlpack <- function(X, verbose=FALSE) { X <- as.matrix(X) - if (requireNamespace("emstreeR", quietly=TRUE)) { - - if (!verbose) - capture.output({mst <- emstreeR:::mlpack_mst(X)}) - else - mst <- emstreeR:::mlpack_mst(X) - - structure(t(mst), - class="mst", - method="euclidean", - Labels=dimnames(X)[[1]] - ) - - } else { - stop("emstreeR` package is not installed.") - } + + if (!verbose) + capture.output({mst <- .emst_mlpack(X)}) + else + mst <- .emst_mlpack(X) + + structure( + mst, + class="mst", + method="euclidean", + Labels=dimnames(X)[[1]] + ) } diff --git a/devel/sphinx/conf.py b/devel/sphinx/conf.py index 2f7c0cff..e2f85905 100644 --- a/devel/sphinx/conf.py +++ b/devel/sphinx/conf.py @@ -25,7 +25,7 @@ # -- Project information ----------------------------------------------------- project = 'genieclust' -copyright = '2020, Marek Gagolewski' +copyright = '2021, Marek Gagolewski' author = 'Marek Gagolewski' # The full version, including alpha/beta/rc tags diff --git a/devel/sphinx/rapi/emst_mlpack.rst b/devel/sphinx/rapi/emst_mlpack.rst index a9287151..22d69ce0 100644 --- a/devel/sphinx/rapi/emst_mlpack.rst +++ b/devel/sphinx/rapi/emst_mlpack.rst @@ -4,7 +4,7 @@ emst_mlpack: Euclidean Minimum Spanning Tree Description ~~~~~~~~~~~ -Provides access to an implementation of the Dual-Tree Borůvka algorithm based on kd-trees. It is fast for (very) low-dimensional Euclidean spaces. For higher dimensional spaces (say, over 5 features) or other metrics, use the parallelised Prim-like algorithm implemented in `mst() `__. +Provides access to an implementation of the Dual-Tree Borůvka algorithm based on kd-trees from MLPACK. It is fast for (very) low-dimensional Euclidean spaces. For higher dimensional spaces (say, over 5 features) or other metrics, use the parallelised Prim-like algorithm implemented in `mst() `__. Usage ~~~~~ @@ -22,13 +22,6 @@ Arguments | ``verbose`` | logical; whether to print diagnostic messages | +-------------+------------------------------------------------------------------------------------------------+ -Details -~~~~~~~ - -Calls ``emstreeR::mlpack_mst()`` and converts the result so that it is compatible with the output of `mst() `__. - -If the ``emstreeR`` package is not available, an error is generated. - Value ~~~~~ diff --git a/devel/sphinx/rapi/gclust.rst b/devel/sphinx/rapi/gclust.rst index 62ca7561..ce7f7290 100644 --- a/devel/sphinx/rapi/gclust.rst +++ b/devel/sphinx/rapi/gclust.rst @@ -146,4 +146,4 @@ Examples pair_sets_index(y_test, y_pred) # Fast for low-dimensional Euclidean spaces: - if (require("emstreeR")) h <- gclust(emst_mlpack(X)) + h <- gclust(emst_mlpack(X)) diff --git a/devel/tinytest/test-gclust.R b/devel/tinytest/test-gclust.R index 7c9e0ec9..023e1cdf 100644 --- a/devel/tinytest/test-gclust.R +++ b/devel/tinytest/test-gclust.R @@ -19,10 +19,8 @@ if (require("genie")) { #for (k in 2:20) expect_equal(adjusted_rand_score(cutree(h1, k), cutree(h2, k)), 1.0) } -if (suppressMessages(require("emstreeR"))) { - print(system.time(h2 <- gclust(emst_mlpack(X, verbose=verbose), verbose=verbose))) - #for (k in 2:20) expect_equal(adjusted_rand_score(cutree(h1, k), cutree(h2, k)), 1.0) -} +print(system.time(h2 <- gclust(emst_mlpack(X, verbose=verbose), verbose=verbose))) +#for (k in 2:20) expect_equal(adjusted_rand_score(cutree(h1, k), cutree(h2, k)), 1.0) # 2020-06-21 diff --git a/devel/tinytest/test-mst.R b/devel/tinytest/test-mst.R index 45abad1c..cb6e86ed 100644 --- a/devel/tinytest/test-mst.R +++ b/devel/tinytest/test-mst.R @@ -23,14 +23,11 @@ expect_true(all(t2[,1] < t2[,2])) expect_true(all(diff(t2[,3])>=0)) - -if (require("emstreeR")) { - print(system.time(t2 <- emst_mlpack(X))) - expect_equal(t1[,1], t2[,1]) - expect_equal(t1[,2], t2[,2]) +print(system.time(t2 <- emst_mlpack(X))) +expect_equal(t1[,1], t2[,1]) +expect_equal(t1[,2], t2[,2]) # print(abs(sum(t1[,3])-sum(t2[,3]))) - expect_true(abs(sum(t1[,3])-sum(t2[,3]))<1e-12) -} +expect_true(abs(sum(t1[,3])-sum(t2[,3]))<1e-12) @@ -50,7 +47,7 @@ for (M in c(1, 5, 10)) { # print(abs(sum(t1[,3])-sum(t2[,3]))) expect_true(abs(sum(t1[,3])-sum(t2[,3]))<1e-12) - if (distance == "euclidean" && M == 1 && require("emstreeR")) { + if (distance == "euclidean" && M == 1) { t2 <- emst_mlpack(X) expect_equal(t1[,1], t2[,1]) expect_equal(t1[,2], t2[,2]) diff --git a/docs/_sources/rapi/emst_mlpack.rst.txt b/docs/_sources/rapi/emst_mlpack.rst.txt index a9287151..22d69ce0 100644 --- a/docs/_sources/rapi/emst_mlpack.rst.txt +++ b/docs/_sources/rapi/emst_mlpack.rst.txt @@ -4,7 +4,7 @@ emst_mlpack: Euclidean Minimum Spanning Tree Description ~~~~~~~~~~~ -Provides access to an implementation of the Dual-Tree Borůvka algorithm based on kd-trees. It is fast for (very) low-dimensional Euclidean spaces. For higher dimensional spaces (say, over 5 features) or other metrics, use the parallelised Prim-like algorithm implemented in `mst() `__. +Provides access to an implementation of the Dual-Tree Borůvka algorithm based on kd-trees from MLPACK. It is fast for (very) low-dimensional Euclidean spaces. For higher dimensional spaces (say, over 5 features) or other metrics, use the parallelised Prim-like algorithm implemented in `mst() `__. Usage ~~~~~ @@ -22,13 +22,6 @@ Arguments | ``verbose`` | logical; whether to print diagnostic messages | +-------------+------------------------------------------------------------------------------------------------+ -Details -~~~~~~~ - -Calls ``emstreeR::mlpack_mst()`` and converts the result so that it is compatible with the output of `mst() `__. - -If the ``emstreeR`` package is not available, an error is generated. - Value ~~~~~ diff --git a/docs/_sources/rapi/gclust.rst.txt b/docs/_sources/rapi/gclust.rst.txt index 62ca7561..ce7f7290 100644 --- a/docs/_sources/rapi/gclust.rst.txt +++ b/docs/_sources/rapi/gclust.rst.txt @@ -146,4 +146,4 @@ Examples pair_sets_index(y_test, y_pred) # Fast for low-dimensional Euclidean spaces: - if (require("emstreeR")) h <- gclust(emst_mlpack(X)) + h <- gclust(emst_mlpack(X)) diff --git a/docs/_static/documentation_options.js b/docs/_static/documentation_options.js index 3f4bd8b0..c84f1f77 100644 --- a/docs/_static/documentation_options.js +++ b/docs/_static/documentation_options.js @@ -1,6 +1,6 @@ var DOCUMENTATION_OPTIONS = { URL_ROOT: document.getElementById("documentation_options").getAttribute('data-url_root'), - VERSION: '0.9.6.dev0', + VERSION: '0.9.6', LANGUAGE: 'None', COLLAPSE_INDEX: false, BUILDER: 'html', diff --git a/docs/genieclust.html b/docs/genieclust.html index a00a0639..758595e7 100644 --- a/docs/genieclust.html +++ b/docs/genieclust.html @@ -7,7 +7,7 @@ - Python Package genieclust Reference — genieclust 0.9.6.dev0 documentation + Python Package genieclust Reference — genieclust 0.9.6 documentation @@ -66,7 +66,7 @@
- 0.9.6.dev0 + 0.9.6
@@ -261,7 +261,7 @@

Python Package genieclust Reference

- © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

diff --git a/docs/genieclust_compare_partitions.html b/docs/genieclust_compare_partitions.html index 02a7b8c7..bdec505f 100644 --- a/docs/genieclust_compare_partitions.html +++ b/docs/genieclust_compare_partitions.html @@ -7,7 +7,7 @@ - genieclust.compare_partitions — genieclust 0.9.6.dev0 documentation + genieclust.compare_partitions — genieclust 0.9.6 documentation @@ -66,7 +66,7 @@
- 0.9.6.dev0 + 0.9.6
@@ -822,7 +822,7 @@

- © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

diff --git a/docs/genieclust_genie.html b/docs/genieclust_genie.html index 42e3664f..09867276 100644 --- a/docs/genieclust_genie.html +++ b/docs/genieclust_genie.html @@ -7,7 +7,7 @@ - genieclust.Genie — genieclust 0.9.6.dev0 documentation + genieclust.Genie — genieclust 0.9.6 documentation @@ -66,7 +66,7 @@
- 0.9.6.dev0 + 0.9.6
@@ -610,7 +610,7 @@

genieclust.Genie

- © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

diff --git a/docs/genieclust_inequity.html b/docs/genieclust_inequity.html index 7f841369..ff398d37 100644 --- a/docs/genieclust_inequity.html +++ b/docs/genieclust_inequity.html @@ -7,7 +7,7 @@ - genieclust.inequity — genieclust 0.9.6.dev0 documentation + genieclust.inequity — genieclust 0.9.6 documentation @@ -66,7 +66,7 @@
- 0.9.6.dev0 + 0.9.6
@@ -379,7 +379,7 @@

- © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

diff --git a/docs/genieclust_internal.html b/docs/genieclust_internal.html index 283e4291..7b9ff1ef 100644 --- a/docs/genieclust_internal.html +++ b/docs/genieclust_internal.html @@ -7,7 +7,7 @@ - genieclust.internal — genieclust 0.9.6.dev0 documentation + genieclust.internal — genieclust 0.9.6 documentation @@ -66,7 +66,7 @@
- 0.9.6.dev0 + 0.9.6
@@ -540,7 +540,7 @@

- © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

diff --git a/docs/genieclust_plots-1.pdf b/docs/genieclust_plots-1.pdf index 34c6f4da552bfebcc50948686d93980a0c06406b..7f0d4ce1493ec093eb624a52bc3288bae469ba7f 100644 GIT binary patch delta 23 fcmaFh@W5fiVp%Rj149E-150Bwqs?n&H!}eMXub#N delta 23 fcmaFh@W5fiVp%Q&Ln9+|LjzMw!_8}DH!}eMXwV1g diff --git a/docs/genieclust_plots-2.pdf b/docs/genieclust_plots-2.pdf index 9146a5d0b620ad8abbea99a4e7e201464682db9f..00887d132f842dccbbab68f5ce005cfa18e7ba7e 100644 GIT binary patch delta 24 fcmaDJ_dITcq&ByqfuVt^fu*sTk?Cd?ZD$q$Y7++o delta 24 fcmaDJ_dITcq&ByKp^=ffp@FHTq1k2?ZD$q$YAgo@ diff --git a/docs/genieclust_plots-3.pdf b/docs/genieclust_plots-3.pdf index 978a56d63aa06007c5ec5a9ad60aa3fb0a4cc43f..34897eed916eeb12238d151b035880cfd2f671fc 100644 GIT binary patch delta 23 ecmZp$Xt3CjEy-nQU}#`!U}eg=2| delta 23 ecmZp$Xt3CjEy-nIXk=t=Xkcn-xVcoan+X6>kOp}G diff --git a/docs/genieclust_plots-4.pdf b/docs/genieclust_plots-4.pdf index 192c62d47b7d8e40dd6536125279446f0b29956f..3a1e69195bc42f9eb698953f7b9f9877958fa5fc 100644 GIT binary patch delta 23 fcmez8^3P?%Re3H$149E-150Bwqs{l_=Q9BSa@q)h delta 23 fcmez8^3P?%Re3H0Ln9+|LjzMw!_D{Q=Q9BSa_k6! diff --git a/docs/genieclust_plots.html b/docs/genieclust_plots.html index 6394f7ce..cbfa409b 100644 --- a/docs/genieclust_plots.html +++ b/docs/genieclust_plots.html @@ -7,7 +7,7 @@ - genieclust.plots — genieclust 0.9.6.dev0 documentation + genieclust.plots — genieclust 0.9.6 documentation @@ -66,7 +66,7 @@
- 0.9.6.dev0 + 0.9.6
@@ -356,7 +356,7 @@

- © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

diff --git a/docs/genieclust_tools.html b/docs/genieclust_tools.html index fbc8f69e..78387583 100644 --- a/docs/genieclust_tools.html +++ b/docs/genieclust_tools.html @@ -7,7 +7,7 @@ - genieclust.tools — genieclust 0.9.6.dev0 documentation + genieclust.tools — genieclust 0.9.6 documentation @@ -66,7 +66,7 @@
- 0.9.6.dev0 + 0.9.6
@@ -392,7 +392,7 @@

- © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

diff --git a/docs/genindex.html b/docs/genindex.html index c12a8396..1f7581ab 100644 --- a/docs/genindex.html +++ b/docs/genindex.html @@ -7,7 +7,7 @@ - Index — genieclust 0.9.6.dev0 documentation + Index — genieclust 0.9.6 documentation @@ -64,7 +64,7 @@
- 0.9.6.dev0 + 0.9.6
@@ -447,7 +447,7 @@

U

- © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

diff --git a/docs/index.html b/docs/index.html index cea13d4f..00654a8c 100644 --- a/docs/index.html +++ b/docs/index.html @@ -7,7 +7,7 @@ - genieclust: Fast and Robust Hierarchical Clustering with Noise Point Detection — genieclust 0.9.6.dev0 documentation + genieclust: Fast and Robust Hierarchical Clustering with Noise Point Detection — genieclust 0.9.6 documentation @@ -65,7 +65,7 @@
- 0.9.6.dev0 + 0.9.6
@@ -356,7 +356,7 @@

Indices and Tables

- © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

diff --git a/docs/objects.inv b/docs/objects.inv index 5e43960b8c603044ce294b7deaec2061b4b58248..72cbdb6d1a1ca87634b9a7d6492a9402657fe8de 100644 GIT binary patch delta 10 RcmbQqGlge@^G1)0tN;~O1Lyz% delta 16 XcmbQjGm~e6Gpk-oYMH@C=ZmZWEjk5- diff --git a/docs/py-modindex.html b/docs/py-modindex.html index 6b921017..9104c2ab 100644 --- a/docs/py-modindex.html +++ b/docs/py-modindex.html @@ -7,7 +7,7 @@ - Python Module Index — genieclust 0.9.6.dev0 documentation + Python Module Index — genieclust 0.9.6 documentation @@ -67,7 +67,7 @@
- 0.9.6.dev0 + 0.9.6
@@ -237,7 +237,7 @@

Python Module Index

- © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

diff --git a/docs/rapi.html b/docs/rapi.html index 4b5d4a05..3436a404 100644 --- a/docs/rapi.html +++ b/docs/rapi.html @@ -7,7 +7,7 @@ - R Package genieclust Reference — genieclust 0.9.6.dev0 documentation + R Package genieclust Reference — genieclust 0.9.6 documentation @@ -66,7 +66,7 @@
- 0.9.6.dev0 + 0.9.6
@@ -234,7 +234,7 @@

R Package genieclust Reference

- © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

diff --git a/docs/rapi/comparing_partitions.html b/docs/rapi/comparing_partitions.html index 0eff4f47..828eb4e3 100644 --- a/docs/rapi/comparing_partitions.html +++ b/docs/rapi/comparing_partitions.html @@ -7,7 +7,7 @@ - comparing_partitions: Pairwise Partition Similarity Scores — genieclust 0.9.6.dev0 documentation + comparing_partitions: Pairwise Partition Similarity Scores — genieclust 0.9.6 documentation @@ -66,7 +66,7 @@
- 0.9.6.dev0 + 0.9.6
@@ -315,7 +315,7 @@

Examples

- © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

diff --git a/docs/rapi/emst_mlpack.html b/docs/rapi/emst_mlpack.html index 637286c1..aeb29ad0 100644 --- a/docs/rapi/emst_mlpack.html +++ b/docs/rapi/emst_mlpack.html @@ -7,7 +7,7 @@ - emst_mlpack: Euclidean Minimum Spanning Tree — genieclust 0.9.6.dev0 documentation + emst_mlpack: Euclidean Minimum Spanning Tree — genieclust 0.9.6 documentation @@ -66,7 +66,7 @@
- 0.9.6.dev0 + 0.9.6
@@ -111,7 +111,6 @@
  • Description
  • Usage
  • Arguments
  • -
  • Details
  • Value
  • References
  • @@ -213,7 +212,7 @@

    emst_mlpack: Euclidean Minimum Spanning Tree

    Description

    -

    Provides access to an implementation of the Dual-Tree Borůvka algorithm based on kd-trees. It is fast for (very) low-dimensional Euclidean spaces. For higher dimensional spaces (say, over 5 features) or other metrics, use the parallelised Prim-like algorithm implemented in mst().

    +

    Provides access to an implementation of the Dual-Tree Borůvka algorithm based on kd-trees from MLPACK. It is fast for (very) low-dimensional Euclidean spaces. For higher dimensional spaces (say, over 5 features) or other metrics, use the parallelised Prim-like algorithm implemented in mst().

    Usage

    @@ -238,11 +237,6 @@

    Arguments -

    Details

    -

    Calls emstreeR::mlpack_mst() and converts the result so that it is compatible with the output of mst().

    -

    If the emstreeR package is not available, an error is generated.

    -

    Value

    An object of class mst, see mst() for details.

    @@ -275,7 +269,7 @@

    References

    - © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

    diff --git a/docs/rapi/gclust.html b/docs/rapi/gclust.html index 5e33e643..64f2acc5 100644 --- a/docs/rapi/gclust.html +++ b/docs/rapi/gclust.html @@ -7,7 +7,7 @@ - gclust: The Genie++ Hierarchical Clustering Algorithm — genieclust 0.9.6.dev0 documentation + gclust: The Genie++ Hierarchical Clustering Algorithm — genieclust 0.9.6 documentation @@ -66,7 +66,7 @@
    - 0.9.6.dev0 + 0.9.6
    @@ -357,7 +357,7 @@

    Examplespair_sets_index(y_test, y_pred) # Fast for low-dimensional Euclidean spaces: -if (require("emstreeR")) h <- gclust(emst_mlpack(X)) +h <- gclust(emst_mlpack(X)) @@ -384,7 +384,7 @@

    Examples

    - © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

    diff --git a/docs/rapi/genieclust-package.html b/docs/rapi/genieclust-package.html index 1c3304c8..9d49ab34 100644 --- a/docs/rapi/genieclust-package.html +++ b/docs/rapi/genieclust-package.html @@ -7,7 +7,7 @@ - genieclust-package: The Genie++ Hierarchical Clustering Algorithm (with Extras) — genieclust 0.9.6.dev0 documentation + genieclust-package: The Genie++ Hierarchical Clustering Algorithm (with Extras) — genieclust 0.9.6 documentation @@ -66,7 +66,7 @@
    - 0.9.6.dev0 + 0.9.6
    @@ -238,7 +238,7 @@

    Author(s)

    - © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

    diff --git a/docs/rapi/inequity.html b/docs/rapi/inequity.html index 1e934bbb..a741ac77 100644 --- a/docs/rapi/inequity.html +++ b/docs/rapi/inequity.html @@ -7,7 +7,7 @@ - inequity: Inequity (Inequality) Measures — genieclust 0.9.6.dev0 documentation + inequity: Inequity (Inequality) Measures — genieclust 0.9.6 documentation @@ -66,7 +66,7 @@
    - 0.9.6.dev0 + 0.9.6
    @@ -297,7 +297,7 @@

    Examples

    - © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

    diff --git a/docs/rapi/mst.html b/docs/rapi/mst.html index 72e9e2b0..591f1c55 100644 --- a/docs/rapi/mst.html +++ b/docs/rapi/mst.html @@ -7,7 +7,7 @@ - mst: Minimum Spanning Tree of the Pairwise Distance Graph — genieclust 0.9.6.dev0 documentation + mst: Minimum Spanning Tree of the Pairwise Distance Graph — genieclust 0.9.6 documentation @@ -66,7 +66,7 @@
    - 0.9.6.dev0 + 0.9.6
    @@ -323,7 +323,7 @@

    Examples

    - © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

    diff --git a/docs/search.html b/docs/search.html index ae2416f1..562fa304 100644 --- a/docs/search.html +++ b/docs/search.html @@ -7,7 +7,7 @@ - Search — genieclust 0.9.6.dev0 documentation + Search — genieclust 0.9.6 documentation @@ -66,7 +66,7 @@
    - 0.9.6.dev0 + 0.9.6
    @@ -206,7 +206,7 @@

    - © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

    diff --git a/docs/searchindex.js b/docs/searchindex.js index cf6f65a8..286ae921 100644 --- a/docs/searchindex.js +++ b/docs/searchindex.js @@ -1 +1 @@ -Search.setIndex({docnames:["genieclust","genieclust_compare_partitions","genieclust_genie","genieclust_inequity","genieclust_internal","genieclust_plots","genieclust_tools","index","rapi","rapi/comparing_partitions","rapi/emst_mlpack","rapi/gclust","rapi/genieclust-package","rapi/inequity","rapi/mst","weave/basics","weave/benchmarks_approx","weave/benchmarks_ar","weave/benchmarks_details","weave/noise","weave/r","weave/sklearn_toy_example","weave/sparse","weave/string","weave/timings","z_bibliography"],envversion:{"sphinx.domains.c":2,"sphinx.domains.changeset":1,"sphinx.domains.citation":1,"sphinx.domains.cpp":3,"sphinx.domains.index":1,"sphinx.domains.javascript":2,"sphinx.domains.math":2,"sphinx.domains.python":2,"sphinx.domains.rst":2,"sphinx.domains.std":1,"sphinx.ext.todo":2,"sphinxcontrib.bibtex":4,sphinx:56},filenames:["genieclust.rst","genieclust_compare_partitions.rst","genieclust_genie.rst","genieclust_inequity.rst","genieclust_internal.rst","genieclust_plots.rst","genieclust_tools.rst","index.rst","rapi.rst","rapi/comparing_partitions.rst","rapi/emst_mlpack.rst","rapi/gclust.rst","rapi/genieclust-package.rst","rapi/inequity.rst","rapi/mst.rst","weave/basics.rst","weave/benchmarks_approx.rst","weave/benchmarks_ar.rst","weave/benchmarks_details.rst","weave/noise.rst","weave/r.rst","weave/sklearn_toy_example.rst","weave/sparse.rst","weave/string.rst","weave/timings.rst","z_bibliography.rst"],objects:{"genieclust.Genie":{fit:[2,1,1,""]},"genieclust.compare_partitions":{adjusted_fm_score:[1,3,1,""],adjusted_mi_score:[1,3,1,""],adjusted_rand_score:[1,3,1,""],compare_partitions2:[1,3,1,""],compare_partitions:[1,3,1,""],confusion_matrix:[1,3,1,""],fm_score:[1,3,1,""],mi_score:[1,3,1,""],normalize_confusion_matrix:[1,3,1,""],normalized_accuracy:[1,3,1,""],normalized_confusion_matrix:[1,3,1,""],normalized_mi_score:[1,3,1,""],pair_sets_index:[1,3,1,""],rand_score:[1,3,1,""]},"genieclust.inequity":{bonferroni_index:[3,4,1,""],gini_index:[3,4,1,""]},"genieclust.internal":{DisjointSets:[4,0,1,""],GiniDisjointSets:[4,0,1,""]},"genieclust.internal.DisjointSets":{find:[4,1,1,""],get_k:[4,1,1,""],get_n:[4,1,1,""],to_list:[4,1,1,""],to_list_normalized:[4,1,1,""],to_lists:[4,1,1,""],union:[4,1,1,""]},"genieclust.internal.GiniDisjointSets":{find:[4,1,1,""],get_count:[4,1,1,""],get_counts:[4,1,1,""],get_gini:[4,1,1,""],get_k:[4,1,1,""],get_n:[4,1,1,""],get_smallest_count:[4,1,1,""],to_list:[4,1,1,""],to_list_normalized:[4,1,1,""],to_lists:[4,1,1,""],union:[4,1,1,""]},"genieclust.plots":{plot_scatter:[5,3,1,""],plot_segments:[5,3,1,""]},"genieclust.tools":{argkmin:[6,4,1,""],cummax:[6,4,1,""],cummin:[6,4,1,""]},genieclust:{Genie:[2,0,1,""],compare_partitions:[1,2,0,"-"],inequity:[3,2,0,"-"],internal:[4,2,0,"-"],plots:[5,2,0,"-"],tools:[6,2,0,"-"]}},objnames:{"0":["py","class","Python class"],"1":["py","method","Python method"],"2":["py","module","Python module"],"3":["py","function","Python function"],"4":["py","attribute","Python attribute"]},objtypes:{"0":"py:class","1":"py:method","2":"py:module","3":"py:function","4":"py:attribute"},terms:{"000":[17,24],"000000":20,"00017":[2,25],"001":21,"003":[2,4,13,25],"004013":20,"005":17,"007":6,"00726":[2,25],"0167":[2,25],"021185":20,"025":17,"031":24,"056494":20,"060":6,"061":6,"067901":20,"072":6,"073":6,"074134":20,"074894":20,"075":6,"081801":20,"084":24,"0_approx":16,"100":[5,6,17,24],"1000":24,"10000":[21,24],"100000":24,"1000000":24,"100000000":6,"10029":25,"1007":25,"100836":22,"100d":16,"1016":[2,4,13,25],"102542":20,"10475":22,"105":[17,24],"105000":24,"105539":20,"105600":24,"1058":22,"108":25,"1109":[1,25],"111":24,"1113":22,"1125":22,"113":24,"11346":24,"1145":[2,25],"1197":22,"1211":22,"122":25,"1232":22,"1234":21,"1250":22,"12m":24,"130701":20,"1313":[2,14,25],"132":24,"13239":22,"1325":[2,14,25],"13327":22,"13328":22,"1389":14,"1394":22,"1401":14,"140138":20,"144":22,"148":16,"1486":22,"1487":22,"1500":21,"154":20,"154272":20,"158":24,"159":25,"16021":24,"161":25,"1627":24,"164":25,"1657":24,"168":6,"1691":24,"16th":25,"170":21,"174":16,"1745":24,"1796":22,"1835804":25,"1835882":25,"1912":[3,13],"1914":22,"193":[1,9,25],"1930":[3,13,14],"1933":22,"1957":14,"1960":22,"1964":22,"1965":22,"1967":22,"1968":22,"197":15,"1973":[22,25],"1974":22,"1975":22,"1977":22,"1979":22,"1980":22,"1982":22,"1983":[22,25],"1984":22,"1985":[1,9,22,25],"1986":22,"1987":22,"1988":22,"1989":22,"1990":22,"1991":22,"1992":22,"1993":22,"1995":[2,14,22,25],"1996":[22,25],"1997":22,"1998":22,"1999":[22,25],"1_approx":16,"1st":20,"200":22,"2000":22,"2005":25,"2009":25,"2010":[1,2,9,10,25],"2011":[1,9,25],"2012":25,"2013":25,"2014":24,"2015":[2,11,14,25],"2016":[1,2,4,9,11,13,25],"2017":25,"2018":[2,10,22,25],"2019":[2,25],"202":24,"2020":[22,25],"2036":22,"203906":20,"205":25,"207":25,"2084":22,"2094":22,"2097":22,"21105":[2,25],"212197":20,"217":[24,25],"2173":[1,9,25],"2174":22,"2175":24,"218":[1,9,25],"2186":[1,9,25],"2190":22,"2216":22,"224":22,"225":24,"2259":22,"226":25,"231":25,"2382":22,"23rd":25,"242":24,"2443":22,"255":25,"2551240":[1,25],"2605":22,"264":[16,25],"266":24,"267":24,"268879":20,"2703":22,"27284":22,"2733381":[2,25],"274155":20,"27448":22,"276":15,"277173":20,"2772":22,"27753444":22,"2778":22,"2792":22,"2825":25,"2830":25,"2837":[1,9,25],"2854":[1,9,24,25],"2861":22,"2888":22,"2891":22,"2892":22,"289224":20,"2907":22,"2916":22,"292":16,"2963":22,"299":6,"299537":20,"2997":24,"2fs":21,"2nd":6,"300326":20,"3010":22,"3016":22,"307":16,"3097983":25,"3098079":25,"319":25,"3241080446115835":15,"326":16,"329":6,"332":16,"3341":22,"336496":20,"340152":20,"340636":20,"341":25,"350592":20,"357":24,"363":[2,4,11,13,25],"374348":20,"376":16,"3776":25,"377eb8":21,"3815066":25,"383":25,"388":6,"389867":20,"390":6,"3927":24,"3_approx":[16,24],"3_mlpack":24,"3_nomlpack":24,"403":6,"409":16,"4114":24,"412":24,"414":6,"415":16,"4170":24,"420523":20,"421":24,"434233":20,"436303":20,"4384":24,"4388":24,"4408":24,"445":24,"446943":20,"447":[6,16],"4486":24,"453451":20,"4581":22,"4716":22,"4743":25,"4757":24,"4759":25,"49055":25,"4945":24,"4daf4a":21,"500":22,"50000":24,"500000":24,"505":6,"508130":20,"512709":20,"516":16,"522":25,"5281":25,"531":16,"53889x283228":22,"539498":20,"541081":20,"543":25,"553":25,"555":16,"568":16,"569":25,"590927":20,"593052":20,"594718":20,"5_approx":16,"600":[17,24],"6006":22,"6027":22,"603":[2,10,25],"605769":20,"60ghz":24,"611":[2,10],"612":25,"621681":20,"624":16,"624147":20,"627805":20,"630009":20,"634251":20,"639":6,"662674":20,"663252":20,"6698":22,"673":6,"692808":20,"70000":24,"708":22,"715":24,"719":[16,24],"726":[2,10,25],"728":16,"731":16,"732":22,"734":16,"753476":20,"755":16,"759396":20,"7708":24,"778":24,"781637":25,"784":24,"794":24,"7_19":25,"7_approx":16,"817850":20,"819":22,"8191":[2,25],"820":22,"827154":20,"829620":20,"831955":20,"836":22,"839":22,"844":16,"850":22,"854317":20,"863":22,"868176":20,"886885":20,"895167":20,"898":22,"898812":20,"899":22,"911":22,"921":22,"931156":20,"934":22,"9352814722212013":23,"955":22,"959609":20,"964":22,"964981247":22,"964982224":22,"964982703":22,"964982931":22,"964983815":22,"969":22,"9724x610":22,"972848":20,"9750h":24,"977":22,"978":25,"984ea3":21,"987":22,"992649":20,"999999":21,"\u03c3":13,"bor\u016fvka":10,"break":[7,24],"c_\u03c3":9,"case":[2,4,5,11,14,16,18,24],"catch":21,"char":20,"class":[0,2,4,10,11,14,15,22],"default":[2,11,14,15,17,19,20,24],"final":20,"float":[2,6,11,14],"fr\u00e4nti":25,"function":[1,4,5,6,7,9,15],"import":[5,7,15,19,21,22,23,24],"int":[2,5,6,21,22],"jarn\u00edk":[2,14,24],"jist\u00e9m":14,"m\u00fcller":25,"m\u00fcllner":25,"minim\u00e1ln\u00edm":14,"moravsk\u00e9":14,"new":[2,4,7,11,13,19,20,22,25],"null":9,"p\u0159\u00edrodov\u011bdeck\u00e9":14,"pr\u00e1ce":14,"probl\u00e9mu":14,"return":[1,2,3,4,6,11,19,22],"spole\u010dnosti":14,"switch":19,"true":[2,11,14,15,19,23,24],"try":[2,11,17],And:22,Being:22,Eqs:[1,9],Eyes:22,For:[2,3,4,10,13,15,16,17,19,20,24],IDs:[4,22],Ice:7,Its:[2,7,11,15],One:[2,3],Sys:14,The:[1,2,3,4,5,6,7,8,13,14,15,16,17,19,20,21,22,23,24,25],Then:[7,18,21,22],There:21,These:[3,9,13],Use:11,a65628:21,aardman:22,abil:14,abl:[2,7,11,15],about:24,abov:[2,11,15,18,22],abridg:22,abundez:[1,9],accept:[1,2,14],access:10,accord:[2,11],accuraci:[1,9,18],achin:25,acm:[2,10,11,14,25],across:16,act:[2,7,11],actg1:23,actual:[1,2],adapt:7,added:[16,18,24],adding:2,addition:2,adjac:[2,11],adjust:[1,9,15,16,17,18,20,23],adjusted_fm_scor:[1,9],adjusted_mi_scor:[1,9],adjusted_rand_scor:[1,9,11,15,23],affect:[2,15,17],affin:[2,17,22,23],afm:1,after:[2,7],again:[16,19],against:[15,17,24],agglom:[15,17,24,25],agglomerativeclust:21,aggreg:[17,18,20],agpl:7,agreement:[1,9,17,18],aim:1,airplan:22,albania:20,albeit:[2,24],alert:16,algeria:20,algo_param:21,algorithm:[1,2,3,4,7,8,10,13,14,15,16,17,18,19,22,24,25],all:[2,3,4,5,11,13,14,16,17,24],alloc:20,allow:[4,7,17,19,23,24],almost:[6,22,24],alongsid:17,alpha:19,alreadi:3,also:[1,7,9,15,17,19,20,21,22,23,24],altern:[2,11,14,24],although:16,altogeth:16,alwai:[1,4,5,9],american:25,ami:1,ami_:9,amongst:[2,3,11,13,15,24],amuel:25,analysi:[2,10,14,25],analyz:22,angola:20,angulardist:2,angulardist_spars:2,ani:[2,5,7,19,24],animatio:22,aniso:21,anisotrop:21,anoth:[7,15],anywai:2,api:[7,15,18,25],appeal:[2,7,11],appendix:[7,17],appli:[1,2,11,15,17,19,24,25],applic:[2,3,10,13,18,25],approach:[2,7,11,25],approxim:[2,7,22,24],arabi:[1,9,25],arbitrari:[2,11],archiv:25,argentina:20,argkmin:6,argmin:6,argsort:6,argu:2,argument:[2,5],ariant:25,arithmet:[11,14],arizmendi:[1,9],armenia:20,around:1,arrai:[1,2,4,6,15,21],array_lik:[1,5],art:[22,25],ascend:6,ascii:2,ask:19,asp:11,assign:[1,3,5,9,13,15,23],associ:25,assum:2,assumpt:4,assur:2,ast:25,astel:25,astyp:21,atgtctccaaagcgtgaccttctagacccgagacgacatatggaggcttggagccgtacctgtgtgaggaaactgtagtacccaaagctattca:23,atom:18,attribut:[2,14],augment:4,australia:20,austria:20,auto:[2,24],automat:24,avail:[2,7,10,17,20,24],averag:[7,17,18,20,21],avoid:21,awai:[2,3,11,13,14],axi:[2,5,15,19],back:[15,22],bailei:[1,9,25],ball:22,bartoszuk:[2,4,11,13,25],base:[1,2,9,10,11,17,18,20,22,23,24,25],basic:[7,20],basicne:20,basket:22,batteri:[16,17],becom:[2,24],been:[18,24],behav:16,behind:7,being:[2,4,11,14],belgium:20,bell:14,belong:15,below:[1,2,9,17,20,21],benchmark:[1,2,7,11,15,20,23,24,25],best:[2,11,17,18,22],better:[16,17,20],between:[1,2,6,9,11,14,15,16,17,18,19,22,23],beyond:15,bf01908075:25,biject:[1,9],birch1:18,birch2:[16,18],birch:[7,17],birch_0:[17,18],bit:[2,11,14,16,18,24],bit_ham:2,bit_jaccard:2,black:5,blackadd:22,blob:[2,21,24,25],blue:[5,22],boi:22,bolivia:20,bologna:[3,13],bonferroni:[3,13],bonferroni_index:[3,13],book:20,bool:[2,3],both:[1,2,3,9,13],bottl:22,bottom:21,bound:[1,9],boundari:[2,11,14],bowfing:22,bowl:22,box:21,boxplot:17,boytsov:[2,25],branching_factor:17,brian:22,bride:22,brother:22,buitinck:25,c_contigu:1,cach:24,call:[1,2,4,5,10,11,20,22,24],campello:[2,11,14,25],can:[1,2,3,5,7,9,11,13,14,15,19,20,23,24],canada:20,cannot:15,cardin:[2,4,24],care:2,carol:22,cast:2,cast_float32:[2,11,14,20,23],catch_warn:21,categor:20,categori:[20,21],catmethod:20,ceil:5,cel:[24,25],cell:22,cena:[2,4,11,13,25],center:5,centr:[2,16,18,24],centroid:[17,18,24],chainlink:18,chameleon:25,chameleon_t4_8k:18,chameleon_t5_8k:18,chameleon_t7_10k:18,chameleon_t8_8k:18,chanc:[1,9,25],chang:[1,2,17,24],charact:23,characterist:21,check:20,children_:[2,15],chile:20,choic:24,choos:[2,11],chose:16,chosen:[2,11,14],christma:22,circl:18,cityblock:[2,11,14],classic:[2,11],classif:[1,9,25],classifi:19,clearli:24,climateandenergi:20,close:22,closer:19,closest:[7,15],cluster:[1,2,3,4,8,9,13,14,15,16,17,18,20,21,22,23,24,25],cluster_std:21,clustering_algorithm:21,clustering_benchmarks_v1:[1,11,25],clusteringtheori:25,cmzs15:[7,15,19,25],coarser:[2,19],coarsest:2,code:7,coercibl:[2,9,10,11,14],coffe:[7,24],col:[5,11],collect:5,colombia:20,color:[5,20,21],colourpalett:20,column:[1,2,5,9,10,11,14,18,20],column_stack:15,com:[1,2,11,15,20,23,25],come:[1,15,23],comfort:22,comment:20,commun:[1,9],compar:[1,7,9,15,24,25],compare_partit:[0,7,15,18,23],compare_partitions2:1,comparing_partit:[7,8],comparis:7,comparison:[1,7,9,25],compat:[7,10,11,15,20,24],complet:[7,14,16,17,18,21,24],completel:22,complex:[2,3,13,14,24],compon:[2,21],compound:18,compress:[4,22],comput:[1,2,3,4,9,11,14,15,16,20,24,25],compute_all_cut:2,compute_full_tre:[2,15],conduct:2,confer:25,confus:[1,9,15],confusion_matrix:1,connect:[2,14,21],consecut:[22,24],consid:[16,17,20,22,24],constant:[3,13],constitut:2,construct:2,consum:[2,11],contain:4,conting:1,contrari:[2,19],contrib:25,contribut:7,control:[2,11,14,19],convers:22,convert:[10,23],convex:[3,5,13,15],convexhul:5,coordin:[2,5,24],copi:21,core:[2,7,11,24],correct:[1,2,9,11,25],correspond:[1,2,5,11,14,15,16,19],cosin:[2,11,14,22],cosinesimil:2,cosinesimil_spars:[2,22],cost:[2,4],cote:20,count:[15,16,17,18],countri:20,counts_:[2,15],cours:[15,19,24],cpu:24,cran:[7,20],creat:[2,21],createindex:2,creatur:22,cross:18,crucial:24,cry:22,csr:22,csr_matrix:2,csv:[20,22],cummax:6,cummin:[2,6,11],cumprod:6,cumsum:6,cumul:6,cuppini:[3,13],current:4,curs:[22,24],curtin:[2,10,25],cut:2,cutre:[7,11,20],cycl:21,czech:20,d31:18,d_m:19,dai:22,dalton:[3,13],danifold:25,dasgupta:25,data:[1,2,3,6,7,9,10,11,13,14,15,19,20,21,24,25],data_typ:2,databas:[22,25],dataset:[1,2,7,9,11,14,15,16,19,20,22,23,25],datatyp:2,dbscan:[2,7,11,15],ddof:2,decim:[2,17],decreas:[2,3,13],dede00:21,default_bas:21,defin:[1,5,9,14,17],definit:[1,9,11,15,22],degrad:24,degre:23,demand:15,demonstr:[16,24],dendrogram:[2,7,11,20],denmark:20,denot:[2,4,11,15,17,18,19],dens:[1,2,18,22],densiti:[2,11,14,25],departur:11,depend:[2,7,11,24],depict:20,descend:6,describ:2,descript:[2,16,17],design:[4,25],desir:[11,17,20],detail:[1,2,7,12,15,17,20],detect:[2,11,14,20,24,25],detect_nois:11,detector:[2,7,11],determin:[1,2,7,14,22,24],devel:[15,20,23],dg19:[17,25],diagnost:[2,10,11,14],diagon:1,diagram:15,dict:[1,2,23],dictionari:[1,2],did:19,differ:[11,16,17,19,21,24],difficult:7,digit:[2,16,17,18,24],dijkstra:[2,14,24],dilemma:25,dimension:[2,10,11,14,16,24],dimnam:20,directli:20,disabl:[2,11,19],disconnect:2,discov:[15,25],discoveri:[2,11,14,25],discrep:16,discuss:[17,24],disjoint:[1,4,5,9],disjointset:4,dispers:[3,13],dissimilar:2,dist:[11,14,20],distanc:[2,7,8,11,16,18,19,20,23,24],distances_:[2,15],distinct:5,distinguish:2,distribut:[2,4,7,11,17,21],dn09:[17,25],dna:7,document:[7,15,18,20],doe:[2,11,16,24],doesn:7,doi:[1,2,4,13,25],dok_matrix:22,domain:23,don:[20,22],done:24,dot:[3,4,21],doubl:[1,3,6],down:2,download:7,draw:5,drawn:5,dtype:[2,15,19,22,23],dua:25,dual:10,duck:22,due:[1,9],dure:[2,4,24],dynam:25,e41a1c:21,each:[1,2,4,5,7,11,14,16,17,18,19,20,24],eagerli:19,earli:21,easier:21,easili:[7,15,19,24],ecml:25,ecoli:18,econom:[3,13,15,20],economi:20,edel:[2,10,25],edg:[2,11,14],edit:23,edu:25,effect:[2,11,19,24],effici:[20,24],either:[2,5,14],eksx96:[15,25],elaps:24,elect:22,element:[1,2,3,4,6,9,11,13,22],elementi:[3,13],els:21,empir:[17,22],emst:[2,10,24],emst_mlpack:[7,8,11,14],emstreer:[10,11],enabl:2,engin:25,engytim:18,enough:15,enumer:21,environ:[2,7,11,14],environment:20,episod:22,epp:[1,9,25],eps:[2,7,11,15],equal:[3,5,6,13,15,17,19],equip:15,equiti:[3,13],equival:[2,5],error:10,esp:9,especi:1,ester:25,estim:[2,11,14,25],estonia:20,etc:20,ethiopia:20,euclidean:[2,5,7,8,11,14,16,18,19,20,24,25],evalu:17,even:[2,3,7,19,24],everi:[1,9,18],everyth:20,evidenc:24,exact:[2,16,22,23,24],exactli:2,exampl:[1,3,5,6,7,15,19,21],excel:19,except:[1,4,9,16,20,24],exercis:22,exhal:22,expect:[1,5,9,17],experiment:25,expert:[15,19,23],explicitli:[11,17,19],extern:[1,7,9,11,20,23,25],extra:[7,8,22],extract:[20,22,24],extrem:[7,24,25],f781bf:21,factor:[2,7,11,14,21],fail:[2,17],fals:[2,3,10,11,14,15,16,22,23,24],familiar:7,famou:22,far:15,fashion:[18,24],fast:[2,4,5,6,10,11,13,14,16,19,25],fastclust:[17,24,25],fastcluster_centroid:24,fastcluster_median:24,fastcluster_ward:24,faster:[2,7,11,14,16,20,23,24],fastest:[21,24],father:22,fcp:18,fear:22,featur:[2,10,11,14,15,16,18,19,20,22,24],feed:20,feel:[7,19],few:[1,2,15,17,20,22],ff7f00:21,fidel:22,figsiz:21,figur:21,file:[14,22],film:22,filterwarn:21,find:[4,6,7,19],fine:2,finer:19,finland:20,fire:16,firenz:[3,13],first:[4,5,7,11,15,19,21,22,24],fish:22,fit:[2,7,15,17,21,22,24],fit_predict:[7,15,19,22,23],fit_transform:21,fix:5,flame:18,flexibl:[2,10,25],float32:[2,22],fly:14,flynt:22,fm83:[18,25],fm_score:[1,9],fmiz16:[17,25],follow:[1,3,13,15],forc:[2,11],forest:[2,24],forget:20,form:[2,7,22],formal:2,format:[2,7,11,22],former:17,forth:22,forthcom:20,fortun:15,found:[2,19],fowlk:[1,9,18,25],frac:[3,4,13],frame:[10,11,14,20,22],franc:20,frankenstein:22,franti:[1,9],friendli:15,from:[1,2,3,5,7,9,11,13,14,15,16,17,18,19,21,22,24,25],fs18:[17,25],full:22,further:[5,7,11,14,24],furthermor:2,futur:22,fuzzi:25,fuzzyx:18,g2mg:[16,17],gacaattatcgcggctttcgccatgcagagtctcgtacaatttgtttcacgcccaatattttccgtgcttcgcgagctaggcagccagggcatttttgga:23,gagolew:[1,11,15,20,23,25],gagolewski:[2,4,7,11,12,13,25],gain:14,game:[21,22],gamma:17,gaussian:[2,16,17,18,24],gbc16:[7,15,17,19,23,25],gca:21,gcaattgaagtccagatctaggtatcgtccaagcatattgcctttaagaaatatatttgaccctgtctcttcgtggaggtacacgtcacggaatcgtaagatttccttgg:23,gclust:[7,8,14,20],gener:[1,2,4,6,10,11,15,16,17,21,24],general:[3,13],generalis:14,geni:[0,3,4,7,8,13,14,15,16,17,19,20,21,22,23,24,25],genie_0:[16,17,18,24],genie_1:16,genieclust:[15,16,17,18,19,20,21,22,23,24],geq:3,german:25,germani:20,get:[4,15,17,19,22],get_count:4,get_gini:4,get_k:4,get_n:4,get_smallest_count:4,ghaisa:[2,10,25],ghana:20,gini:[2,3,4,11,13,15],gini_index:[3,11,13],gini_threshold:[2,11,15,16,17,19,20,24],ginidisjointset:4,github:[1,2,7,11,15,20,23,25],give:[1,2,3,5,9,11,13,14,15,17,20,23,24],given:[1,2,3,4,9,11,13,14,15,22,24],glanc:15,glass:18,glust:20,gnu:[7,24],goal:19,goe:[2,7,11],good:[2,7,16,19,24],gp10:[17,25],graff:25,grai:[2,10,15,25],grail:22,grain:2,grand:22,granular:[15,19],graph:[2,7,8,11,18,24,25],graphic:[5,15],grave:[18,25],greater:[2,20,24],greec:20,green:5,grei:19,grid:17,gromit:22,ground:[1,9,17],groundhog:22,group:[2,7,11,15,18,20],grumpier:22,guarante:2,guess:15,guffman:22,gun:22,h2mg:[16,17],h_oecd:20,ha85:[17,18,25],han:25,hand:[2,7,11,15,24],handi:1,handl:22,happen:15,hard:[15,22],has:[2,3,7,13,18,20,24],hasattr:21,have:[3,4,13,16,17,18,19,24],hclust:[7,11,20],hdbscan:[2,7,11,18,25],head:[20,22],header:7,heali:25,heat:18,height:11,help:22,henc:[1,2,7,9,11,17,24],hepta:18,here:[5,15,16,17,19,22,24],hierarch:[2,4,8,13,14,15,17,19,20,21,24,25],hierarchi:[2,7,11,15,22,24],high:[16,22,23,24],higher:[10,24],highest:17,highli:[2,7,11,24],hire:5,hnsw:2,hold:[2,3,6,11,13,14],holi:22,hollywood:22,hood:19,hope:22,horizontalalign:[5,21],how:[7,15,19,20,22],howev:[2,7,11,17,19,24],hspace:21,html:25,http:[1,2,4,10,11,15,20,23,25],hubert:[1,9,25],hull:5,human:20,hungari:20,hunt:22,i_dataset:21,iceland:20,ics:25,idea:[2,7,19],ident:[1,9,24],identif:19,identifi:[2,11,14,19,20],ieee:[1,9,25],ierarch:25,ignor:[2,21],iii:22,illustr:[21,22],iloc:22,imbalanc:[2,7,11],implement:[1,2,4,7,10,13,14,15,17,18,19,22,23,24],importantli:24,includ:[2,17],increas:[2,11,15,24],increasingli:[2,3,6,13],independ:[1,2,9],index:[1,2,3,4,6,7,9,11,13,15,16,17,18,20,23],indexthreadqti:2,indic:[1,3,5,13,14,15,16,18,20,23],individu:7,inequ:[0,2,7,8,15],inform:[1,2,4,9,11,13,14,17,18,25],init:2,input:[1,2,7,9,11,13,14,15,20,22,24],ins:[2,4,13,25],insert:6,inspect:17,inspir:5,instal:[2,20],instanc:[2,24],instead:[2,11,14,15],integ:[1,2,4,5,6,9,11,22],intel:24,intellig:25,interact:[15,20],interest:20,interestingli:[16,17],interfac:[7,15],intern:[0,1,5,7,9],intp:[15,19,23],invari:2,ionospher:18,ireland:20,iri:[9,11,14,18],iris5:18,irrespect:24,is_sort:3,ish:15,isin:22,islic:21,isol:18,israel:20,issu:7,istodor:25,itali:20,item:[1,18],iter:2,itertool:21,itm:[17,18,25],its:[1,2,4,5,7,9,11,15,24],itself:[2,4,24],ivoir:20,jaccard_spars:2,jain:[15,18,25],japan:20,jedi:22,jl05:[15,25],jmlr:25,john:22,join:15,joincod:20,joincountrydata2map:20,joss:[2,25],journal:[1,2,9,10,25],jumanji:22,just:[2,11,24],karypi:25,kdd:25,keep:[7,19],kei:1,kernel:[24,25],khk99:[17,25],king:22,kingdom:20,kmean:[9,15,24],kmkm17:[24,25],kneighbors_graph:21,knowledg:[1,2,9,11,14,25],known:[15,17,19],kobren:25,korea:20,kriegel:25,krishnamurthi:25,kruskal:[2,24],kumar:25,kwarg:5,l1_spars:2,l2_spars:2,label:[1,2,5,7,9,14,15,17,19,23],labels0:[15,19,23],labels_:[2,21],labels_geni:[15,19],labels_hdbscan:[15,19],labels_kmean:15,labels_nois:19,labels_pr:23,labels_tru:[15,19,23],labirynth:18,lampert:25,languag:[7,25],lao:20,laplacian:17,laptop:16,larg:[7,16,25],larger:[2,17,21,24],largest:1,larri:22,las:11,lastp:15,latex:[2,25],latter:[2,5,17],latvia:20,law:25,lead:17,leaf:2,learn:[1,2,7,9,10,15,17,21,24,25],least:[2,16,17,19,24],leav:[2,11],lebanon:20,lectur:25,left:[2,3,15,21],len:[5,15,19,21,23],length:[1,2,4,5,6,9],leq:1,less:[2,16,24],lesser:17,let:[1,4,9,15,16,19,20,22,23,24],level:[2,11,24],leven:[2,23],levenshtein:23,lgorithm:25,librari:[2,7,10,11,14,15,20,25],libreria:[3,13],libya:20,licens:7,lie:15,life:22,light:19,like:[2,6,7,10,11,14,15,24],limit:[17,24],lin73:[15,25],line:[5,18],linear:[1,9],linf:2,linf_spars:2,ling:25,link:[7,11,15],linkag:[2,7,11,14,16,17,18,21,24],linkage_matrix:15,linux:24,list:[4,11,15,16,20,21,23,24],lithuania:20,littl:20,live:22,load:[15,19,22],loadtxt:[15,19,23,24],loaf:22,loc:22,locat:[2,6],logic:[10,11,14],lola:22,look:[7,19],low:[2,10,11,14,24],lower:17,lozhnikov:[2,10,25],lstrip:21,lsun:18,luxembourg:20,machin:[1,2,9,10,25],magic:[2,11,15],magnolia:22,mai:[1,2],main:1,make:[2,7,11,14,15],make_blob:21,make_circl:21,make_moon:21,malkov:[2,25],malkovich:22,mallow:[1,9,18,25],manhattan:[2,11,14],mani:[2,15,19],manual:[2,15,20,25],map:[18,22,25],mapcountrydata:20,mapdata:20,maptitl:20,march:[2,10,25],marek:[7,12,20],mariescu:25,mark:[2,11],marker:[5,19],markers:5,master:[2,15,20,23,25],match:[1,7,9,15,25],mathrm:1,matplotlib:[5,15,19,21],matrix:[1,2,5,9,10,11,14,15,20,21,22,23],matter:[1,5,22],mauritania:20,mauritiu:20,max:[1,2,5,6,11,14,16,17,18,21,22],maxim:[1,9,17],maximis:17,maximum:6,mccallum:25,mcinn:25,mcs:15,mcss:19,mean:[1,2,7,16,17,18,19,20,22,24,25],meaning:[7,16,21],measur:[1,3,7,8,9,11,15,18,20,25],median:[16,17,18,24],member:[4,7,20,22],membership:4,memori:[2,6,7,14,24],men:22,menac:22,mentekidi:[2,10,25],mention:[19,23],merg:[2,4,7,11,15],messag:[2,10,11,14,21],meta:22,method:[2,7,11,14,15,17,20,21,24,25],metric:[2,10,11,14,15,23,24,25],mexico:20,mha17:[19,25],mi_scor:[1,9],might:[1,2,6,7,9,11,14,15,17,19,24],million:[7,15,16],min:[1,6,16,17,18],min_cluster_s:[2,11,15,19],min_sampl:19,mind:[15,24],mine:[1,9,25],minimum:[2,5,6,7,8,11,17,19,24,25],minut:16,miss:11,missingcountrycol:20,mixtur:[17,18],mk1:18,mk2:18,mk3:18,mk4:18,mlpack:[2,10,24,25],mlpack_en:[2,24],mlpack_leaf_s:2,mlpack_mst:10,mnist:[18,24],model:25,modul:[0,7,25],monath:25,monti:22,more:[1,2,3,6,7,12,15,17,18,19,20,24],moreov:[1,2,14,17,19,24],most:[11,15,21,24],moulavi:[2,11,14,25],movi:7,movieid:22,movielen:22,mrg10:[24,25],mrk:5,mrk_recycl:5,msnowozinl12:[17,25],mss:19,mst:[2,5,7,8,10,11,20,24,25],mst_from_dist:5,much:[2,15,16,17,24],mul13:[17,24,25],multipl:[1,14,17,25],must:[2,4,5],mutabilita:[3,13],mutual:[1,2,7,9,11,14,18,19],n_cluster:[2,7,15,17,19,21,22,23,24],n_clusters_:2,n_featur:2,n_features_:2,n_init:[17,24],n_neighbor:21,n_sampl:[2,21],n_samples_:2,nacc:1,naidan:[2,25],naiv:4,nake:22,name:[2,14,20,21,22],namecolumntoplot:20,namejoincolumn:20,namibia:20,nan:18,natur:19,naturalresourc:20,nbmn19:[7,24,25],ncl:15,ncol:5,ncs:19,ndarrai:[1,2,3,4,6],ndmin:[15,19,24],nearest:[2,7,11,14,15,16],neat:19,necessarili:[6,16],need:[2,4,24],neg:[1,3,9,13],negdotprod:2,negdotprod_spars:2,neighbour:[2,7,11,14,15,16,22,23,24],neither:4,nest:15,net:25,netherland:20,network:14,nicaragua:20,nice:[15,21,24],night:22,nip:25,nmi:1,nmi_:9,nmrk:5,nmslib:[2,7,16,22,23,24,25],nmslib_n_neighbor:2,nmslib_params_index:[2,23],nmslib_params_init:2,nmslib_params_queri:2,no_label:15,no_structur:21,nois:[2,11,14,15,16,18,20,21,24,25],noisy_circl:21,noisy_moon:21,non:[2,3,13,19,22,25],non_nois:19,nondecreasingli:[4,14],none:[2,5,11,21],nonempti:[1,9],nor:4,normal:[1,9,21,25],normalis:[1,3,4,13,18],normalize_confusion_matrix:1,normalized_accuraci:[1,9],normalized_confusion_matrix:[1,15],normalized_mi_scor:[1,9],normleven:2,north:20,norwai:20,note:[1,2,3,4,5,6,7,9,11,14,15,16,20,21,24,25],noteworthi:16,notion:[2,11,15],novak:[2,25],now:[2,11,19,22,24],nowozin:25,number:[2,3,4,7,11,13,14,15,17,19,20,21],numer:[2,3,10,11,13,14],numpi:[2,6,15,19,21,22,23,24],object:[2,9,10,11,14,15,20,21,22],observ:[1,2,9,14,16,17,22,24],obtain:[2,11,15,19,20,23],occur:11,octob:22,oecd:20,off:5,often:[2,7,11,15],old:[19,22],old_movieid_map:22,oliv:22,ols95:[24,25],olson:[2,14,25],olymp:18,omit:17,omp_num_thread:[2,11,14],onc:[2,5,11,19,24],one:[2,3,5,7,10,11,13,14,15,16,18,19,22,23,24],ones:[2,16,19],onli:[2,5,7,11,15,16,17,20,21,22,24],onto:1,open:[2,7,10,25],oper:4,option:2,order:[2,3,4,6,11,13,20,24],org:[4,10,20,25],organ:25,orient:15,origin:[1,2,7,11,14,15,16,19,21,24],other:[2,3,4,7,10,11,13,14,15,17,18,22,24,25],otherwis:[2,4,11,13,14],our:[2,16,19,22,24],ourselv:[17,20],out:[2,15,20,21,22,24],outcom:[16,17],outlier:[2,4,7,11,13,14,25],outperform:[2,7,11,15,17],output:[1,2,9,10,15,16,17,21],over:[4,10,17],overal:[17,24],own:7,packag:[2,4,5,7,10,15,17,18,19,20,22,23,24],page:[7,25],pair:[1,5,7,9,18,20],pair_sets_index:[1,9,11],pairwis:[1,2,7,8,11,24],palett:20,panama:20,panda:[15,19,22],paolo:[3,13],paper:[10,25],parabol:18,parallel:[2,14,25],parallelis:[2,10,11,14,24],param:21,paramet:[1,2,3,4,5,6,7,11,15,16,17,19,21,24],parameteris:19,parametr:17,parent:4,part:[2,17,22,24],partial:20,particular:[5,13,15,16],partit:[1,2,4,7,8,11,15,17,18,19,20,21,24,25],pass:[2,11,14],path:4,pathbas:18,patriot:22,pattern:25,pch:11,pdf:[2,5,10,25],pdist:2,pedregosa:25,pedrycz:25,penalis:[2,11],peopl:22,perceiv:[3,13],perfect:[3,13,15,17,18],perfectli:7,perform:[2,11,16,18,22,23,24],perhap:17,permut:[1,3,9,13],person:6,personaldevelopmentandhealth:20,pessimist:4,phantom:22,physic:24,pictur:15,pigou:[3,13],pivot:[1,15],pkdd:25,plai:19,plausibl:17,plot:[0,2,7,11,15,19,20,21],plot_num:21,plot_scatt:[5,15,19],plot_seg:5,plt:[5,15,19,21],png:5,point:[2,5,11,14,15,16,17,20,24],poland:20,poli:17,polic:22,policeman:22,pool:24,poor:[3,13],popul:17,popular:15,portug:20,posit:6,possibl:[1,9,15,20],post:[2,23],postprocess:[2,11],power:7,practic:[6,15],precis:[2,11,14,16],precomput:2,predecessor:2,predefin:[2,7,11],predict:[15,16,17,19,21],prefer:[1,6,9],preprocess:[2,18,21],presenc:9,present:18,pretti:5,prevent:[2,7,11],preview:[20,23],previou:[16,24],prim:[2,10,14,24],princess:22,principl:[3,13,25],print:[2,10,11,14,20,22,23,24],probabl:[1,9,25],problem:[1,9,24],proc:[2,10,25],procedur:[2,19,21],process:2,produc:22,product:6,progress:[2,11,14],project:[19,20,22,25],properti:[1,2,5,9,11,25],provid:[2,10,11,17,19,24],psi:[1,9],publish:[2,7],pull:[2,11,14],puriti:[1,9,18],pypi:7,pyplot:[5,15,19,21],python:[7,15,20,22,24,25],python_bind:25,quadrophenia:22,qualiti:[15,17,24],quantifi:[1,2,3,9,13,16,17],question:24,quickli:24,quiroz:[1,9],quit:17,r15:18,rabb:22,rais:[2,11],ram:[2,10,22,25],rand:[1,9,15,16,17,18,20,21,23],rand_scor:[1,9],randn:5,random:[5,6,21],random_st:21,randomli:6,rang:[5,15,16,19],rank:[4,17,18],rate:22,rather:2,raw:[2,11,14,18],rbf:17,reachabl:[2,7,11,14,19],read:[7,18,20,22],read_csv:22,readabl:20,real:[2,9],realli:4,reason:[17,20],recal:[16,24],recognit:25,recommend:[7,15,16,17,24],recomput:[4,24],record:2,recurs:4,red:[5,22],refer:[1,2,3,7,15,16,17,18,19,20,23,24],regard:20,region:15,reimplement:11,rel:7,relat:21,reli:[2,4,15,16,19,22,23],reloc:1,remap:1,remov:[16,18,19,24],rendon:[1,9],rennt:22,repeat:5,replac:19,report:17,repositori:[20,25],repr:22,repres:[1,4,9,14],republ:20,request:[2,14,24],requir:[2,11],research:[1,9,25],resist:[2,4,7,11,13,25],resourc:24,respect:[1,2,5,7,9,11,14,16,18,19,22,24],restart:24,restrict:[17,20],result:[1,2,4,7,9,10,11,15,16,17,19,21,24],rev:11,reveal:19,review:22,rezaei:[1,9,25],rf16:[18,25],rich:[3,13,17],right:[3,21],ring:18,ring_noisi:18,ring_outli:18,rmd:23,robinhood:3,robust:[2,11],robustifi:[2,7,11,15],rocket:22,romania:20,round:[1,3,17],routin:[11,22,23,25],row:[1,2,9,14,18,20,22],run:[2,4,6,11,16,21,22,24],rushmor:22,russia:20,rworldmap:20,safe:24,sai:[2,10,20],sake:15,same:[1,4,5,9,15,17,22,24],sampl:[3,13,17,20,21],sander:[2,11,14,25],scale:[2,16,17,18,20,24],scatter:[5,15,19,21],scheme:6,schur:[3,13],scienc:[2,4,11,13,25],scikit:[7,15,17,21,24,25],scipi:[2,5,15,22],score:[1,3,7,8,11,13,15,17,18,20],script:21,search:[7,16,22,23,24],searchsort:22,seber:[3,13],sec:22,second:[4,24],secret:22,section:[15,16,17,18,24],see:[1,2,4,5,7,9,10,12,15,16,17,18,20,23,24],seed:21,seem:15,seen:16,segment:5,select:[11,14,21],self:[2,25],sens:17,separ:14,sequenc:15,seri:[1,24],set:[1,2,3,4,5,7,9,11,13,14,15,17,18,19,20,21,23,24,25],set_data_structur:4,set_param:24,setenv:14,setquerytimeparam:2,shape:[1,2,4,5,15,19],shave:22,shortest:14,should:[2,11,15,17],shouldn:15,show:[5,15,19,21,22],show_leaf_count:15,shut:22,side:15,sieranoja:25,sight:22,sigkdd:[2,10,25],sigma:[1,3],sigmoid:17,signific:17,sim:15,similar:[1,7,8,11,15,16,17,18,20,22,23],similarli:[1,9],simpl:[7,22],simplic:[2,5,7,11],singl:[2,9,11,16,17,18,21,24,25],sipu:[16,18,24],site:19,six:25,size:[2,3,4,7,11,13,14,15,21,24],sklearn:[15,21,24],sklearn_kmean:24,slightli:24,slovak:20,slovenia:20,slow:[4,14,24],slower:24,small:[1,2,6,7,11,16,22,24],smaller:[4,17,20],smallest:[2,4,6,7,11,15],smell:22,smile:18,smooth:[2,7,11,14],smp:24,societi:20,softwar:[2,10,25],solut:[1,2,9,17],solv:[7,24],som:25,some:[1,2,4,7,9,14,17,18,24],somehow:[2,7,11],someth:22,sometim:[1,2,7,9,17],somewhat:15,somewher:15,sonar:18,sort:[2,3,6,13,14,24],sort_valu:22,soup:22,sourc:[2,7,10,17,25],south:20,space:[2,10,11,14,15,16,24,25],spain:20,span:[2,5,7,8,11,17,19,24,25],spars:[2,7],spatial:[2,5,25],specif:[20,21],spectral:17,spectral_rbf_5:[17,18],speed:15,sphinx:[15,20,23],spinal:22,spiral:18,splendid:7,split:15,spoiler:16,sqrt:[2,4,24],squad:22,squar:[2,18],squareform:2,ssfindex:20,ssi:20,ssi_2016_categori:20,ssize_t:4,stabl:[2,15,17,25],stage:[2,18],standardis:[2,11],standardscal:21,star:22,stat:20,state:20,statist:[6,16,17,18,25],statistica:[3,13],statlog:18,std:[2,16,17,18],stderr:2,step:19,still:[19,24],sting:22,stop:21,store:[2,22,24],stori:22,str:[2,23],strang:15,strike:22,string:[2,7],stripe:18,structur:[2,24],studi:[17,24,25],style:5,subgroup:15,subject:17,submarin:22,suboptim:14,subplot:[15,19,21],subplots_adjust:21,subset:[1,4,9],subtract:15,suggest:[2,17],suit:[1,7,16,17,18,24,25],suitabl:[2,24],sum:[1,6,9],sum_:[3,4],summari:7,summaris:[1,15,18],support:[2,7,22],surpris:15,sustain:20,sweden:20,switzerland:20,symbol:15,synonym:[2,11,14],synthet:24,syst:14,system:[24,25],tabl:[1,9,22],take:[2,3,11,13,16,22,24],taken:2,tap:22,target:18,task:[2,7,14,24],tataacaaccctgattacatcaagctacgctccggtgcgttgcctcggacgagtgctaatccctccccactgactgtattcatcttgacaata:23,tech:14,temporarili:19,tend:[2,17,19],term:15,terrestri:22,test:[11,17],tetra:18,text:[5,21],thailand:20,than:[2,4,16,20,24],thank:[7,24],thei:[2,3,9,13,16,17,22,24],them:[15,19],themself:2,theoret:[1,9,17,25],theori:25,therefor:[2,5,7,11,24],therein:1,thi:[1,2,4,5,11,14,15,16,17,18,19,20,21,22,23,24],thou:22,thousand:15,thread:[2,7,11,14],three:22,threshold:[2,11,15,17],thrown:4,tile:5,time:[2,3,4,6,7,11,13,14,17,20,21],timestamp:22,tini:[2,16,18,24],tipografia:[3,13],titl:[5,15,19,21,22],tkde:[1,25],to_list:4,to_list_norm:4,tocsr:22,todens:22,togeth:[2,11,15],toi:[7,22],tolist:23,tommi:22,too:[2,14,15],tool:[0,2,7],top:[2,21,22,24],total:[2,3,16,18,24],toward:25,tracker:7,traffic:22,trajectori:[16,18],transact:[1,2,9,11,14,25],transax:21,transform:[1,9,21,22],transit:20,translat:[2,24],trapped_lov:18,treat:2,treatment:2,tree:[2,5,7,8,11,15,17,19,20,21,23,24,25],trouser:22,truncate_mod:15,truth:[1,9,17],ttagagcgcttaaccccacaggaaccgagttcccctcatgtggcaaggttctcccgcctcaggtatcacagaaacaaggtatgtagccctaggctacgagc:23,tune:[15,19],tunisia:20,turkei:20,turn:[2,15,21,24],tutori:7,twist:22,two:[1,2,5,9,15,22,24,25],twodiamond:18,twosplash:18,type:[2,6,22],typic:[2,17],ubuntu:24,uci:[18,25],ukrain:20,ult05:[17,25],ultrametr:[2,11],ultsch:25,unadjust:[1,9],unbal:18,under:[7,19],underli:1,undirect:14,unfortun:15,union:4,uniqu:[2,15,19,22,23],unit:20,unless:[2,24],unlik:5,updat:[4,21],url:25,usabl:[2,7,11],use:[2,4,7,10,11,23,24],used:[1,2,3,6,9,11,13,14,15,17,20,23,24],useful:[6,17,19],usefulness:17,user:[2,15,19,22,25],userid:22,userwarn:21,uses:[3,13,24],using:[2,11,14,25],usual:2,v11:25,valid:[1,9,11,17,20,23,25],valu:[1,2,3,4,6,15,21],vari:21,variabilita:[3,13],variabl:[2,11,14,17],varianc:[2,16,18,21,24],variant:[1,9,15,24],variou:[5,17],veb10:[18,25],vector:[1,2,3,4,5,6,9,11,13,17],verbos:[2,10,11,14,20],veri:[2,6,7,10,11,14,23,24],version:[1,2,7,9,11,15,16,17,18,22,24,25],versu:[1,9],vertex:[2,11],vertic:14,via:7,vietnam:20,vinh10a:25,vinh:[1,9,25],violat:[2,11],visibl:24,visual:[2,11,14,25],voronoi:15,wai:[2,5,17,19,22],wait:22,wallac:22,wanda:22,want:11,war:22,ward:[7,17,18,21,24],warn:[2,21],wdbc:18,weav:[15,20],web:20,websit:[21,22],weight:[2,11,14],welcom:7,well:[2,5,14,15,17],wellb:20,wellbalancedsocieti:20,were:[16,18,19,22,24],what:[2,19],whatev:19,when:[2,19],whenev:1,where:[1,2,3,4,5,6,9,11,13,14,16,22],wherea:15,wherev:18,whether:[2,10,11,14],which:[1,2,9,11,14,15,16,17,19,22,24],which_clust:22,whichev:4,white:20,whole:[2,7,11,22],whose:[2,4,6,11],wide:22,wiki:4,wikipedia:4,window:18,wine:18,wingnut:18,wise:18,within:[7,17],won:22,word:15,work:[2,6],workhors:20,workshop:25,worms_2:[18,24],worms_64:[16,18,24],wors:[16,24],worth:[2,11,15,17],would:[15,22],wrapper:1,wrong:22,wspace:21,wut:[16,18],www:[20,25],x86_64:24,x_1:[3,4,13],x_aniso:21,x_i:[3,4,13],x_j:[3,4,13],x_k:4,x_n:[3,13],x_oecd:20,xlim:21,xnn:25,xperienc:25,xtick:21,y_pred:[9,11,20,21],y_test:11,y_true:9,yeast:18,yellow:22,yemen:20,yet:20,yield:[2,3,13,16,22],ylim:[5,21],you:[4,5,11,14],young:22,your:14,ython:25,ytick:21,zealand:20,zenodo:25,zero:22,zhang:[2,10,25],zhong:25,zigzag:18,zigzag_noisi:18,zigzag_outli:18,zimbabw:20,zimek:[2,11,14,25]},titles:["Python Package genieclust Reference","genieclust.compare_partitions","genieclust.Genie","genieclust.inequity","genieclust.internal","genieclust.plots","genieclust.tools","genieclust: Fast and Robust Hierarchical Clustering with Noise Point Detection","R Package genieclust Reference","comparing_partitions: Pairwise Partition Similarity Scores","emst_mlpack: Euclidean Minimum Spanning Tree","gclust: The Genie++ Hierarchical Clustering Algorithm","genieclust-package: The Genie++ Hierarchical Clustering Algorithm (with Extras)","inequity: Inequity (Inequality) Measures","mst: Minimum Spanning Tree of the Pairwise Distance Graph","Basics","Benchmarks \u2014 Approximate Method","Benchmarks (How Good Is It?)","Benchmarks \u2014 Detailed Results","Clustering with Noise Points Detection","R Interface Examples","Comparing Algorithms on Toy Datasets","Example: Sparse Data and Movie Recommendation","Example: String Data and Grouping of DNA","Timings (How Fast Is It?)","References"],titleterms:{"break":15,"function":24,Ice:15,The:[11,12],algorithm:[11,12,21],also:[11,14,25],ami:18,approxim:16,argument:[9,10,11,13,14],author:12,basic:15,benchmark:[16,17,18],cluster:[7,11,12,19],compar:21,compare_partit:1,comparing_partit:9,comparis:19,comparison:15,data:[22,23],dataset:[17,18,21,24],dendrogram:15,descript:[9,10,11,12,13,14],detail:[9,10,11,13,14,18],detect:[7,19],distanc:14,dna:23,emst_mlpack:10,euclidean:10,exampl:[9,11,13,14,20,22,23],extra:12,factor:19,fast:[7,24],further:15,gclust:11,geni:[2,11,12],genieclust:[0,1,2,3,4,5,6,7,8,12],good:17,graph:14,group:23,hdbscan:[15,19],hierarch:[7,11,12],how:[17,24],indic:7,inequ:[3,13],interfac:20,intern:4,larg:[17,18,24],mean:15,measur:13,method:16,minimum:[10,14],movi:22,mst:14,nacc:18,nmi:18,nois:[7,19],number:24,packag:[0,8,12],pairwis:[9,14],partit:9,plot:5,point:[7,19],psi:18,python:0,read:15,recommend:22,refer:[0,8,9,10,11,13,14,25],result:18,robust:7,score:9,see:[11,14,25],similar:9,small:[17,18],smooth:19,span:[10,14],spars:22,string:23,summari:[17,18,24],tabl:7,thread:24,time:24,toi:21,tool:6,tree:[10,14],usag:[9,10,11,13,14],valu:[9,10,11,13,14]}}) \ No newline at end of file +Search.setIndex({docnames:["genieclust","genieclust_compare_partitions","genieclust_genie","genieclust_inequity","genieclust_internal","genieclust_plots","genieclust_tools","index","rapi","rapi/comparing_partitions","rapi/emst_mlpack","rapi/gclust","rapi/genieclust-package","rapi/inequity","rapi/mst","weave/basics","weave/benchmarks_approx","weave/benchmarks_ar","weave/benchmarks_details","weave/noise","weave/r","weave/sklearn_toy_example","weave/sparse","weave/string","weave/timings","z_bibliography"],envversion:{"sphinx.domains.c":2,"sphinx.domains.changeset":1,"sphinx.domains.citation":1,"sphinx.domains.cpp":3,"sphinx.domains.index":1,"sphinx.domains.javascript":2,"sphinx.domains.math":2,"sphinx.domains.python":2,"sphinx.domains.rst":2,"sphinx.domains.std":1,"sphinx.ext.todo":2,"sphinxcontrib.bibtex":4,sphinx:56},filenames:["genieclust.rst","genieclust_compare_partitions.rst","genieclust_genie.rst","genieclust_inequity.rst","genieclust_internal.rst","genieclust_plots.rst","genieclust_tools.rst","index.rst","rapi.rst","rapi/comparing_partitions.rst","rapi/emst_mlpack.rst","rapi/gclust.rst","rapi/genieclust-package.rst","rapi/inequity.rst","rapi/mst.rst","weave/basics.rst","weave/benchmarks_approx.rst","weave/benchmarks_ar.rst","weave/benchmarks_details.rst","weave/noise.rst","weave/r.rst","weave/sklearn_toy_example.rst","weave/sparse.rst","weave/string.rst","weave/timings.rst","z_bibliography.rst"],objects:{"genieclust.Genie":{fit:[2,1,1,""]},"genieclust.compare_partitions":{adjusted_fm_score:[1,3,1,""],adjusted_mi_score:[1,3,1,""],adjusted_rand_score:[1,3,1,""],compare_partitions2:[1,3,1,""],compare_partitions:[1,3,1,""],confusion_matrix:[1,3,1,""],fm_score:[1,3,1,""],mi_score:[1,3,1,""],normalize_confusion_matrix:[1,3,1,""],normalized_accuracy:[1,3,1,""],normalized_confusion_matrix:[1,3,1,""],normalized_mi_score:[1,3,1,""],pair_sets_index:[1,3,1,""],rand_score:[1,3,1,""]},"genieclust.inequity":{bonferroni_index:[3,4,1,""],gini_index:[3,4,1,""]},"genieclust.internal":{DisjointSets:[4,0,1,""],GiniDisjointSets:[4,0,1,""]},"genieclust.internal.DisjointSets":{find:[4,1,1,""],get_k:[4,1,1,""],get_n:[4,1,1,""],to_list:[4,1,1,""],to_list_normalized:[4,1,1,""],to_lists:[4,1,1,""],union:[4,1,1,""]},"genieclust.internal.GiniDisjointSets":{find:[4,1,1,""],get_count:[4,1,1,""],get_counts:[4,1,1,""],get_gini:[4,1,1,""],get_k:[4,1,1,""],get_n:[4,1,1,""],get_smallest_count:[4,1,1,""],to_list:[4,1,1,""],to_list_normalized:[4,1,1,""],to_lists:[4,1,1,""],union:[4,1,1,""]},"genieclust.plots":{plot_scatter:[5,3,1,""],plot_segments:[5,3,1,""]},"genieclust.tools":{argkmin:[6,4,1,""],cummax:[6,4,1,""],cummin:[6,4,1,""]},genieclust:{Genie:[2,0,1,""],compare_partitions:[1,2,0,"-"],inequity:[3,2,0,"-"],internal:[4,2,0,"-"],plots:[5,2,0,"-"],tools:[6,2,0,"-"]}},objnames:{"0":["py","class","Python class"],"1":["py","method","Python method"],"2":["py","module","Python module"],"3":["py","function","Python function"],"4":["py","attribute","Python attribute"]},objtypes:{"0":"py:class","1":"py:method","2":"py:module","3":"py:function","4":"py:attribute"},terms:{"000":[17,24],"000000":20,"00017":[2,25],"001":21,"003":[2,4,13,25],"004013":20,"005":17,"007":6,"00726":[2,25],"0167":[2,25],"021185":20,"025":17,"031":24,"056494":20,"060":6,"061":6,"067901":20,"072":6,"073":6,"074134":20,"074894":20,"075":6,"081801":20,"084":24,"0_approx":16,"100":[5,6,17,24],"1000":24,"10000":[21,24],"100000":24,"1000000":24,"100000000":6,"10029":25,"1007":25,"100836":22,"100d":16,"1016":[2,4,13,25],"102542":20,"10475":22,"105":[17,24],"105000":24,"105539":20,"105600":24,"1058":22,"108":25,"1109":[1,25],"111":24,"1113":22,"1125":22,"113":24,"11346":24,"1145":[2,25],"1197":22,"1211":22,"122":25,"1232":22,"1234":21,"1250":22,"12m":24,"130701":20,"1313":[2,14,25],"132":24,"13239":22,"1325":[2,14,25],"13327":22,"13328":22,"1389":14,"1394":22,"1401":14,"140138":20,"144":22,"148":16,"1486":22,"1487":22,"1500":21,"154":20,"154272":20,"158":24,"159":25,"16021":24,"161":25,"1627":24,"164":25,"1657":24,"168":6,"1691":24,"16th":25,"170":21,"174":16,"1745":24,"1796":22,"1835804":25,"1835882":25,"1912":[3,13],"1914":22,"193":[1,9,25],"1930":[3,13,14],"1933":22,"1957":14,"1960":22,"1964":22,"1965":22,"1967":22,"1968":22,"197":15,"1973":[22,25],"1974":22,"1975":22,"1977":22,"1979":22,"1980":22,"1982":22,"1983":[22,25],"1984":22,"1985":[1,9,22,25],"1986":22,"1987":22,"1988":22,"1989":22,"1990":22,"1991":22,"1992":22,"1993":22,"1995":[2,14,22,25],"1996":[22,25],"1997":22,"1998":22,"1999":[22,25],"1_approx":16,"1st":20,"200":22,"2000":22,"2005":25,"2009":25,"2010":[1,2,9,10,25],"2011":[1,9,25],"2012":25,"2013":25,"2014":24,"2015":[2,11,14,25],"2016":[1,2,4,9,11,13,25],"2017":25,"2018":[2,10,22,25],"2019":[2,25],"202":24,"2020":[22,25],"2036":22,"203906":20,"205":25,"207":25,"2084":22,"2094":22,"2097":22,"21105":[2,25],"212197":20,"217":[24,25],"2173":[1,9,25],"2174":22,"2175":24,"218":[1,9,25],"2186":[1,9,25],"2190":22,"2216":22,"224":22,"225":24,"2259":22,"226":25,"231":25,"2382":22,"23rd":25,"242":24,"2443":22,"255":25,"2551240":[1,25],"2605":22,"264":[16,25],"266":24,"267":24,"268879":20,"2703":22,"27284":22,"2733381":[2,25],"274155":20,"27448":22,"276":15,"277173":20,"2772":22,"27753444":22,"2778":22,"2792":22,"2825":25,"2830":25,"2837":[1,9,25],"2854":[1,9,24,25],"2861":22,"2888":22,"2891":22,"2892":22,"289224":20,"2907":22,"2916":22,"292":16,"2963":22,"299":6,"299537":20,"2997":24,"2fs":21,"2nd":6,"300326":20,"3010":22,"3016":22,"307":16,"3097983":25,"3098079":25,"319":25,"3241080446115835":15,"326":16,"329":6,"332":16,"3341":22,"336496":20,"340152":20,"340636":20,"341":25,"350592":20,"357":24,"363":[2,4,11,13,25],"374348":20,"376":16,"3776":25,"377eb8":21,"3815066":25,"383":25,"388":6,"389867":20,"390":6,"3927":24,"3_approx":[16,24],"3_mlpack":24,"3_nomlpack":24,"403":6,"409":16,"4114":24,"412":24,"414":6,"415":16,"4170":24,"420523":20,"421":24,"434233":20,"436303":20,"4384":24,"4388":24,"4408":24,"445":24,"446943":20,"447":[6,16],"4486":24,"453451":20,"4581":22,"4716":22,"4743":25,"4757":24,"4759":25,"49055":25,"4945":24,"4daf4a":21,"500":22,"50000":24,"500000":24,"505":6,"508130":20,"512709":20,"516":16,"522":25,"5281":25,"531":16,"53889x283228":22,"539498":20,"541081":20,"543":25,"553":25,"555":16,"568":16,"569":25,"590927":20,"593052":20,"594718":20,"5_approx":16,"600":[17,24],"6006":22,"6027":22,"603":[2,10,25],"605769":20,"60ghz":24,"611":[2,10],"612":25,"621681":20,"624":16,"624147":20,"627805":20,"630009":20,"634251":20,"639":6,"662674":20,"663252":20,"6698":22,"673":6,"692808":20,"70000":24,"708":22,"715":24,"719":[16,24],"726":[2,10,25],"728":16,"731":16,"732":22,"734":16,"753476":20,"755":16,"759396":20,"7708":24,"778":24,"781637":25,"784":24,"794":24,"7_19":25,"7_approx":16,"817850":20,"819":22,"8191":[2,25],"820":22,"827154":20,"829620":20,"831955":20,"836":22,"839":22,"844":16,"850":22,"854317":20,"863":22,"868176":20,"886885":20,"895167":20,"898":22,"898812":20,"899":22,"911":22,"921":22,"931156":20,"934":22,"9352814722212013":23,"955":22,"959609":20,"964":22,"964981247":22,"964982224":22,"964982703":22,"964982931":22,"964983815":22,"969":22,"9724x610":22,"972848":20,"9750h":24,"977":22,"978":25,"984ea3":21,"987":22,"992649":20,"999999":21,"\u03c3":13,"bor\u016fvka":10,"break":[7,24],"c_\u03c3":9,"case":[2,4,5,11,14,16,18,24],"catch":21,"char":20,"class":[0,2,4,10,11,14,15,22],"default":[2,11,14,15,17,19,20,24],"final":20,"float":[2,6,11,14],"fr\u00e4nti":25,"function":[1,4,5,6,7,9,15],"import":[5,7,15,19,21,22,23,24],"int":[2,5,6,21,22],"jarn\u00edk":[2,14,24],"jist\u00e9m":14,"m\u00fcller":25,"m\u00fcllner":25,"minim\u00e1ln\u00edm":14,"moravsk\u00e9":14,"new":[2,4,7,11,13,19,20,22,25],"null":9,"p\u0159\u00edrodov\u011bdeck\u00e9":14,"pr\u00e1ce":14,"probl\u00e9mu":14,"return":[1,2,3,4,6,11,19,22],"spole\u010dnosti":14,"switch":19,"true":[2,11,14,15,19,23,24],"try":[2,11,17],And:22,Being:22,Eqs:[1,9],Eyes:22,For:[2,3,4,10,13,15,16,17,19,20,24],IDs:[4,22],Ice:7,Its:[2,7,11,15],One:[2,3],Sys:14,The:[1,2,3,4,5,6,7,8,13,14,15,16,17,19,20,21,22,23,24,25],Then:[7,18,21,22],There:21,These:[3,9,13],Use:11,a65628:21,aardman:22,abil:14,abl:[2,7,11,15],about:24,abov:[2,11,15,18,22],abridg:22,abundez:[1,9],accept:[1,2,14],access:10,accord:[2,11],accuraci:[1,9,18],achin:25,acm:[2,10,11,14,25],across:16,act:[2,7,11],actg1:23,actual:[1,2],adapt:7,added:[16,18,24],adding:2,addition:2,adjac:[2,11],adjust:[1,9,15,16,17,18,20,23],adjusted_fm_scor:[1,9],adjusted_mi_scor:[1,9],adjusted_rand_scor:[1,9,11,15,23],affect:[2,15,17],affin:[2,17,22,23],afm:1,after:[2,7],again:[16,19],against:[15,17,24],agglom:[15,17,24,25],agglomerativeclust:21,aggreg:[17,18,20],agpl:7,agreement:[1,9,17,18],aim:1,airplan:22,albania:20,albeit:[2,24],alert:16,algeria:20,algo_param:21,algorithm:[1,2,3,4,7,8,10,13,14,15,16,17,18,19,22,24,25],all:[2,3,4,5,11,13,14,16,17,24],alloc:20,allow:[4,7,17,19,23,24],almost:[6,22,24],alongsid:17,alpha:19,alreadi:3,also:[1,7,9,15,17,19,20,21,22,23,24],altern:[2,11,14,24],although:16,altogeth:16,alwai:[1,4,5,9],american:25,ami:1,ami_:9,amongst:[2,3,11,13,15,24],amuel:25,analysi:[2,10,14,25],analyz:22,angola:20,angulardist:2,angulardist_spars:2,ani:[2,5,7,19,24],animatio:22,aniso:21,anisotrop:21,anoth:[7,15],anywai:2,api:[7,15,18,25],appeal:[2,7,11],appendix:[7,17],appli:[1,2,11,15,17,19,24,25],applic:[2,3,10,13,18,25],approach:[2,7,11,25],approxim:[2,7,22,24],arabi:[1,9,25],arbitrari:[2,11],archiv:25,argentina:20,argkmin:6,argmin:6,argsort:6,argu:2,argument:[2,5],ariant:25,arithmet:[11,14],arizmendi:[1,9],armenia:20,around:1,arrai:[1,2,4,6,15,21],array_lik:[1,5],art:[22,25],ascend:6,ascii:2,ask:19,asp:11,assign:[1,3,5,9,13,15,23],associ:25,assum:2,assumpt:4,assur:2,ast:25,astel:25,astyp:21,atgtctccaaagcgtgaccttctagacccgagacgacatatggaggcttggagccgtacctgtgtgaggaaactgtagtacccaaagctattca:23,atom:18,attribut:[2,14],augment:4,australia:20,austria:20,auto:[2,24],automat:24,avail:[2,7,17,20,24],averag:[7,17,18,20,21],avoid:21,awai:[2,3,11,13,14],axi:[2,5,15,19],back:[15,22],bailei:[1,9,25],ball:22,bartoszuk:[2,4,11,13,25],base:[1,2,9,10,11,17,18,20,22,23,24,25],basic:[7,20],basicne:20,basket:22,batteri:[16,17],becom:[2,24],been:[18,24],behav:16,behind:7,being:[2,4,11,14],belgium:20,bell:14,belong:15,below:[1,2,9,17,20,21],benchmark:[1,2,7,11,15,20,23,24,25],best:[2,11,17,18,22],better:[16,17,20],between:[1,2,6,9,11,14,15,16,17,18,19,22,23],beyond:15,bf01908075:25,biject:[1,9],birch1:18,birch2:[16,18],birch:[7,17],birch_0:[17,18],bit:[2,11,14,16,18,24],bit_ham:2,bit_jaccard:2,black:5,blackadd:22,blob:[2,21,24,25],blue:[5,22],boi:22,bolivia:20,bologna:[3,13],bonferroni:[3,13],bonferroni_index:[3,13],book:20,bool:[2,3],both:[1,2,3,9,13],bottl:22,bottom:21,bound:[1,9],boundari:[2,11,14],bowfing:22,bowl:22,box:21,boxplot:17,boytsov:[2,25],branching_factor:17,brian:22,bride:22,brother:22,buitinck:25,c_contigu:1,cach:24,call:[1,2,4,5,11,20,22,24],campello:[2,11,14,25],can:[1,2,3,5,7,9,11,13,14,15,19,20,23,24],canada:20,cannot:15,cardin:[2,4,24],care:2,carol:22,cast:2,cast_float32:[2,11,14,20,23],catch_warn:21,categor:20,categori:[20,21],catmethod:20,ceil:5,cel:[24,25],cell:22,cena:[2,4,11,13,25],center:5,centr:[2,16,18,24],centroid:[17,18,24],chainlink:18,chameleon:25,chameleon_t4_8k:18,chameleon_t5_8k:18,chameleon_t7_10k:18,chameleon_t8_8k:18,chanc:[1,9,25],chang:[1,2,17,24],charact:23,characterist:21,check:20,children_:[2,15],chile:20,choic:24,choos:[2,11],chose:16,chosen:[2,11,14],christma:22,circl:18,cityblock:[2,11,14],classic:[2,11],classif:[1,9,25],classifi:19,clearli:24,climateandenergi:20,close:22,closer:19,closest:[7,15],cluster:[1,2,3,4,8,9,13,14,15,16,17,18,20,21,22,23,24,25],cluster_std:21,clustering_algorithm:21,clustering_benchmarks_v1:[1,11,25],clusteringtheori:25,cmzs15:[7,15,19,25],coarser:[2,19],coarsest:2,code:7,coercibl:[2,9,10,11,14],coffe:[7,24],col:[5,11],collect:5,colombia:20,color:[5,20,21],colourpalett:20,column:[1,2,5,9,10,11,14,18,20],column_stack:15,com:[1,2,11,15,20,23,25],come:[1,15,23],comfort:22,comment:20,commun:[1,9],compar:[1,7,9,15,24,25],compare_partit:[0,7,15,18,23],compare_partitions2:1,comparing_partit:[7,8],comparis:7,comparison:[1,7,9,25],compat:[7,11,15,20,24],complet:[7,14,16,17,18,21,24],completel:22,complex:[2,3,13,14,24],compon:[2,21],compound:18,compress:[4,22],comput:[1,2,3,4,9,11,14,15,16,20,24,25],compute_all_cut:2,compute_full_tre:[2,15],conduct:2,confer:25,confus:[1,9,15],confusion_matrix:1,connect:[2,14,21],consecut:[22,24],consid:[16,17,20,22,24],constant:[3,13],constitut:2,construct:2,consum:[2,11],contain:4,conting:1,contrari:[2,19],contrib:25,contribut:7,control:[2,11,14,19],convers:22,convert:23,convex:[3,5,13,15],convexhul:5,coordin:[2,5,24],copi:21,core:[2,7,11,24],correct:[1,2,9,11,25],correspond:[1,2,5,11,14,15,16,19],cosin:[2,11,14,22],cosinesimil:2,cosinesimil_spars:[2,22],cost:[2,4],cote:20,count:[15,16,17,18],countri:20,counts_:[2,15],cours:[15,19,24],cpu:24,cran:[7,20],creat:[2,21],createindex:2,creatur:22,cross:18,crucial:24,cry:22,csr:22,csr_matrix:2,csv:[20,22],cummax:6,cummin:[2,6,11],cumprod:6,cumsum:6,cumul:6,cuppini:[3,13],current:4,curs:[22,24],curtin:[2,10,25],cut:2,cutre:[7,11,20],cycl:21,czech:20,d31:18,d_m:19,dai:22,dalton:[3,13],danifold:25,dasgupta:25,data:[1,2,3,6,7,9,10,11,13,14,15,19,20,21,24,25],data_typ:2,databas:[22,25],dataset:[1,2,7,9,11,14,15,16,19,20,22,23,25],datatyp:2,dbscan:[2,7,11,15],ddof:2,decim:[2,17],decreas:[2,3,13],dede00:21,default_bas:21,defin:[1,5,9,14,17],definit:[1,9,11,15,22],degrad:24,degre:23,demand:15,demonstr:[16,24],dendrogram:[2,7,11,20],denmark:20,denot:[2,4,11,15,17,18,19],dens:[1,2,18,22],densiti:[2,11,14,25],departur:11,depend:[2,7,11,24],depict:20,descend:6,describ:2,descript:[2,16,17],design:[4,25],desir:[11,17,20],detail:[1,2,7,10,12,15,17,20],detect:[2,11,14,20,24,25],detect_nois:11,detector:[2,7,11],determin:[1,2,7,14,22,24],devel:[15,20,23],dg19:[17,25],diagnost:[2,10,11,14],diagon:1,diagram:15,dict:[1,2,23],dictionari:[1,2],did:19,differ:[11,16,17,19,21,24],difficult:7,digit:[2,16,17,18,24],dijkstra:[2,14,24],dilemma:25,dimension:[2,10,11,14,16,24],dimnam:20,directli:20,disabl:[2,11,19],disconnect:2,discov:[15,25],discoveri:[2,11,14,25],discrep:16,discuss:[17,24],disjoint:[1,4,5,9],disjointset:4,dispers:[3,13],dissimilar:2,dist:[11,14,20],distanc:[2,7,8,11,16,18,19,20,23,24],distances_:[2,15],distinct:5,distinguish:2,distribut:[2,4,7,11,17,21],dn09:[17,25],dna:7,document:[7,15,18,20],doe:[2,11,16,24],doesn:7,doi:[1,2,4,13,25],dok_matrix:22,domain:23,don:[20,22],done:24,dot:[3,4,21],doubl:[1,3,6],down:2,download:7,draw:5,drawn:5,dtype:[2,15,19,22,23],dua:25,dual:10,duck:22,due:[1,9],dure:[2,4,24],dynam:25,e41a1c:21,each:[1,2,4,5,7,11,14,16,17,18,19,20,24],eagerli:19,earli:21,easier:21,easili:[7,15,19,24],ecml:25,ecoli:18,econom:[3,13,15,20],economi:20,edel:[2,10,25],edg:[2,11,14],edit:23,edu:25,effect:[2,11,19,24],effici:[20,24],either:[2,5,14],eksx96:[15,25],elaps:24,elect:22,element:[1,2,3,4,6,9,11,13,22],elementi:[3,13],els:21,empir:[17,22],emst:[2,10,24],emst_mlpack:[7,8,11,14],enabl:2,engin:25,engytim:18,enough:15,enumer:21,environ:[2,7,11,14],environment:20,episod:22,epp:[1,9,25],eps:[2,7,11,15],equal:[3,5,6,13,15,17,19],equip:15,equiti:[3,13],equival:[2,5],esp:9,especi:1,ester:25,estim:[2,11,14,25],estonia:20,etc:20,ethiopia:20,euclidean:[2,5,7,8,11,14,16,18,19,20,24,25],evalu:17,even:[2,3,7,19,24],everi:[1,9,18],everyth:20,evidenc:24,exact:[2,16,22,23,24],exactli:2,exampl:[1,3,5,6,7,15,19,21],excel:19,except:[1,4,9,16,20,24],exercis:22,exhal:22,expect:[1,5,9,17],experiment:25,expert:[15,19,23],explicitli:[11,17,19],extern:[1,7,9,11,20,23,25],extra:[7,8,22],extract:[20,22,24],extrem:[7,24,25],f781bf:21,factor:[2,7,11,14,21],fail:[2,17],fals:[2,3,10,11,14,15,16,22,23,24],familiar:7,famou:22,far:15,fashion:[18,24],fast:[2,4,5,6,10,11,13,14,16,19,25],fastclust:[17,24,25],fastcluster_centroid:24,fastcluster_median:24,fastcluster_ward:24,faster:[2,7,11,14,16,20,23,24],fastest:[21,24],father:22,fcp:18,fear:22,featur:[2,10,11,14,15,16,18,19,20,22,24],feed:20,feel:[7,19],few:[1,2,15,17,20,22],ff7f00:21,fidel:22,figsiz:21,figur:21,file:[14,22],film:22,filterwarn:21,find:[4,6,7,19],fine:2,finer:19,finland:20,fire:16,firenz:[3,13],first:[4,5,7,11,15,19,21,22,24],fish:22,fit:[2,7,15,17,21,22,24],fit_predict:[7,15,19,22,23],fit_transform:21,fix:5,flame:18,flexibl:[2,10,25],float32:[2,22],fly:14,flynt:22,fm83:[18,25],fm_score:[1,9],fmiz16:[17,25],follow:[1,3,13,15],forc:[2,11],forest:[2,24],forget:20,form:[2,7,22],formal:2,format:[2,7,11,22],former:17,forth:22,forthcom:20,fortun:15,found:[2,19],fowlk:[1,9,18,25],frac:[3,4,13],frame:[10,11,14,20,22],franc:20,frankenstein:22,franti:[1,9],friendli:15,from:[1,2,3,5,7,9,10,11,13,14,15,16,17,18,19,21,22,24,25],fs18:[17,25],full:22,further:[5,7,11,14,24],furthermor:2,futur:22,fuzzi:25,fuzzyx:18,g2mg:[16,17],gacaattatcgcggctttcgccatgcagagtctcgtacaatttgtttcacgcccaatattttccgtgcttcgcgagctaggcagccagggcatttttgga:23,gagolew:[1,11,15,20,23,25],gagolewski:[2,4,7,11,12,13,25],gain:14,game:[21,22],gamma:17,gaussian:[2,16,17,18,24],gbc16:[7,15,17,19,23,25],gca:21,gcaattgaagtccagatctaggtatcgtccaagcatattgcctttaagaaatatatttgaccctgtctcttcgtggaggtacacgtcacggaatcgtaagatttccttgg:23,gclust:[7,8,14,20],gener:[1,2,4,6,11,15,16,17,21,24],general:[3,13],generalis:14,geni:[0,3,4,7,8,13,14,15,16,17,19,20,21,22,23,24,25],genie_0:[16,17,18,24],genie_1:16,genieclust:[15,16,17,18,19,20,21,22,23,24],geq:3,german:25,germani:20,get:[4,15,17,19,22],get_count:4,get_gini:4,get_k:4,get_n:4,get_smallest_count:4,ghaisa:[2,10,25],ghana:20,gini:[2,3,4,11,13,15],gini_index:[3,11,13],gini_threshold:[2,11,15,16,17,19,20,24],ginidisjointset:4,github:[1,2,7,11,15,20,23,25],give:[1,2,3,5,9,11,13,14,15,17,20,23,24],given:[1,2,3,4,9,11,13,14,15,22,24],glanc:15,glass:18,glust:20,gnu:[7,24],goal:19,goe:[2,7,11],good:[2,7,16,19,24],gp10:[17,25],graff:25,grai:[2,10,15,25],grail:22,grain:2,grand:22,granular:[15,19],graph:[2,7,8,11,18,24,25],graphic:[5,15],grave:[18,25],greater:[2,20,24],greec:20,green:5,grei:19,grid:17,gromit:22,ground:[1,9,17],groundhog:22,group:[2,7,11,15,18,20],grumpier:22,guarante:2,guess:15,guffman:22,gun:22,h2mg:[16,17],h_oecd:20,ha85:[17,18,25],han:25,hand:[2,7,11,15,24],handi:1,handl:22,happen:15,hard:[15,22],has:[2,3,7,13,18,20,24],hasattr:21,have:[3,4,13,16,17,18,19,24],hclust:[7,11,20],hdbscan:[2,7,11,18,25],head:[20,22],header:7,heali:25,heat:18,height:11,help:22,henc:[1,2,7,9,11,17,24],hepta:18,here:[5,15,16,17,19,22,24],hierarch:[2,4,8,13,14,15,17,19,20,21,24,25],hierarchi:[2,7,11,15,22,24],high:[16,22,23,24],higher:[10,24],highest:17,highli:[2,7,11,24],hire:5,hnsw:2,hold:[2,3,6,11,13,14],holi:22,hollywood:22,hood:19,hope:22,horizontalalign:[5,21],how:[7,15,19,20,22],howev:[2,7,11,17,19,24],hspace:21,html:25,http:[1,2,4,10,11,15,20,23,25],hubert:[1,9,25],hull:5,human:20,hungari:20,hunt:22,i_dataset:21,iceland:20,ics:25,idea:[2,7,19],ident:[1,9,24],identif:19,identifi:[2,11,14,19,20],ieee:[1,9,25],ierarch:25,ignor:[2,21],iii:22,illustr:[21,22],iloc:22,imbalanc:[2,7,11],implement:[1,2,4,7,10,13,14,15,17,18,19,22,23,24],importantli:24,includ:[2,17],increas:[2,11,15,24],increasingli:[2,3,6,13],independ:[1,2,9],index:[1,2,3,4,6,7,9,11,13,15,16,17,18,20,23],indexthreadqti:2,indic:[1,3,5,13,14,15,16,18,20,23],individu:7,inequ:[0,2,7,8,15],inform:[1,2,4,9,11,13,14,17,18,25],init:2,input:[1,2,7,9,11,13,14,15,20,22,24],ins:[2,4,13,25],insert:6,inspect:17,inspir:5,instal:[2,20],instanc:[2,24],instead:[2,11,14,15],integ:[1,2,4,5,6,9,11,22],intel:24,intellig:25,interact:[15,20],interest:20,interestingli:[16,17],interfac:[7,15],intern:[0,1,5,7,9],intp:[15,19,23],invari:2,ionospher:18,ireland:20,iri:[9,11,14,18],iris5:18,irrespect:24,is_sort:3,ish:15,isin:22,islic:21,isol:18,israel:20,issu:7,istodor:25,itali:20,item:[1,18],iter:2,itertool:21,itm:[17,18,25],its:[1,2,4,5,7,9,11,15,24],itself:[2,4,24],ivoir:20,jaccard_spars:2,jain:[15,18,25],japan:20,jedi:22,jl05:[15,25],jmlr:25,john:22,join:15,joincod:20,joincountrydata2map:20,joss:[2,25],journal:[1,2,9,10,25],jumanji:22,just:[2,11,24],karypi:25,kdd:25,keep:[7,19],kei:1,kernel:[24,25],khk99:[17,25],king:22,kingdom:20,kmean:[9,15,24],kmkm17:[24,25],kneighbors_graph:21,knowledg:[1,2,9,11,14,25],known:[15,17,19],kobren:25,korea:20,kriegel:25,krishnamurthi:25,kruskal:[2,24],kumar:25,kwarg:5,l1_spars:2,l2_spars:2,label:[1,2,5,7,9,14,15,17,19,23],labels0:[15,19,23],labels_:[2,21],labels_geni:[15,19],labels_hdbscan:[15,19],labels_kmean:15,labels_nois:19,labels_pr:23,labels_tru:[15,19,23],labirynth:18,lampert:25,languag:[7,25],lao:20,laplacian:17,laptop:16,larg:[7,16,25],larger:[2,17,21,24],largest:1,larri:22,las:11,lastp:15,latex:[2,25],latter:[2,5,17],latvia:20,law:25,lead:17,leaf:2,learn:[1,2,7,9,10,15,17,21,24,25],least:[2,16,17,19,24],leav:[2,11],lebanon:20,lectur:25,left:[2,3,15,21],len:[5,15,19,21,23],length:[1,2,4,5,6,9],leq:1,less:[2,16,24],lesser:17,let:[1,4,9,15,16,19,20,22,23,24],level:[2,11,24],leven:[2,23],levenshtein:23,lgorithm:25,librari:[2,7,10,11,14,15,20,25],libreria:[3,13],libya:20,licens:7,lie:15,life:22,light:19,like:[2,6,7,10,11,14,15,24],limit:[17,24],lin73:[15,25],line:[5,18],linear:[1,9],linf:2,linf_spars:2,ling:25,link:[7,11,15],linkag:[2,7,11,14,16,17,18,21,24],linkage_matrix:15,linux:24,list:[4,11,15,16,20,21,23,24],lithuania:20,littl:20,live:22,load:[15,19,22],loadtxt:[15,19,23,24],loaf:22,loc:22,locat:[2,6],logic:[10,11,14],lola:22,look:[7,19],low:[2,10,11,14,24],lower:17,lozhnikov:[2,10,25],lstrip:21,lsun:18,luxembourg:20,machin:[1,2,9,10,25],magic:[2,11,15],magnolia:22,mai:[1,2],main:1,make:[2,7,11,14,15],make_blob:21,make_circl:21,make_moon:21,malkov:[2,25],malkovich:22,mallow:[1,9,18,25],manhattan:[2,11,14],mani:[2,15,19],manual:[2,15,20,25],map:[18,22,25],mapcountrydata:20,mapdata:20,maptitl:20,march:[2,10,25],marek:[7,12,20],mariescu:25,mark:[2,11],marker:[5,19],markers:5,master:[2,15,20,23,25],match:[1,7,9,15,25],mathrm:1,matplotlib:[5,15,19,21],matrix:[1,2,5,9,10,11,14,15,20,21,22,23],matter:[1,5,22],mauritania:20,mauritiu:20,max:[1,2,5,6,11,14,16,17,18,21,22],maxim:[1,9,17],maximis:17,maximum:6,mccallum:25,mcinn:25,mcs:15,mcss:19,mean:[1,2,7,16,17,18,19,20,22,24,25],meaning:[7,16,21],measur:[1,3,7,8,9,11,15,18,20,25],median:[16,17,18,24],member:[4,7,20,22],membership:4,memori:[2,6,7,14,24],men:22,menac:22,mentekidi:[2,10,25],mention:[19,23],merg:[2,4,7,11,15],messag:[2,10,11,14,21],meta:22,method:[2,7,11,14,15,17,20,21,24,25],metric:[2,10,11,14,15,23,24,25],mexico:20,mha17:[19,25],mi_scor:[1,9],might:[1,2,6,7,9,11,14,15,17,19,24],million:[7,15,16],min:[1,6,16,17,18],min_cluster_s:[2,11,15,19],min_sampl:19,mind:[15,24],mine:[1,9,25],minimum:[2,5,6,7,8,11,17,19,24,25],minut:16,miss:11,missingcountrycol:20,mixtur:[17,18],mk1:18,mk2:18,mk3:18,mk4:18,mlpack:[2,10,24,25],mlpack_en:[2,24],mlpack_leaf_s:2,mnist:[18,24],model:25,modul:[0,7,25],monath:25,monti:22,more:[1,2,3,6,7,12,15,17,18,19,20,24],moreov:[1,2,14,17,19,24],most:[11,15,21,24],moulavi:[2,11,14,25],movi:7,movieid:22,movielen:22,mrg10:[24,25],mrk:5,mrk_recycl:5,msnowozinl12:[17,25],mss:19,mst:[2,5,7,8,10,11,20,24,25],mst_from_dist:5,much:[2,15,16,17,24],mul13:[17,24,25],multipl:[1,14,17,25],must:[2,4,5],mutabilita:[3,13],mutual:[1,2,7,9,11,14,18,19],n_cluster:[2,7,15,17,19,21,22,23,24],n_clusters_:2,n_featur:2,n_features_:2,n_init:[17,24],n_neighbor:21,n_sampl:[2,21],n_samples_:2,nacc:1,naidan:[2,25],naiv:4,nake:22,name:[2,14,20,21,22],namecolumntoplot:20,namejoincolumn:20,namibia:20,nan:18,natur:19,naturalresourc:20,nbmn19:[7,24,25],ncl:15,ncol:5,ncs:19,ndarrai:[1,2,3,4,6],ndmin:[15,19,24],nearest:[2,7,11,14,15,16],neat:19,necessarili:[6,16],need:[2,4,24],neg:[1,3,9,13],negdotprod:2,negdotprod_spars:2,neighbour:[2,7,11,14,15,16,22,23,24],neither:4,nest:15,net:25,netherland:20,network:14,nicaragua:20,nice:[15,21,24],night:22,nip:25,nmi:1,nmi_:9,nmrk:5,nmslib:[2,7,16,22,23,24,25],nmslib_n_neighbor:2,nmslib_params_index:[2,23],nmslib_params_init:2,nmslib_params_queri:2,no_label:15,no_structur:21,nois:[2,11,14,15,16,18,20,21,24,25],noisy_circl:21,noisy_moon:21,non:[2,3,13,19,22,25],non_nois:19,nondecreasingli:[4,14],none:[2,5,11,21],nonempti:[1,9],nor:4,normal:[1,9,21,25],normalis:[1,3,4,13,18],normalize_confusion_matrix:1,normalized_accuraci:[1,9],normalized_confusion_matrix:[1,15],normalized_mi_scor:[1,9],normleven:2,north:20,norwai:20,note:[1,2,3,4,5,6,7,9,11,14,15,16,20,21,24,25],noteworthi:16,notion:[2,11,15],novak:[2,25],now:[2,11,19,22,24],nowozin:25,number:[2,3,4,7,11,13,14,15,17,19,20,21],numer:[2,3,10,11,13,14],numpi:[2,6,15,19,21,22,23,24],object:[2,9,10,11,14,15,20,21,22],observ:[1,2,9,14,16,17,22,24],obtain:[2,11,15,19,20,23],occur:11,octob:22,oecd:20,off:5,often:[2,7,11,15],old:[19,22],old_movieid_map:22,oliv:22,ols95:[24,25],olson:[2,14,25],olymp:18,omit:17,omp_num_thread:[2,11,14],onc:[2,5,11,19,24],one:[2,3,5,7,10,11,13,14,15,16,18,19,22,23,24],ones:[2,16,19],onli:[2,5,7,11,15,16,17,20,21,22,24],onto:1,open:[2,7,10,25],oper:4,option:2,order:[2,3,4,6,11,13,20,24],org:[4,10,20,25],organ:25,orient:15,origin:[1,2,7,11,14,15,16,19,21,24],other:[2,3,4,7,10,11,13,14,15,17,18,22,24,25],otherwis:[2,4,11,13,14],our:[2,16,19,22,24],ourselv:[17,20],out:[2,15,20,21,22,24],outcom:[16,17],outlier:[2,4,7,11,13,14,25],outperform:[2,7,11,15,17],output:[1,2,9,15,16,17,21],over:[4,10,17],overal:[17,24],own:7,packag:[2,4,5,7,15,17,18,19,20,22,23,24],page:[7,25],pair:[1,5,7,9,18,20],pair_sets_index:[1,9,11],pairwis:[1,2,7,8,11,24],palett:20,panama:20,panda:[15,19,22],paolo:[3,13],paper:[10,25],parabol:18,parallel:[2,14,25],parallelis:[2,10,11,14,24],param:21,paramet:[1,2,3,4,5,6,7,11,15,16,17,19,21,24],parameteris:19,parametr:17,parent:4,part:[2,17,22,24],partial:20,particular:[5,13,15,16],partit:[1,2,4,7,8,11,15,17,18,19,20,21,24,25],pass:[2,11,14],path:4,pathbas:18,patriot:22,pattern:25,pch:11,pdf:[2,5,10,25],pdist:2,pedregosa:25,pedrycz:25,penalis:[2,11],peopl:22,perceiv:[3,13],perfect:[3,13,15,17,18],perfectli:7,perform:[2,11,16,18,22,23,24],perhap:17,permut:[1,3,9,13],person:6,personaldevelopmentandhealth:20,pessimist:4,phantom:22,physic:24,pictur:15,pigou:[3,13],pivot:[1,15],pkdd:25,plai:19,plausibl:17,plot:[0,2,7,11,15,19,20,21],plot_num:21,plot_scatt:[5,15,19],plot_seg:5,plt:[5,15,19,21],png:5,point:[2,5,11,14,15,16,17,20,24],poland:20,poli:17,polic:22,policeman:22,pool:24,poor:[3,13],popul:17,popular:15,portug:20,posit:6,possibl:[1,9,15,20],post:[2,23],postprocess:[2,11],power:7,practic:[6,15],precis:[2,11,14,16],precomput:2,predecessor:2,predefin:[2,7,11],predict:[15,16,17,19,21],prefer:[1,6,9],preprocess:[2,18,21],presenc:9,present:18,pretti:5,prevent:[2,7,11],preview:[20,23],previou:[16,24],prim:[2,10,14,24],princess:22,principl:[3,13,25],print:[2,10,11,14,20,22,23,24],probabl:[1,9,25],problem:[1,9,24],proc:[2,10,25],procedur:[2,19,21],process:2,produc:22,product:6,progress:[2,11,14],project:[19,20,22,25],properti:[1,2,5,9,11,25],provid:[2,10,11,17,19,24],psi:[1,9],publish:[2,7],pull:[2,11,14],puriti:[1,9,18],pypi:7,pyplot:[5,15,19,21],python:[7,15,20,22,24,25],python_bind:25,quadrophenia:22,qualiti:[15,17,24],quantifi:[1,2,3,9,13,16,17],question:24,quickli:24,quiroz:[1,9],quit:17,r15:18,rabb:22,rais:[2,11],ram:[2,10,22,25],rand:[1,9,15,16,17,18,20,21,23],rand_scor:[1,9],randn:5,random:[5,6,21],random_st:21,randomli:6,rang:[5,15,16,19],rank:[4,17,18],rate:22,rather:2,raw:[2,11,14,18],rbf:17,reachabl:[2,7,11,14,19],read:[7,18,20,22],read_csv:22,readabl:20,real:[2,9],realli:4,reason:[17,20],recal:[16,24],recognit:25,recommend:[7,15,16,17,24],recomput:[4,24],record:2,recurs:4,red:[5,22],refer:[1,2,3,7,15,16,17,18,19,20,23,24],regard:20,region:15,reimplement:11,rel:7,relat:21,reli:[2,4,15,16,19,22,23],reloc:1,remap:1,remov:[16,18,19,24],rendon:[1,9],rennt:22,repeat:5,replac:19,report:17,repositori:[20,25],repr:22,repres:[1,4,9,14],republ:20,request:[2,14,24],requir:2,research:[1,9,25],resist:[2,4,7,11,13,25],resourc:24,respect:[1,2,5,7,9,11,14,16,18,19,22,24],restart:24,restrict:[17,20],result:[1,2,4,7,9,11,15,16,17,19,21,24],rev:11,reveal:19,review:22,rezaei:[1,9,25],rf16:[18,25],rich:[3,13,17],right:[3,21],ring:18,ring_noisi:18,ring_outli:18,rmd:23,robinhood:3,robust:[2,11],robustifi:[2,7,11,15],rocket:22,romania:20,round:[1,3,17],routin:[11,22,23,25],row:[1,2,9,14,18,20,22],run:[2,4,6,11,16,21,22,24],rushmor:22,russia:20,rworldmap:20,safe:24,sai:[2,10,20],sake:15,same:[1,4,5,9,15,17,22,24],sampl:[3,13,17,20,21],sander:[2,11,14,25],scale:[2,16,17,18,20,24],scatter:[5,15,19,21],scheme:6,schur:[3,13],scienc:[2,4,11,13,25],scikit:[7,15,17,21,24,25],scipi:[2,5,15,22],score:[1,3,7,8,11,13,15,17,18,20],script:21,search:[7,16,22,23,24],searchsort:22,seber:[3,13],sec:22,second:[4,24],secret:22,section:[15,16,17,18,24],see:[1,2,4,5,7,9,10,12,15,16,17,18,20,23,24],seed:21,seem:15,seen:16,segment:5,select:[11,14,21],self:[2,25],sens:17,separ:14,sequenc:15,seri:[1,24],set:[1,2,3,4,5,7,9,11,13,14,15,17,18,19,20,21,23,24,25],set_data_structur:4,set_param:24,setenv:14,setquerytimeparam:2,shape:[1,2,4,5,15,19],shave:22,shortest:14,should:[2,11,15,17],shouldn:15,show:[5,15,19,21,22],show_leaf_count:15,shut:22,side:15,sieranoja:25,sight:22,sigkdd:[2,10,25],sigma:[1,3],sigmoid:17,signific:17,sim:15,similar:[1,7,8,11,15,16,17,18,20,22,23],similarli:[1,9],simpl:[7,22],simplic:[2,5,7,11],singl:[2,9,11,16,17,18,21,24,25],sipu:[16,18,24],site:19,six:25,size:[2,3,4,7,11,13,14,15,21,24],sklearn:[15,21,24],sklearn_kmean:24,slightli:24,slovak:20,slovenia:20,slow:[4,14,24],slower:24,small:[1,2,6,7,11,16,22,24],smaller:[4,17,20],smallest:[2,4,6,7,11,15],smell:22,smile:18,smooth:[2,7,11,14],smp:24,societi:20,softwar:[2,10,25],solut:[1,2,9,17],solv:[7,24],som:25,some:[1,2,4,7,9,14,17,18,24],somehow:[2,7,11],someth:22,sometim:[1,2,7,9,17],somewhat:15,somewher:15,sonar:18,sort:[2,3,6,13,14,24],sort_valu:22,soup:22,sourc:[2,7,10,17,25],south:20,space:[2,10,11,14,15,16,24,25],spain:20,span:[2,5,7,8,11,17,19,24,25],spars:[2,7],spatial:[2,5,25],specif:[20,21],spectral:17,spectral_rbf_5:[17,18],speed:15,sphinx:[15,20,23],spinal:22,spiral:18,splendid:7,split:15,spoiler:16,sqrt:[2,4,24],squad:22,squar:[2,18],squareform:2,ssfindex:20,ssi:20,ssi_2016_categori:20,ssize_t:4,stabl:[2,15,17,25],stage:[2,18],standardis:[2,11],standardscal:21,star:22,stat:20,state:20,statist:[6,16,17,18,25],statistica:[3,13],statlog:18,std:[2,16,17,18],stderr:2,step:19,still:[19,24],sting:22,stop:21,store:[2,22,24],stori:22,str:[2,23],strang:15,strike:22,string:[2,7],stripe:18,structur:[2,24],studi:[17,24,25],style:5,subgroup:15,subject:17,submarin:22,suboptim:14,subplot:[15,19,21],subplots_adjust:21,subset:[1,4,9],subtract:15,suggest:[2,17],suit:[1,7,16,17,18,24,25],suitabl:[2,24],sum:[1,6,9],sum_:[3,4],summari:7,summaris:[1,15,18],support:[2,7,22],surpris:15,sustain:20,sweden:20,switzerland:20,symbol:15,synonym:[2,11,14],synthet:24,syst:14,system:[24,25],tabl:[1,9,22],take:[2,3,11,13,16,22,24],taken:2,tap:22,target:18,task:[2,7,14,24],tataacaaccctgattacatcaagctacgctccggtgcgttgcctcggacgagtgctaatccctccccactgactgtattcatcttgacaata:23,tech:14,temporarili:19,tend:[2,17,19],term:15,terrestri:22,test:[11,17],tetra:18,text:[5,21],thailand:20,than:[2,4,16,20,24],thank:[7,24],thei:[2,3,9,13,16,17,22,24],them:[15,19],themself:2,theoret:[1,9,17,25],theori:25,therefor:[2,5,7,11,24],therein:1,thi:[1,2,4,5,11,14,15,16,17,18,19,20,21,22,23,24],thou:22,thousand:15,thread:[2,7,11,14],three:22,threshold:[2,11,15,17],thrown:4,tile:5,time:[2,3,4,6,7,11,13,14,17,20,21],timestamp:22,tini:[2,16,18,24],tipografia:[3,13],titl:[5,15,19,21,22],tkde:[1,25],to_list:4,to_list_norm:4,tocsr:22,todens:22,togeth:[2,11,15],toi:[7,22],tolist:23,tommi:22,too:[2,14,15],tool:[0,2,7],top:[2,21,22,24],total:[2,3,16,18,24],toward:25,tracker:7,traffic:22,trajectori:[16,18],transact:[1,2,9,11,14,25],transax:21,transform:[1,9,21,22],transit:20,translat:[2,24],trapped_lov:18,treat:2,treatment:2,tree:[2,5,7,8,11,15,17,19,20,21,23,24,25],trouser:22,truncate_mod:15,truth:[1,9,17],ttagagcgcttaaccccacaggaaccgagttcccctcatgtggcaaggttctcccgcctcaggtatcacagaaacaaggtatgtagccctaggctacgagc:23,tune:[15,19],tunisia:20,turkei:20,turn:[2,15,21,24],tutori:7,twist:22,two:[1,2,5,9,15,22,24,25],twodiamond:18,twosplash:18,type:[2,6,22],typic:[2,17],ubuntu:24,uci:[18,25],ukrain:20,ult05:[17,25],ultrametr:[2,11],ultsch:25,unadjust:[1,9],unbal:18,under:[7,19],underli:1,undirect:14,unfortun:15,union:4,uniqu:[2,15,19,22,23],unit:20,unless:[2,24],unlik:5,updat:[4,21],url:25,usabl:[2,7,11],use:[2,4,7,10,11,23,24],used:[1,2,3,6,9,11,13,14,15,17,20,23,24],useful:[6,17,19],usefulness:17,user:[2,15,19,22,25],userid:22,userwarn:21,uses:[3,13,24],using:[2,11,14,25],usual:2,v11:25,valid:[1,9,11,17,20,23,25],valu:[1,2,3,4,6,15,21],vari:21,variabilita:[3,13],variabl:[2,11,14,17],varianc:[2,16,18,21,24],variant:[1,9,15,24],variou:[5,17],veb10:[18,25],vector:[1,2,3,4,5,6,9,11,13,17],verbos:[2,10,11,14,20],veri:[2,6,7,10,11,14,23,24],version:[1,2,7,9,11,15,16,17,18,22,24,25],versu:[1,9],vertex:[2,11],vertic:14,via:7,vietnam:20,vinh10a:25,vinh:[1,9,25],violat:[2,11],visibl:24,visual:[2,11,14,25],voronoi:15,wai:[2,5,17,19,22],wait:22,wallac:22,wanda:22,want:11,war:22,ward:[7,17,18,21,24],warn:[2,21],wdbc:18,weav:[15,20],web:20,websit:[21,22],weight:[2,11,14],welcom:7,well:[2,5,14,15,17],wellb:20,wellbalancedsocieti:20,were:[16,18,19,22,24],what:[2,19],whatev:19,when:[2,19],whenev:1,where:[1,2,3,4,5,6,9,11,13,14,16,22],wherea:15,wherev:18,whether:[2,10,11,14],which:[1,2,9,11,14,15,16,17,19,22,24],which_clust:22,whichev:4,white:20,whole:[2,7,11,22],whose:[2,4,6,11],wide:22,wiki:4,wikipedia:4,window:18,wine:18,wingnut:18,wise:18,within:[7,17],won:22,word:15,work:[2,6],workhors:20,workshop:25,worms_2:[18,24],worms_64:[16,18,24],wors:[16,24],worth:[2,11,15,17],would:[15,22],wrapper:1,wrong:22,wspace:21,wut:[16,18],www:[20,25],x86_64:24,x_1:[3,4,13],x_aniso:21,x_i:[3,4,13],x_j:[3,4,13],x_k:4,x_n:[3,13],x_oecd:20,xlim:21,xnn:25,xperienc:25,xtick:21,y_pred:[9,11,20,21],y_test:11,y_true:9,yeast:18,yellow:22,yemen:20,yet:20,yield:[2,3,13,16,22],ylim:[5,21],you:[4,5,11,14],young:22,your:14,ython:25,ytick:21,zealand:20,zenodo:25,zero:22,zhang:[2,10,25],zhong:25,zigzag:18,zigzag_noisi:18,zigzag_outli:18,zimbabw:20,zimek:[2,11,14,25]},titles:["Python Package genieclust Reference","genieclust.compare_partitions","genieclust.Genie","genieclust.inequity","genieclust.internal","genieclust.plots","genieclust.tools","genieclust: Fast and Robust Hierarchical Clustering with Noise Point Detection","R Package genieclust Reference","comparing_partitions: Pairwise Partition Similarity Scores","emst_mlpack: Euclidean Minimum Spanning Tree","gclust: The Genie++ Hierarchical Clustering Algorithm","genieclust-package: The Genie++ Hierarchical Clustering Algorithm (with Extras)","inequity: Inequity (Inequality) Measures","mst: Minimum Spanning Tree of the Pairwise Distance Graph","Basics","Benchmarks \u2014 Approximate Method","Benchmarks (How Good Is It?)","Benchmarks \u2014 Detailed Results","Clustering with Noise Points Detection","R Interface Examples","Comparing Algorithms on Toy Datasets","Example: Sparse Data and Movie Recommendation","Example: String Data and Grouping of DNA","Timings (How Fast Is It?)","References"],titleterms:{"break":15,"function":24,Ice:15,The:[11,12],algorithm:[11,12,21],also:[11,14,25],ami:18,approxim:16,argument:[9,10,11,13,14],author:12,basic:15,benchmark:[16,17,18],cluster:[7,11,12,19],compar:21,compare_partit:1,comparing_partit:9,comparis:19,comparison:15,data:[22,23],dataset:[17,18,21,24],dendrogram:15,descript:[9,10,11,12,13,14],detail:[9,11,13,14,18],detect:[7,19],distanc:14,dna:23,emst_mlpack:10,euclidean:10,exampl:[9,11,13,14,20,22,23],extra:12,factor:19,fast:[7,24],further:15,gclust:11,geni:[2,11,12],genieclust:[0,1,2,3,4,5,6,7,8,12],good:17,graph:14,group:23,hdbscan:[15,19],hierarch:[7,11,12],how:[17,24],indic:7,inequ:[3,13],interfac:20,intern:4,larg:[17,18,24],mean:15,measur:13,method:16,minimum:[10,14],movi:22,mst:14,nacc:18,nmi:18,nois:[7,19],number:24,packag:[0,8,12],pairwis:[9,14],partit:9,plot:5,point:[7,19],psi:18,python:0,read:15,recommend:22,refer:[0,8,9,10,11,13,14,25],result:18,robust:7,score:9,see:[11,14,25],similar:9,small:[17,18],smooth:19,span:[10,14],spars:22,string:23,summari:[17,18,24],tabl:7,thread:24,time:24,toi:21,tool:6,tree:[10,14],usag:[9,10,11,13,14],valu:[9,10,11,13,14]}}) \ No newline at end of file diff --git a/docs/weave/basics.html b/docs/weave/basics.html index a9aaa0c7..bdab5f52 100644 --- a/docs/weave/basics.html +++ b/docs/weave/basics.html @@ -7,7 +7,7 @@ - Basics — genieclust 0.9.6.dev0 documentation + Basics — genieclust 0.9.6 documentation @@ -66,7 +66,7 @@
    - 0.9.6.dev0 + 0.9.6
    @@ -466,7 +466,7 @@

    Further Reading

    - © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

    diff --git a/docs/weave/benchmarks_approx.html b/docs/weave/benchmarks_approx.html index c2e00021..ce57164b 100644 --- a/docs/weave/benchmarks_approx.html +++ b/docs/weave/benchmarks_approx.html @@ -7,7 +7,7 @@ - Benchmarks — Approximate Method — genieclust 0.9.6.dev0 documentation + Benchmarks — Approximate Method — genieclust 0.9.6 documentation @@ -66,7 +66,7 @@
    - 0.9.6.dev0 + 0.9.6
    @@ -514,7 +514,7 @@

    Benchmarks — Approximate Method

    - © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

    diff --git a/docs/weave/benchmarks_ar.html b/docs/weave/benchmarks_ar.html index 0e1d0cc5..4bb1cbfe 100644 --- a/docs/weave/benchmarks_ar.html +++ b/docs/weave/benchmarks_ar.html @@ -7,7 +7,7 @@ - Benchmarks (How Good Is It?) — genieclust 0.9.6.dev0 documentation + Benchmarks (How Good Is It?) — genieclust 0.9.6 documentation @@ -66,7 +66,7 @@
    - 0.9.6.dev0 + 0.9.6
    @@ -563,7 +563,7 @@

    Summary

    - © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

    diff --git a/docs/weave/benchmarks_details.html b/docs/weave/benchmarks_details.html index 7b324363..9a693719 100644 --- a/docs/weave/benchmarks_details.html +++ b/docs/weave/benchmarks_details.html @@ -7,7 +7,7 @@ - Benchmarks — Detailed Results — genieclust 0.9.6.dev0 documentation + Benchmarks — Detailed Results — genieclust 0.9.6 documentation @@ -66,7 +66,7 @@
    - 0.9.6.dev0 + 0.9.6
    @@ -10832,7 +10832,7 @@

    Summary

    - © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

    diff --git a/docs/weave/noise.html b/docs/weave/noise.html index 10a8b60d..254daded 100644 --- a/docs/weave/noise.html +++ b/docs/weave/noise.html @@ -7,7 +7,7 @@ - Clustering with Noise Points Detection — genieclust 0.9.6.dev0 documentation + Clustering with Noise Points Detection — genieclust 0.9.6 documentation @@ -66,7 +66,7 @@
    - 0.9.6.dev0 + 0.9.6
    @@ -365,7 +365,7 @@

    A Comparision with HDBSCAN*

    - © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

    diff --git a/docs/weave/r.html b/docs/weave/r.html index d9832a57..3fbb5906 100644 --- a/docs/weave/r.html +++ b/docs/weave/r.html @@ -7,7 +7,7 @@ - R Interface Examples — genieclust 0.9.6.dev0 documentation + R Interface Examples — genieclust 0.9.6 documentation @@ -66,7 +66,7 @@
    - 0.9.6.dev0 + 0.9.6
    @@ -316,7 +316,7 @@

    R Interface Examples

    - © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

    diff --git a/docs/weave/sklearn_toy_example.html b/docs/weave/sklearn_toy_example.html index bb0da9fb..98e3f692 100644 --- a/docs/weave/sklearn_toy_example.html +++ b/docs/weave/sklearn_toy_example.html @@ -7,7 +7,7 @@ - Comparing Algorithms on Toy Datasets — genieclust 0.9.6.dev0 documentation + Comparing Algorithms on Toy Datasets — genieclust 0.9.6 documentation @@ -66,7 +66,7 @@
    - 0.9.6.dev0 + 0.9.6
    @@ -356,7 +356,7 @@

    Comparing Algorithms on Toy Datasets

    - © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

    diff --git a/docs/weave/sparse.html b/docs/weave/sparse.html index 26e89513..f9215834 100644 --- a/docs/weave/sparse.html +++ b/docs/weave/sparse.html @@ -7,7 +7,7 @@ - Example: Sparse Data and Movie Recommendation — genieclust 0.9.6.dev0 documentation + Example: Sparse Data and Movie Recommendation — genieclust 0.9.6 documentation @@ -66,7 +66,7 @@
    - 0.9.6.dev0 + 0.9.6
    @@ -386,7 +386,7 @@

    Example: Sparse Data and Movie Recommendation

    - © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

    diff --git a/docs/weave/string.html b/docs/weave/string.html index 16e2603c..7718c6a7 100644 --- a/docs/weave/string.html +++ b/docs/weave/string.html @@ -7,7 +7,7 @@ - Example: String Data and Grouping of DNA — genieclust 0.9.6.dev0 documentation + Example: String Data and Grouping of DNA — genieclust 0.9.6 documentation @@ -66,7 +66,7 @@
    - 0.9.6.dev0 + 0.9.6
    @@ -266,7 +266,7 @@

    Example: String Data and Grouping of DNA

    - © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

    diff --git a/docs/weave/timings.html b/docs/weave/timings.html index 4825a815..05ea245d 100644 --- a/docs/weave/timings.html +++ b/docs/weave/timings.html @@ -7,7 +7,7 @@ - Timings (How Fast Is It?) — genieclust 0.9.6.dev0 documentation + Timings (How Fast Is It?) — genieclust 0.9.6 documentation @@ -66,7 +66,7 @@
    - 0.9.6.dev0 + 0.9.6
    @@ -702,7 +702,7 @@

    Summary

    - © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

    diff --git a/docs/z_bibliography.html b/docs/z_bibliography.html index 2ac19f7f..5f658d43 100644 --- a/docs/z_bibliography.html +++ b/docs/z_bibliography.html @@ -7,7 +7,7 @@ - References — genieclust 0.9.6.dev0 documentation + References — genieclust 0.9.6 documentation @@ -65,7 +65,7 @@
    - 0.9.6.dev0 + 0.9.6
    @@ -321,7 +321,7 @@

    See Also

    - © Copyright 2020, Marek Gagolewski + © Copyright 2021, Marek Gagolewski

    diff --git a/genieclust/__init__.py b/genieclust/__init__.py index dfb6e605..1590598b 100644 --- a/genieclust/__init__.py +++ b/genieclust/__init__.py @@ -28,4 +28,4 @@ from . import internal from .genie import Genie, GIc -__version__ = '0.9.6.dev0' # see also ../setup.py +__version__ = '0.9.6' # see also ../setup.py; e.g., '0.9.6.dev0' diff --git a/man/emst_mlpack.Rd b/man/emst_mlpack.Rd index 92a8be44..9c610f27 100644 --- a/man/emst_mlpack.Rd +++ b/man/emst_mlpack.Rd @@ -17,16 +17,10 @@ An object of class \code{mst}, see \code{\link{mst}()} for details. } \description{ Provides access to an implementation of the Dual-Tree Borůvka -algorithm based on kd-trees. It is fast for (very) low-dimensional +algorithm based on kd-trees from MLPACK. It is fast for (very) low-dimensional Euclidean spaces. For higher dimensional spaces (say, over 5 features) -or other metrics, -use the parallelised Prim-like algorithm implemented in \code{\link{mst}()}. -} -\details{ -Calls \code{emstreeR::mlpack_mst()} and converts the result -so that it is compatible with the output of \code{\link{mst}()}. - -If the \code{emstreeR} package is not available, an error is generated. +or other metrics, use the parallelised Prim-like algorithm implemented +in \code{\link{mst}()}. } \references{ March W.B., Ram P., Gray A.G., diff --git a/man/gclust.Rd b/man/gclust.Rd index da86d12b..a092e698 100644 --- a/man/gclust.Rd +++ b/man/gclust.Rd @@ -182,7 +182,7 @@ adjusted_rand_score(y_test, y_pred) pair_sets_index(y_test, y_pred) # Fast for low-dimensional Euclidean spaces: -if (require("emstreeR")) h <- gclust(emst_mlpack(X)) +h <- gclust(emst_mlpack(X)) } \references{ diff --git a/setup.py b/setup.py index 34658230..ce4b3dcd 100644 --- a/setup.py +++ b/setup.py @@ -135,7 +135,7 @@ def build_extensions(self): setuptools.setup( name="genieclust", - version="0.9.6.dev0", # see also genieclust/__init__.py; e.g., 0.9.4.dev0 + version="0.9.6", # see also genieclust/__init__.py; e.g., 0.9.4.dev0 description="The Genie++ Hierarchical Clustering Algorithm (with Extras)", long_description=long_description, long_description_content_type="text/x-rst", diff --git a/src/RcppExports.cpp b/src/RcppExports.cpp index 7fd51b2f..8bda704e 100644 --- a/src/RcppExports.cpp +++ b/src/RcppExports.cpp @@ -1,6 +1,8 @@ // Generated by using Rcpp::compileAttributes() -> do not edit by hand // Generator token: 10BE3573-1514-4C36-9D1C-5A225CD40393 +#include +#include #include using namespace Rcpp; @@ -113,6 +115,17 @@ BEGIN_RCPP return rcpp_result_gen; END_RCPP } +// __emst_mlpack +Rcpp::NumericMatrix __emst_mlpack(Rcpp::NumericMatrix X); +RcppExport SEXP _genieclust___emst_mlpack(SEXP XSEXP) { +BEGIN_RCPP + Rcpp::RObject rcpp_result_gen; + Rcpp::RNGScope rcpp_rngScope_gen; + Rcpp::traits::input_parameter< Rcpp::NumericMatrix >::type X(XSEXP); + rcpp_result_gen = Rcpp::wrap(__emst_mlpack(X)); + return rcpp_result_gen; +END_RCPP +} // __gclust List __gclust(NumericMatrix mst, double gini_threshold, bool verbose); RcppExport SEXP _genieclust___gclust(SEXP mstSEXP, SEXP gini_thresholdSEXP, SEXP verboseSEXP) { @@ -203,6 +216,7 @@ static const R_CallMethodDef CallEntries[] = { {"_genieclust_adjusted_mi_score", (DL_FUNC) &_genieclust_adjusted_mi_score, 2}, {"_genieclust_normalized_accuracy", (DL_FUNC) &_genieclust_normalized_accuracy, 2}, {"_genieclust_pair_sets_index", (DL_FUNC) &_genieclust_pair_sets_index, 2}, + {"_genieclust___emst_mlpack", (DL_FUNC) &_genieclust___emst_mlpack, 1}, {"_genieclust___gclust", (DL_FUNC) &_genieclust___gclust, 3}, {"_genieclust___genie", (DL_FUNC) &_genieclust___genie, 6}, {"_genieclust_mst_default", (DL_FUNC) &_genieclust_mst_default, 5}, diff --git a/src/c_common.h b/src/c_common.h index ec99462f..5c2fefbd 100644 --- a/src/c_common.h +++ b/src/c_common.h @@ -1,6 +1,6 @@ /* Common functions, macros, includes * - * Copyleft (C) 2018-2020, Marek Gagolewski + * Copyleft (C) 2018-2021, Marek Gagolewski * * This program is free software: you can redistribute it and/or modify * it under the terms of the GNU Affero General Public License diff --git a/src/r_compare_partitions.cpp b/src/r_compare_partitions.cpp index cb2b6369..0efab95f 100644 --- a/src/r_compare_partitions.cpp +++ b/src/r_compare_partitions.cpp @@ -1,6 +1,6 @@ /* Partition Similarity Scores * - * Copyleft (C) 2018-2020, Marek Gagolewski + * Copyleft (C) 2018-2021, Marek Gagolewski * * This program is free software: you can redistribute it and/or modify * it under the terms of the GNU Affero General Public License diff --git a/src/r_emst.cpp b/src/r_emst.cpp new file mode 100644 index 00000000..6922c73a --- /dev/null +++ b/src/r_emst.cpp @@ -0,0 +1,50 @@ +/* Calls RcppMLPACK::DualTreeBoruvka::ComputeMST + * + * Copyleft (C) 2018-2021, Marek Gagolewski + * + * This program is free software: you can redistribute it and/or modify + * it under the terms of the GNU Affero General Public License + * Version 3, 19 November 2007, published by the Free Software Foundation. + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU Affero General Public License Version 3 for more details. + * You should have received a copy of the License along with this program. + * If this is not the case, refer to . + */ + +#include +// #include +// #include +#include "c_common.h" + + + +// Euclidean MST via MLPACK +// Calls RcppMLPACK::DualTreeBoruvka::ComputeMST +// [[Rcpp::export(".emst_mlpack")]] +Rcpp::NumericMatrix __emst_mlpack(Rcpp::NumericMatrix X) +{ + ssize_t n = X.nrow(); + ssize_t d = X.ncol(); + + // Let _X = transpose(X) + arma::Mat _X(d, n); + for (ssize_t i=0; i _ret; + mlpack::emst::DualTreeBoruvka<>(_X).ComputeMST(_ret); + + Rcpp::NumericMatrix ret(n-1, 3); + for (ssize_t i=0; i 1-based) + ret(i, 1) = _ret(1, i)+1; // greater edge index + ret(i, 2) = _ret(2, i); // distance between the pair of points + GENIECLUST_ASSERT(ret(i, 0) < ret(i, 1)); + GENIECLUST_ASSERT(i == 0 || ret(i-1, 2) <= ret(i, 2)); + } + + return ret; +} diff --git a/src/r_gclust.cpp b/src/r_gclust.cpp index 0f18300f..0d45d365 100644 --- a/src/r_gclust.cpp +++ b/src/r_gclust.cpp @@ -1,6 +1,6 @@ /* The Genie++ Clustering Algorithm - R Wrapper * - * Copyleft (C) 2018-2020, Marek Gagolewski + * Copyleft (C) 2018-2021, Marek Gagolewski * * This program is free software: you can redistribute it and/or modify * it under the terms of the GNU Affero General Public License @@ -14,35 +14,6 @@ */ -// //[[Rcpp::depends(RcppMLPACK)]] -// #include - -// if (use_mlpack) { -// if (distance != "euclidean" && distance != "l2") -// stop("`use_mlpack` can only be used with Euclidean distance"); -// -// std::vector mst_i((n-1)*2); -// std::vector mst_d(n-1); -// -// //mlpack::Log::Info.ignoreInput = !verbose; -// //mlpack::Log::Warn.ignoreInput = !verbose; -// -// arma::Mat X2(REAL(SEXP(X)), n, d, /*copy_aux_mem=*/true, /*strict=*/true); -// mlpack::emst::DualTreeBoruvka<> boruvka(X2.t()); -// arma::mat mst; -// boruvka.ComputeMST(mst); -// for (ssize_t i=0; i(mst_i, mst_d, n, gini_threshold, verbose); -// } - - - - #include "c_common.h" #include "c_matrix.h" #include "c_distance.h" @@ -107,7 +78,7 @@ void __generate_merge(ssize_t n, NumericMatrix links, NumericMatrix merge) } -/* This function was originally part of our `genie` package for R */ +/* Originally, this function was part of our `genie` package for R */ void __generate_order(ssize_t n, NumericMatrix merge, NumericVector order) { std::vector< std::list > relord(n+1); diff --git a/src/r_inequity.cpp b/src/r_inequity.cpp index d6e66a1d..0725cb11 100644 --- a/src/r_inequity.cpp +++ b/src/r_inequity.cpp @@ -1,6 +1,6 @@ /* Economic Inequity (Inequality) Measures. * - * Copyleft (C) 2018-2020, Marek Gagolewski + * Copyleft (C) 2018-2021, Marek Gagolewski * * This program is free software: you can redistribute it and/or modify * it under the terms of the GNU Affero General Public License