From 56cd07fa35f75c677ef61e87da5fb0c0092ef198 Mon Sep 17 00:00:00 2001 From: Leon Wabeke Date: Fri, 3 Jan 2025 10:08:44 +0200 Subject: [PATCH] Modification to dbscan to add test cases and support for the case where number of points <= num dimensions --- src/dbscan.jl | 1 - test/dbscan.jl | 29 +++++++++++++++++++++++++++++ 2 files changed, 29 insertions(+), 1 deletion(-) diff --git a/src/dbscan.jl b/src/dbscan.jl index b34e580e..bfa04bc3 100644 --- a/src/dbscan.jl +++ b/src/dbscan.jl @@ -101,7 +101,6 @@ function dbscan(points::AbstractMatrix, radius::Real; if metric !== nothing # points are point coordinates dim, num_points = size(points) - num_points <= dim && throw(ArgumentError("points has $dim rows and $num_points columns. Must be a D x N matric with D < N")) kdtree = KDTree(points, metric; nntree_kwargs...) data = (kdtree, points) else diff --git a/test/dbscan.jl b/test/dbscan.jl index e35195a4..58959cdb 100644 --- a/test/dbscan.jl +++ b/test/dbscan.jl @@ -14,6 +14,35 @@ include("test_helpers.jl") @test @inferred(dbscan(randn(2, 2), 0.5, metric=nothing, min_neighbors=1)) isa DbscanResult end +@testset "Simple 2D test case" begin + X = [10.0 0.0 10.5 ; + 0.0 10.0 0.1] + R = dbscan(X, 20) + @test nclusters(R) == 1 + R = dbscan(X, 1.0) + @test nclusters(R) == 2 + R = dbscan(X, 0.1) + @test nclusters(R) == 3 +end + +@testset "Simple 2D test case with limited points" begin + X = [10.0 0.0 ; + 0.0 10.0 ] + R = dbscan(X, 20) + @test nclusters(R) == 1 + R = dbscan(X, 1.0) + @test nclusters(R) == 2 +end +@testset "Simple 2D test case with limited points trivial case" begin + X = zeros(2,1) # At minimum dbscan needs a matrix and will not work with just a vector, but matrix could be Nx1 + X[:,1] = [10.0 ; + 0.0 ] + R = dbscan(X, 20) + @test nclusters(R) == 1 + R = dbscan(X, 1.0) + @test nclusters(R) == 1 +end + @testset "clustering synthetic data with 3 clusters" begin Random.seed!(34568)