From 5a3f4b8157f2f44d6bffc6d3296f2583b30e9cb2 Mon Sep 17 00:00:00 2001 From: Shaoliang Nie Date: Mon, 7 Aug 2017 09:48:27 -0400 Subject: [PATCH] Correct signature size calculation According to the description in this file, signature size equals to R * b instead of R * n --- src/main/java/info/debatty/java/lsh/LSHMinHash.java | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/src/main/java/info/debatty/java/lsh/LSHMinHash.java b/src/main/java/info/debatty/java/lsh/LSHMinHash.java index beb5812..0f51e2b 100644 --- a/src/main/java/info/debatty/java/lsh/LSHMinHash.java +++ b/src/main/java/info/debatty/java/lsh/LSHMinHash.java @@ -46,7 +46,7 @@ public class LSHMinHash extends LSH { */ public LSHMinHash(final int s, final int b, final int n) { super(s, b); - int signature_size = computeSignatureSize(s, n); + int signature_size = computeSignatureSize(s, b); this.mh = new MinHash(signature_size, n); } @@ -66,7 +66,7 @@ public LSHMinHash(final int s, final int b, final int n) { */ public LSHMinHash(final int s, final int b, final int n, final long seed) { super(s, b); - int signature_size = computeSignatureSize(s, n); + int signature_size = computeSignatureSize(s, b); this.mh = new MinHash(signature_size, n, seed); } @@ -92,7 +92,7 @@ public LSHMinHash(final int s, final int b, final int n, final long seed) { private int computeSignatureSize(final int s, final int n) { int r = (int) Math.ceil(Math.log(1.0 / s) / Math.log(THRESHOLD)) + 1; - return r * s; + return r * b; } /**