From bb7a9df946a78941c83ff2499e0e545f3796dc90 Mon Sep 17 00:00:00 2001 From: Maurice Laveaux Date: Mon, 19 May 2014 12:24:20 +0200 Subject: Also remove @ and # from input text. --- src/analysis/BrandChecker.java | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) (limited to 'src') diff --git a/src/analysis/BrandChecker.java b/src/analysis/BrandChecker.java index 0f7fcad..c22d47d 100644 --- a/src/analysis/BrandChecker.java +++ b/src/analysis/BrandChecker.java @@ -129,8 +129,7 @@ public class BrandChecker { * Removes punctuation and urls. */ private String removePunct(String text) { - //text = text.replaceAll("https?://\\S*", ""); - text = text.replaceAll("[.,!?();\"'-]", " "); + text = text.replaceAll("[.,!?();\"'@#-]", " "); return text; } -- cgit v1.2.1