Commit f45686c8 authored by Manuel  Segimon's avatar Manuel Segimon
Browse files

Fix punctuation removal in extractWordUsage method

parent 3fc60724
Loading
Loading
Loading
Loading
+1 −1
Original line number Diff line number Diff line
@@ -278,7 +278,7 @@ public class crawler {
                }
            }
        } else {
            extractWordUsage(web_data.text(), wordUsage);
            extractWordUsage(web_data.text().replaceAll("\\p{Punct}", ""), wordUsage);
            // System.out.println("Ngrams built successfully. for size:"+MAXNGRAM);
            uncompressedData = wordUsage.serialize();
            compressedData = compress(uncompressedData);