JabRef · lenhard · Oct 3, 2016 · Sep 29, 2016 · Sep 29, 2016 · Sep 29, 2016
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -58,6 +58,7 @@ We refer to [GitHub issues](https://github.com/JabRef/jabref/issues) by using `#
 - Improve language quality of the German translation of shared database
 
 ### Fixed
+- Fixed [#1993](https://github.com/JabRef/jabref/issues/1993): Various optimizations regarding search performance
 - Fixed [koppor#160](https://github.com/koppor/jabref/issues/160): Tooltips now working in the main table
 - Fixed [#2054](https://github.com/JabRef/jabref/issues/2054): Ignoring a new version now works as expected
 - Fixed selecting an entry out of multiple duplicates

diff --git a/jabref.install4j b/jabref.install4j
@@ -750,4 +750,9 @@ return true;</string>
   </mediaSets>
   <buildIds buildAll="true" />
   <buildOptions verbose="false" faster="false" disableSigning="false" disableJreBundling="false" debug="false" />
+  <jvmArguments>
+      <arg>-XX:+UseG1GC</arg>
+      <arg>-XX:+UseStringDeduplication</arg>
+      <arg>-XX:StringTableSize=1000003</arg>
+  </jvmArguments>
 </install4j>
diff --git a/src/main/java/net/sf/jabref/model/entry/BibEntry.java b/src/main/java/net/sf/jabref/model/entry/BibEntry.java
@@ -27,6 +27,7 @@
 import net.sf.jabref.model.database.BibDatabaseMode;
 import net.sf.jabref.model.entry.event.EntryEventSource;
 import net.sf.jabref.model.entry.event.FieldChangedEvent;
+import net.sf.jabref.model.strings.LatexToUnicode;
 import net.sf.jabref.model.strings.StringUtil;
 
 import com.google.common.base.Strings;
@@ -52,11 +53,22 @@ public class BibEntry implements Cloneable {
 
     private String type;
     private Map<String, String> fields = new ConcurrentHashMap<>();
-    /*
+
+    /**
      * Map to store the words in every field
      */
     private final Map<String, Set<String>> fieldsAsWords = new HashMap<>();
 
+    /**
+     * Cache that stores latex free versions of fields.
+     */
+    private final Map<String, String> latexFreeFields = new ConcurrentHashMap<>();
+
+    /**
+     * Used to cleanse field values for internal LaTeX-free storage
+     */
+    private LatexToUnicode unicodeConverter = new LatexToUnicode();
+
     // Search and grouping status is stored in boolean fields for quick reference:
     private boolean searchHit;
     private boolean groupHit;
@@ -65,7 +77,7 @@ public class BibEntry implements Cloneable {
 
     private String commentsBeforeEntry = "";
 
-    /*
+    /**
      * Marks whether the complete serialization, which was read from file, should be used.
      *
      * Is set to false, if parts of the entry change. This causes the entry to be serialized based on the internal state (and not based on the old serialization)
@@ -95,7 +107,7 @@ public BibEntry(String id) {
     /**
      * Constructs a new BibEntry with the given ID and given type
      *
-     * @param id The ID to be used
+     * @param id   The ID to be used
      * @param type The type to set. May be null or empty. In that case, DEFAULT_TYPE is used.
      */
     public BibEntry(String id, String type) {
@@ -107,7 +119,7 @@ public BibEntry(String id, String type) {
     }
 
     public Optional<FieldChange> replaceKeywords(KeywordList keywordsToReplace, Optional<Keyword> newValue,
-            Character keywordDelimiter) {
+                                                 Character keywordDelimiter) {
         KeywordList keywordList = getKeywords(keywordDelimiter);
         keywordList.replaceKeywords(keywordsToReplace, newValue);
 
@@ -180,7 +192,6 @@ public String getId() {
 
     /**
      * Sets the cite key AKA citation key AKA BibTeX key.
-     *
      * Note: This is <emph>not</emph> the internal Id of this entry. The internal Id is always present, whereas the BibTeX key might not be present.
      *
      * @param newCiteKey The cite key to set. Must not be null; use {@link #clearCiteKey()} to remove the cite key.
@@ -191,7 +202,6 @@ public void setCiteKey(String newCiteKey) {
 
     /**
      * Returns the cite key AKA citation key AKA BibTeX key, or null if it is not set.
-     *
      * Note: this is <emph>not</emph> the internal Id of this entry. The internal Id is always present, whereas the BibTeX key might not be present.
      */
     @Deprecated
@@ -396,8 +406,9 @@ public void setField(Map<String, String> fields) {
 
     /**
      * Set a field, and notify listeners about the change.
-     * @param name  The field to set
-     * @param value The value to set
+     *
+     * @param name        The field to set
+     * @param value       The value to set
      * @param eventSource Source the event is sent from
      */
     public Optional<FieldChange> setField(String name, String value, EntryEventSource eventSource) {
@@ -421,8 +432,8 @@ public Optional<FieldChange> setField(String name, String value, EntryEventSourc
 
         changed = true;
 
-        fields.put(fieldName, value);
-        fieldsAsWords.remove(fieldName);
+        fields.put(fieldName, value.intern());
+        invalidateFieldCache(fieldName);
 
         FieldChange change = new FieldChange(this, fieldName, oldValue, value);
         eventBus.post(new FieldChangedEvent(change, eventSource));
@@ -460,7 +471,7 @@ public Optional<FieldChange> clearField(String name) {
      * Remove the mapping for the field name, and notify listeners about
      * the change including the {@link EntryEventSource}.
      *
-     * @param name The field to clear.
+     * @param name        The field to clear.
      * @param eventSource the source a new {@link FieldChangedEvent} should be posten from.
      */
     public Optional<FieldChange> clearField(String name, EntryEventSource eventSource) {
@@ -478,7 +489,8 @@ public Optional<FieldChange> clearField(String name, EntryEventSource eventSourc
         changed = true;
 
         fields.remove(fieldName);
-        fieldsAsWords.remove(fieldName);
+        invalidateFieldCache(fieldName);
+
         FieldChange change = new FieldChange(this, fieldName, oldValue.get(), null);
         eventBus.post(new FieldChangedEvent(change, eventSource));
         return Optional.of(change);
@@ -570,7 +582,7 @@ public void setGroupHit(boolean groupHit) {
      * Author1, Author2: Title (Year)
      */
     public String getAuthorTitleYear(int maxCharacters) {
-        String[] s = new String[] {getField(FieldName.AUTHOR).orElse("N/A"), getField(FieldName.TITLE).orElse("N/A"),
+        String[] s = new String[]{getField(FieldName.AUTHOR).orElse("N/A"), getField(FieldName.TITLE).orElse("N/A"),
                 getField(FieldName.YEAR).orElse("N/A")};
 
         String text = s[0] + ": \"" + s[1] + "\" (" + s[2] + ')';
@@ -765,4 +777,21 @@ public Set<String> getFieldAsWords(String field) {
     public Optional<FieldChange> clearCiteKey() {
         return clearField(KEY_FIELD);
     }
+
+    private void invalidateFieldCache(String fieldName) {
+        latexFreeFields.remove(fieldName);
+        fieldsAsWords.remove(fieldName);
+    }
+
+    public Optional<String> getLatexFreeField(String name) {
+        if (!hasField(name)) {
+            return Optional.empty();
+        } else if (latexFreeFields.containsKey(name)) {
+            return Optional.ofNullable(latexFreeFields.get(toLowerCase(name)));
+        } else {
+            String latexFreeField = unicodeConverter.format(getField(name).get()).intern();
+            latexFreeFields.put(name, latexFreeField);
+            return Optional.of(latexFreeField);
+        }
+    }
 }
diff --git a/src/main/java/net/sf/jabref/model/search/rules/ContainBasedSearchRule.java b/src/main/java/net/sf/jabref/model/search/rules/ContainBasedSearchRule.java
@@ -38,8 +38,8 @@ public boolean applyRule(String query, BibEntry bibEntry) {
 
         List<String> unmatchedWords = new SentenceAnalyzer(searchString).getWords();
 
-        for (String fieldContent : bibEntry.getFieldValues()) {
-            String formattedFieldContent = LATEX_TO_UNICODE_FORMATTER.format(fieldContent);
+        for (String fieldKey : bibEntry.getFieldNames()) {
+            String formattedFieldContent = bibEntry.getLatexFreeField(fieldKey).get();
             if (!caseSensitive) {
                 formattedFieldContent = formattedFieldContent.toLowerCase();
             }

diff --git a/src/main/java/net/sf/jabref/model/search/rules/GrammarBasedSearchRule.java b/src/main/java/net/sf/jabref/model/search/rules/GrammarBasedSearchRule.java
@@ -162,7 +162,7 @@ public boolean compare(BibEntry entry) {
             }
 
             for (String field : fieldsKeys) {
-                Optional<String> fieldValue = entry.getField(field);
+                Optional<String> fieldValue = entry.getLatexFreeField(field);
                 if (fieldValue.isPresent()) {
                     if (matchFieldValue(fieldValue.get())) {
                         return true;

diff --git a/src/main/java/net/sf/jabref/model/search/rules/RegexBasedSearchRule.java b/src/main/java/net/sf/jabref/model/search/rules/RegexBasedSearchRule.java
@@ -53,8 +53,7 @@ public boolean applyRule(String query, BibEntry bibEntry) {
         for (String field : bibEntry.getFieldNames()) {
             Optional<String> fieldOptional = bibEntry.getField(field);
             if (fieldOptional.isPresent()) {
-                String fieldContent = RegexBasedSearchRule.LATEX_TO_UNICODE_FORMATTER.format(fieldOptional.get());
-                String fieldContentNoBrackets = RegexBasedSearchRule.LATEX_TO_UNICODE_FORMATTER.format(fieldContent);
+                String fieldContentNoBrackets = bibEntry.getLatexFreeField(field).get();
                 Matcher m = pattern.matcher(fieldContentNoBrackets);
                 if (m.find()) {
                     return true;

diff --git a/src/main/java/net/sf/jabref/model/strings/LatexToUnicode.java b/src/main/java/net/sf/jabref/model/strings/LatexToUnicode.java
@@ -1,21 +1,33 @@
 package net.sf.jabref.model.strings;
 
 import java.util.Map;
+import java.util.regex.Pattern;
 
 public class LatexToUnicode {
 
     private static final Map<String, String> CHARS = HTMLUnicodeConversionMaps.LATEX_UNICODE_CONVERSION_MAP;
     private static final Map<String, String> ACCENTS = HTMLUnicodeConversionMaps.UNICODE_ESCAPED_ACCENTS;
 
+    private static final Pattern AMP_LATEX = Pattern.compile("&|\\\\&");
+    private static final Pattern P_LATEX = Pattern.compile("[\\n]{1,}");
+    private static final Pattern DOLLAR_LATEX = Pattern.compile("\\\\\\$");
+    private static final Pattern DOLLARS_LATEX = Pattern.compile("\\$([^\\$]*)\\$");
+
+    private static final Pattern AMP = Pattern.compile("\\&amp;");
+    private static final Pattern P = Pattern.compile("<p>");
+    private static final Pattern DOLLAR = Pattern.compile("\\&dollar;");
+    private static final Pattern TILDE = Pattern.compile("~");
 
     public String format(String inField) {
         if (inField.isEmpty()) {
             return "";
         }
         int i;
         // TODO: document what does this do
-        String field = inField.replaceAll("&|\\\\&", "&amp;").replaceAll("[\\n]{1,}", "<p>").replace("\\$", "&dollar;") // Replace \$ with &dollar;
-                .replaceAll("\\$([^\\$]*)\\$", "\\{$1\\}");
+        String field = AMP_LATEX.matcher(inField).replaceAll("&amp;");
+        field = P_LATEX.matcher(field).replaceAll("<p>");
+        field = DOLLAR_LATEX.matcher(field).replaceAll("&dollar;");
+        field = DOLLARS_LATEX.matcher(field).replaceAll("\\{$1\\}");
 
         StringBuilder sb = new StringBuilder();
         StringBuilder currentCommand = null;
@@ -187,8 +199,11 @@ public String format(String inField) {
             }
         }
 
-        return sb.toString().replace("&amp;", "&").replace("<p>", "\n").replace("&dollar;", "$").replace("~",
-                "\u00A0");
+        String result = AMP.matcher(sb.toString()).replaceAll("&");
+        result = P.matcher(result).replaceAll("\n");
+        result = DOLLAR.matcher(result).replaceAll("\\$");
+        result = TILDE.matcher(result).replaceAll("\u00A0");
+        return result;
 
     }
 }