aboutsummaryrefslogtreecommitdiffstats
path: root/java/src
diff options
context:
space:
mode:
authorJean Chalard <jchalard@google.com>2012-05-15 11:37:50 -0700
committerAndroid Git Automerger <android-git-automerger@android.com>2012-05-15 11:37:50 -0700
commit47fedb89930c7450885040ab4192f29df8d1f252 (patch)
treedae6bec4e88044e980fd1d0f770358c83640a473 /java/src
parent16c34b1bc5192059eb47986b142a4ac1ced1a468 (diff)
parentf5ac6c725a0e12c1ed796de9f255103b957e1724 (diff)
downloadlatinime-47fedb89930c7450885040ab4192f29df8d1f252.tar.gz
latinime-47fedb89930c7450885040ab4192f29df8d1f252.tar.xz
latinime-47fedb89930c7450885040ab4192f29df8d1f252.zip
am f5ac6c72: Merge "More optimizations" into jb-dev
* commit 'f5ac6c725a0e12c1ed796de9f255103b957e1724': More optimizations
Diffstat (limited to 'java/src')
-rw-r--r--java/src/com/android/inputmethod/latin/makedict/BinaryDictInputOutput.java15
1 files changed, 11 insertions, 4 deletions
diff --git a/java/src/com/android/inputmethod/latin/makedict/BinaryDictInputOutput.java b/java/src/com/android/inputmethod/latin/makedict/BinaryDictInputOutput.java
index 3c818cc56..bb1042324 100644
--- a/java/src/com/android/inputmethod/latin/makedict/BinaryDictInputOutput.java
+++ b/java/src/com/android/inputmethod/latin/makedict/BinaryDictInputOutput.java
@@ -489,10 +489,17 @@ public class BinaryDictInputOutput {
// Merging tails can only be done if there are no attributes. Searching for attributes
// in LatinIME code depends on a total breadth-first ordering, which merging tails
// breaks. If there are no attributes, it should be fine (and reduce the file size)
- // to merge tails, and the following step would be necessary.
- // If eventually the code runs on Android, searching through the whole array each time
- // may be a performance concern.
- list.remove(node);
+ // to merge tails, and removing the node from the list would be necessary. However,
+ // we don't merge tails because breaking the breadth-first ordering would result in
+ // extreme overhead at bigram lookup time (it would make the search function O(n) instead
+ // of the current O(log(n)), where n=number of nodes in the dictionary which is pretty
+ // high).
+ // If no nodes are ever merged, we can't have the same node twice in the list, hence
+ // searching for duplicates in unnecessary. It is also very performance consuming,
+ // since `list' is an ArrayList so it's an O(n) operation that runs on all nodes, making
+ // this simple list.remove operation O(n*n) overall. On Android this overhead is very
+ // high.
+ // For future reference, the code to remove duplicate is a simple : list.remove(node);
list.add(node);
final ArrayList<CharGroup> branches = node.mData;
final int nodeSize = branches.size();