1 files changed, 62 insertions, 53 deletions
diff --git a/background_scripts/search_engines.coffee b/background_scripts/search_engines.coffee
index e68cf85d..3c6654e3 100644
--- a/background_scripts/search_engines.coffee
+++ b/background_scripts/search_engines.coffee
@@ -1,49 +1,54 @@
 
-matchesAnyRegexp = (regexps, string) ->
-  for re in regexps
-    return true if re.test string
-  false
-
-# Each completer implements three functions:
+# A completion engine provides search suggestions for a search engine.  A search engine is identified by a
+# "searchUrl", e.g. Settings.get("searchUrl"), or a custom search engine.
+#
+# Each completion engine defines three functions:
+#
+#   1. "match" - This takes a searchUrl, and returns a boolean indicating whether this completion engine can
+#      perform completion for the given search engine.
 #
-#   match:  can this completer be used for this search URL?
-#   getUrl: map these query terms to a completion URL.
-#   parse:  extract suggestions from the resulting (successful) XMLHttpRequest.
+#   2. "getUrl" - This takes a list of query terms (queryTerms) and generates a completion URL, that is, a URL
+#      which will provide completions for this completion engine.
 #
-class Google
+#   3. "parse" - This takes a successful XMLHttpRequest object (the request has completed successfully), and
+#      returns a list of suggestions (a list of strings).
+#
+# The main (only) completion entry point is SearchEngines.complete().  This implements all lookup and caching
+# logic.  It is possible to add new completion engines without changing the SearchEngines infrastructure
+# itself.
+
+# A base class for common regexp-based matching engines.
+class RegexpEngine
+  constructor: (@regexps) ->
+  match: (searchUrl) -> Utils.matchesAnyRegexp @regexps, searchUrl
+
+# Completion engine for English-language Google search.
+class Google extends RegexpEngine
   constructor: ->
-    @regexps = [
-      # We include matches for the major English-speaking TLDs.
+    super [
+      # We match the major English-speaking TLDs.
       new RegExp "^https?://[a-z]+\.google\.(com|ie|co.uk|ca|com.au)/"
-      # NOTE(smblott). A  temporary hack, just for me, and just for development. Will be removed.
-      new RegExp "localhost/.*/booky"
+      new RegExp "localhost/cgi-bin/booky" # Only for smblott.
       ]
 
-  name: "Google"
-  match: (searchUrl) -> matchesAnyRegexp @regexps, searchUrl
-
   getUrl: (queryTerms) ->
     "http://suggestqueries.google.com/complete/search?ss_protocol=legace&client=toolbar&q=#{Utils.createSearchQuery queryTerms}"
 
-  # Returns a list of suggestions (strings).
   parse: (xhr) ->
-    suggestions = xhr?.responseXML?.getElementsByTagName "suggestion"
-    return [] unless suggestions
-    for suggestion in suggestions
-      continue unless suggestion = suggestion.getAttribute "data"
-      suggestion
+    try
+      for suggestion in xhr.responseXML.getElementsByTagName "suggestion"
+        continue unless suggestion = suggestion.getAttribute "data"
+        suggestion
+    catch
+      []
 
-class Youtube
+class Youtube extends RegexpEngine
   constructor: ->
-    @regexps = [ new RegExp "https?://[a-z]+\.youtube\.com/results" ]
-
-  name: "YouTube"
-  match: (searchUrl) -> matchesAnyRegexp @regexps, searchUrl
+    super [ new RegExp "https?://[a-z]+\.youtube\.com/results" ]
 
   getUrl: (queryTerms) ->
     "http://suggestqueries.google.com/complete/search?client=youtube&ds=yt&q=#{Utils.createSearchQuery queryTerms}"
 
-  # Returns a list of suggestions (strings).
   parse: (xhr) ->
     try
       text = xhr.responseText
@@ -56,8 +61,6 @@ class Youtube
 # A dummy search engine which is guaranteed to match any search URL, but never produces completions.  This
 # allows the rest of the logic to be written knowing that there will be a search engine match.
 class DummySearchEngine
-  constructor: ->
-  name: "Dummy"
   match: -> true
   # We return a useless URL which we know will succeed, but which won't generate any network traffic.
   getUrl: -> chrome.runtime.getURL "content_scripts/vimium.css"
@@ -72,15 +75,13 @@ SearchEngines =
     callback? null
 
   # Perform an HTTP GET.
-  #   searchUrl is the search engine's URL, e.g. Settings.get("searchUrl").
-  #   url is the URL to fetch.
-  #   callback will be called with a successful XMLHttpRequest object, or null.
   get: (searchUrl, url, callback) ->
-    @requests ?= {} # Maps searchUrls to any outstanding HTTP request for that search engine.
+    @requests ?= {} # Maps a searchUrl to any outstanding HTTP request for that search engine.
     @cancel searchUrl
 
-    # We cache the results of the most-recent 1000 requests with a one-minute expiry.
-    @requestCache ?= new SimpleCache 1 * 60 * 1000, 1000
+    # We cache the results of the most-recent 100 successfully XMLHttpRequests with a ten-second (ie. very
+    # short) expiry.
+    @requestCache ?= new SimpleCache 10 * 1000, 100
 
     if @requestCache.has url
       callback @requestCache.get url
@@ -88,22 +89,23 @@ SearchEngines =
 
     @requests[searchUrl] = xhr = new XMLHttpRequest()
     xhr.open "GET", url, true
-    xhr.timeout = 500
+    # We set a fairly short timeout.  If we block for too long, then we block *all* completers.
+    xhr.timeout = 300
     xhr.ontimeout = => @cancel searchUrl, callback
     xhr.onerror = => @cancel searchUrl, callback
     xhr.send()
 
     xhr.onreadystatechange = =>
       if xhr.readyState == 4
+        @requests[searchUrl] = null
         if xhr.status == 200
-          @requests[searchUrl] = null
           callback @requestCache.set url, xhr
         else
           callback null
 
-  # Look up the search-completion engine for this search URL.  Because of DummySearchEngine, above, we know
-  # there will always be a match.  Imagining that there may be many search engines, and knowing that this is
-  # called for every character entered, we cache the result.
+  # Look up the search-completion engine for this searchUrl.  Because of DummySearchEngine, above, we know
+  # there will always be a match.  Imagining that there may be many completion engines, and knowing that this
+  # is called for every input event in the vomnibar, we cache the result.
   lookupEngine: (searchUrl) ->
     @engineCache ?= new SimpleCache 30 * 60 * 60 * 1000 # 30 hours (these are small, we can keep them longer).
     if @engineCache.has searchUrl
@@ -114,22 +116,24 @@ SearchEngines =
         return @engineCache.set searchUrl, engine if engine.match searchUrl
 
   # This is the main (actually, the only) entry point.
-  #   searchUrl is the search engine's URL, e.g. Settings.get("searchUrl").
-  #   queryTerms are the queryTerms.
-  #   callback will be applied to a list of suggestion strings (which may be an empty list, if anything goes
-  #   wrong).
+  #  - searchUrl is the search engine's URL, e.g. Settings.get("searchUrl"), or a custome search engine's URL.
+  #    This is only used as a key for determining the relevant completion engine.
+  #  - queryTerms are the queryTerms.
+  #  - callback will be applied to a list of suggestion strings (which may be an empty list, if anything goes
+  #    wrong).
   complete: (searchUrl, queryTerms, callback) ->
+    # We can't complete empty queries.
     return callback [] unless 0 < queryTerms.length
 
-    # Don't try to complete general URLs.
+    # We don't complete URLs.
     return callback [] if 1 == queryTerms.length and Utils.isUrl queryTerms[0]
 
-    # Don't try to complete Javascrip URLs.
-    return callback [] if 0 < queryTerms.length and Utils.hasJavascriptPrefix queryTerms[0]
+    # We don't complete Javascript URLs.
+    return callback [] if Utils.hasJavascriptPrefix queryTerms[0]
 
     # Cache completions.  However, completions depend upon both the searchUrl and the query terms.  So we need
-    # to generate a key.  We mix in some nonsense generated by pwgen. There is the possibility of a key clash,
-    # but it's vanishingly small.
+    # to generate a key.  We mix in some nonsense generated by pwgen. A key clash is possible, but vanishingly
+    # unlikely.
     junk = "//Zi?ei5;o//"
     completionCacheKey = searchUrl + junk + queryTerms.join junk
     @completionCache ?= new SimpleCache 6 * 60 * 60 * 1000, 2000 # Six hours, 2000 entries.
@@ -140,9 +144,14 @@ SearchEngines =
     url = engine.getUrl queryTerms
     @get searchUrl, url, (xhr = null) =>
       if xhr?
-        callback @completionCache.set completionCacheKey, engine.parse xhr
+        # We keep at most three suggestions, the top three.  These are most likely to be useful.
+        callback @completionCache.set completionCacheKey, engine.parse(xhr)[...3]
       else
-        callback []
+        callback @completionCache.set completionCacheKey, callback []
+        # We cache failures, but remove them after just ten minutes.  This (it is hoped) avoids repeated
+        # XMLHttpRequest failures over a short period of time.
+        removeCompletionCacheKey = => @completionCache.set completionCacheKey, null
+        setTimeout removeCompletionCacheKey, 10 * 60 * 1000 # Ten minutes.
 
 root = exports ? window
 root.SearchEngines = SearchEngines