diff --git a/docs/html/pattern-web.html b/docs/html/pattern-web.html
index a624585d..b783b638 100644
--- a/docs/html/pattern-web.html
+++ b/docs/html/pattern-web.html
@@ -83,7 +83,7 @@ <h2><a name="URL"></a>URLs</h2>
 <p>The example below downloads an image. <br />The <span class="inline_code">extension()</span> helper function parses the file extension from a file name:</p>
 <div class="example">
 <pre class="brush:python; gutter:false; light:true;">&gt;&gt;&gt; from pattern.web import URL, extension
-&gt;&gt;&gt;  
+&gt;&gt;&gt;
 &gt;&gt;&gt; url = URL('http://www.clips.ua.ac.be/media/pattern_schema.gif')
 &gt;&gt;&gt; f = open('test' + extension(url.page), 'wb') # save as test.gif
 &gt;&gt;&gt; f.write(url.download())
@@ -97,7 +97,7 @@ <h3>URL mime-type</h3>
 <p>The <span class="inline_code">URL.mimetype</span> can be used to check the type of document at the given URL. This is more reliable than sniffing the filename extension (which may be omitted).</p>
 <div class="example">
 <pre class="brush:python; gutter:false; light:true;">&gt;&gt;&gt; from pattern import URL, MIMETYPE_IMAGE
-&gt;&gt;&gt;  
+&gt;&gt;&gt;
 &gt;&gt;&gt; url = URL('http://www.clips.ua.ac.be/media/pattern_schema.gif')
 &gt;&gt;&gt; print url.mimetype in MIMETYPE_IMAGE
 
@@ -222,7 +222,7 @@ <h2><a name="asynchronous"></a>Asynchronous requests</h2>
 </pre><p>The example below executes a Google query without halting the main program. Instead, it displays a "busy" message (e.g., a progress bar updated in the application's event loop) until <span class="inline_code">request.done</span>.</p>
 <div class="example">
 <pre class="brush:python; gutter:false; light:true;">&gt;&gt;&gt; from pattern.web import asynchronous, time, Google
-&gt;&gt;&gt;  
+&gt;&gt;&gt;
 &gt;&gt;&gt; request = asynchronous(Google().search, 'holy grail', timeout=4)
 &gt;&gt;&gt; while not request.done:
 &gt;&gt;&gt;    time.sleep(0.1)
@@ -236,14 +236,14 @@ <h2><a name="services"></a>Search engine + web services</h2>
 <p>The <span class="inline_code">SearchEngine</span> object has a number of subclasses that can be used to query different web services (e.g., Google, Wikipedia). <span class="inline_code">SearchEngine.search()</span>&nbsp;returns a list of <span class="inline_code">Result</span> objects for a given query string – similar to a search field and a results page in a browser.</p>
 <pre class="brush:python; gutter:false; light:true;">engine = SearchEngine(license=None, throttle=1.0, language=None)</pre><pre class="brush:python; gutter:false; light:true;">engine.license              # Service license key.
 engine.throttle             # Time between requests (being nice to server).
-engine.language             # Restriction for Result.language (e.g., 'en').</pre><pre class="brush:python; gutter:false; light:true;">engine.search(query, 
+engine.language             # Restriction for Result.language (e.g., 'en').</pre><pre class="brush:python; gutter:false; light:true;">engine.search(query,
     type = SEARCH,          # SEARCH | IMAGE | NEWS
    start = 1,               # Starting page.
    count = 10,              # Results per page.
     size = None             # Image size: TINY | SMALL | MEDIUM | LARGE
   cached = True)            # Cache locally?</pre><p><span class="small"><span style="text-decoration: underline;">Note</span>: <span class="inline_code">SearchEngine.search()</span> takes the same optional parameters as <span class="inline_code">URL.download()</span>.</span></p>
 <h3>Google, Bing, Twitter, Facebook, Wikipedia, Flickr</h3>
-<p><span class="inline_code">SearchEngine</span> is subclassed by <span class="inline_code">Google</span>, <span class="inline_code">Yahoo</span>, <span class="inline_code">Bing</span>, <span class="inline_code">DuckDuckGo</span>, <span class="inline_code">Twitter</span>, <span class="inline_code">Facebook</span>, <span class="inline_code">Wikipedia</span>, <span class="inline_code">Wiktionary</span>, <span class="inline_code">Wikia</span>, <span class="inline_code">DBPedia</span>, <span class="inline_code">Flickr</span> and <span class="inline_code">Newsfeed</span>. The constructors take the same parameters:</p>
+<p><span class="inline_code">SearchEngine</span> is subclassed by <span class="inline_code">Google</span>, <span class="inline_code">Bing</span>, <span class="inline_code">DuckDuckGo</span>, <span class="inline_code">Twitter</span>, <span class="inline_code">Facebook</span>, <span class="inline_code">Wikipedia</span>, <span class="inline_code">Wiktionary</span>, <span class="inline_code">Wikia</span>, <span class="inline_code">DBPedia</span>, <span class="inline_code">Flickr</span> and <span class="inline_code">Newsfeed</span>. The constructors take the same parameters:</p>
 <pre class="brush:python; gutter:false; light:true;">engine = Google(license=None, throttle=0.5, language=None)</pre><pre class="brush:python; gutter:false; light:true;">engine = Bing(license=None, throttle=0.5, language=None)</pre><pre class="brush:python; gutter:false; light:true;">engine = Twitter(license=None, throttle=0.5, language=None)</pre><pre class="brush:python; gutter:false; light:true;">engine = Facebook(license=None, throttle=1.0, language='en')</pre><pre class="brush:python; gutter:false; light:true;">engine = Wikipedia(license=None, throttle=5.0, language=None)</pre><pre class="brush:python; gutter:false; light:true;">engine = Flickr(license=None, throttle=5.0, language=None)</pre><p>Each search engine has different settings for the <span class="inline_code">search()</span> method. For example, <span class="inline_code">Twitter.search()</span> returns up to 3000 results for a given query (30 queries with 100 results each, or 300 queries with 10 results each). It has a limit of 150 queries per 15 minutes. Each call to <span class="inline_code">search()</span> counts as one query.</p>
 <table class="border">
 <tbody>
@@ -272,14 +272,6 @@ <h3>Google, Bing, Twitter, Facebook, Wikipedia, Flickr</h3>
 <td>0.5</td>
 </tr>
 <tr>
-<td><span class="inline_code">Yahoo</span></td>
-<td><span class="inline_code">SEARCH</span> <span class="inline_code">|</span> <span class="inline_code">NEWS</span> <span class="inline_code">|</span> <span class="inline_code">IMAGE</span><sup>13</sup></td>
-<td>1-1000/<span class="inline_code">count</span></td>
-<td>1-50</td>
-<td class="smallcaps">paid</td>
-<td>0.5</td>
-</tr>
-<tr>
 <td><span class="inline_code">DuckDuckGo</span></td>
 <td><span class="inline_code">SEARCH</span></td>
 <td>1</td>
@@ -353,14 +345,13 @@ <h3>Google, Bing, Twitter, Facebook, Wikipedia, Flickr</h3>
 </tr>
 </tbody>
 </table>
-<p><span class="small"><sup>1 </sup><span class="inline_code">Google</span>, <span class="inline_code">Bing</span> and <span class="inline_code">Yahoo</span> are paid services – see further how to obtain a license key.<br /></span> <span class="small"><sup>2 </sup><span class="inline_code">Bing.search(type=NEWS)</span> has a <span class="inline_code">count</span> of 1-15.<br /></span> <span class="small"><sup>3 </sup><span class="inline_code">Yahoo.search(type=IMAGES)</span> has a <span class="inline_code">count</span> of 1-35.</span><br /> <span class="smallcaps"><br /><a name="license"></a>Web service license key</span></p>
+<p><span class="small"><sup>1 </sup><span class="inline_code">Google</span> and <span class="inline_code">Bing</span> are paid services – see further how to obtain a license key.<br /></span> <span class="small"><sup>2 </sup><span class="inline_code">Bing.search(type=NEWS)</span> has a <span class="inline_code">count</span> of 1-15.<br /></span> <span class="smallcaps"><br /><a name="license"></a>Web service license key</span></p>
 <p>Some services require a license key. They may work without one, but this implies that you share a public license key (and query limit) with other users of the pattern.web module. If the query limit is exceeded, <span class="inline_code">SearchEngine.search()</span>&nbsp;raises a&nbsp;<span class="inline_code">SearchEngineLimitError</span>.</p>
 <ul>
 <li><span class="inline_code">Google</span> is a paid service ($1 for 200 queries), with a 100 free queries per day. When you obtain a license key (follow the link below), activate "Custom Search API" and "Translate API" under "Services" and look up the key under "API Access".</li>
 <li><span class="inline_code">Bing</span> is a paid service ($1 for 500 queries), with a 5,000 free queries per month.</li>
-<li><span class="inline_code">Yahoo</span> is a paid service ($1 for 1250 queries) that requires an OAuth key + secret, which can be passed as a tuple: <span class="inline_code">Yahoo(license=(key,</span> <span class="inline_code">secret))</span>.</li>
 </ul>
-<p>Obtain a license key: <a href="https://code.google.com/apis/console/" target="_blank">Google</a>, <a href="https://datamarket.azure.com/dataset/5BA839F1-12CE-4CCE-BF57-A49D98D29A44" target="_blank">Bing</a>, <a href="http://developer.yahoo.com/search/boss/" target="_blank">Yahoo</a>, <a href="https://apps.twitter.com/app/new" target="_blank">Twitter</a>, <a href="/pattern-facebook" target="_blank">Facebook</a>, <a href="http://www.flickr.com/services/api/keys/" target="_blank">Flickr</a>.<br /><span class="smallcaps"><br />Web service request throttle</span></p>
+<p>Obtain a license key: <a href="https://code.google.com/apis/console/" target="_blank">Google</a>, <a href="https://datamarket.azure.com/dataset/5BA839F1-12CE-4CCE-BF57-A49D98D29A44" target="_blank">Bing</a>, <a href="https://apps.twitter.com/app/new" target="_blank">Twitter</a>, <a href="/pattern-facebook" target="_blank">Facebook</a>, <a href="http://www.flickr.com/services/api/keys/" target="_blank">Flickr</a>.<br /><span class="smallcaps"><br />Web service request throttle</span></p>
 <p>A <span class="inline_code">SearchEngine.search()</span> request takes a minimum amount of time to complete, as outlined in the table above. This is intended as etiquette towards the server providing the service. Raise the <span class="inline_code">throttle</span> value if you plan to run multiple queries in batch.&nbsp;Wikipedia requests are especially intensive. If you plan to mine a lot of data from Wikipedia, download the <a href="http://en.wikipedia.org/wiki/Wikipedia:Database_download">Wikipedia database</a> instead.</p>
 <p>&nbsp;</p>
 <hr />
@@ -379,7 +370,7 @@ <h2>Search Engine results</h2>
 <p><a name="google"></a>For example:</p>
 <div class="example">
 <pre class="brush:python; gutter:false; light:true;">&gt;&gt;&gt; from pattern.web import Bing, SEARCH, plaintext
-&gt;&gt;&gt;  
+&gt;&gt;&gt;
 &gt;&gt;&gt; engine = Bing(license=None) # Enter your license key.
 &gt;&gt;&gt; for i in range(1,5):
 &gt;&gt;&gt;    for result in engine.search('holy handgrenade', type=SEARCH, start=i):
@@ -392,13 +383,13 @@ <h2>Search Engine results</h2>
 <p>Since <span class="inline_code">SearchEngine.search()</span> takes the same optional parameters as <span class="inline_code">URL.download()</span>&nbsp;it is easy to disable local caching, set a proxy server, a throttle (minimum time) or a timeout (maximum time).</p>
 <div class="example">
 <pre class="brush: python;gutter: false; light: true; fontsize: 100; first-line: 1; ">&gt;&gt;&gt; from pattern.web import Google
-&gt;&gt;&gt;  
+&gt;&gt;&gt;
 &gt;&gt;&gt; engine = Google(license=None) # Enter your license key.
 &gt;&gt;&gt; for result in engine.search('tim', cached=False, proxy=('proxy.com', 'https'))
 &gt;&gt;&gt;     print result.url
 &gt;&gt;&gt;     print result.text</pre></div>
 <p><span class="smallcaps"><br />Image search</span></p>
-<p>For <span class="inline_code">Flickr</span>, <span class="inline_code">Bing</span>&nbsp;and&nbsp;<span class="inline_code">Yahoo</span>, image URLs retrieved with <span class="inline_code">search(type=IMAGE)</span> can be filtered by setting the&nbsp;<span class="inline_code">size</span> to <span class="inline_code">TINY</span>, <span class="inline_code">SMALL</span>, <span class="inline_code">MEDIUM</span>, <span class="inline_code">LARGE</span> or <span class="inline_code">None</span> (any size). Images may be subject to copyright.</p>
+<p>For <span class="inline_code">Flickr</span> and <span class="inline_code">Bing</span> image URLs retrieved with <span class="inline_code">search(type=IMAGE)</span> can be filtered by setting the&nbsp;<span class="inline_code">size</span> to <span class="inline_code">TINY</span>, <span class="inline_code">SMALL</span>, <span class="inline_code">MEDIUM</span>, <span class="inline_code">LARGE</span> or <span class="inline_code">None</span> (any size). Images may be subject to copyright.</p>
 <p>For <span class="inline_code">Flickr</span>, use <span class="inline_code">search(copyright=False)</span> to retrieve results with no copyright restrictions (either public domain or Creative Commons <a href="http://creativecommons.org/licenses/by-sa/2.0/">by-sa</a>).</p>
 <p>For <span class="inline_code">Twitter</span>, each result has a <span class="inline_code">Result.profile</span> property with the URL to the user's profile picture.</p>
 <p>&nbsp;</p>
@@ -407,7 +398,7 @@ <h2>Google translate</h2>
 <p><span class="inline_code">Google.translate()</span>&nbsp;returns the translated string in the given language.<br /><span class="inline_code">Google.identify()</span>&nbsp;returns a <span class="inline_code">(language</span> <span class="inline_code">code,</span> <span class="inline_code">confidence)</span>-tuple for a given string.</p>
 <div class="example">
 <pre class="brush:python; gutter:false; light:true;">&gt;&gt;&gt; from pattern.web import Google
-&gt;&gt;&gt; 
+&gt;&gt;&gt;
 &gt;&gt;&gt; s = "C'est un lapin, lapin de bois. Quoi? Un cadeau."
 &gt;&gt;&gt; g = Google()
 &gt;&gt;&gt; print g.translate(s, input='fr', output='en', cached=False)
@@ -424,7 +415,7 @@ <h2><a name="twitter"></a>Twitter search</h2>
 <pre class="brush: python;gutter: false; light: true; fontsize: 100; first-line: 1; ">&gt;&gt;&gt; from pattern.web import Twitter
 &gt;&gt;&gt;
 &gt;&gt;&gt; t = Twitter()
-&gt;&gt;&gt; i = None 
+&gt;&gt;&gt; i = None
 &gt;&gt;&gt; for j in range(3):
 &gt;&gt;&gt;     for tweet in t.search('win', start=i, count=10):
 &gt;&gt;&gt;         print tweet.text
@@ -436,10 +427,10 @@ <h2>Twitter streams</h2>
 <p><span class="inline_code">Twitter.stream()</span>&nbsp;returns an endless, live stream of <span class="inline_code">Result</span> objects. A <span class="inline_code">Stream</span> is a Python list that accumulates each time <span class="inline_code">Stream.update()</span> is called:</p>
 <div class="example">
 <pre class="brush: python;gutter: false; light: true; fontsize: 100; first-line: 1; ">&gt;&gt;&gt; from pattern.web import Twitter
-&gt;&gt;&gt; 
+&gt;&gt;&gt;
 &gt;&gt;&gt; s = Twitter().stream('#fail')
 &gt;&gt;&gt; for i in range(10):
-&gt;&gt;&gt;     time.sleep(1) 
+&gt;&gt;&gt;     time.sleep(1)
 &gt;&gt;&gt;     s.update(bytes=1024)
 &gt;&gt;&gt;     print s[-1].text if s else ''</pre></div>
 <p>To clear the accumulated list, call <span class="inline_code">Stream.clear()</span>.</p>
@@ -477,11 +468,11 @@ <h3>Wikipedia article sections</h3>
 section.string              # Section plaintext unicode string.
 section.content             # Section string minus title.
 section.level               # Section nested depth (from 0).
-section.links               # List of titles of linked articles. 
+section.links               # List of titles of linked articles.
 section.tables              # List of WikipediaTable objects.</pre><p>The following example downloads a Wikipedia article and prints the title of each section, indented according to the section level:</p>
 <div class="example">
 <pre class="brush:python; gutter:false; light:true;">&gt;&gt;&gt; from pattern.web import Wikipedia
-&gt;&gt;&gt; 
+&gt;&gt;&gt;
 &gt;&gt;&gt; article = Wikipedia().search('cat')
 &gt;&gt;&gt; for section in article.sections:
 &gt;&gt;&gt;    print repr(' ' * section.level + section.title)
@@ -525,7 +516,7 @@ <h2><a name="dbpedia"></a>DBPedia</h2>
 <p><a href="http://dbpedia.org/About" target="_blank">DBPedia</a> is a database of structured information mined from Wikipedia and stored as (subject, predicate, object)-triples (e.g., <em>cat</em> <span class="postag">is-a</span> <em>animal</em>). DBPedia can be queried with <a href="http://www.w3.org/TR/rdf-sparql-query/" target="_blank">SPARQL</a>, where subject, predicate and/or object can be given as&nbsp;<span class="inline_code">?variables</span>. The&nbsp;<span class="inline_code">Result</span> objects in the list returned from <span class="inline_code">DBPedia.search()</span> have the variables as additional properties:</p>
 <div class="example">
 <pre class="brush: python;gutter: false; light: true; fontsize: 100; first-line: 1; ">&gt;&gt;&gt; from pattern.web import DBPedia
-&gt;&gt;&gt; 
+&gt;&gt;&gt;
 &gt;&gt;&gt; sparql = '\n'.join((
 &gt;&gt;&gt;     'prefix dbo: &lt;http://dbpedia.org/ontology/&gt;',
 &gt;&gt;&gt;     'select ?person ?place where {',
@@ -547,25 +538,25 @@ <h2><a name="facebook"></a>Facebook posts, comments &amp; likes</h2>
 <p><span class="inline_code">Facebook.search(id,</span> <span class="inline_code">type=COMMENTS)</span> retrieves comments for a given post's&nbsp;<span class="inline_code">Result.id</span>. You can also pass the id of a post or a comment to <span class="inline_code">Facebook.search(id, type=LIKES)</span> to retrieve users that liked it.</p>
 <div class="example">
 <pre class="brush: python;gutter: false; light: true; fontsize: 100; first-line: 1; ">&gt;&gt;&gt; from pattern.web import Facebook, NEWS, COMMENTS, LIKES
-&gt;&gt;&gt; 
+&gt;&gt;&gt;
 &gt;&gt;&gt; fb = Facebook(license='your key')
 &gt;&gt;&gt; me = fb.profile(id=None) # (id, name, date, gender, locale, likes)-tuple
-&gt;&gt;&gt; 
+&gt;&gt;&gt;
 &gt;&gt;&gt; for post in fb.search(me[0], type=NEWS, count=100):
 &gt;&gt;&gt;     print repr(post.id)
 &gt;&gt;&gt;     print repr(post.text)
 &gt;&gt;&gt;     print repr(post.url)
 &gt;&gt;&gt;     if post.comments &gt; 0:
-&gt;&gt;&gt;         print '%i comments' % post.comments 
+&gt;&gt;&gt;         print '%i comments' % post.comments
 &gt;&gt;&gt;         print [(r.text, r.author) for r in fb.search(post.id, type=COMMENTS)]
 &gt;&gt;&gt;     if post.likes &gt; 0:
-&gt;&gt;&gt;         print '%i likes' % post.likes 
+&gt;&gt;&gt;         print '%i likes' % post.likes
 &gt;&gt;&gt;         print [r.author for r in fb.search(post.id, type=LIKES)]
 
 u'530415277_10151455896030278'
 u'Tom De Smedt likes CLiPS Research Center'
 u'http://www.facebook.com/CLiPS.UA'
-1 likes 
+1 likes
 [(u'485942414773810', u'CLiPS Research Center')]
 .... </pre></div>
 <p>The maximum <span class="inline_code">count</span> for <span class="inline_code">COMMENTS</span> and <span class="inline_code">LIKES</span> is 1000 (by default, 10).&nbsp;</p>
@@ -575,7 +566,7 @@ <h2>RSS + Atom newsfeeds</h2>
 <p>The <span class="inline_code">Newsfeed</span> object is a wrapper for Mark Pilgrim's <a href="http://www.feedparser.org/" target="_blank">Universal Feed Parser</a>. <span class="inline_code">Newsfeed.search()</span> takes the URL of an RSS or Atom news feed and returns a list of <span class="inline_code">Result</span> objects.</p>
 <div class="example">
 <pre class="brush:python; gutter:false; light:true;">&gt;&gt;&gt; from pattern.web import Newsfeed
-&gt;&gt;&gt; 
+&gt;&gt;&gt;
 &gt;&gt;&gt; NATURE = 'http://www.nature.com/nature/current_issue/rss/index.html'
 &gt;&gt;&gt; for result in Newsfeed().search(NATURE)[:5]:
 &gt;&gt;&gt;     print repr(result.title)
@@ -597,7 +588,7 @@ <h2><a name="sort"></a>Web sort</h2>
 <pre class="brush:python; gutter:false; light:true;">sort(
     terms = [],             # List of search terms.
   context = '',             # Term used for sorting.
-  service = GOOGLE,         # GOOGLE | BING | YAHOO | FLICKR
+  service = GOOGLE,         # GOOGLE | BING | FLICKR
   license = None,           # Service license key.
    strict = True,           # Wrap query in quotes?
    prefix = False,          # context + term or term + context?
@@ -605,13 +596,13 @@ <h2><a name="sort"></a>Web sort</h2>
 <p>Now let's see who is more dangerous:</p>
 <div class="example">
 <pre class="brush:python; gutter:false; light:true;">&gt;&gt;&gt; from pattern.web import sort
-&gt;&gt;&gt; 
+&gt;&gt;&gt;
 &gt;&gt;&gt; results = sort(terms=[
-&gt;&gt;&gt;   'arnold schwarzenegger', 
-&gt;&gt;&gt;   'chuck norris', 
-&gt;&gt;&gt;   'dolph lundgren', 
+&gt;&gt;&gt;   'arnold schwarzenegger',
+&gt;&gt;&gt;   'chuck norris',
+&gt;&gt;&gt;   'dolph lundgren',
 &gt;&gt;&gt;   'steven seagal',
-&gt;&gt;&gt;   'sylvester stallone', 
+&gt;&gt;&gt;   'sylvester stallone',
 &gt;&gt;&gt;   'mickey mouse'], context='dangerous', prefix=True)
 &gt;&gt;&gt;
 &gt;&gt;&gt; for weight, term in results:
@@ -649,7 +640,7 @@ <h2><a name="plaintext"></a>HTML to plaintext</h2>
 <p>The following example downloads a HTML document and keeps a minimal amount of formatting (headings, bold, links).</p>
 <div class="example">
 <pre class="brush:python; gutter:false; light:true;">&gt;&gt;&gt; from pattern.web import URL, plaintext
-&gt;&gt;&gt; 
+&gt;&gt;&gt;
 &gt;&gt;&gt; s = URL('http://www.clips.ua.ac.be').download()
 &gt;&gt;&gt; s = plaintext(s, keep={'h1':[], 'h2':[], 'strong':[], 'a':['href']})
 &gt;&gt;&gt; print s
@@ -742,12 +733,12 @@ <h3>Node</h3>
 </div>
 <div class="example">
 <pre class="brush: python;gutter: false; light: true; fontsize: 100; first-line: 1; ">&gt;&gt;&gt; from pattern.web import Element
-&gt;&gt;&gt; 
+&gt;&gt;&gt;
 &gt;&gt;&gt; div = Element('&lt;div&gt; &lt;a&gt;1st&lt;/a&gt; &lt;a&gt;2nd&lt;a&gt; &lt;/div&gt;')
 &gt;&gt;&gt; print div('a:first-child')
 &gt;&gt;&gt; print div('a:first-child')[0].source
 
-[Element(tag='a')] 
+[Element(tag='a')]
 &lt;a&gt;1st&lt;/a&gt; </pre></div>
 <h3>DOM</h3>
 <p>The top-level element in the Document Object Model.</p>
@@ -756,7 +747,7 @@ <h3>DOM</h3>
 dom.body                    # &lt;body&gt; Element.</pre><p>The following example retrieves the most recent&nbsp;<a href="http://www.reddit.com/" target="_blank">reddit</a>&nbsp;entries. The pattern.web module does not include a reddit search engine, but we can parse entries directly from the HTML source. This is called <em>screen scraping</em>, and many websites will strongly dislike it.</p>
 <div class="example">
 <pre class="brush:python; gutter:false; light:true;">&gt;&gt;&gt; from pattern.web import URL, DOM, plaintext
-&gt;&gt;&gt; 
+&gt;&gt;&gt;
 &gt;&gt;&gt; url = URL('http://www.reddit.com/top/')
 &gt;&gt;&gt; dom = DOM(url.download(cached=True))
 &gt;&gt;&gt; for e in dom('div.entry')[:3]: # Top 3 reddit entries.
@@ -765,13 +756,13 @@ <h3>DOM</h3>
 
 u'Invisible Kitty'
 u'Naturally, he said yes.'
-u"I'd just like to remind everyone that /r/minecraft exists and not everyone wants" 
+u"I'd just like to remind everyone that /r/minecraft exists and not everyone wants"
  "to have 10 Minecraft posts a day on their front page."</pre></div>
 <p><span class="smallcaps"><br />Absolute URLs</span></p>
 <p>Links parsed from the <span class="inline_code">DOM</span> can be relative (e.g., starting with <span class="inline_code">"../"</span> instead of <span class="inline_code">"http://"</span>).<br />To get the absolute URL, you can use the <span class="inline_code">abs()</span> function in combination with <span class="inline_code">URL.redirect</span>:</p>
 <div class="example">
 <pre class="brush:python; gutter:false; light:true;">&gt;&gt;&gt; from pattern.web import URL, DOM, abs
-&gt;&gt;&gt; 
+&gt;&gt;&gt;
 &gt;&gt;&gt; url = URL('http://www.clips.ua.ac.be')
 &gt;&gt;&gt; dom = DOM(url.download())
 &gt;&gt;&gt; for link in dom('a'):
@@ -783,13 +774,13 @@ <h2><a name="pdf"></a>PDF Parser</h2>
 <p style="margin-top: 0.2em; margin-right: 0px; margin-bottom: 0.5em; margin-left: 0px;">The <span class="inline_code">PDF</span> object (based on <a href="http://www.unixuser.org/~euske/python/pdfminer/" target="_self">PDFMiner</a>) parses the source text from a PDF file.</p>
 <div class="example">
 <pre class="brush:python; gutter:false; light:true;">&gt;&gt;&gt; from pattern.web import URL, PDF
-&gt;&gt;&gt; 
+&gt;&gt;&gt;
 &gt;&gt;&gt; url = URL('http://www.clips.ua.ac.be/sites/default/files/ctrs-002_0.pdf')
 &gt;&gt;&gt; pdf = PDF(url.download())
 &gt;&gt;&gt; print pdf.string
 
 CLiPS Technical Report series 002 September 7, 2010
-Tom De Smedt, Vincent Van Asch, Walter Daelemans 
+Tom De Smedt, Vincent Van Asch, Walter Daelemans
 Computational Linguistics &amp; Psycholinguistics Research Center
 ... </pre></div>
 <p style="margin-top: 0.2em; margin-right: 0px; margin-bottom: 0.5em; margin-left: 0px;">URLs linking to a PDF document can be identified with: <span class="inline_code">URL.mimetype</span> <span class="inline_code">in</span> <span class="inline_code">MIMETYPE_PDF</span>.</p>
@@ -803,7 +794,7 @@ <h2><a name="crawler"></a>Crawler</h2>
 crawler.history              # Dictionary of (domain, time last visited)-items.
 crawler.visited              # Dictionary of URLs visited.
 crawler.sort                 # FIFO | LIFO (how new links are queued).
-crawler.done                 # True when all links have been visited.</pre><pre class="brush: python;gutter: false; light: true; fontsize: 100; first-line: 1; ">crawler.push(link, priority=1.0, sort=LIFO)            
+crawler.done                 # True when all links have been visited.</pre><pre class="brush: python;gutter: false; light: true; fontsize: 100; first-line: 1; ">crawler.push(link, priority=1.0, sort=LIFO)
 crawler.pop(remove=True)
 crawler.next                 # Yields the next scheduled link = Crawler.pop(False)</pre><pre class="brush:python; gutter:false; light:true;">crawler.crawl(method=DEPTH)  # DEPTH | BREADTH | None.</pre><pre class="brush:python; gutter:false; light:true;">crawler.priority(link, method=DEPTH)
 crawler.follow(link)
@@ -832,7 +823,7 @@ <h2><a name="crawler"></a>Crawler</h2>
 <div class="example">
 <pre class="brush:python; gutter:false; light:true;">&gt;&gt;&gt; from pattern.web import Crawler
 &gt;&gt;&gt;
-&gt;&gt;&gt; class Polly(Crawler): 
+&gt;&gt;&gt; class Polly(Crawler):
 &gt;&gt;&gt;     def visit(self, link, source=None):
 &gt;&gt;&gt;         print 'visited:', repr(link.url), 'from:', link.referrer
 &gt;&gt;&gt;     def fail(self, link):
@@ -852,19 +843,19 @@ <h2><a name="crawler"></a>Crawler</h2>
 <h3>Crawl function</h3>
 <p>The <span class="inline_code">crawl()</span> function returns an iterator&nbsp;that yields <span class="inline_code">(Link,</span> <span class="inline_code">source)</span>-tuples. When it is <em>idle</em> (e.g., waiting for the <span class="inline_code">delay</span> on a domain) it yields (<span class="inline_code">None</span>, <span class="inline_code">None</span>).</p>
 <pre class="brush: python;gutter: false; light: true; fontsize: 100; first-line: 1; ">crawl(
-    links = [], 
-  domains = [], 
-    delay = 20.0, 
-     sort = FIFO, 
+    links = [],
+  domains = [],
+    delay = 20.0,
+     sort = FIFO,
    method = DEPTH, **kwargs)</pre><div class="example">
 <pre class="brush: python;gutter: false; light: true; fontsize: 100; first-line: 1; ">&gt;&gt;&gt; from pattern.web import crawl
-&gt;&gt;&gt; 
+&gt;&gt;&gt;
 &gt;&gt;&gt; for link, source in crawl('http://www.clips.ua.ac.be/', delay=3, throttle=3):
 &gt;&gt;&gt;     print link
 
 Link(url=u'http://www.clips.ua.ac.be/')
 Link(url=u'http://www.clips.ua.ac.be/#navigation')
-Link(url=u'http://www.clips.ua.ac.be/computational-linguistics') 
+Link(url=u'http://www.clips.ua.ac.be/computational-linguistics')
 ...</pre></div>
 <p>&nbsp;</p>
 <hr />
@@ -889,7 +880,7 @@ <h2><a name="mail"></a>E-mail</h2>
 </pre><p>The following example retrieves spam e-mails containing the word "wish":</p>
 <div class="example">
 <pre class="brush:python; gutter:false; light:true;">&gt;&gt;&gt; from pattern.web import Mail, GMAIL, SUBJECT
-&gt;&gt;&gt; 
+&gt;&gt;&gt;
 &gt;&gt;&gt; gmail = Mail(username='...', password='...', service=GMAIL)
 &gt;&gt;&gt; print gmail.folders.keys()
 
@@ -914,8 +905,8 @@ <h2><a name="locale"></a>Locale</h2>
 <pre class="brush:python; gutter:false; light:true;">geocode(location)           # 'Brussels' =&gt; (50.83, 4.33, u'nl', u'Belgium')</pre><p>This is useful in combination with the <span class="inline_code">geo</span> parameter for <span class="inline_code">Twitter.search()</span> to obtain regional tweets:</p>
 <div class="example">
 <pre class="brush:python; gutter:false; light:true;">&gt;&gt;&gt; from pattern.web import Twitter
-&gt;&gt;&gt; from pattern.web.locale import geocode 
-&gt;&gt;&gt; 
+&gt;&gt;&gt; from pattern.web.locale import geocode
+&gt;&gt;&gt;
 &gt;&gt;&gt; twitter = Twitter(language='en')
 &gt;&gt;&gt; for tweet in twitter.search('restaurant', geo=geocode('Brussels')[:2]):
 &gt;&gt;&gt;      print tweet.text
diff --git a/examples/01-web/01-google.py b/examples/01-web/01-google.py
index 1fbd2ac7..1fc9c1b4 100644
--- a/examples/01-web/01-google.py
+++ b/examples/01-web/01-google.py
@@ -6,8 +6,8 @@
 # The pattern.web module has a SearchEngine class,
 # with a SearchEngine.search() method that yields a list of Result objects.
 # Each Result has url, title, text, language, author and date and properties.
-# Subclasses of SearchEngine include: 
-# Google, Bing, Yahoo, Twitter, Facebook, Wikipedia, Wiktionary, Flickr, ...
+# Subclasses of SearchEngine include:
+# Google, Bing, Twitter, Facebook, Wikipedia, Wiktionary, Flickr, ...
 
 # This example retrieves results from Google based on a given query.
 # The Google search engine can handle SEARCH type searches.
@@ -17,7 +17,7 @@
 # The pattern.web module uses a test account by default,
 # with a 100 free queries per day shared by all Pattern users.
 # If this limit is exceeded, SearchEngineLimitError is raised.
-# You should obtain your own license key at: 
+# You should obtain your own license key at:
 # https://code.google.com/apis/console/
 # Activate "Custom Search API" under "Services" and get the key under "API Access".
 # Then use Google(license=[YOUR_KEY]).search().
diff --git a/examples/01-web/11-facebook.py b/examples/01-web/11-facebook.py
index a633cb9c..4924237c 100644
--- a/examples/01-web/11-facebook.py
+++ b/examples/01-web/11-facebook.py
@@ -15,7 +15,7 @@
 # 1) Searching for public status updates.
 #    Search for all status updates that contain the word "horrible".
 
-try: 
+try:
     # We'll store the status updates in a Datasheet.
     # A Datasheet is a table of rows and columns that can be exported as a CSV-file.
     # In the first column, we'll store a unique id for each status update.
@@ -33,7 +33,7 @@
 # we get the most recent results instead of those in the local cache.
 # Keeping a local cache can also be useful (e.g., while testing)
 # because a query is instant when it is executed the second time.
-for status in fb.search("horrible", count=25, cached=False):
+for status in fb.search(262588213843476, count=25, cached=False):
     print "=" * 100
     print status.id
     print status.text
@@ -59,8 +59,8 @@
 if license != "":
     fb = Facebook(license)
     # Facebook.profile() returns a dictionary with author info.
-    # By default, this is your own profile. 
-    # You can also supply the id of another profile, 
+    # By default, this is your own profile.
+    # You can also supply the id of another profile,
     # or the name of a product page.
     me = fb.profile()["id"]
     for status in fb.search(me, type=NEWS, count=30, cached=False):
diff --git a/examples/01-web/15-sort.py b/examples/01-web/15-sort.py
index 8134ccfc..0c369253 100644
--- a/examples/01-web/15-sort.py
+++ b/examples/01-web/15-sort.py
@@ -1,29 +1,29 @@
 import os, sys; sys.path.insert(0, os.path.join(os.path.dirname(__file__), "..", ".."))
 
-from pattern.web import GOOGLE, YAHOO, BING, sort
+from pattern.web import GOOGLE, BING, sort
 
 # The pattern.web module includes an interesting sort() algorithm.
 # Ir classifies search terms according to a search engine's total results count.
 # When a context is defined, it sorts according to relevancy to the context:
 # sort(terms=["black", "green", "red"], context="Darth Vader") =>
-# yields "black" as the best candidate, 
+# yields "black" as the best candidate,
 # because "black Darth Vader" yields more search results.
 
 results = sort(
       terms = [
-        "arnold schwarzenegger", 
-        "chuck norris", 
-        "dolph lundgren", 
+        "arnold schwarzenegger",
+        "chuck norris",
+        "dolph lundgren",
         "steven seagal",
-        "sylvester stallone", 
+        "sylvester stallone",
         "mickey mouse",
         ],
     context = "dangerous", # Term used for sorting.
-    service = BING,        # GOOGLE, YAHOO, BING, ...
+    service = BING,        # GOOGLE, BING, ...
     license = None,        # You should supply your own API license key for the given service.
-     strict = True,        # Wraps the query in quotes, i.e. 'mac sweet'. 
+     strict = True,        # Wraps the query in quotes, i.e. 'mac sweet'.
     reverse = True,        # Reverses term and context: 'sweet mac' instead of 'mac sweet'.
      cached = True)
-    
+
 for weight, term in results:
     print "%5.2f" % (weight * 100) + "%", term
\ No newline at end of file
diff --git a/pattern/web/__init__.py b/pattern/web/__init__.py
index b1390eab..343154b1 100644
--- a/pattern/web/__init__.py
+++ b/pattern/web/__init__.py
@@ -58,7 +58,7 @@
     MODULE = os.path.dirname(os.path.realpath(__file__))
 except:
     MODULE = ""
-    
+
 if sys.version > "3":
     long = int
 
@@ -68,8 +68,8 @@
 # assigned to these code points.
 
 GREMLINS = set([
-    0x0152, 0x0153, 0x0160, 0x0161, 0x0178, 0x017E, 0x017D, 0x0192, 0x02C6, 
-    0x02DC, 0x2013, 0x2014, 0x201A, 0x201C, 0x201D, 0x201E, 0x2018, 0x2019, 
+    0x0152, 0x0153, 0x0160, 0x0161, 0x0178, 0x017E, 0x017D, 0x0192, 0x02C6,
+    0x02DC, 0x2013, 0x2014, 0x201A, 0x201C, 0x201D, 0x201E, 0x2018, 0x2019,
     0x2020, 0x2021, 0x2022, 0x2026, 0x2030, 0x2039, 0x203A, 0x20AC, 0x2122
 ])
 
@@ -81,7 +81,7 @@ def fix(s, ignore=""):
     if not isinstance(s, unicode):
         s = s.decode("utf-8")
         # If this doesn't work,
-        # copy & paste string in a Unicode .txt, 
+        # copy & paste string in a Unicode .txt,
         # and then pass open(f).read() to fix().
     u = []
     i = 0
@@ -1048,7 +1048,7 @@ def description(self):
     @property
     def likes(self):
         return self.votes
-        
+
     @property
     def retweets(self):
         return self.shares
@@ -1077,7 +1077,7 @@ def __setitem__(self, k, v):
 
     def setdefault(self, k, v=None):
         return dict.setdefault(self, u(k), self._format(v))
-        
+
     def update(self, *args, **kwargs):
         dict.update(self, [(u(k), self._format(v)) for k, v in dict(*args, **kwargs).items()])
 
@@ -1233,89 +1233,6 @@ def identify(self, string, **kwargs):
         data = u(data.get("language")), float(data.get("confidence"))
         return data
 
-#--- YAHOO -----------------------------------------------------------------------------------------
-# Yahoo! Search is a web search engine owned by Yahoo! Inc.
-# Yahoo! BOSS ("Build Your Own Search Service") is a paid service.
-# http://developer.yahoo.com/search/
-
-YAHOO = "http://yboss.yahooapis.com/ysearch/"
-YAHOO_LICENSE = api.license["Yahoo"]
-
-class Yahoo(SearchEngine):
-
-    def __init__(self, license=None, throttle=0.5, language=None):
-        SearchEngine.__init__(self, license or YAHOO_LICENSE, throttle, language)
-
-    def _authenticate(self, url):
-        url.query.update({
-            "oauth_version": "1.0",
-            "oauth_nonce": oauth.nonce(),
-            "oauth_timestamp": oauth.timestamp(),
-            "oauth_consumer_key": self.license[0],
-            "oauth_signature_method": "HMAC-SHA1"
-        })
-        url.query["oauth_signature"] = oauth.sign(url.string.split("?")[0], url.query,
-            method = url.method,
-            secret = self.license[1]
-        )
-        return url
-
-    def search(self, query, type=SEARCH, start=1, count=10, sort=RELEVANCY, size=None, cached=True, **kwargs):
-        """ Returns a list of results from Yahoo for the given query.
-            - type : SEARCH, IMAGE or NEWS,
-            - start: maximum 1000 results => start 1-100 with count=10, 1000/count,
-            - count: maximum 50, or 35 for images.
-            There is no daily limit, however Yahoo BOSS is a paid service.
-        """
-        if type not in (SEARCH, IMAGE, NEWS):
-            raise SearchEngineTypeError
-        if type == SEARCH:
-            url = YAHOO + "web"
-        if type == IMAGE:
-            url = YAHOO + "images"
-        if type == NEWS:
-            url = YAHOO + "news"
-        if not query or count < 1 or start < 1 or start > 1000 / count:
-            return Results(YAHOO, query, type)
-        # 1) Create request URL.
-        url = URL(url, method=GET, query={
-                 "q": query.replace(" ", "+"),
-             "start": 1 + (start-1) * count,
-             "count": min(count, type==IMAGE and 35 or 50),
-            "format": "json"
-        })
-        # 2) Restrict language.
-        if self.language is not None:
-            market = locale.market(self.language)
-            if market:
-                url.query["market"] = market.lower()
-        # 3) Authenticate.
-        url = self._authenticate(url)
-        # 4) Parse JSON response.
-        kwargs.setdefault("unicode", True)
-        kwargs.setdefault("throttle", self.throttle)
-        try:
-            data = url.download(cached=cached, **kwargs)
-        except HTTP401Authentication:
-            raise HTTP401Authentication("Yahoo %s API is a paid service" % type)
-        except HTTP403Forbidden:
-            raise SearchEngineLimitError
-        data = json.loads(data)
-        data = data.get("bossresponse") or {}
-        data = data.get({SEARCH:"web", IMAGE:"images", NEWS:"news"}[type], {})
-        results = Results(YAHOO, query, type)
-        results.total = int(data.get("totalresults") or 0)
-        for x in data.get("results", []):
-            r = Result(url=None)
-            r.url      = self.format(x.get("url", x.get("clickurl")))
-            r.title    = self.format(x.get("title"))
-            r.text     = self.format(x.get("abstract"))
-            r.date     = self.format(x.get("date"))
-            r.author   = self.format(x.get("source"))
-            r.language = self.format(x.get("language") and \
-                                     x.get("language").split(" ")[0] or self.language or "")
-            results.append(r)
-        return results
 
 #--- BING ------------------------------------------------------------------------------------------
 # Bing is a web search engine owned by Microsoft.
@@ -1638,12 +1555,12 @@ def search(self, query, type=SEARCH, start=1, count=10, sort=RELEVANCY, size=Non
         # If search() is called again with start+1, start from this id.
         if isinstance(start, (int, long, float)):
             k = (query, kwargs.get("geo"), kwargs.get("date"), int(start), count)
-            if results:  
-                self._pagination[k] = str(int(results[-1].id) - 1) 
+            if results:
+                self._pagination[k] = str(int(results[-1].id) - 1)
             else:
                 self._pagination[k] = id
         return results
-        
+
     def profile(self, query, start=1, count=10, **kwargs):
         """ Returns a list of results for the given author id, alias or search query.
         """
@@ -1869,13 +1786,13 @@ def index(self, namespace=0, start=None, count=100, cached=True, **kwargs):
             start = data.get("query-continue", {}).get("allpages", {})
             start = start.get("apcontinue", start.get("apfrom", -1))
         raise StopIteration
-    
+
     # Backwards compatibility.
     list = index
 
     def search(self, query, type=SEARCH, start=1, count=10, sort=RELEVANCY, size=None, cached=True, **kwargs):
         """ With type=SEARCH, returns a MediaWikiArticle for the given query (case-sensitive).
-            With type=ALL, returns a list of results. 
+            With type=ALL, returns a list of results.
             Each result.title is the title of an article that contains the given query.
         """
         if type not in (SEARCH, ALL, "*"):
@@ -2063,7 +1980,7 @@ def plaintext(self, **kwargs):
     @property
     def html(self):
         return self.source
-        
+
     @property
     def src(self):
         return self.source
@@ -2100,7 +2017,7 @@ def source(self):
     @property
     def html(self):
         return self.source
-        
+
     @property
     def src(self):
         return self.source
@@ -2142,7 +2059,7 @@ def tables(self):
                 p = self.article._plaintext
                 f = find_between
                 for s in f(b[0], b[1], self.source):
-                    t = self.article.parser.MediaWikiTable(self, 
+                    t = self.article.parser.MediaWikiTable(self,
                          title = p((f(r"<caption.*?>", "</caption>", s) + [""])[0]),
                         source = b[0] + s + b[1])
                     # 1) Parse <td> and <th> content and format it as plain text.
@@ -2186,7 +2103,7 @@ def plaintext(self, **kwargs):
     @property
     def html(self):
         return self.source
-        
+
     @property
     def src(self):
         return self.source
@@ -2493,7 +2410,7 @@ def search(self, query, type=SPARQL, start=1, count=10, sort=RELEVANCY, size=Non
 # Flickr is a popular image hosting and video hosting website.
 # http://www.flickr.com/services/api/
 
-FLICKR = "http://api.flickr.com/services/rest/"
+FLICKR = "https://api.flickr.com/services/rest/"
 FLICKR_LICENSE = api.license["Flickr"]
 
 INTERESTING = "interesting"
@@ -2624,23 +2541,22 @@ def _token(self):
             "client_secret": "81ff4204e73ecafcd87635a3a3683fbe"
         }).download().split("=")[1]
 
-    def search(self, query, type=SEARCH, start=1, count=10, cached=False, **kwargs):
+    def search(self, query, type=NEWS, start=1, count=10, cached=False, **kwargs):
         """ Returns a list of results from Facebook public status updates for the given query.
             - query: string, or Result.id for NEWS and COMMENTS,
-            - type : SEARCH,
+            - type : NEWS,
             - start: 1,
-            - count: maximum 100 for SEARCH and NEWS, 1000 for COMMENTS and LIKES.
+            - count: maximum 100 for NEWS, 1000 for COMMENTS and LIKES.
             There is an hourly limit of +-600 queries (actual amount undisclosed).
         """
-        # Facebook.search(type=SEARCH) returns public posts + author.
         # Facebook.search(type=NEWS) returns posts for the given author (id | alias | "me").
         # Facebook.search(type=COMMENTS) returns comments for the given post id.
         # Facebook.search(type=LIKES) returns authors for the given author, post or comments.
         # Facebook.search(type=FRIENDS) returns authors for the given author.
         # An author is a Facebook user or other entity (e.g., a product page).
-        if type not in (SEARCH, NEWS, COMMENTS, LIKES, FRIENDS):
+        if type not in (NEWS, COMMENTS, LIKES, FRIENDS):
             raise SearchEngineTypeError
-        if type in (SEARCH, NEWS):
+        if type in (NEWS):
             max = 100
         if type in (COMMENTS, LIKES):
             max = 1000
@@ -2651,15 +2567,6 @@ def search(self, query, type=SEARCH, start=1, count=10, cached=False, **kwargs):
         if isinstance(query, FacebookResult):
             query = query.id
         # 1) Construct request URL.
-        if type == SEARCH:
-            url = FACEBOOK + type
-            url = URL(url, method=GET, query={
-                         "q": query,
-                      "type": "post",
-              "access_token": self.license,
-                    "offset": (start-1) * min(count, max),
-                     "limit": (start-0) * min(count, max)
-            })
         if type in (NEWS, FEED, COMMENTS, LIKES, FRIENDS):
             url = FACEBOOK + (u(query) or "me").replace(FACEBOOK, "") + "/" + type.replace("news", "feed")
             url = URL(url, method=GET, query={
@@ -2667,10 +2574,10 @@ def search(self, query, type=SEARCH, start=1, count=10, cached=False, **kwargs):
                     "offset": (start-1) * min(count, max),
                      "limit": (start-0) * min(count, max),
             })
-        if type in (SEARCH, NEWS, FEED):
+        if type in (NEWS, FEED):
             url.query["fields"] = ",".join((
-                "id", "from", "name", "story", "message", "link", "picture", "created_time", "shares", 
-                "comments.limit(1).summary(true)", 
+                "id", "from", "name", "story", "message", "link", "picture", "created_time", "shares",
+                "comments.limit(1).summary(true)",
                    "likes.limit(1).summary(true)"
             ))
         # 2) Parse JSON response.
@@ -2737,7 +2644,7 @@ def profile(self, id=None, **kwargs):
             locale = data.get("hometown", {}).get("name", ""),
              votes = int(data.get("likes", 0)) # (for product pages)
         )
-        
+
     page = profile
 
 #--- PRODUCT REVIEWS -------------------------------------------------------------------------------
@@ -2876,8 +2783,6 @@ def query(string, service=GOOGLE, **kwargs):
     service = service.lower()
     if service in (GOOGLE, "google", "g"):
         engine = Google
-    if service in (YAHOO, "yahoo", "y!"):
-        engine = Yahoo
     if service in (BING, "bing"):
         engine = Bing
     if service in (DUCKDUCKGO, "duckduckgo", "ddg"):
@@ -2907,7 +2812,6 @@ def query(string, service=GOOGLE, **kwargs):
 
 SERVICES = {
     GOOGLE    : Google,
-    YAHOO     : Yahoo,
     BING      : Bing,
     TWITTER   : Twitter,
     WIKIPEDIA : Wikipedia,
@@ -2924,7 +2828,7 @@ def sort(terms=[], context="", service=GOOGLE, license=None, strict=True, prefix
         yields "black" as the best candidate, because "black Darth Vader" is more common in search results.
         - terms   : list of search terms,
         - context : term used for sorting,
-        - service : web service name (GOOGLE, YAHOO, BING),
+        - service : web service name (GOOGLE, BING),
         - license : web service license id,
         - strict  : when True the query constructed from term + context is wrapped in quotes.
     """
@@ -3021,7 +2925,7 @@ def traverse(self, visit=lambda node: None):
         """ Executes the visit function on this node and each of its child nodes.
         """
         visit(self); [node.traverse(visit) for node in self.children]
-        
+
     def remove(self, child):
         """ Removes the given child node (and all nested nodes).
         """
@@ -3043,7 +2947,7 @@ def __str__(self):
         return bytestring(self.__unicode__())
     def __unicode__(self):
         return u(self._p)
-        
+
     def __call__(self, *args, **kwargs):
         pass
 
@@ -3235,7 +3139,7 @@ def __repr__(self):
 
 def _encode_space(s):
     return s.replace(" ", "<!space!>")
-    
+
 def _decode_space(s):
     return s.replace("<!space!>", " ")
 
@@ -3253,11 +3157,11 @@ def __init__(self, s):
         s = s.replace(".", " .")        # .class
         s = s.replace(":", " :")        # :pseudo-element
         s = s.replace("[", " [")        # [attribute="value"]
-        s = re.sub(r"\[.*?\]", 
-            lambda m: re.sub(r" (\#|\.|\:)", "\\1", m.group(0)), s)    
-        s = re.sub(r"\[.*?\]", 
+        s = re.sub(r"\[.*?\]",
+            lambda m: re.sub(r" (\#|\.|\:)", "\\1", m.group(0)), s)
+        s = re.sub(r"\[.*?\]",
             lambda m: _encode_space(m.group(0)), s)
-        s = re.sub(r":contains\(.*?\)", 
+        s = re.sub(r":contains\(.*?\)",
             lambda m: _encode_space(m.group(0)), s)
         s = s.split(" ")
         self.tag, self.id, self.classes, self.pseudo, self.attributes = (
@@ -3297,7 +3201,7 @@ def _first_child(self, e):
             for e in e.children:
                 if isinstance(e, Element):
                     return e
-                
+
     def _next_sibling(self, e):
         """ Returns the first next sibling Element of the given element.
         """
@@ -3305,7 +3209,7 @@ def _next_sibling(self, e):
             e = e.next
             if isinstance(e, Element):
                 return e
-                
+
     def _previous_sibling(self, e):
         """ Returns the last previous sibling Element of the given element.
         """
@@ -3313,7 +3217,7 @@ def _previous_sibling(self, e):
             e = e.previous
             if isinstance(e, Element):
                 return e
-                
+
     def _contains(self, e, s):
         """ Returns True if string s occurs in the given element (case-insensitive).
         """
@@ -3383,9 +3287,9 @@ def __init__(self, s):
             s = re.sub(r" *\> *", " >", s)
             s = re.sub(r" *\< *", " <", s)
             s = re.sub(r" *\+ *", " +", s)
-            s = re.sub(r"\[.*?\]", 
+            s = re.sub(r"\[.*?\]",
                 lambda m: _encode_space(m.group(0)), s)
-            s = re.sub(r":contains\(.*?\)", 
+            s = re.sub(r":contains\(.*?\)",
                 lambda m: _encode_space(m.group(0)), s)
             self.append([])
             for s in s.split(" "):
@@ -3739,7 +3643,7 @@ class DocumentParserError(Exception):
     pass
 
 class DocumentParser(object):
-    
+
     def __init__(self, path, *args, **kwargs):
         """ Parses a text document (e.g., .pdf or .docx),
             given as a file path or a string.
@@ -3760,7 +3664,7 @@ def _parse(self, path, *args, **kwargs):
         """ Returns a plaintext Unicode string parsed from the given document.
         """
         return plaintext(decode_utf8(self.open(path).read()))
-        
+
     @property
     def string(self):
         return self.content
@@ -3810,7 +3714,7 @@ class DOCXError(DocumentParserError):
     pass
 
 class DOCX(DocumentParser):
-    
+
     def _parse(self, path, *args, **kwargs):
         from docx.docx import opendocx
         from docx.docx import getdocumenttext
@@ -3830,7 +3734,7 @@ def parsepdf(path, *args, **kwargs):
     """ Returns the content as a Unicode string from the given .pdf file.
     """
     return PDF(path, *args, **kwargs).content
-    
+
 def parsedocx(path, *args, **kwargs):
     """ Returns the content as a Unicode string from the given .docx file.
     """
@@ -3853,7 +3757,7 @@ def parsedoc(path, format=None):
             return parsehtml(path)
     # Brute-force approach if the format is unknown.
     for f in (parsepdf, parsedocx, parsehtml):
-        try: 
+        try:
             return f(path)
         except:
             pass
diff --git a/pattern/web/api.py b/pattern/web/api.py
index 5dfd0d54..882b456c 100644
--- a/pattern/web/api.py
+++ b/pattern/web/api.py
@@ -1,6 +1,6 @@
 #--- API LICENSE CONFIGURATION -----------------------------------------------------------------------
 # Default license keys used by pattern.web.SearchEngine to contact different API's.
-# Google and Yahoo are paid services for which you need a personal license + payment method.
+# Google is paid services for which you need a personal license + payment method.
 # The default Google license is for testing purposes (= 100 daily queries).
 # Wikipedia, Twitter and Facebook are free.
 # Bing, Flickr and ProductsWiki use licenses shared among all Pattern users.
@@ -12,9 +12,6 @@
 license["Bing"] = \
     "VnJEK4HTlntE3SyF58QLkUCLp/78tkYjV1Fl3J7lHa0="
 
-license["Yahoo"] = \
-    ("", "") # OAuth (key, secret)
-
 license["DuckDuckGo"] = \
     None
 
diff --git a/test/test.py b/test/test.py
index 40b08a09..3483cb5e 100644
--- a/test/test.py
+++ b/test/test.py
@@ -18,8 +18,8 @@
 #---------------------------------------------------------------------------------------------------
 # Run all tests.
 # pattern.db tests require a valid username and password for MySQL.
-# pattern.web tests require a working internet connection 
-# and API license keys (see pattern.web.api.py) for Google and Yahoo API's.
+# pattern.web tests require a working internet connection
+# and API license keys (see pattern.web.api.py) for Google API's.
 
 def suite():
     suite = unittest.TestSuite()
diff --git a/test/test_web.py b/test/test_web.py
index 269a6822..95b2d92b 100644
--- a/test/test_web.py
+++ b/test/test_web.py
@@ -15,10 +15,10 @@
 #---------------------------------------------------------------------------------------------------
 
 class TestCache(unittest.TestCase):
-    
+
     def setUp(self):
         pass
-    
+
     def test_cache(self):
         # Assert cache unicode.
         k, v = "test", u"ünîcødé"
@@ -28,11 +28,11 @@ def test_cache(self):
         self.assertEqual(web.cache.age(k), 0)
         del web.cache[k]
         print("pattern.web.Cache")
-        
+
 #---------------------------------------------------------------------------------------------------
 
 class TestUnicode(unittest.TestCase):
-    
+
     def setUp(self):
         # Test data with different (or wrong) encodings.
         self.strings = (
@@ -43,7 +43,7 @@ def setUp(self):
              "ünîcøde",
             u"אוניקאָד"
         )
-        
+
     def test_decode_utf8(self):
         # Assert unicode.
         for s in self.strings:
@@ -55,7 +55,7 @@ def test_encode_utf8(self):
         for s in self.strings:
             self.assertTrue(isinstance(web.encode_utf8(s), str))
         print("pattern.web.encode_utf8()")
-        
+
     def test_fix(self):
         # Assert fix for common Unicode mistakes.
         self.assertEqual(web.fix(u"clichÃ©"), u"cliché")
@@ -66,7 +66,7 @@ def test_fix(self):
 #---------------------------------------------------------------------------------------------------
 
 class TestURL(unittest.TestCase):
-    
+
     def setUp(self):
         # Test a live URL that has fast response time
         self.live = "http://www.google.com/"
@@ -83,7 +83,7 @@ def setUp(self):
                "query": {"q": 1},
               "anchor": "anchor"
         }
-    
+
     def test_asynchrous(self):
         # Assert asynchronous function call (returns 1).
         v = web.asynchronous(lambda t: time.sleep(t) or 1, 0.2)
@@ -91,25 +91,25 @@ def test_asynchrous(self):
             time.sleep(0.1)
         self.assertEqual(v.value, 1)
         print("pattern.web.asynchronous()")
-    
+
     def test_extension(self):
         # Assert filename extension.
         v = web.extension(os.path.join("pattern", "test", "test-web.py.zip"))
         self.assertEqual(v, ".zip")
         print("pattern.web.extension()")
-        
+
     def test_urldecode(self):
         # Assert URL decode (inverse of urllib.urlencode).
         v = web.urldecode("?user=me&page=1&q=&")
         self.assertEqual(v, {"user": "me", "page": 1, "q": None})
         print("pattern.web.urldecode()")
-        
+
     def test_proxy(self):
         # Assert URL proxy.
         v = web.proxy("www.proxy.com", "https")
         self.assertEqual(v, ("www.proxy.com", "https"))
         print("pattern.web.proxy()")
-        
+
     def test_url_parts(self):
         # Assert URL._parse and URL.parts{}.
         v = web.URL(self.url)
@@ -125,7 +125,7 @@ def test_url_parts(self):
           (web.ANCHOR,   self.parts["anchor"])):
             self.assertEqual(v.parts[a], b)
         print("pattern.web.URL.parts")
-    
+
     def test_url_query(self):
         # Assert URL.query and URL.querystring.
         v = web.URL(self.url)
@@ -142,7 +142,7 @@ def test_url_query(self):
         self.assertEqual(v.query, q[0])
         print("pattern.web.URL.query")
         print("pattern.web.URL.querystring")
-    
+
     def test_url_string(self):
         # Assert URL._set_string().
         v = web.URL("")
@@ -151,7 +151,7 @@ def test_url_string(self):
         self.assertEqual(v.parts[web.DOMAIN],   "domain.com")
         self.assertEqual(v.parts[web.PATH],     [])
         print("pattern.web.URL.string")
-        
+
     def test_url(self):
         # Assert URL.copy().
         v = web.URL(self.url)
@@ -171,7 +171,7 @@ def test_url(self):
         self.assertEqual(v.query,    self.parts["query"])
         self.assertEqual(v.anchor,   self.parts["anchor"])
         print("pattern.web.URL")
-        
+
     def test_url_open(self):
         # Assert URLError.
         v = web.URL(self.live.replace("http://", "htp://"))
@@ -190,7 +190,7 @@ def test_url_open(self):
         self.assertTrue(v.open(user_agent=web.MOZILLA, referrer=web.REFERRER) != None)
         print("pattern.web.URL.exists")
         print("pattern.web.URL.open()")
-        
+
     def test_url_download(self):
         t = time.time()
         v = web.URL(self.live).download(cached=False, throttle=0.25, unicode=True)
@@ -200,19 +200,19 @@ def test_url_download(self):
         # Assert download rate limiting.
         self.assertTrue(t >= 0.25)
         print("pattern.web.URL.download()")
-        
+
     def test_url_mimetype(self):
         # Assert URL MIME-type.
         v = web.URL(self.live).mimetype
         self.assertTrue(v in web.MIMETYPE_WEBPAGE)
         print("pattern.web.URL.mimetype")
-        
+
     def test_url_headers(self):
         # Assert URL headers.
         v = web.URL(self.live).headers["content-type"].split(";")[0]
         self.assertEqual(v, "text/html")
         print("pattern.web.URL.headers")
-        
+
     def test_url_redirect(self):
         # Assert URL redirected URL (this depends on where you are).
         # In Belgium, it yields "http://www.google.be/".
@@ -233,12 +233,12 @@ def test_abs(self):
             v = web.abs(a, base=b)
             self.assertEqual(v, b+c+a) # http://domain.com/#anchor
         print("pattern.web.abs()")
-        
+
     def test_base(self):
         # Assert base URL domain name.
         self.assertEqual(web.base("http://domain.com/home.html"), "domain.com")
         print("pattern.web.base()")
-        
+
     def test_oauth(self):
         # Assert OAuth algorithm.
         data = {
@@ -247,7 +247,7 @@ def test_oauth(self):
             "oauth_nonce": "0",
             "oauth_timestamp": 0,
             "oauth_consumer_key": "key",
-            "oauth_signature_method": "HMAC-SHA1" 
+            "oauth_signature_method": "HMAC-SHA1"
         }
         v = web.oauth.sign("http://yboss.yahooapis.com/ysearch/web", data, secret="secret")
         self.assertEqual(v, "RtTu8dxSp3uBzSbsuLAXIWOKfyI=")
@@ -256,10 +256,10 @@ def test_oauth(self):
 #---------------------------------------------------------------------------------------------------
 
 class TestPlaintext(unittest.TestCase):
-    
+
     def setUp(self):
         pass
-        
+
     def test_find_urls(self):
         # Assert URL finder with common URL notations.
         for url in (
@@ -277,7 +277,7 @@ def test_find_urls(self):
         self.assertEqual(web.find_urls("http://domain.net\">domain")[0], "http://domain.net")
         self.assertEqual(web.find_urls("domain.com, domain.net"), ["domain.com", "domain.net"])
         print("pattern.web.find_urls()")
-        
+
     def test_find_email(self):
         # Assert e-mail finder with common e-mail notations.
         s = "firstname.last+name@domain.ac.co.uk"
@@ -288,7 +288,7 @@ def test_find_email(self):
         v = web.find_email("("+",".join(s)+")")
         self.assertEqual(v, s)
         print("pattern.web.find_email()")
-        
+
     def test_find_between(self):
         # Assert search between open tag and close tag.
         s = "<script type='text/javascript'>alert(0);</script>"
@@ -299,7 +299,7 @@ def test_find_between(self):
         v = web.find_between("a", "b", s)
         self.assertEqual(v, ["0", "1"])
         print("pattern.web.find_between()")
-        
+
     def test_strip_tags(self):
         # Assert HTML parser and tag stripper.
         for html, plain in (
@@ -314,19 +314,19 @@ def test_strip_tags(self):
         v = web.strip_tags("<a href=\"\" onclick=\"\">text</a>", exclude={"a": ["href"]})
         self.assertEqual(v, "<a href=\"\">text</a>")
         print("pattern.web.strip_tags()")
-    
+
     def test_strip_element(self):
         # Assert strip <p> elements.
         v = web.strip_element(" <p><p></p>text</p> <b><P></P></b>", "p")
         self.assertEqual(v, "  <b></b>")
         print("pattern.web.strip_element()")
-        
+
     def test_strip_between(self):
         # Assert strip <p> elements.
         v = web.strip_between("<p", "</p>", " <p><p></p>text</p> <b><P></P></b>")
         self.assertEqual(v, " text</p> <b></b>")
         print("pattern.web.strip_between()")
-        
+
     def test_strip_javascript(self):
         # Assert strip <script> elements.
         v = web.strip_javascript(" <script type=\"text/javascript\">text</script> ")
@@ -338,7 +338,7 @@ def test_strip_inline_css(self):
         v = web.strip_inline_css(" <style type=\"text/css\">text</style> ")
         self.assertEqual(v, "  ")
         print("pattern.web.strip_inline_css()")
-        
+
     def test_strip_comments(self):
         # Assert strip <!-- --> elements.
         v = web.strip_comments(" <!-- text --> ")
@@ -350,19 +350,19 @@ def test_strip_forms(self):
         v = web.strip_forms(" <form method=\"get\">text</form> ")
         self.assertEqual(v, "  ")
         print("pattern.web.strip_forms()")
-        
+
     def test_encode_entities(self):
         # Assert HTML entity encoder (e.g., "&" => "&&amp;")
         for a, b in (
-          ("&#201;", "&#201;"), 
-          ("&", "&amp;"), 
-          ("<", "&lt;"), 
-          (">", "&gt;"), 
+          ("&#201;", "&#201;"),
+          ("&", "&amp;"),
+          ("<", "&lt;"),
+          (">", "&gt;"),
           ('"', "&quot;"),
           ("'", "&#39;")):
             self.assertEqual(web.encode_entities(a), b)
         print("pattern.web.encode_entities()")
-            
+
     def test_decode_entities(self):
         # Assert HMTL entity decoder (e.g., "&amp;" => "&")
         for a, b in (
@@ -373,7 +373,7 @@ def test_decode_entities(self):
           ("&foo;", "&foo;")):
             self.assertEqual(web.decode_entities(a), b)
         print("pattern.web.decode_entities()")
-            
+
     def test_collapse_spaces(self):
         # Assert collapse multiple spaces.
         for a, b in (
@@ -386,7 +386,7 @@ def test_collapse_spaces(self):
         # Assert preserve indendation.
         self.assertEqual(web.collapse_spaces("  . \n", indentation=True), "  .")
         print("pattern.web.collapse_spaces()")
-        
+
     def test_collapse_tabs(self):
         # Assert collapse multiple tabs to 1 space.
         for a, b in (
@@ -398,7 +398,7 @@ def test_collapse_tabs(self):
         # Assert preserve indendation.
         self.assertEqual(web.collapse_tabs("\t\t .\t\n", indentation=True), "\t\t .")
         print("pattern.web.collapse_tabs()")
-        
+
     def test_collapse_linebreaks(self):
         # Assert collapse multiple linebreaks.
         for a, b in (
@@ -409,9 +409,9 @@ def test_collapse_linebreaks(self):
           (" \n  .", "\n  .")):
             self.assertEqual(web.collapse_linebreaks(a), b)
         print("pattern.web.collapse_linebreaks()")
-    
+
     def test_plaintext(self):
-        # Assert plaintext: 
+        # Assert plaintext:
         # - strip <script>, <style>, <form>, <!-- --> elements,
         # - strip tags,
         # - decode entities,
@@ -447,13 +447,12 @@ def test_plaintext(self):
 #---------------------------------------------------------------------------------------------------
 
 class TestSearchEngine(unittest.TestCase):
-    
+
     def setUp(self):
-        # Test data for all search engines: 
+        # Test data for all search engines:
         # {api: (source, license, Engine)}.
         self.api = {
             "Google": (web.GOOGLE,      web.GOOGLE_LICENSE,      web.Google),
-             "Yahoo": (web.YAHOO,       web.YAHOO_LICENSE,       web.Yahoo),
               "Bing": (web.BING,        web.BING_LICENSE,        web.Bing),
            "Twitter": (web.TWITTER,     web.TWITTER_LICENSE,     web.Twitter),
          "Wikipedia": (web.MEDIAWIKI,   web.WIKIPEDIA_LICENSE,   web.Wikipedia),
@@ -465,10 +464,10 @@ def setUp(self):
 
     def _test_search_engine(self, api, source, license, Engine, query="today", type=web.SEARCH):
         # Assert SearchEngine standard interface for any api:
-        # Google, Yahoo, Bing, Twitter, Wikipedia, Flickr, Facebook, ProductWiki, Newsfeed.
-        # SearchEngine.search() returns a list of Result objects with unicode fields, 
+        # Google, Bing, Twitter, Wikipedia, Flickr, Facebook, ProductWiki, Newsfeed.
+        # SearchEngine.search() returns a list of Result objects with unicode fields,
         # except Wikipedia which returns a WikipediaArticle (MediaWikiArticle subclass).
-        if api == "Yahoo" and license == ("",""): 
+        if license == ("",""):
             return
         t = time.time()
         e = Engine(license=license, throttle=0.25, language="en")
@@ -504,11 +503,9 @@ def _test_search_engine(self, api, source, license, Engine, query="today", type=
         # Assert SearchEngineTypeError for unknown type.
         self.assertRaises(web.SearchEngineTypeError, e.search, query, type="crystall-ball")
         print("pattern.web.%s.search()" % api)
-    
+
     def test_search_google(self):
         self._test_search_engine("Google",       *self.api["Google"])
-    def test_search_yahoo(self):
-        self._test_search_engine("Yahoo",        *self.api["Yahoo"])
     def test_search_bing(self):
         self._test_search_engine("Bing",         *self.api["Bing"])
     def test_search_twitter(self):
@@ -526,11 +523,11 @@ def test_search_productwiki(self):
     def test_search_newsfeed(self):
         for feed, url in web.feeds.items():
             self._test_search_engine("Newsfeed", url, None, web.Newsfeed, query=url, type=web.NEWS)
-    
+
     def _test_results(self, api, source, license, Engine, type=web.SEARCH, query="today", baseline=[6,6,6,0]):
         # Assert SearchEngine result content.
         # We expect to find http:// URL's and descriptions containing the search query.
-        if api == "Yahoo" and license == ("",""): 
+        if license == ("",""):
             return
         i1 = 0
         i2 = 0
@@ -553,15 +550,9 @@ def _test_results(self, api, source, license, Engine, type=web.SEARCH, query="to
         self.assertTrue(i3 >= baseline[2]) # language "en"
         self.assertTrue(i4 >= baseline[3]) # url's ending with "jpg", "png" or "gif"
         print("pattern.web.%s.Result(type=%s)" % (api, type.upper()))
-    
+
     def test_results_google(self):
         self._test_results("Google",   *self.api["Google"])
-    def test_results_yahoo(self):
-        self._test_results("Yahoo",    *self.api["Yahoo"])
-    def test_results_yahoo_images(self):
-        self._test_results("Yahoo",    *self.api["Yahoo"], **{"type": web.IMAGE, "baseline": [6,6,0,6]})
-    def test_results_yahoo_news(self):
-        self._test_results("Yahoo",    *self.api["Yahoo"], **{"type": web.NEWS})
     def test_results_bing(self):
         self._test_results("Bing",     *self.api["Bing"])
     def test_results_bing_images(self):
@@ -585,7 +576,7 @@ def test_google_translate(self):
             print("pattern.web.Google.translate()")
         except web.HTTP401Authentication:
             pass
-            
+
     def test_google_identify(self):
         try:
             # Assert Google Translate API (language detection).
@@ -596,7 +587,7 @@ def test_google_identify(self):
             print("pattern.web.Google.identify()")
         except web.HTTP401Authentication:
             pass
-    
+
     def test_twitter_author(self):
         self.assertEqual(web.author("me"), "from:me")
         print("pattern.web.author()")
@@ -606,10 +597,10 @@ def test_twitter_hashtags(self):
     def test_twitter_retweets(self):
         self.assertEqual(web.retweets("RT @me: blah"), ["@me"])
         print("pattern.web.retweets()")
-        
+
     def _test_search_image_size(self, api, source, license, Engine):
         # Assert image URL's for different sizes actually exist.
-        if api == "Yahoo" and license == ("",""): 
+        if license == ("",""):
             return
         e = Engine(license, throttle=0.25)
         for size in (web.TINY, web.SMALL, web.MEDIUM, web.LARGE):
@@ -617,13 +608,11 @@ def _test_search_image_size(self, api, source, license, Engine):
             self.assertEqual(web.URL(v[0].url).exists, True)
             print("pattern.web.%s.search(type=IMAGE, size=%s)" % (api, size.upper()))
 
-    def test_yahoo_image_size(self):
-        self._test_search_image_size("Yahoo",  *self.api["Yahoo"])
     def test_bing_image_size(self):
         self._test_search_image_size("Bing",   *self.api["Bing"])
     def test_flickr_image_size(self):
         self._test_search_image_size("Flickr", *self.api["Flickr"])
-    
+
     def test_wikipedia_list(self):
         # Assert WikipediaArticle.list(), an iterator over all article titles.
         source, license, Engine = self.api["Wikipedia"]
@@ -633,7 +622,7 @@ def test_wikipedia_list(self):
         self.assertTrue(v[0].lower().startswith("a"))
         self.assertTrue(v[1].lower().startswith("a"))
         print("pattern.web.Wikipedia.list()")
-        
+
     def test_wikipedia_all(self):
         # Assert WikipediaArticle.all(), an iterator over WikipediaArticle objects.
         source, license, Engine = self.api["Wikipedia"]
@@ -643,7 +632,7 @@ def test_wikipedia_all(self):
         self.assertTrue(isinstance(v[0], web.WikipediaArticle))
         self.assertTrue(v[0].title.lower().startswith("a"))
         print("pattern.web.Wikipedia.all()")
-    
+
     def test_wikipedia_article(self):
         source, license, Engine = self.api["Wikipedia"]
         v = Engine(license).search("cat", cached=False)
@@ -668,7 +657,7 @@ def test_wikipedia_article(self):
         self.assertTrue(v.external[0].startswith("http"))
         self.assertTrue(v.media[0].endswith(("jpg","png","gif","svg")))
         print("pattern.web.WikipediaArticle")
-        
+
     def test_wikipedia_article_sections(self):
         # Assert WikipediaArticle.sections structure.
         # The test may need to be modified if the Wikipedia "Cat" article changes.
@@ -713,7 +702,7 @@ def test_productwiki(self):
 #---------------------------------------------------------------------------------------------------
 
 class TestDOM(unittest.TestCase):
-    
+
     def setUp(self):
         # Test HTML document.
         self.html = """
@@ -726,8 +715,8 @@ def setUp(self):
             <body id="front" class="comments">
                 <script type="text/javascript">alert(0);</script>
                 <div id="navigation">
-                    <a href="nav1.html">nav1</a> | 
-                    <a href="nav2.html">nav2</a> | 
+                    <a href="nav1.html">nav1</a> |
+                    <a href="nav2.html">nav2</a> |
                     <a href="nav3.html">nav3</a>
                 </div>
                 <div id="content">
@@ -744,7 +733,7 @@ def setUp(self):
             </body>
             </html>
         """
-    
+
     def test_node_document(self):
         # Assert Node properties.
         v1 = web.Document(self.html)
@@ -766,7 +755,7 @@ def test_node_document(self):
         self.assertTrue(v1.body.source.startswith("<body"))
         print("pattern.web.Node")
         print("pattern.web.DOM")
-    
+
     def test_node_traverse(self):
         # Assert Node.traverse() (must visit all child nodes recursively).
         self.b = False
@@ -777,7 +766,7 @@ def visit(node):
         v.traverse(visit)
         self.assertEqual(self.b, True)
         print("pattern.web.Node.traverse()")
-        
+
     def test_element(self):
         # Assert Element properties (test <body>).
         v = web.DOM(self.html).body
@@ -838,10 +827,10 @@ def test_selector(self):
 #---------------------------------------------------------------------------------------------------
 
 class TestDocumentParser(unittest.TestCase):
-    
+
     def setUp(self):
         pass
-        
+
     def test_pdf(self):
         # Assert PDF to string parser.
         s = web.parsedoc(os.path.join(PATH, "corpora", "carroll-wonderland.pdf"))
@@ -859,7 +848,7 @@ def test_docx(self):
 #---------------------------------------------------------------------------------------------------
 
 class TestLocale(unittest.TestCase):
-    
+
     def setUp(self):
         pass
 
@@ -868,37 +857,37 @@ def test_encode_language(self):
         self.assertEqual(web.locale.encode_language("dutch"), "nl")
         self.assertEqual(web.locale.encode_language("?????"), None)
         print("pattern.web.locale.encode_language()")
-        
+
     def test_decode_language(self):
         # Assert "nl" => "Dutch".
         self.assertEqual(web.locale.decode_language("nl"), "Dutch")
         self.assertEqual(web.locale.decode_language("NL"), "Dutch")
         self.assertEqual(web.locale.decode_language("??"), None)
         print("pattern.web.locale.decode_language()")
-        
+
     def test_encode_region(self):
         # Assert "Belgium" => "BE".
         self.assertEqual(web.locale.encode_region("belgium"), "BE")
         self.assertEqual(web.locale.encode_region("???????"), None)
         print("pattern.web.locale.encode_region()")
-        
+
     def test_decode_region(self):
         # Assert "BE" => "Belgium".
         self.assertEqual(web.locale.decode_region("be"), "Belgium")
         self.assertEqual(web.locale.decode_region("BE"), "Belgium")
         self.assertEqual(web.locale.decode_region("??"), None)
         print("pattern.web.locale.decode_region()")
-        
+
     def test_languages(self):
         # Assert "BE" => "fr" + "nl".
         self.assertEqual(web.locale.languages("be"), ["fr", "nl"])
         print("pattern.web.locale.languages()")
-        
+
     def test_regions(self):
         # Assert "nl" => "NL" + "BE".
         self.assertEqual(web.locale.regions("nl"), ["NL", "BE"])
         print("pattern.web.locale.regions()")
-        
+
     def test_regionalize(self):
         # Assert "nl" => "nl-NL" + "nl-BE".
         self.assertEqual(web.locale.regionalize("nl"), ["nl-NL", "nl-BE"])
@@ -912,7 +901,7 @@ def test_geocode(self):
         self.assertEqual(v[2], "nl")
         self.assertEqual(v[3], "Belgium")
         print("pattern.web.locale.geocode()")
-        
+
     def test_correlation(self):
         # Test the correlation between locale.LANGUAGE_REGION and locale.GEOCODE.
         # It should increase as new languages and locations are added.
@@ -927,7 +916,7 @@ def test_correlation(self):
 # You need to define a username, password and mailbox to test on.
 
 class TestMail(unittest.TestCase):
-    
+
     def setUp(self):
         self.username = ""
         self.password = ""
@@ -936,7 +925,7 @@ def setUp(self):
         self.SSL      = True
         self.query1   = "google" # FROM-field query in Inbox.
         self.query2   = "viagra" # SUBJECT-field query in Spam.
-    
+
     def test_mail(self):
         if not self.username or not self.password:
             return
@@ -947,7 +936,7 @@ def test_mail(self):
         self.assertTrue(len(m.folders) > 0)
         self.assertTrue(len(m.inbox) > 0)
         print("pattern.web.Mail")
-        
+
     def test_mail_message1(self):
         if not self.username or not self.password or not self.query1:
             return
@@ -988,10 +977,10 @@ def test_mail_message2(self):
 #---------------------------------------------------------------------------------------------------
 
 class TestCrawler(unittest.TestCase):
-    
+
     def setUp(self):
         pass
-        
+
     def test_link(self):
         # Assert web.Link parser and properties.
         v = web.HTMLLinkParser().parse("""
@@ -1017,7 +1006,7 @@ def test_link(self):
         self.assertTrue(v[1].referrer, "http://www.domain.com/")
         self.assertTrue(v[0] < v[1])
         print("pattern.web.HTMLLinkParser")
-    
+
     def test_crawler_crawl(self):
         # Assert domain filter.
         v = web.Crawler(links=["http://www.clips.ua.ac.be/"], domains=["clips.ua.ac.be"], delay=0.5)
@@ -1027,7 +1016,7 @@ def test_crawler_crawl(self):
             self.assertTrue("clips.ua.ac.be" in url)
         self.assertTrue(len(v.history) == 1)
         print("pattern.web.Crawler.crawl()")
-    
+
     def test_crawler_delay(self):
         # Assert delay for several crawls to a single domain.
         v = web.Crawler(links=["http://www.clips.ua.ac.be/"], domains=["clips.ua.ac.be"], delay=1.0)
@@ -1038,7 +1027,7 @@ def test_crawler_delay(self):
         t = time.time() - t
         self.assertTrue(t > 1.0)
         print("pattern.web.Crawler.delay")
-        
+
     def test_crawler_breadth(self):
         # Assert BREADTH cross-domain preference.
         v = web.Crawler(links=["http://www.clips.ua.ac.be/"], delay=10)

0.5
Yahoo	SEARCH \| NEWS \| IMAGE¹³	1-1000/count	1-50	paid	0.5
DuckDuckGo	SEARCH	1