diff options
| author | Nick Mathewson <nickm@torproject.org> | 2008-07-30 18:39:02 +0000 |
|---|---|---|
| committer | Nick Mathewson <nickm@torproject.org> | 2008-07-30 18:39:02 +0000 |
| commit | 1c5aca9a62b3a637d7fc9053c6ae40dcc5e2c09b (patch) | |
| tree | 334c810a5cacf95c9096ce7235fdcffef25bc60e /rank.py | |
| parent | 7c6d6e28b679fc50b40cf416f0efeaf1d364fc21 (diff) | |
| download | anonbib-1c5aca9a62b3a637d7fc9053c6ae40dcc5e2c09b.tar.gz | |
Do not actually build a URL opener for ranks until we know we have a cacche miss. Under some circumstances, building the opener hits the network.
svn:r291
Diffstat (limited to 'rank.py')
| -rw-r--r-- | rank.py | 8 |
1 files changed, 5 insertions, 3 deletions
@@ -56,9 +56,6 @@ def getCite(title, cache=True, update=True, save=True): title = re.sub("[^'a-zA-Z0-9\. \-\/:]", "", title) title = re.sub("'\/", " ", title) - # Make a custom user agent (so that we are not filtered by Google)! - opener = build_opener() - opener.addheaders = [('User-agent', 'Anon.Bib.0.1')] # We rely on google scholar to return the article with this exact title gurl = "http://scholar.google.com/scholar?as_epq=%s&as_occt=title" @@ -70,6 +67,11 @@ def getCite(title, cache=True, update=True, save=True): page = file(join(cache_folder(), md5h(url)),'r').read() elif update: print "Downloading rank for %r."%title + + # Make a custom user agent (so that we are not filtered by Google)! + opener = build_opener() + opener.addheaders = [('User-agent', 'Anon.Bib.0.1')] + page = opener.open(url).read() if save: file(join(cache_folder(), md5h(url)),'w').write(page) else: |
