From ddbfd834af1305e01024f0ef13d0a6f82aa53f74 Mon Sep 17 00:00:00 2001 From: Camil Staps Date: Fri, 8 Dec 2017 13:48:29 +0100 Subject: run.py: don't download missing files --- run.py | 11 +++-------- 1 file changed, 3 insertions(+), 8 deletions(-) diff --git a/run.py b/run.py index 7f0fea9..96fa10e 100755 --- a/run.py +++ b/run.py @@ -4,7 +4,6 @@ import fileinput import json import os from urllib.parse import quote_plus -from urllib.request import urlopen, Request DATADIR = 'data' ERRORFILE = 'errors' @@ -12,13 +11,7 @@ ERRORFILE = 'errors' def get(dbpediaid): outfile = os.path.join(DATADIR, quote_plus(dbpediaid) + '.json') if not os.path.isfile(outfile): - url = 'http://api.nordlys.cc/ec/lookup_id/{}'.format( - quote_plus(dbpediaid.replace('/', '___SLASH')).replace('___SLASH', '/')) - print(url) - result = urlopen(Request(url, - headers={'User-Agent': 'Radboud University'})).read() - with open(outfile, 'w') as f: - f.write(result.decode(encoding='UTF-8')) + return None with open(outfile) as f: return json.load(f) @@ -33,6 +26,8 @@ def run(queries, line, outfile): terms = queries[query].split() try: result = get(dbpediaid) + if result is None: + return for field, values in result.items(): matches = 0 for value in values: -- cgit v1.2.3