fetchquefix

This commit is contained in:
Andreas Stephanides
2017-01-29 14:31:15 +01:00
parent 3761817c75
commit 8770aaf530
2 changed files with 13 additions and 9 deletions

View File

@@ -38,7 +38,7 @@ def process_url(url,tpe, parent_url):
#clogger.debug("process URL of type "+ tpe + ": " + url) #clogger.debug("process URL of type "+ tpe + ": " + url)
if parent_url is not None: if parent_url is not None:
url=fix_link(parent_url, url) url=fix_link(parent_url, url)
put_fetch_queue((0,tpe,url)) put_fetch_queue((0,tpe,url,{"nofollow":False}))
# process a url list # process a url list

View File

@@ -30,35 +30,39 @@ def work_compile():
def queue_url(tpe, url,params={"nofollow": False}): def queue_url(tpe, url,params={"nofollow": False}):
fetch_queue.put((0,tpe,url,params)) fetch_queue.put((False,tpe,url,params))
#param nofollow = True : Don't follow pagination recursivly to only fetch an update #param nofollow = True : Don't follow pagination recursivly to only fetch an update
def queue_url_upd(tpe, url,params={"nofollow": True}): def queue_url_upd(tpe, url,params={"nofollow": True}):
fetch_queue.put((0,tpe,url,params)) fetch_queue.put((True,tpe,url,params))
# fetch a page from the url list # fetch a page from the url list
def run_fetch(): def run_fetch():
tc, tpe, url,params = fetch_queue.get() try:
tc, tpe, url, p= fetch_queue.get()
except ValueError:
tc, tpe, url= fetch_queue.get()
if tpe is not "dummyarticle" and tpe is not "dummyindex": if tpe is not "dummyarticle" and tpe is not "dummyindex":
rw=fetch_page(url) rw=fetch_page(url)
else: else:
rw="<p> dummytext</p>" rw="<p> dummytext</p>"
compile_queue.put((0, tpe, {"url": url, "sourcetype": tpe, "raw": rw},params)) compile_queue.put((0, tpe, {"url": url, "sourcetype": tpe, "raw": rw},p))
return rw return rw
# fetch_queue.task_done() # fetch_queue.task_done()
#comile something from the compile list #comile something from the compile list
def run_compile(): def run_compile():
tc,tpe,h,params = compile_queue.get() tc,tpe,h, p = compile_queue.get()
h=do_compile(tpe,h) h=do_compile(tpe,h)
process_queue.put((0,tpe, h,params)) process_queue.put((0,tpe, h,p))
return h return h
# compile_queue.task_done() # compile_queue.task_done()
def run_process(): def run_process():
tc,tpe,h,params = process_queue.get() tc,tpe,h,p = process_queue.get()
do_process(tpe, h,params) do_process(tpe, h,p)
return h return h
# process_queue.task_done() # process_queue.task_done()