Use print() function in both Python 2 and Python 3

Legacy __print__ statements are syntax errors in Python 3 but __print()__ function works as expected in both Python 2 and Python 3.
This commit is contained in:
cclauss 2019-01-09 18:00:43 +01:00
parent a0c8029bc3
commit 244f63da64
5 changed files with 84 additions and 79 deletions

View File

@ -22,6 +22,7 @@
#* * #* *
#*************************************************************************** #***************************************************************************
from __future__ import print_function
__title__="buildpdf" __title__="buildpdf"
__author__ = "Yorik van Havre <yorik@uncreated.net>" __author__ = "Yorik van Havre <yorik@uncreated.net>"
__url__ = "http://www.freecadweb.org" __url__ = "http://www.freecadweb.org"
@ -363,19 +364,19 @@ def crawl():
return 1 return 1
elif PDFCONVERTOR == 'htmldoc': elif PDFCONVERTOR == 'htmldoc':
if os.system('htmldoc --version'): if os.system('htmldoc --version'):
print "Error: Htmldoc not found, exiting." print("Error: Htmldoc not found, exiting.")
return 1 return 1
try: try:
from PyPDF2 import PdfFileReader,PdfFileWriter from PyPDF2 import PdfFileReader,PdfFileWriter
except: except:
print "Error: Python-pypdf2 not installed, exiting." print("Error: Python-pypdf2 not installed, exiting.")
# run ######################################################## # run ########################################################
buildpdffiles() buildpdffiles()
joinpdf() joinpdf()
if VERBOSE: print "All done!" if VERBOSE: print("All done!")
return 0 return 0
@ -389,10 +390,10 @@ def buildpdffiles():
for i in templist: for i in templist:
if i[-5:] == '.html': if i[-5:] == '.html':
fileslist.append(i) fileslist.append(i)
print "converting ",len(fileslist)," pages" print("converting ",len(fileslist)," pages")
i = 1 i = 1
for f in fileslist: for f in fileslist:
print i," : ",f print(i," : ",f)
if PDFCONVERTOR == 'pisa': if PDFCONVERTOR == 'pisa':
createpdf_pisa(f[:-5]) createpdf_pisa(f[:-5])
elif PDFCONVERTOR == 'wkhtmltopdf': elif PDFCONVERTOR == 'wkhtmltopdf':
@ -421,7 +422,7 @@ def createpdf_pisa(pagename):
if (not exists(pagename+".pdf",image=True)) or OVERWRTIE: if (not exists(pagename+".pdf",image=True)) or OVERWRTIE:
infile = open(FOLDER + os.sep + pagename+'.html','ro') infile = open(FOLDER + os.sep + pagename+'.html','ro')
outfile = open(FOLDER + os.sep + pagename+'.pdf','wb') outfile = open(FOLDER + os.sep + pagename+'.pdf','wb')
if VERBOSE: print "Converting " + pagename + " to pdf..." if VERBOSE: print("Converting " + pagename + " to pdf...")
pdf = pisa.CreatePDF(infile,outfile,FOLDER,link_callback=fetch_resources) pdf = pisa.CreatePDF(infile,outfile,FOLDER,link_callback=fetch_resources)
outfile.close() outfile.close()
if pdf.err: if pdf.err:
@ -441,7 +442,7 @@ def createpdf_firefox(pagename):
if os.path.exists(FIREFOXPDFFOLDER + os.sep + pagename + ".pdf"): if os.path.exists(FIREFOXPDFFOLDER + os.sep + pagename + ".pdf"):
shutil.move(FIREFOXPDFFOLDER+os.sep+pagename+".pdf",outfile) shutil.move(FIREFOXPDFFOLDER+os.sep+pagename+".pdf",outfile)
else: else:
print "-----------------------------------------> Couldn't find print output!" print("-----------------------------------------> Couldn't find print output!")
def createpdf_htmldoc(pagename): def createpdf_htmldoc(pagename):
@ -458,16 +459,16 @@ def createpdf_wkhtmltopdf(pagename):
infile = FOLDER + os.sep + pagename+'.html' infile = FOLDER + os.sep + pagename+'.html'
outfile = FOLDER + os.sep + pagename+'.pdf' outfile = FOLDER + os.sep + pagename+'.pdf'
cmd = 'wkhtmltopdf -L 5mm --user-style-sheet '+FOLDER+os.sep+'wkhtmltopdf.css '+infile+' '+outfile cmd = 'wkhtmltopdf -L 5mm --user-style-sheet '+FOLDER+os.sep+'wkhtmltopdf.css '+infile+' '+outfile
print cmd print(cmd)
#return os.system(cmd) #return os.system(cmd)
else: else:
print "skipping" print("skipping")
def joinpdf(): def joinpdf():
"creates one pdf file from several others, following order from the cover" "creates one pdf file from several others, following order from the cover"
from PyPDF2 import PdfFileReader,PdfFileWriter from PyPDF2 import PdfFileReader,PdfFileWriter
if VERBOSE: print "Building table of contents..." if VERBOSE: print("Building table of contents...")
result = PdfFileWriter() result = PdfFileWriter()
createCover() createCover()
@ -488,7 +489,7 @@ def joinpdf():
if page == "end": if page == "end":
parent = False parent = False
continue continue
if VERBOSE: print 'Appending',page, "at position",count if VERBOSE: print('Appending',page, "at position",count)
title = page.replace("_"," ") title = page.replace("_"," ")
pdffile = page + ".pdf" pdffile = page + ".pdf"
if exists(pdffile,True): if exists(pdffile,True):
@ -504,16 +505,16 @@ def joinpdf():
result.addBookmark(title,count,parent) result.addBookmark(title,count,parent)
count += numpages count += numpages
else: else:
print "page",pdffile,"not found, aborting." print("page",pdffile,"not found, aborting.")
sys.exit() sys.exit()
if VERBOSE: print "Writing..." if VERBOSE: print("Writing...")
outputfile = open(FOLDER+os.sep+"freecad.pdf",'wb') outputfile = open(FOLDER+os.sep+"freecad.pdf",'wb')
result.write(outputfile) result.write(outputfile)
outputfile.close() outputfile.close()
if VERBOSE: if VERBOSE:
print ' ' print(' ')
print 'Successfully created '+FOLDER+os.sep+'freecad.pdf' print('Successfully created '+FOLDER+os.sep+'freecad.pdf')
def local(page,image=False): def local(page,image=False):
@ -544,7 +545,7 @@ def makeStyleSheet():
def createCover(): def createCover():
"downloads and creates a cover page" "downloads and creates a cover page"
if VERBOSE: print "fetching " + COVER if VERBOSE: print("fetching " + COVER)
data = (urlopen(COVER).read()) data = (urlopen(COVER).read())
path = FOLDER + os.sep + "Cover.svg" path = FOLDER + os.sep + "Cover.svg"
fil = open(path,'wb') fil = open(path,'wb')

View File

@ -22,6 +22,7 @@
#* * #* *
#*************************************************************************** #***************************************************************************
from __future__ import print_function
__title__="wiki2qhelp" __title__="wiki2qhelp"
__author__ = "Yorik van Havre <yorik@uncreated.net>" __author__ = "Yorik van Havre <yorik@uncreated.net>"
__url__ = "http://www.freecadweb.org" __url__ = "http://www.freecadweb.org"
@ -52,10 +53,10 @@ def crawl():
# tests ############################################### # tests ###############################################
if os.system(QHELPCOMPILER +' -v'): if os.system(QHELPCOMPILER +' -v'):
print "Error: QAssistant not fully installed, exiting." print("Error: QAssistant not fully installed, exiting.")
return 1 return 1
if os.system(QCOLLECTIOMGENERATOR +' -v'): if os.system(QCOLLECTIOMGENERATOR +' -v'):
print "Error: QAssistant not fully installed, exiting." print("Error: QAssistant not fully installed, exiting.")
return 1 return 1
# run ######################################################## # run ########################################################
@ -64,22 +65,22 @@ def crawl():
qhcp = createCollProjectFile() qhcp = createCollProjectFile()
shutil.copy("freecad-icon-64.png","localwiki/freecad-icon-64.png") shutil.copy("freecad-icon-64.png","localwiki/freecad-icon-64.png")
if generate(qhcp) or compile(qhp): if generate(qhcp) or compile(qhp):
print "Error at compiling" print("Error at compiling")
return 1 return 1
if VERBOSE: print "All done!" if VERBOSE: print("All done!")
i=raw_input("Copy the files to their correct location in the source tree? y/n (default=no) ") i=raw_input("Copy the files to their correct location in the source tree? y/n (default=no) ")
if i.upper() in ["Y","YES"]: if i.upper() in ["Y","YES"]:
shutil.copy("localwiki/freecad.qch","../../Doc/freecad.qch") shutil.copy("localwiki/freecad.qch","../../Doc/freecad.qch")
shutil.copy("localwiki/freecad.qhc","../../Doc/freecad.qhc") shutil.copy("localwiki/freecad.qhc","../../Doc/freecad.qhc")
else: else:
print 'Files are in localwiki. Test with "assistant -collectionFile localwiki/freecad.qhc"' print('Files are in localwiki. Test with "assistant -collectionFile localwiki/freecad.qhc"')
return 0 return 0
def compile(qhpfile): def compile(qhpfile):
"compiles the whole html doc with qassistant" "compiles the whole html doc with qassistant"
qchfile = FOLDER + os.sep + "freecad.qch" qchfile = FOLDER + os.sep + "freecad.qch"
if not os.system(QHELPCOMPILER + ' '+qhpfile+' -o '+qchfile): if not os.system(QHELPCOMPILER + ' '+qhpfile+' -o '+qchfile):
if VERBOSE: print "Successfully created",qchfile if VERBOSE: print("Successfully created",qchfile)
return 0 return 0
def generate(qhcpfile): def generate(qhcpfile):
@ -93,7 +94,7 @@ def generate(qhcpfile):
about.close() about.close()
qhcfile = FOLDER + os.sep + "freecad.qhc" qhcfile = FOLDER + os.sep + "freecad.qhc"
if not os.system(QCOLLECTIOMGENERATOR+' '+qhcpfile+' -o '+qhcfile): if not os.system(QCOLLECTIOMGENERATOR+' '+qhcpfile+' -o '+qhcfile):
if VERBOSE: print "Successfully created ",qhcfile if VERBOSE: print("Successfully created ",qhcfile)
return 0 return 0
def createCollProjectFile(): def createCollProjectFile():
@ -131,12 +132,12 @@ def createCollProjectFile():
</docFiles> </docFiles>
</QHelpCollectionProject> </QHelpCollectionProject>
''' '''
if VERBOSE: print "Building project file..." if VERBOSE: print("Building project file...")
qfilename = FOLDER + os.sep + "freecad.qhcp" qfilename = FOLDER + os.sep + "freecad.qhcp"
f = open(qfilename,'w') f = open(qfilename,'w')
f.write(qprojectfile) f.write(qprojectfile)
f.close() f.close()
if VERBOSE: print "Done writing qhcp file",qfilename if VERBOSE: print("Done writing qhcp file",qfilename)
return qfilename return qfilename
def buildtoc(): def buildtoc():
@ -182,7 +183,7 @@ def buildtoc():
if not link: link = 'default.html' if not link: link = 'default.html'
return title,link return title,link
if VERBOSE: print "Building table of contents..." if VERBOSE: print("Building table of contents...")
f = open(FOLDER+os.sep+INDEX+'.html') f = open(FOLDER+os.sep+INDEX+'.html')
html = '' html = ''
for line in f: html += line for line in f: html += line
@ -229,7 +230,7 @@ def buildtoc():
f = open(qfilename,'wb') f = open(qfilename,'wb')
f.write(qhelpfile) f.write(qhelpfile)
f.close() f.close()
if VERBOSE: print "Done writing qhp file",qfilename if VERBOSE: print("Done writing qhp file",qfilename)
return qfilename return qfilename
if __name__ == "__main__": if __name__ == "__main__":

View File

@ -22,6 +22,7 @@
#* * #* *
#*************************************************************************** #***************************************************************************
from __future__ import print_function
__title__="buildwikiindex.py" __title__="buildwikiindex.py"
__author__ = "Yorik van Havre <yorik@uncreated.net>" __author__ = "Yorik van Havre <yorik@uncreated.net>"
__url__ = "http://www.freecadweb.org" __url__ = "http://www.freecadweb.org"
@ -60,15 +61,15 @@ def crawl(pagename=[]):
else: else:
if os.path.exists("wikifiles.txt"): if os.path.exists("wikifiles.txt"):
f = open("wikifiles.txt","r") f = open("wikifiles.txt","r")
if VERBOSE: print "Reading existing list..." if VERBOSE: print("Reading existing list...")
for l in f.readlines(): for l in f.readlines():
if l.strip() != "": if l.strip() != "":
if VERBOSE: print "Adding ",l if VERBOSE: print("Adding ",l)
processed.append(l.strip()) processed.append(l.strip())
f.close() f.close()
if os.path.exists("todolist.txt"): if os.path.exists("todolist.txt"):
f = open("todolist.txt","r") f = open("todolist.txt","r")
if VERBOSE: print "Reading existing todo list..." if VERBOSE: print("Reading existing todo list...")
for l in f.readlines(): for l in f.readlines():
if l.strip() != "": if l.strip() != "":
todolist.append(l.strip()) todolist.append(l.strip())
@ -79,19 +80,19 @@ def crawl(pagename=[]):
while todolist: while todolist:
targetpage = todolist.pop() targetpage = todolist.pop()
if (not targetpage in NORETRIEVE): if (not targetpage in NORETRIEVE):
if VERBOSE: print count, ": Scanning ", targetpage if VERBOSE: print(count, ": Scanning ", targetpage)
pages,images = get(targetpage) pages,images = get(targetpage)
count += 1 count += 1
processed.append(targetpage) processed.append(targetpage)
processed.extend(images) processed.extend(images)
if VERBOSE: print "got",len(pages),"links" if VERBOSE: print("got",len(pages),"links")
for p in pages: for p in pages:
if (not (p in todolist)) and (not (p in processed)): if (not (p in todolist)) and (not (p in processed)):
todolist.append(p) todolist.append(p)
if WRITETHROUGH: if WRITETHROUGH:
writeList(processed) writeList(processed)
writeList(todolist,"todolist.txt") writeList(todolist,"todolist.txt")
if VERBOSE: print "Fetched ", count, " pages" if VERBOSE: print("Fetched ", count, " pages")
if not WRITETHROUGH: if not WRITETHROUGH:
writeList(processed) writeList(processed)
if pagename: if pagename:
@ -156,7 +157,7 @@ def getlinks(html):
NORETRIEVE.append(rg) NORETRIEVE.append(rg)
if not rg in NORETRIEVE: if not rg in NORETRIEVE:
pages.append(rg) pages.append(rg)
print "got link: ",rg print("got link: ",rg)
return pages return pages
def getimagelinks(html): def getimagelinks(html):
@ -167,7 +168,7 @@ def getimagelinks(html):
def fetchpage(page): def fetchpage(page):
"retrieves given page from the wiki" "retrieves given page from the wiki"
print "fetching: ",page print("fetching: ",page)
failcount = 0 failcount = 0
while failcount < MAXFAIL: while failcount < MAXFAIL:
try: try:
@ -175,7 +176,7 @@ def fetchpage(page):
return html return html
except HTTPError: except HTTPError:
failcount += 1 failcount += 1
print 'Error: unable to fetch page ' + page print('Error: unable to fetch page ' + page)
sys.exit() sys.exit()
def cleanList(pagelist): def cleanList(pagelist):
@ -193,7 +194,7 @@ def writeList(pages,filename="wikifiles.txt"):
for p in pages: for p in pages:
f.write(p+"\n") f.write(p+"\n")
f.close() f.close()
if VERBOSE: print "written ",filename if VERBOSE: print("written ",filename)
if __name__ == "__main__": if __name__ == "__main__":
crawl(sys.argv[1:]) crawl(sys.argv[1:])

View File

@ -22,6 +22,7 @@
#* * #* *
#*************************************************************************** #***************************************************************************
from __future__ import print_function
__title__="downloadwiki" __title__="downloadwiki"
__author__ = "Yorik van Havre <yorik@uncreated.net>" __author__ = "Yorik van Havre <yorik@uncreated.net>"
__url__ = "http://www.freecadweb.org" __url__ = "http://www.freecadweb.org"
@ -137,7 +138,7 @@ def crawl():
"downloads an entire wiki site" "downloads an entire wiki site"
global processed global processed
processed = [] processed = []
if VERBOSE: print "crawling ", URL, ", saving in ", FOLDER if VERBOSE: print("crawling ", URL, ", saving in ", FOLDER)
if not os.path.isdir(FOLDER): os.mkdir(FOLDER) if not os.path.isdir(FOLDER): os.mkdir(FOLDER)
file = open(FOLDER + os.sep + "wiki.css",'wb') file = open(FOLDER + os.sep + "wiki.css",'wb')
file.write(css) file.write(css)
@ -151,16 +152,16 @@ def crawl():
for l in lfile: locallist.append(l.replace("\n","")) for l in lfile: locallist.append(l.replace("\n",""))
lfile.close() lfile.close()
todolist = locallist[:] todolist = locallist[:]
print "getting",len(todolist),"files..." print("getting",len(todolist),"files...")
count = 1 count = 1
indexpages = get(INDEX) indexpages = get(INDEX)
while todolist: while todolist:
targetpage = todolist.pop() targetpage = todolist.pop()
if VERBOSE: print count, ": Fetching ", targetpage if VERBOSE: print(count, ": Fetching ", targetpage)
get(targetpage) get(targetpage)
count += 1 count += 1
if VERBOSE: print "Fetched ", count, " pages" if VERBOSE: print("Fetched ", count, " pages")
if VERBOSE: print "All done!" if VERBOSE: print("All done!")
return 0 return 0
def get(page): def get(page):
@ -180,7 +181,7 @@ def get(page):
html = cleanimagelinks(html) html = cleanimagelinks(html)
output(html,page) output(html,page)
else: else:
if VERBOSE: print " skipping",page if VERBOSE: print(" skipping",page)
def getlinks(html): def getlinks(html):
"returns a list of wikipage links in html file" "returns a list of wikipage links in html file"
@ -268,7 +269,7 @@ def cleanimagelinks(html,links=None):
def fetchpage(page): def fetchpage(page):
"retrieves given page from the wiki" "retrieves given page from the wiki"
print " fetching: ",page print(" fetching: ",page)
failcount = 0 failcount = 0
while failcount < MAXFAIL: while failcount < MAXFAIL:
try: try:
@ -276,19 +277,19 @@ def fetchpage(page):
return html return html
except HTTPError: except HTTPError:
failcount += 1 failcount += 1
print 'Error: unable to fetch page ' + page print('Error: unable to fetch page ' + page)
def fetchimage(imagelink): def fetchimage(imagelink):
"retrieves given image from the wiki and saves it" "retrieves given image from the wiki and saves it"
if imagelink[0:5] == "File:": if imagelink[0:5] == "File:":
print "Skipping file page link" print("Skipping file page link")
return return
filename = re.findall('.*/(.*)',imagelink)[0] filename = re.findall('.*/(.*)',imagelink)[0]
if not exists(filename,image=True): if not exists(filename,image=True):
failcount = 0 failcount = 0
while failcount < MAXFAIL: while failcount < MAXFAIL:
try: try:
if VERBOSE: print " fetching " + filename if VERBOSE: print(" fetching " + filename)
data = (urlopen(URL + imagelink).read()) data = (urlopen(URL + imagelink).read())
path = local(filename,image=True) path = local(filename,image=True)
file = open(path,'wb') file = open(path,'wb')
@ -298,11 +299,11 @@ def fetchimage(imagelink):
failcount += 1 failcount += 1
else: else:
processed.append(filename) processed.append(filename)
if VERBOSE: print " saving",local(filename,image=True) if VERBOSE: print(" saving",local(filename,image=True))
return return
print 'Error: unable to fetch file ' + filename print('Error: unable to fetch file ' + filename)
else: else:
if VERBOSE: print " skipping",filename if VERBOSE: print(" skipping",filename)
def local(page,image=False): def local(page,image=False):
"returns a local path for a given page/image" "returns a local path for a given page/image"
@ -337,7 +338,7 @@ def output(html,page):
filename = filename.replace("&pagefrom=","+") filename = filename.replace("&pagefrom=","+")
filename = filename.replace("#mw-pages","") filename = filename.replace("#mw-pages","")
filename = filename.replace(".html.html",".html") filename = filename.replace(".html.html",".html")
print " saving",filename print(" saving",filename)
file = open(filename,'wb') file = open(filename,'wb')
file.write(html) file.write(html)
file.close() file.close()

View File

@ -22,6 +22,7 @@
#* * #* *
#*************************************************************************** #***************************************************************************
from __future__ import print_function
__title__="update.py" __title__="update.py"
__author__ = "Yorik van Havre <yorik@uncreated.net>" __author__ = "Yorik van Havre <yorik@uncreated.net>"
__url__ = "http://www.freecadweb.org" __url__ = "http://www.freecadweb.org"
@ -58,70 +59,70 @@ def update(pagename=None):
if not os.path.exists("revisions.txt"): # case 1) if not os.path.exists("revisions.txt"): # case 1)
if not os.path.exists("wikifiles.txt"): if not os.path.exists("wikifiles.txt"):
print "No wikifiles.txt found. Aborting" print("No wikifiles.txt found. Aborting")
sys.exit() sys.exit()
pages = [] pages = []
f = open("wikifiles.txt","r") f = open("wikifiles.txt","r")
if VERBOSE: print "Reading existing list..." if VERBOSE: print("Reading existing list...")
for l in f.readlines(): for l in f.readlines():
if l.strip() != "": if l.strip() != "":
if not "/wiki/" in l: if not "/wiki/" in l:
if VERBOSE: print "Adding ",l.strip() if VERBOSE: print("Adding ",l.strip())
pages.append(l.strip()) pages.append(l.strip())
f.close() f.close()
if VERBOSE: print "Added ",str(len(pages))," entries" if VERBOSE: print("Added ",str(len(pages))," entries")
i = 1 i = 1
revs = [] revs = []
for page in pages: for page in pages:
rev = getRevision(page) rev = getRevision(page)
if VERBOSE: print str(i)," revision: ",rev if VERBOSE: print(str(i)," revision: ",rev)
revs.append(page+":"+rev) revs.append(page+":"+rev)
i += 1 i += 1
writeList(revs,"revisions.txt") writeList(revs,"revisions.txt")
print "All done. Successfully written revisions.txt with ",len(revs)," entries." print("All done. Successfully written revisions.txt with ",len(revs)," entries.")
elif os.path.exists("revisions.txt") and (not os.path.exists("updates.txt")): # case 2) elif os.path.exists("revisions.txt") and (not os.path.exists("updates.txt")): # case 2)
f = open("revisions.txt","r") f = open("revisions.txt","r")
if VERBOSE: print "Reading revisions list..." if VERBOSE: print("Reading revisions list...")
revisions = {} revisions = {}
for l in f.readlines(): for l in f.readlines():
if l.strip() != "": if l.strip() != "":
r = l.strip().split(":") r = l.strip().split(":")
p = ":".join(r[:-1]) p = ":".join(r[:-1])
if VERBOSE: print "Adding ",p if VERBOSE: print("Adding ",p)
revisions[p] = r[1] revisions[p] = r[1]
f.close() f.close()
if VERBOSE: print "Added ",str(len(revisions.keys()))," entries" if VERBOSE: print("Added ",str(len(revisions.keys()))," entries")
updates = [] updates = []
i = 1 i = 1
for page in revisions.keys(): for page in revisions.keys():
rev = getRevision(page) rev = getRevision(page)
if rev != revisions[page]: if rev != revisions[page]:
if VERBOSE: print str(i),page," has a new revision: ",rev if VERBOSE: print(str(i),page," has a new revision: ",rev)
updates.append(page) updates.append(page)
else: else:
if VERBOSE: print str(i),page," is up to date " if VERBOSE: print(str(i),page," is up to date ")
i += 1 i += 1
if updates: if updates:
writeList(updates,"updates.txt") writeList(updates,"updates.txt")
print "All done. Successfully written updates.txt with ",len(updates)," entries." print("All done. Successfully written updates.txt with ",len(updates)," entries.")
else: else:
print "Everything up to date. Nothing to be done." print("Everything up to date. Nothing to be done.")
elif os.path.exists("revisions.txt") and os.path.exists("updates.txt"): # case 3) elif os.path.exists("revisions.txt") and os.path.exists("updates.txt"): # case 3)
if not os.path.exists("wikifiles.txt"): if not os.path.exists("wikifiles.txt"):
print "No wikifiles.txt found. Aborting" print("No wikifiles.txt found. Aborting")
sys.exit() sys.exit()
wikifiles = [] wikifiles = []
f = open("wikifiles.txt","r") f = open("wikifiles.txt","r")
if VERBOSE: print "Reading wikifiles list..." if VERBOSE: print("Reading wikifiles list...")
for l in f.readlines(): for l in f.readlines():
if l.strip() != "": if l.strip() != "":
wikifiles.append(l.strip()) wikifiles.append(l.strip())
f.close() f.close()
if VERBOSE: print "Read ",str(len(wikifiles))," entries" if VERBOSE: print("Read ",str(len(wikifiles))," entries")
f = open("revisions.txt","r") f = open("revisions.txt","r")
if VERBOSE: print "Reading revisions list..." if VERBOSE: print("Reading revisions list...")
revisions = {} revisions = {}
for l in f.readlines(): for l in f.readlines():
if l.strip() != "": if l.strip() != "":
@ -131,25 +132,25 @@ def update(pagename=None):
f.close() f.close()
todo = [] todo = []
f = open("updates.txt","r") f = open("updates.txt","r")
if VERBOSE: print "Reading updates list..." if VERBOSE: print("Reading updates list...")
for l in f.readlines(): for l in f.readlines():
if l.strip() != "": if l.strip() != "":
todo.append(l.strip()) todo.append(l.strip())
f.close() f.close()
if VERBOSE: print str(len(todo))," pages to scan..." if VERBOSE: print(str(len(todo))," pages to scan...")
import buildwikiindex import buildwikiindex
buildwikiindex.WRITETHROUGH = False buildwikiindex.WRITETHROUGH = False
buildwikiindex.VERBOSE = VERBOSE buildwikiindex.VERBOSE = VERBOSE
updates = [] updates = []
for t in todo: for t in todo:
if VERBOSE: print "Scanning ",t if VERBOSE: print("Scanning ",t)
updates.extend(buildwikiindex.crawl(t)) updates.extend(buildwikiindex.crawl(t))
updates = [u for u in updates if not u in wikifiles] updates = [u for u in updates if not u in wikifiles]
if VERBOSE: print str(len(updates))," files to download..." if VERBOSE: print(str(len(updates))," files to download...")
import downloadwiki import downloadwiki
i = 1 i = 1
for u in updates: for u in updates:
if VERBOSE: print i, ": Fetching ", u if VERBOSE: print(i, ": Fetching ", u)
downloadwiki.get(u) downloadwiki.get(u)
if not "/wiki/" in u: if not "/wiki/" in u:
rev = getRevision(u) rev = getRevision(u)
@ -157,26 +158,26 @@ def update(pagename=None):
if not u in wikifiles: if not u in wikifiles:
wikifiles.append(u) wikifiles.append(u)
i += 1 i += 1
if VERBOSE: print "Updating wikifiles and revisions..." if VERBOSE: print("Updating wikifiles and revisions...")
writeList(wikifiles,"wikifiles.txt") writeList(wikifiles,"wikifiles.txt")
updatedrevs = [] updatedrevs = []
for k in revisions.keys(): for k in revisions.keys():
updatedrevs.append(k+":"+revisions[k]) updatedrevs.append(k+":"+revisions[k])
writeList(updatedrevs,"revisions.txt") writeList(updatedrevs,"revisions.txt")
os.remove("updates.txt") os.remove("updates.txt")
if VERBOSE: print "All done!" if VERBOSE: print("All done!")
def getRevision(page): def getRevision(page):
html = fetchPage(page) html = fetchPage(page)
revs = re.findall("wgCurRevisionId\"\:(.*?),",html) revs = re.findall("wgCurRevisionId\"\:(.*?),",html)
if len(revs) == 1: if len(revs) == 1:
return revs[0] return revs[0]
print 'Error: unable to get revision ID of ' + page print('Error: unable to get revision ID of ' + page)
sys.exit() sys.exit()
def fetchPage(page): def fetchPage(page):
"retrieves given page from the wiki" "retrieves given page from the wiki"
print "fetching: ",page print("fetching: ",page)
failcount = 0 failcount = 0
while failcount < MAXFAIL: while failcount < MAXFAIL:
try: try:
@ -184,7 +185,7 @@ def fetchPage(page):
return html return html
except HTTPError: except HTTPError:
failcount += 1 failcount += 1
print 'Error: unable to fetch page ' + page print('Error: unable to fetch page ' + page)
sys.exit() sys.exit()
def writeList(pages,filename): def writeList(pages,filename):
@ -192,7 +193,7 @@ def writeList(pages,filename):
for p in pages: for p in pages:
f.write(p+"\n") f.write(p+"\n")
f.close() f.close()
if VERBOSE: print "written ",filename if VERBOSE: print("written ",filename)
if __name__ == "__main__": if __name__ == "__main__":
update(sys.argv[1:]) update(sys.argv[1:])