also store a complete copy of the document

This commit is contained in:
Albert S. 2018-08-09 21:03:49 +02:00
والد f535372be7
کامیت 6c07601c84

مشاهده پرونده

@ -60,10 +60,13 @@ def process_pdf(path):
result.append(data)
count += 1
#everything = pagedata()
#everything.page = 0
#everything.content = content.replace("\f", "")
#result.append(everything)
#TODO: current hack, so we can fts search several words over the whole document
#this of course uses more space, but in the end that's not a big problem
#Nevertheless, this remains a hack
everything = pagedata()
everything.page = 0
everything.content = content.replace("\f", "")
result.append(everything)
return result
def process_odt(path):