remove pdf_pagecount()

这个提交包含在:
Albert S. 2018-08-09 23:00:44 +02:00
父节点 07b3479029
当前提交 e006a95673
共有 1 个文件被更改,包括 2 次插入5 次删除

查看文件

@ -41,11 +41,8 @@ def strip_irrelevant(content):
result = re.sub(' +', ' ', result)
return result;
def pdf_pagecount(path):
cmd = "pdfinfo " + path + " | grep Pages | awk '{print $2}'"
stdout,stderr = subprocess.Popen(cmd,shell=True,stdout=subprocess.PIPE, stderr=subprocess.PIPE).communicate()
result = int(stdout)
return result
def process_pdf(path):
result = list()
args=["pdftotext", path, "-"]