8
0
Fork 0
mirror of https://gitlab2.federez.net/re2o/re2o synced 2024-09-19 20:53:09 +00:00
re2o/printer/utils.py
2018-12-06 17:57:37 +01:00

28 lines
844 B
Python

import subprocess
def pdfinfo(file_path):
"""
Uses pdfinfo to extract the PDF meta information.
Returns metainfo in a dictionary.
requires poppler-utils
"""
def _extract(row):
"""Extracts the right hand value from a : delimited row"""
row=row.decode()
return row.split(':', 1)[1].strip()
output = {}
labels = ['Title', 'Author', 'Creator', 'Producer', 'CreationDate', 'ModDate',
'Tagged', 'Pages', 'Encrypted', 'Page size',
'File size', 'Optimized', 'PDF version']
cmd_output = subprocess.check_output(['/usr/bin/pdfinfo', file_path])
for line in cmd_output.splitlines():
for label in labels:
if label in line.decode():
output[label] = _extract(line)
return output