21 lines
778 B
Python
21 lines
778 B
Python
# -*- coding: utf-8 -*-
|
|
|
|
import os
|
|
|
|
from ..utils import get_page_layout, get_text_objects
|
|
|
|
|
|
class BaseParser(object):
|
|
"""Defines a base parser."""
|
|
|
|
def _generate_layout(self, filename, layout_kwargs):
|
|
self.filename = filename
|
|
self.layout_kwargs = layout_kwargs
|
|
self.layout, self.dimensions = get_page_layout(filename, **layout_kwargs)
|
|
self.images = get_text_objects(self.layout, ltype="image")
|
|
self.horizontal_text = get_text_objects(self.layout, ltype="horizontal_text")
|
|
self.vertical_text = get_text_objects(self.layout, ltype="vertical_text")
|
|
self.pdf_width, self.pdf_height = self.dimensions
|
|
self.rootname, __ = os.path.splitext(self.filename)
|
|
self.imagename = "".join([self.rootname, ".png"])
|