paperless-ngx/src/documents/management/commands/document_consumer.py

import datetime
import glob
import langdetect
import os
import random
import re
import subprocess
import time

import pyocr

from PIL import Image

from django.conf import settings
from django.core.management.base import BaseCommand, CommandError
from django.template.defaultfilters import slugify
from django.utils import timezone

from paperless.db import GnuPG

from ...languages import ISO639
from ...models import Document, Sender, Tag


class OCRError(BaseException):
    pass


class Command(BaseCommand):
    """
    Loop over every file found in CONSUMPTION_DIR and:
      1. Convert it to a greyscale png
      2. Use tesseract on the png
      3. Encrypt and store the document in the MEDIA_ROOT
      4. Store the OCR'd text in the database
      5. Delete the document and image(s)
    """

    LOOP_TIME = 10  # Seconds

    CONVERT = settings.CONVERT_BINARY
    SCRATCH = settings.SCRATCH_DIR
    CONSUME = settings.CONSUMPTION_DIR

    OCR = pyocr.get_available_tools()[0]
    DEFAULT_OCR_LANGUAGE = settings.OCR_LANGUAGE
    MEDIA_DOCS = os.path.join(settings.MEDIA_ROOT, "documents")

    PARSER_REGEX_TITLE = re.compile(
        r"^.*/(.*)\.(pdf|jpe?g|png|gif|tiff)$", flags=re.IGNORECASE)
    PARSER_REGEX_SENDER_TITLE = re.compile(
        r"^.*/(.*) - (.*)\.(pdf|jpe?g|png|gif|tiff)", flags=re.IGNORECASE)

    def __init__(self, *args, **kwargs):

        self.verbosity = 0
        self.stats = {}
        self._ignore = []

        BaseCommand.__init__(self, *args, **kwargs)

    def handle(self, *args, **options):

        self.verbosity = options["verbosity"]

        self._setup()

        try:
            while True:
                self.loop()
                time.sleep(self.LOOP_TIME)
                if self.verbosity > 1:
                    print(".")
        except KeyboardInterrupt:
            print("Exiting")

    def loop(self):

        for doc in os.listdir(self.CONSUME):

            doc = os.path.join(self.CONSUME, doc)

            if not os.path.isfile(doc):
                continue

            if not re.match(self.PARSER_REGEX_TITLE, doc):
                continue

            if doc in self._ignore:
                continue

            if self._is_ready(doc):
                continue

            self._render("Consuming {}".format(doc), 1)

            pngs = self._get_greyscale(doc)

            try:
                text = self._get_ocr(pngs)
            except OCRError:
                self._ignore.append(doc)
                self._render("OCR FAILURE: {}".format(doc), 0)
                continue

            self._store(text, doc)
            self._cleanup(pngs, doc)

    def _setup(self):

        if not self.CONSUME:
            raise CommandError(
                "The CONSUMPTION_DIR settings variable does not appear to be "
                "set."
            )

        if not os.path.exists(self.CONSUME):
            raise CommandError("Consumption directory {} does not exist".format(
                self.CONSUME))

        for d in (self.SCRATCH, self.MEDIA_DOCS):
            try:
                os.makedirs(d)
            except FileExistsError:
                pass

    def _is_ready(self, doc):
        """
        Detect whether `doc` is ready to consume or if it's still being written
        to by the scanner.
        """

        t = os.stat(doc).st_mtime

        if self.stats.get(doc) == t:
            del(self.stats[doc])
            return True

        self.stats[doc] = t

        return False

    def _get_greyscale(self, doc):

        self._render("  Generating greyscale image", 2)

        i = random.randint(1000000, 9999999)
        png = os.path.join(self.SCRATCH, "{}.png".format(i))

        subprocess.Popen((
            self.CONVERT, "-density", "300", "-depth", "8",
            "-type", "grayscale", doc, png
        )).wait()

        return sorted(glob.glob(os.path.join(self.SCRATCH, "{}*".format(i))))

    def _get_ocr(self, pngs):

        self._render("  OCRing the document", 2)

        raw_text = self._ocr(pngs, self.DEFAULT_OCR_LANGUAGE)

        guessed_language = langdetect.detect(raw_text)

        self._render("    Language detected: {}".format(guessed_language), 2)

        if guessed_language not in ISO639:
            self._render("Language detection failed!", 0)
            if settings.FORGIVING_OCR:
                self._render(
                    "As FORGIVING_OCR is enabled, we're going to make the best "
                    "with what we have.",
                    1
                )
                return raw_text
            raise OCRError

        if ISO639[guessed_language] == self.DEFAULT_OCR_LANGUAGE:
            return raw_text

        try:
            return self._ocr(pngs, ISO639[guessed_language])
        except pyocr.pyocr.tesseract.TesseractError:
            if settings.FORGIVING_OCR:
                self._render(
                    "OCR for {} failed, but we're going to stick with what "
                    "we've got since FORGIVING_OCR is enabled.".format(
                        guessed_language
                    ),
                    0
                )
                return raw_text
            raise OCRError

    def _ocr(self, pngs, lang):

        self._render("    Parsing for {}".format(lang), 2)

        r = ""
        for png in pngs:
            with Image.open(os.path.join(self.SCRATCH, png)) as f:
                self._render("    {}".format(f.filename), 3)
                r += self.OCR.image_to_string(f, lang=lang)

        # Strip out excess white space to allow matching to go smoother
        return re.sub(r"\s+", " ", r)

    def _store(self, text, doc):

        sender, title, file_type = self._parse_file_name(doc)

        lower_text = text.lower()
        relevant_tags = [t for t in Tag.objects.all() if t.matches(lower_text)]

        stats = os.stat(doc)

        self._render("  Saving record to database", 2)

        document = Document.objects.create(
            sender=sender,
            title=title,
            content=text,
            file_type=file_type,
            created=timezone.make_aware(
                datetime.datetime.fromtimestamp(stats.st_mtime)),
            modified=timezone.make_aware(
                datetime.datetime.fromtimestamp(stats.st_mtime))
        )

        if relevant_tags:
            tag_names = ", ".join([t.slug for t in relevant_tags])
            self._render("    Tagging with {}".format(tag_names), 2)
            document.tags.add(*relevant_tags)

        with open(doc, "rb") as unencrypted:
            with open(document.source_path, "wb") as encrypted:
                self._render("  Encrypting", 3)
                encrypted.write(GnuPG.encrypted(unencrypted))

    def _parse_file_name(self, doc):
        """
        We use a crude naming convention to make handling the sender and title
        easier:
          "<sender> - <title>.<suffix>"
        """

        # First we attempt "<sender> - <title>.<suffix>"
        m = re.match(self.PARSER_REGEX_SENDER_TITLE, doc)
        if m:
            sender_name, title, file_type = m.group(1), m.group(2), m.group(3)
            sender, __ = Sender.objects.get_or_create(
                name=sender_name, defaults={"slug": slugify(sender_name)})
            return sender, title, file_type

        # That didn't work, so we assume sender is None
        m = re.match(self.PARSER_REGEX_TITLE, doc)
        return None, m.group(1), m.group(2)

    def _cleanup(self, pngs, doc):

        png_glob = os.path.join(
            self.SCRATCH, re.sub(r"^.*/(\d+)-\d+.png$", "\\1*", pngs[0]))

        for f in list(glob.glob(png_glob)) + [doc]:
            self._render("  Deleting {}".format(f), 2)
            os.unlink(f)

        self._render("", 2)

    def _render(self, text, verbosity):
        if self.verbosity >= verbosity:
            print(text)
Changed the consumer into a loop 2015-12-26 13:21:33 +00:00			`import datetime`
It works! 2015-12-20 19:23:33 +00:00			`import glob`
Introducing language detection 2016-01-21 12:50:22 -05:00			`import langdetect`
It works! 2015-12-20 19:23:33 +00:00			`import os`
			`import random`
			`import re`
			`import subprocess`
Restructured the consumer into a loop and added a check for scans in-progress 2015-12-21 02:44:24 +00:00			`import time`
It works! 2015-12-20 19:23:33 +00:00
			`import pyocr`

			`from PIL import Image`

			`from django.conf import settings`
Fixed a few consumer bugs and added an exporter Rename exporter to export and fixt some debugging Account for files not matching the sender/title pattern Added a safety note Wrong regex on the name parser Renamed the command to something slightly less ambiguous 2016-01-14 19:47:57 +00:00			`from django.core.management.base import BaseCommand, CommandError`
Actually handle the change to using a Sender model 2016-01-15 02:02:47 +00:00			`from django.template.defaultfilters import slugify`
Changed the consumer into a loop 2015-12-26 13:21:33 +00:00			`from django.utils import timezone`
It works! 2015-12-20 19:23:33 +00:00
pep8 2016-01-23 02:58:03 +00:00			`from paperless.db import GnuPG`

Added language detection 2016-01-23 02:33:29 +00:00			`from ...languages import ISO639`
#11: automatic tagging support 2016-01-28 07:23:11 +00:00			`from ...models import Document, Sender, Tag`
It works! 2015-12-20 19:23:33 +00:00

Added language detection 2016-01-23 02:33:29 +00:00			`class OCRError(BaseException):`
			`pass`


It works! 2015-12-20 19:23:33 +00:00			`class Command(BaseCommand):`
			`"""`
			`Loop over every file found in CONSUMPTION_DIR and:`
Updated the docstring to show what's actually happening 2016-01-10 15:51:38 +00:00			`1. Convert it to a greyscale png`
			`2. Use tesseract on the png`
#12: Support image documents 2016-01-29 23:18:03 +00:00			`3. Encrypt and store the document in the MEDIA_ROOT`
Updated the docstring to show what's actually happening 2016-01-10 15:51:38 +00:00			`4. Store the OCR'd text in the database`
#12: Support image documents 2016-01-29 23:18:03 +00:00			`5. Delete the document and image(s)`
It works! 2015-12-20 19:23:33 +00:00			`"""`

Changed the consumer into a loop 2015-12-26 13:21:33 +00:00			`LOOP_TIME = 10 # Seconds`

It works! 2015-12-20 19:23:33 +00:00			`CONVERT = settings.CONVERT_BINARY`
			`SCRATCH = settings.SCRATCH_DIR`
			`CONSUME = settings.CONSUMPTION_DIR`

			`OCR = pyocr.get_available_tools()[0]`
Added language detection 2016-01-23 02:33:29 +00:00			`DEFAULT_OCR_LANGUAGE = settings.OCR_LANGUAGE`
#12: Support image documents 2016-01-29 23:18:03 +00:00			`MEDIA_DOCS = os.path.join(settings.MEDIA_ROOT, "documents")`
It works! 2015-12-20 19:23:33 +00:00
#12: Support image documents 2016-01-29 23:18:03 +00:00			`PARSER_REGEX_TITLE = re.compile(`
			`r"^./(.)\.(pdf\|jpe?g\|png\|gif\|tiff)$", flags=re.IGNORECASE)`
			`PARSER_REGEX_SENDER_TITLE = re.compile(`
			`r"^./(.) - (.*)\.(pdf\|jpe?g\|png\|gif\|tiff)", flags=re.IGNORECASE)`
Restructured the consumer into a loop and added a check for scans in-progress 2015-12-21 02:44:24 +00:00
It works! 2015-12-20 19:23:33 +00:00			`def __init__(self, args, *kwargs):`
Introducing language detection 2016-01-21 12:50:22 -05:00
It works! 2015-12-20 19:23:33 +00:00			`self.verbosity = 0`
Restructured the consumer into a loop and added a check for scans in-progress 2015-12-21 02:44:24 +00:00			`self.stats = {}`
Added language detection 2016-01-23 02:33:29 +00:00			`self._ignore = []`
Introducing language detection 2016-01-21 12:50:22 -05:00
It works! 2015-12-20 19:23:33 +00:00			`BaseCommand.__init__(self, args, *kwargs)`

			`def handle(self, args, *options):`

			`self.verbosity = options["verbosity"]`

			`self._setup()`

Restructured the consumer into a loop and added a check for scans in-progress 2015-12-21 02:44:24 +00:00			`try:`
			`while True:`
			`self.loop()`
Changed the consumer into a loop 2015-12-26 13:21:33 +00:00			`time.sleep(self.LOOP_TIME)`
			`if self.verbosity > 1:`
			`print(".")`
Restructured the consumer into a loop and added a check for scans in-progress 2015-12-21 02:44:24 +00:00			`except KeyboardInterrupt:`
			`print("Exiting")`

			`def loop(self):`

#12: Support image documents 2016-01-29 23:18:03 +00:00			`for doc in os.listdir(self.CONSUME):`
It works! 2015-12-20 19:23:33 +00:00
#12: Support image documents 2016-01-29 23:18:03 +00:00			`doc = os.path.join(self.CONSUME, doc)`
Restructured the consumer into a loop and added a check for scans in-progress 2015-12-21 02:44:24 +00:00
#12: Support image documents 2016-01-29 23:18:03 +00:00			`if not os.path.isfile(doc):`
It works! 2015-12-20 19:23:33 +00:00			`continue`

#12: Support image documents 2016-01-29 23:18:03 +00:00			`if not re.match(self.PARSER_REGEX_TITLE, doc):`
It works! 2015-12-20 19:23:33 +00:00			`continue`

#12: Support image documents 2016-01-29 23:18:03 +00:00			`if doc in self._ignore:`
Added language detection 2016-01-23 02:33:29 +00:00			`continue`

#12: Support image documents 2016-01-29 23:18:03 +00:00			`if self._is_ready(doc):`
Restructured the consumer into a loop and added a check for scans in-progress 2015-12-21 02:44:24 +00:00			`continue`

#12: Support image documents 2016-01-29 23:18:03 +00:00			`self._render("Consuming {}".format(doc), 1)`
It works! 2015-12-20 19:23:33 +00:00
#12: Support image documents 2016-01-29 23:18:03 +00:00			`pngs = self._get_greyscale(doc)`
Added language detection 2016-01-23 02:33:29 +00:00
			`try:`
			`text = self._get_ocr(pngs)`
			`except OCRError:`
#12: Support image documents 2016-01-29 23:18:03 +00:00			`self._ignore.append(doc)`
			`self._render("OCR FAILURE: {}".format(doc), 0)`
Added language detection 2016-01-23 02:33:29 +00:00			`continue`
It works! 2015-12-20 19:23:33 +00:00
#12: Support image documents 2016-01-29 23:18:03 +00:00			`self._store(text, doc)`
			`self._cleanup(pngs, doc)`
It works! 2015-12-20 19:23:33 +00:00
			`def _setup(self):`
Smarter check positions 2016-01-23 03:42:39 +00:00
			`if not self.CONSUME:`
			`raise CommandError(`
			`"The CONSUMPTION_DIR settings variable does not appear to be "`
			`"set."`
			`)`

			`if not os.path.exists(self.CONSUME):`
			`raise CommandError("Consumption directory {} does not exist".format(`
			`self.CONSUME))`

#12: Support image documents 2016-01-29 23:18:03 +00:00			`for d in (self.SCRATCH, self.MEDIA_DOCS):`
It works! 2015-12-20 19:23:33 +00:00			`try:`
			`os.makedirs(d)`
			`except FileExistsError:`
			`pass`

#12: Support image documents 2016-01-29 23:18:03 +00:00			`def _is_ready(self, doc):`
Restructured the consumer into a loop and added a check for scans in-progress 2015-12-21 02:44:24 +00:00			`"""`
#12: Support image documents 2016-01-29 23:18:03 +00:00			Detect whether `doc` is ready to consume or if it's still being written
Restructured the consumer into a loop and added a check for scans in-progress 2015-12-21 02:44:24 +00:00			`to by the scanner.`
			`"""`

#12: Support image documents 2016-01-29 23:18:03 +00:00			`t = os.stat(doc).st_mtime`
Restructured the consumer into a loop and added a check for scans in-progress 2015-12-21 02:44:24 +00:00
#12: Support image documents 2016-01-29 23:18:03 +00:00			`if self.stats.get(doc) == t:`
			`del(self.stats[doc])`
Restructured the consumer into a loop and added a check for scans in-progress 2015-12-21 02:44:24 +00:00			`return True`

#12: Support image documents 2016-01-29 23:18:03 +00:00			`self.stats[doc] = t`
Restructured the consumer into a loop and added a check for scans in-progress 2015-12-21 02:44:24 +00:00
			`return False`

#12: Support image documents 2016-01-29 23:18:03 +00:00			`def _get_greyscale(self, doc):`
It works! 2015-12-20 19:23:33 +00:00
Added GPG encryption for the PDFs 2016-01-01 16:13:59 +00:00			`self._render(" Generating greyscale image", 2)`

			`i = random.randint(1000000, 9999999)`
It works! 2015-12-20 19:23:33 +00:00			`png = os.path.join(self.SCRATCH, "{}.png".format(i))`

			`subprocess.Popen((`
			`self.CONVERT, "-density", "300", "-depth", "8",`
#12: Support image documents 2016-01-29 23:18:03 +00:00			`"-type", "grayscale", doc, png`
It works! 2015-12-20 19:23:33 +00:00			`)).wait()`

			`return sorted(glob.glob(os.path.join(self.SCRATCH, "{}*".format(i))))`

			`def _get_ocr(self, pngs):`

#12: Support image documents 2016-01-29 23:18:03 +00:00			`self._render(" OCRing the document", 2)`
Added GPG encryption for the PDFs 2016-01-01 16:13:59 +00:00
Added language detection 2016-01-23 02:33:29 +00:00			`raw_text = self._ocr(pngs, self.DEFAULT_OCR_LANGUAGE)`
Introducing language detection 2016-01-21 12:50:22 -05:00
			`guessed_language = langdetect.detect(raw_text)`
Added language detection 2016-01-23 02:33:29 +00:00
			`self._render(" Language detected: {}".format(guessed_language), 2)`

			`if guessed_language not in ISO639:`
			`self._render("Language detection failed!", 0)`
			`if settings.FORGIVING_OCR:`
			`self._render(`
			`"As FORGIVING_OCR is enabled, we're going to make the best "`
			`"with what we have.",`
			`1`
			`)`
			`return raw_text`
			`raise OCRError`

			`if ISO639[guessed_language] == self.DEFAULT_OCR_LANGUAGE:`
Introducing language detection 2016-01-21 12:50:22 -05:00			`return raw_text`

Added language detection 2016-01-23 02:33:29 +00:00			`try:`
			`return self._ocr(pngs, ISO639[guessed_language])`
			`except pyocr.pyocr.tesseract.TesseractError:`
			`if settings.FORGIVING_OCR:`
			`self._render(`
			`"OCR for {} failed, but we're going to stick with what "`
			`"we've got since FORGIVING_OCR is enabled.".format(`
			`guessed_language`
			`),`
			`0`
			`)`
			`return raw_text`
			`raise OCRError`
Introducing language detection 2016-01-21 12:50:22 -05:00
			`def _ocr(self, pngs, lang):`

Added language detection 2016-01-23 02:33:29 +00:00			`self._render(" Parsing for {}".format(lang), 2)`

It works! 2015-12-20 19:23:33 +00:00			`r = ""`
			`for png in pngs:`
			`with Image.open(os.path.join(self.SCRATCH, png)) as f:`
Added GPG encryption for the PDFs 2016-01-01 16:13:59 +00:00			`self._render(" {}".format(f.filename), 3)`
Added language detection 2016-01-23 02:33:29 +00:00			`r += self.OCR.image_to_string(f, lang=lang)`
It works! 2015-12-20 19:23:33 +00:00
#11: automatic tagging support 2016-01-28 07:23:11 +00:00			`# Strip out excess white space to allow matching to go smoother`
			`return re.sub(r"\s+", " ", r)`
It works! 2015-12-20 19:23:33 +00:00
#12: Support image documents 2016-01-29 23:18:03 +00:00			`def _store(self, text, doc):`
It works! 2015-12-20 19:23:33 +00:00
#12: Support image documents 2016-01-29 23:18:03 +00:00			`sender, title, file_type = self._parse_file_name(doc)`
Restructured the consumer into a loop and added a check for scans in-progress 2015-12-21 02:44:24 +00:00
#12: Support image documents 2016-01-29 23:18:03 +00:00			`lower_text = text.lower()`
			`relevant_tags = [t for t in Tag.objects.all() if t.matches(lower_text)]`

			`stats = os.stat(doc)`
Changed the consumer into a loop 2015-12-26 13:21:33 +00:00
Added GPG encryption for the PDFs 2016-01-01 16:13:59 +00:00			`self._render(" Saving record to database", 2)`

#12: Support image documents 2016-01-29 23:18:03 +00:00			`document = Document.objects.create(`
Added GPG encryption for the PDFs 2016-01-01 16:13:59 +00:00			`sender=sender,`
			`title=title,`
			`content=text,`
#12: Support image documents 2016-01-29 23:18:03 +00:00			`file_type=file_type,`
Added GPG encryption for the PDFs 2016-01-01 16:13:59 +00:00			`created=timezone.make_aware(`
			`datetime.datetime.fromtimestamp(stats.st_mtime)),`
			`modified=timezone.make_aware(`
			`datetime.datetime.fromtimestamp(stats.st_mtime))`
Changed the consumer into a loop 2015-12-26 13:21:33 +00:00			`)`
It works! 2015-12-20 19:23:33 +00:00
#11: automatic tagging support 2016-01-28 07:23:11 +00:00			`if relevant_tags:`
			`tag_names = ", ".join([t.slug for t in relevant_tags])`
			`self._render(" Tagging with {}".format(tag_names), 2)`
#12: Support image documents 2016-01-29 23:18:03 +00:00			`document.tags.add(*relevant_tags)`
#11: automatic tagging support 2016-01-28 07:23:11 +00:00
#12: Support image documents 2016-01-29 23:18:03 +00:00			`with open(doc, "rb") as unencrypted:`
			`with open(document.source_path, "wb") as encrypted:`
Added GPG encryption for the PDFs 2016-01-01 16:13:59 +00:00			`self._render(" Encrypting", 3)`
Fixed a few consumer bugs and added an exporter Rename exporter to export and fixt some debugging Account for files not matching the sender/title pattern Added a safety note Wrong regex on the name parser Renamed the command to something slightly less ambiguous 2016-01-14 19:47:57 +00:00			`encrypted.write(GnuPG.encrypted(unencrypted))`
It works! 2015-12-20 19:23:33 +00:00
#12: Support image documents 2016-01-29 23:18:03 +00:00			`def _parse_file_name(self, doc):`
Restructured the consumer into a loop and added a check for scans in-progress 2015-12-21 02:44:24 +00:00			`"""`
			`We use a crude naming convention to make handling the sender and title`
			`easier:`
#12: Support image documents 2016-01-29 23:18:03 +00:00			`"<sender> - <title>.<suffix>"`
Restructured the consumer into a loop and added a check for scans in-progress 2015-12-21 02:44:24 +00:00			`"""`

#12: Support image documents 2016-01-29 23:18:03 +00:00			`# First we attempt "<sender> - <title>.<suffix>"`
			`m = re.match(self.PARSER_REGEX_SENDER_TITLE, doc)`
Restructured the consumer into a loop and added a check for scans in-progress 2015-12-21 02:44:24 +00:00			`if m:`
#12: Support image documents 2016-01-29 23:18:03 +00:00			`sender_name, title, file_type = m.group(1), m.group(2), m.group(3)`
Actually handle the change to using a Sender model 2016-01-15 02:02:47 +00:00			`sender, __ = Sender.objects.get_or_create(`
			`name=sender_name, defaults={"slug": slugify(sender_name)})`
#12: Support image documents 2016-01-29 23:18:03 +00:00			`return sender, title, file_type`
Restructured the consumer into a loop and added a check for scans in-progress 2015-12-21 02:44:24 +00:00
Fixed a few consumer bugs and added an exporter Rename exporter to export and fixt some debugging Account for files not matching the sender/title pattern Added a safety note Wrong regex on the name parser Renamed the command to something slightly less ambiguous 2016-01-14 19:47:57 +00:00			`# That didn't work, so we assume sender is None`
#12: Support image documents 2016-01-29 23:18:03 +00:00			`m = re.match(self.PARSER_REGEX_TITLE, doc)`
			`return None, m.group(1), m.group(2)`
Restructured the consumer into a loop and added a check for scans in-progress 2015-12-21 02:44:24 +00:00
#12: Support image documents 2016-01-29 23:18:03 +00:00			`def _cleanup(self, pngs, doc):`
It works! 2015-12-20 19:23:33 +00:00
			`png_glob = os.path.join(`
			`self.SCRATCH, re.sub(r"^./(\d+)-\d+.png$", "\\1", pngs[0]))`

#12: Support image documents 2016-01-29 23:18:03 +00:00			`for f in list(glob.glob(png_glob)) + [doc]:`
Added GPG encryption for the PDFs 2016-01-01 16:13:59 +00:00			`self._render(" Deleting {}".format(f), 2)`
It works! 2015-12-20 19:23:33 +00:00			`os.unlink(f)`
Added GPG encryption for the PDFs 2016-01-01 16:13:59 +00:00
Fixed a few consumer bugs and added an exporter Rename exporter to export and fixt some debugging Account for files not matching the sender/title pattern Added a safety note Wrong regex on the name parser Renamed the command to something slightly less ambiguous 2016-01-14 19:47:57 +00:00			`self._render("", 2)`

Added GPG encryption for the PDFs 2016-01-01 16:13:59 +00:00			`def _render(self, text, verbosity):`
			`if self.verbosity >= verbosity:`
			`print(text)`