blob: 62269f0d66bd1c696ea8b8235d795f5d5776ea23 [file] [log] [blame]
# text.py
#
# Copyright (C) 2011 Carlos Garcia Campos <carlosgc@gnome.org>
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
from __future__ import absolute_import, division, print_function
from backends import Backend, register_backend
import subprocess
import os
class Text(Backend):
def __init__(self, name):
Backend.__init__(self, name, '.diff')
self._pdftotext = os.path.join(self._utilsdir, 'pdftotext');
def create_refs(self, doc_path, refs_path, password = None):
out_path = os.path.join(refs_path, 'text')
cmd = [self._pdftotext, doc_path, out_path + '.txt']
if password is not None:
cmd.extend(['-opw', password, '-upw', password])
p = subprocess.Popen(cmd, stderr = subprocess.PIPE)
return self._check_exit_status(p, out_path)
def _create_diff(self, ref_path, result_path):
import difflib
ref = open(ref_path, 'r')
result = open(result_path, 'r')
diff = difflib.unified_diff(ref.readlines(), result.readlines(), ref_path, result_path)
ref.close()
result.close()
diff_file = open(result_path + '.diff', 'w')
diff_file.writelines(diff)
diff_file.close()
register_backend('text', Text)