mirror of https://github.com/muk-it/muk_base
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
140 lines
6.0 KiB
140 lines
6.0 KiB
###################################################################################
|
|
#
|
|
# Copyright (C) 2018 MuK IT GmbH
|
|
#
|
|
# This program is free software: you can redistribute it and/or modify
|
|
# it under the terms of the GNU Affero General Public License as
|
|
# published by the Free Software Foundation, either version 3 of the
|
|
# License, or (at your option) any later version.
|
|
#
|
|
# This program is distributed in the hope that it will be useful,
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
# GNU Affero General Public License for more details.
|
|
#
|
|
# You should have received a copy of the GNU Affero General Public License
|
|
# along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
#
|
|
###################################################################################
|
|
|
|
import os
|
|
import io
|
|
import base64
|
|
import shutil
|
|
import urllib
|
|
import logging
|
|
import tempfile
|
|
import mimetypes
|
|
|
|
from subprocess import Popen
|
|
from subprocess import PIPE
|
|
from subprocess import CalledProcessError
|
|
|
|
from contextlib import closing
|
|
|
|
from odoo.tools import config
|
|
from odoo.tools.mimetypes import guess_mimetype
|
|
|
|
_logger = logging.getLogger(__name__)
|
|
|
|
FORMATS = [
|
|
"bib", "doc", "doc6", "doc95", "docbook", "docx", "docx7", "fodt", "html", "latex", "mediawiki",
|
|
"odt", "ooxml", "ott", "pdb", "pdf", "psw", "rtf", "sdw", "sdw4", "sdw3", "stw", "sxw", "text",
|
|
"txt", "uot", "vor", "vor4", "vor3", "wps", "xhtml", "bmp", "emf", "eps", "fodg", "gif", "html",
|
|
"jpg", "met", "odd", "otg", "pbm", "pct", "pdf", "pgm", "png", "ppm", "ras", "std", "svg", "svm",
|
|
"swf", "sxd", "sxd3", "sxd5", "sxw", "tiff", "vor", "vor3", "wmf", "xhtml", "xpm", "bmp", "emf",
|
|
"eps", "fodp", "gif", "html", "jpg", "met", "odg", "odp", "otp", "pbm", "pct", "pdf", "pgm", "png",
|
|
"potm", "pot", "ppm", "pptx", "pps", "ppt", "pwp", "ras", "sda", "sdd", "sdd3", "sdd4", "sxd",
|
|
"sti", "svg", "svm", "swf", "sxi", "tiff", "uop", "vor", "vor3", "vor4", "vor5", "wmf", "xhtml",
|
|
"xpm", "csv", "dbf", "dif", "fods", "html", "ods", "ooxml", "ots", "pdf", "pxl", "sdc", "sdc4",
|
|
"sdc3", "slk", "stc", "sxc", "uos", "vor3", "vor4", "vor", "xhtml", "xls", "xls5", "xls95", "xlt",
|
|
"xlt5", "xlt95", "xlsx",
|
|
]
|
|
|
|
def formats():
|
|
return FORMATS
|
|
|
|
def unoconv_environ():
|
|
env = os.environ.copy()
|
|
uno_path = config.get('uno_path', False)
|
|
if uno_path:
|
|
env['UNO_PATH'] = config['uno_path']
|
|
return env
|
|
|
|
def convert(input_path, output_path, doctype="document", format="pdf"):
|
|
"""
|
|
Convert a file to the given format.
|
|
|
|
:param input_path: The path of the file to convert.
|
|
:param output_path: The path of the output where the converted file is to be saved.
|
|
:param doctype: Specify the document type (document, graphics, presentation, spreadsheet).
|
|
:param format: Specify the output format for the document.
|
|
:raises CalledProcessError: The command returned non-zero exit status 1.
|
|
:raises OSError: This exception is raised when a system function returns a system-related error.
|
|
"""
|
|
try:
|
|
env = unoconv_environ()
|
|
shell = True if os.name in ('nt', 'os2') else False
|
|
args = ['unoconv', '--format=%s' % format, '--output=%s' % output_path, input_path]
|
|
process = Popen(args, stdout=PIPE, env=env, shell=shell)
|
|
outs, errs = process.communicate()
|
|
return_code = process.wait()
|
|
if return_code:
|
|
raise CalledProcessError(return_code, args, outs, errs)
|
|
except CalledProcessError:
|
|
_logger.exception("Error while running unoconv.")
|
|
raise
|
|
except OSError:
|
|
_logger.exception("Error while running unoconv.")
|
|
raise
|
|
|
|
def convert_binary(binary, mimetype=None, filename=None, export="binary", doctype="document", format="pdf"):
|
|
"""
|
|
Converts a binary value to the given format.
|
|
|
|
:param binary: The binary value.
|
|
:param mimetype: The mimetype of the binary value.
|
|
:param filename: The filename of the binary value.
|
|
:param export: The output format (binary, file, base64).
|
|
:param doctype: Specify the document type (document, graphics, presentation, spreadsheet).
|
|
:param format: Specify the output format for the document.
|
|
:return: Returns the output depending on the given format.
|
|
:raises ValueError: The file extension could not be determined or the format is invalid.
|
|
"""
|
|
def get_extension(filename, mimetype):
|
|
if not filename and mimetype:
|
|
return mimetypes.guess_extension(mimetype)
|
|
elif filename:
|
|
return os.path.splitext(filename)[1]
|
|
return None
|
|
if not mimetype and not filename:
|
|
mimetype = guess_mimetype(binary, default=False)
|
|
if not mimetype and filename:
|
|
mimetype = mimetypes.guess_type(urllib.request.pathname2url(filename))[0]
|
|
extension = get_extension(filename, mimetype)
|
|
if not extension:
|
|
raise ValueError("The file extension could not be determined.")
|
|
if format not in FORMATS:
|
|
raise ValueError("Invalid export format.")
|
|
tmp_dir = tempfile.mkdtemp()
|
|
try:
|
|
tmp_wpath = os.path.join(tmp_dir, "tmpfile" + extension)
|
|
tmp_ppath = os.path.join(tmp_dir, "tmpfile." + format)
|
|
if os.name == 'nt':
|
|
tmp_wpath = tmp_wpath.replace("\\", "/")
|
|
tmp_ppath = tmp_ppath.replace("\\", "/")
|
|
with closing(open(tmp_wpath, 'wb')) as file:
|
|
file.write(binary)
|
|
convert(tmp_wpath, tmp_ppath, doctype, format)
|
|
with closing(open(tmp_ppath, 'rb')) as file:
|
|
if export == 'file':
|
|
output = io.BytesIO()
|
|
output.write(file.read())
|
|
output.close()
|
|
return output
|
|
elif export == 'base64':
|
|
return base64.b64encode(file.read())
|
|
else:
|
|
return file.read()
|
|
finally:
|
|
shutil.rmtree(tmp_dir)
|