You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

139 lines
6.0 KiB

7 years ago
  1. ###################################################################################
  2. #
  3. # Copyright (C) 2018 MuK IT GmbH
  4. #
  5. # This program is free software: you can redistribute it and/or modify
  6. # it under the terms of the GNU Affero General Public License as
  7. # published by the Free Software Foundation, either version 3 of the
  8. # License, or (at your option) any later version.
  9. #
  10. # This program is distributed in the hope that it will be useful,
  11. # but WITHOUT ANY WARRANTY; without even the implied warranty of
  12. # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  13. # GNU Affero General Public License for more details.
  14. #
  15. # You should have received a copy of the GNU Affero General Public License
  16. # along with this program. If not, see <http://www.gnu.org/licenses/>.
  17. #
  18. ###################################################################################
  19. import os
  20. import io
  21. import base64
  22. import shutil
  23. import urllib
  24. import logging
  25. import tempfile
  26. import mimetypes
  27. from subprocess import Popen
  28. from subprocess import PIPE
  29. from subprocess import CalledProcessError
  30. from contextlib import closing
  31. from odoo.tools import config
  32. from odoo.tools.mimetypes import guess_mimetype
  33. _logger = logging.getLogger(__name__)
  34. FORMATS = [
  35. "bib", "doc", "doc6", "doc95", "docbook", "docx", "docx7", "fodt", "html", "latex", "mediawiki",
  36. "odt", "ooxml", "ott", "pdb", "pdf", "psw", "rtf", "sdw", "sdw4", "sdw3", "stw", "sxw", "text",
  37. "txt", "uot", "vor", "vor4", "vor3", "wps", "xhtml", "bmp", "emf", "eps", "fodg", "gif", "html",
  38. "jpg", "met", "odd", "otg", "pbm", "pct", "pdf", "pgm", "png", "ppm", "ras", "std", "svg", "svm",
  39. "swf", "sxd", "sxd3", "sxd5", "sxw", "tiff", "vor", "vor3", "wmf", "xhtml", "xpm", "bmp", "emf",
  40. "eps", "fodp", "gif", "html", "jpg", "met", "odg", "odp", "otp", "pbm", "pct", "pdf", "pgm", "png",
  41. "potm", "pot", "ppm", "pptx", "pps", "ppt", "pwp", "ras", "sda", "sdd", "sdd3", "sdd4", "sxd",
  42. "sti", "svg", "svm", "swf", "sxi", "tiff", "uop", "vor", "vor3", "vor4", "vor5", "wmf", "xhtml",
  43. "xpm", "csv", "dbf", "dif", "fods", "html", "ods", "ooxml", "ots", "pdf", "pxl", "sdc", "sdc4",
  44. "sdc3", "slk", "stc", "sxc", "uos", "vor3", "vor4", "vor", "xhtml", "xls", "xls5", "xls95", "xlt",
  45. "xlt5", "xlt95", "xlsx",
  46. ]
  47. def formats():
  48. return FORMATS
  49. def unoconv_environ():
  50. env = os.environ.copy()
  51. uno_path = config.get('uno_path', False)
  52. if uno_path:
  53. env['UNO_PATH'] = config['uno_path']
  54. return env
  55. def convert(input_path, output_path, doctype="document", format="pdf"):
  56. """
  57. Convert a file to the given format.
  58. :param input_path: The path of the file to convert.
  59. :param output_path: The path of the output where the converted file is to be saved.
  60. :param doctype: Specify the document type (document, graphics, presentation, spreadsheet).
  61. :param format: Specify the output format for the document.
  62. :raises CalledProcessError: The command returned non-zero exit status 1.
  63. :raises OSError: This exception is raised when a system function returns a system-related error.
  64. """
  65. try:
  66. env = unoconv_environ()
  67. shell = True if os.name in ('nt', 'os2') else False
  68. args = ['unoconv', '--format=%s' % format, '--output=%s' % output_path, input_path]
  69. process = Popen(args, stdout=PIPE, env=env, shell=shell)
  70. outs, errs = process.communicate()
  71. return_code = process.wait()
  72. if return_code:
  73. raise CalledProcessError(return_code, args, outs, errs)
  74. except CalledProcessError:
  75. _logger.exception("Error while running unoconv.")
  76. raise
  77. except OSError:
  78. _logger.exception("Error while running unoconv.")
  79. raise
  80. def convert_binary(binary, mimetype=None, filename=None, export="binary", doctype="document", format="pdf"):
  81. """
  82. Converts a binary value to the given format.
  83. :param binary: The binary value.
  84. :param mimetype: The mimetype of the binary value.
  85. :param filename: The filename of the binary value.
  86. :param export: The output format (binary, file, base64).
  87. :param doctype: Specify the document type (document, graphics, presentation, spreadsheet).
  88. :param format: Specify the output format for the document.
  89. :return: Returns the output depending on the given format.
  90. :raises ValueError: The file extension could not be determined or the format is invalid.
  91. """
  92. def get_extension(filename, mimetype):
  93. if not filename and mimetype:
  94. return mimetypes.guess_extension(mimetype)
  95. elif filename:
  96. return os.path.splitext(filename)[1]
  97. return None
  98. if not mimetype and not filename:
  99. mimetype = guess_mimetype(binary, default=False)
  100. if not mimetype and filename:
  101. mimetype = mimetypes.guess_type(urllib.request.pathname2url(filename))[0]
  102. extension = get_extension(filename, mimetype)
  103. if not extension:
  104. raise ValueError("The file extension could not be determined.")
  105. if format not in FORMATS:
  106. raise ValueError("Invalid export format.")
  107. tmp_dir = tempfile.mkdtemp()
  108. try:
  109. tmp_wpath = os.path.join(tmp_dir, "tmpfile" + extension)
  110. tmp_ppath = os.path.join(tmp_dir, "tmpfile." + format)
  111. if os.name == 'nt':
  112. tmp_wpath = tmp_wpath.replace("\\", "/")
  113. tmp_ppath = tmp_ppath.replace("\\", "/")
  114. with closing(open(tmp_wpath, 'wb')) as file:
  115. file.write(binary)
  116. convert(tmp_wpath, tmp_ppath, doctype, format)
  117. with closing(open(tmp_ppath, 'rb')) as file:
  118. if export == 'file':
  119. output = io.BytesIO()
  120. output.write(file.read())
  121. output.close()
  122. return output
  123. elif export == 'base64':
  124. return base64.b64encode(file.read())
  125. else:
  126. return file.read()
  127. finally:
  128. shutil.rmtree(tmp_dir)