19.0 vanilla

2026-04-23 00:11:59 +02:00 · 2025-10-03 18:07:25 +02:00 · 2025-10-03 18:07:25 +02:00 · 991d2234ca
commit 991d2234ca
parent 0a7ae8db93
416 changed files with 646602 additions and 300844 deletions
--- a/odoo-bringout-oca-ocb-base/odoo/tools/pdf/signature.py
+++ b/odoo-bringout-oca-ocb-base/odoo/tools/pdf/signature.py
@ -0,0 +1,467 @@
+import base64
+import datetime
+import hashlib
+import io
+from typing import Optional
+from asn1crypto import cms, algos, core, x509
+import logging
+
+try:
+    from cryptography.hazmat.primitives import hashes
+    from cryptography.hazmat.primitives.asymmetric.types import PrivateKeyTypes
+    from cryptography.hazmat.primitives.serialization import Encoding, load_pem_private_key
+    from cryptography.hazmat.primitives.asymmetric import padding
+    from cryptography.x509 import Certificate, load_pem_x509_certificate
+except ImportError:
+    # cryptography 41.0.7 and above is supported
+    hashes = None
+    PrivateKeyTypes = None
+    Encoding = None
+    load_pem_private_key = None
+    padding = None
+    Certificate = None
+    load_pem_x509_certificate = None
+
+from odoo import _
+from odoo.addons.base.models.res_company import ResCompany
+from odoo.addons.base.models.res_users import ResUsers
+from odoo.tools.pdf import PdfReader, PdfWriter, ArrayObject, ByteStringObject, DictionaryObject, NameObject, NumberObject, create_string_object, DecodedStreamObject as StreamObject
+
+_logger = logging.getLogger(__name__)
+
+class PdfSigner:
+    """Class that defines methods uses in the signing process of pdf documents
+
+    The PdfSigner will perform the following operations on a PDF document:
+        - Modifiying the document by adding a signature field via a form,
+        - Performing a cryptographic signature of the document.
+
+    This implementation follows the Adobe PDF Reference (v1.7) (https://ia601001.us.archive.org/1/items/pdf1.7/pdf_reference_1-7.pdf)
+    for the structure of the PDF document,
+    and Digital Signatures in a PDF (https://www.adobe.com/devnet-docs/acrobatetk/tools/DigSig/Acrobat_DigitalSignatures_in_PDF.pdf),
+    for the structure of the signature in a PDF.
+    """
+
+    def __init__(self, stream: io.BytesIO, company: Optional[ResCompany] = None, signing_time=None) -> None:
+        self.signing_time = signing_time
+        self.company = company
+        if not 'clone_document_from_reader' in dir(PdfWriter):
+            _logger.info("PDF signature is supported by Python 3.12 and above")
+            return
+        reader = PdfReader(stream)
+        self.writer = PdfWriter()
+        self.writer.clone_document_from_reader(reader)
+
+
+
+    def sign_pdf(self, visible_signature: bool = False, field_name: str = "Odoo Signature", signer: Optional[ResUsers] = None) -> Optional[io.BytesIO]:
+        """Signs the pdf document using a PdfWriter object
+
+        Returns:
+            Optional[io.BytesIO]: the resulting output stream after the signature has been performed, or None in case of error
+        """
+        if not self.company or not load_pem_x509_certificate:
+            return
+
+        dummy, sig_field_value = self._setup_form(visible_signature, field_name,  signer)
+
+        if not self._perform_signature(sig_field_value):
+            return
+
+        out_stream = io.BytesIO()
+        self.writer.write_stream(out_stream)
+        return out_stream
+
+    def _load_key_and_certificate(self) -> tuple[Optional[PrivateKeyTypes], Optional[Certificate]]:
+        """Loads the private key
+
+        Returns:
+            Optional[PrivateKeyTypes]: a private key object, or None if the key couldn't be loaded.
+        """
+        if "signing_certificate_id" not in self.company._fields \
+            or not self.company.signing_certificate_id.pem_certificate:
+            return None, None
+
+        certificate = self.company.signing_certificate_id
+        cert_bytes = base64.decodebytes(certificate.pem_certificate)
+        private_key_bytes = base64.decodebytes(certificate.private_key_id.content)
+        return load_pem_private_key(private_key_bytes, None), load_pem_x509_certificate(cert_bytes)
+
+    def _setup_form(self, visible_signature: bool, field_name: str, signer: Optional[ResUsers] = None) -> tuple[DictionaryObject, DictionaryObject] | None:
+        """Creates the /AcroForm and populates it with the appropriate field for the signature
+
+        Args:
+            visible_signature (bool): boolean value that determines if the signature should be visible on the document
+            field_name (str): the name of the signature field
+            signer (Optional[ResUsers]): user that will be used in the visuals of the signature field
+
+        Returns:
+            tuple[DictionaryObject, DictionaryObject]: a tuple containing the signature field and the signature content
+        """
+        if "/AcroForm" not in self.writer._root_object:
+            form = DictionaryObject()
+            form.update({
+                NameObject("/SigFlags"): NumberObject(3)
+            })
+            form_ref = self.writer._add_object(form)
+
+            self.writer._root_object.update({
+                NameObject("/AcroForm"): form_ref
+            })
+        else:
+            form = self.writer._root_object["/AcroForm"].get_object()
+
+
+            # SigFlags(3) = SignatureExists = true && AppendOnly = true.
+            # The document contains signed signature and must be modified in incremental mode (see https://github.com/pdf-association/pdf-issues/issues/457)
+            form.update({
+                NameObject("/SigFlags"): NumberObject(3)
+            })
+
+        # Assigning the newly created field to a page
+        page = self.writer.pages[0]
+
+        # Setting up the signature field properties
+        signature_field = DictionaryObject()
+
+        # Metadata of the signature field
+        # /FT = Field Type, here set to /Sig the signature type
+        # /T = name of the field
+        # /Type = type of object, in this case annotation (/Annot)
+        # /Subtype = type of annotation
+        # /F = annotation flags, represented as a 32 bit unsigned integer. 132 corresponds to the Print and Locked flags
+        #   Print : corresponds to printing the signature when the page is printed
+        #   Locked : preventing the annotation properties to be modfied or the annotation to be deletd by the user
+        #   (see section 8.4.2 of the Adobe PDF Reference (v1.7) https://ia601001.us.archive.org/1/items/pdf1.7/pdf_reference_1-7.pdf),
+        # /P = page reference, reference to the page where the signature field is located
+        signature_field.update({
+            NameObject("/FT"): NameObject("/Sig"),
+            NameObject("/T"): create_string_object(field_name),
+            NameObject("/Type"): NameObject("/Annot"),
+            NameObject("/Subtype"): NameObject("/Widget"),
+            NameObject("/F"): NumberObject(132),
+            NameObject("/P"): page.indirect_reference,
+        })
+
+
+        # Creating the appearance (visible elements of the signature)
+        if visible_signature:
+            origin = page.mediabox.upper_right # retrieves the top-right coordinates of the page
+            rect_size = (200, 20) # dimensions of the box (width, height)
+            padding = 5
+
+            # Box that will contain the signature, defined as [x1, y1, x2, y2]
+            # where (x1, y1) is the bottom left coordinates of the box,
+            # and (x2, y2) the top-right coordinates.
+            rect = [
+                origin[0] - rect_size[0] - padding,
+                origin[1] - rect_size[1] - padding,
+                origin[0] - padding,
+                origin[1] - padding
+            ]
+
+            # Here is defined the StreamObject that contains the information about the visible
+            # parts of the signature
+            #
+            # Dictionary contents:
+            # /BBox = coordinates of the 'visible' box, relative to the /Rect definition of the signature field
+            # /Resources = resources needed to properly render the signature,
+            #   /Font = dictionary containing the information about the font used by the signature
+            #       /F1 = font resource, used to define a font that will be usable in the signature
+            stream = StreamObject()
+            stream.update({
+                NameObject("/BBox"): self._create_number_array_object([0, 0, rect_size[0], rect_size[1]]),
+                NameObject("/Resources"): DictionaryObject({
+                    NameObject("/Font"): DictionaryObject({
+                        NameObject("/F1"): DictionaryObject({
+                            NameObject("/Type"): NameObject("/Font"),
+                            NameObject("/Subtype"): NameObject("/Type1"),
+                            NameObject("/BaseFont"): NameObject("/Helvetica")
+                        })
+                    })
+                }),
+                NameObject("/Type"): NameObject("/XObject"),
+                NameObject("/Subtype"): NameObject("/Form")
+            })
+
+            #
+            content = "Digitally signed"
+            content = create_string_object(f'{content} by {signer.name} <{signer.email}>') if signer is not None else create_string_object(content)
+
+            # Setting the parameters used to display the text object of the signature
+            # More details on this subject can be found in the sections 4.3 and 5.3
+            # of the Adobe PDF Reference (v1.7) https://ia601001.us.archive.org/1/items/pdf1.7/pdf_reference_1-7.pdf
+            #
+            # Parameters:
+            # q = saves the the current graphics state on the graphics state stack
+            # 0.5 0 0 0.5 0 0 cm = modification of the current transformation matrix. Here used to scale down the text size by 0.5 in x and y
+            # BT = begin text object
+            # /F1 = reference to the font resource named F1
+            # 12 Tf = set the font size to 12
+            # 0 TL = defines text leading, the space between lines, here set to 0
+            # 0 10 Td = moves the text to the start of the next line, expressed in text space units. Here (x, y) = (0, 10)
+            # (text_content) Tj = renders a text string
+            # ET = end text object
+            # Q = Restore the graphics state by removing the most recently saved state from the stack and making it the current state
+            stream._data = f"q 0.5 0 0 0.5 0 0 cm BT /F1 12 Tf 0 TL 0 10 Td ({content}) Tj ET Q".encode()
+            signature_appearence = DictionaryObject()
+            signature_appearence.update({
+                NameObject("/N"): stream
+            })
+            signature_field.update({
+                NameObject("/AP"): signature_appearence,
+            })
+        else:
+            rect = [0,0,0,0]
+
+        signature_field.update({
+            NameObject("/Rect"): self._create_number_array_object(rect)
+        })
+
+        # Setting up the actual signature contents with placeholders for /Contents and /ByteRange
+        #
+        # Dictionary contents:
+        # /Contents = content of the signature field. The content is a byte string of an object that follows
+        # the Cryptographic Message Syntax (CMS). The object is converted in hexadecimal and stored as bytes.
+        # The /Contents are pre-filled with placeholder values of an arbitrary size (i.e. 8KB) to ensure that
+        # the signature will fit in the "<>" bounds of the field
+        # /ByteRange = an array represented as [offset, length, offset, length, ...] which defines the bytes that
+        # are used when computing the digest of the document. Similarly to the /Contents, the /ByteRange is set to
+        # a placeholder as we aren't yet able to compute the range at this point.
+        # /Type = the type of form field. Here /Sig, the signature field
+        # /Filter
+        # /SubFilter
+        # /M = the timestamp of the signature. Indicates when the document was signed.
+        signature_field_value = DictionaryObject()
+        signature_field_value.update({
+            NameObject("/Contents"): ByteStringObject(b"\0" * 8192),
+            NameObject("/ByteRange"): self._create_number_array_object([0, 0, 0, 0]),
+            NameObject("/Type"): NameObject("/Sig"),
+            NameObject("/Filter"): NameObject("/Adobe.PPKLite"),
+            NameObject("/SubFilter"): NameObject("/adbe.pkcs7.detached"),
+            NameObject("/M"): create_string_object(datetime.datetime.now(datetime.timezone.utc).strftime("D:%Y%m%d%H%M%S")),
+        })
+
+        # Here we add the reference to be written in a specific order. This is needed
+        # by Adobe Acrobat to consider the signature valid.
+        signature_field_ref = self.writer._add_object(signature_field)
+        signature_field_value_ref = self.writer._add_object(signature_field_value)
+
+        # /V = the actual value of the signature field. Used to store the dictionary of the field
+        signature_field.update({
+            NameObject("/V"): signature_field_value_ref
+        })
+
+        # Definition of the fields array linked to the form (/AcroForm)
+        if "/Fields" not in self.writer._root_object:
+            fields = ArrayObject()
+        else:
+            fields = self.writer._root_object["/Fields"].get_object()
+        fields.append(signature_field_ref)
+        form.update({
+            NameObject("/Fields"): fields
+        })
+
+        # The signature field reference is added to the annotations array
+        if "/Annots" not in page:
+            page[NameObject("/Annots")] = ArrayObject()
+        page[NameObject("/Annots")].append(signature_field_ref)
+
+        return signature_field, signature_field_value
+
+    def _get_cms_object(self, digest: bytes) -> Optional[cms.ContentInfo]:
+        """Creates an object that follows the Cryptographic Message Syntax(CMS)
+
+        RFC: https://datatracker.ietf.org/doc/html/rfc5652
+
+        Args:
+            digest (bytes): the digest of the document in bytes
+
+        Returns:
+            cms.ContentInfo: a CMS object containing the information of the signature
+        """
+        private_key, certificate = self._load_key_and_certificate()
+        if private_key == None or certificate == None:
+            return None
+        cert = x509.Certificate.load(
+            certificate.public_bytes(encoding=Encoding.DER))
+        encap_content_info = {
+            'content_type': 'data',
+            'content': None
+        }
+
+        attrs = cms.CMSAttributes([
+            cms.CMSAttribute({
+                'type': 'content_type',
+                'values': ['data']
+            }),
+            cms.CMSAttribute({
+                'type': 'signing_time',
+                'values': [cms.Time({'utc_time': core.UTCTime(self.signing_time or datetime.datetime.now(datetime.timezone.utc))})]
+            }),
+            cms.CMSAttribute({
+                'type': 'cms_algorithm_protection',
+                'values': [
+                        cms.CMSAlgorithmProtection(
+                            {
+                                'mac_algorithm': None,
+                                'digest_algorithm': cms.DigestAlgorithm(
+                                    {'algorithm': 'sha256', 'parameters': None}
+                                ),
+                                'signature_algorithm': cms.SignedDigestAlgorithm({
+                                    'algorithm': 'sha256_rsa',
+                                    'parameters': None
+                                })
+                            }
+                        )
+                ]
+            }),
+            cms.CMSAttribute({
+                'type': 'message_digest',
+                'values': [digest],
+            }),
+        ])
+
+        signed_attrs = private_key.sign(
+            attrs.dump(),
+            padding.PKCS1v15(),
+            hashes.SHA256()
+        )
+
+        signer_info = cms.SignerInfo({
+            'version': "v1",
+            'digest_algorithm': algos.DigestAlgorithm({'algorithm': 'sha256'}),
+            'signature_algorithm': algos.SignedDigestAlgorithm({'algorithm': 'sha256_rsa'}),
+            'signature': signed_attrs,
+            'sid': cms.SignerIdentifier({
+                'issuer_and_serial_number': cms.IssuerAndSerialNumber({
+                    'issuer': cert.issuer,
+                    'serial_number': cert.serial_number
+                })
+            }),
+            'signed_attrs': attrs})
+
+        signed_data = {
+            'version': 'v1',
+            'digest_algorithms': [algos.DigestAlgorithm({'algorithm': 'sha256'})],
+            'encap_content_info': encap_content_info,
+            'certificates': [cert],
+            'signer_infos': [signer_info]
+        }
+
+        return cms.ContentInfo({
+            'content_type': 'signed_data',
+            'content': cms.SignedData(signed_data)
+        })
+
+    def _perform_signature(self, sig_field_value: DictionaryObject) -> bool:
+        """Creates the actual signature content and populate /ByteRange and /Contents properties with meaningful content.
+
+        Args:
+            sig_field_value (DictionaryObject): the value (/V) of the signature field which needs to be modified
+        """
+        pdf_data = self._get_document_data()
+
+        # Computation of the location of the last inserted contents for the signature field
+        signature_field_pos = pdf_data.rfind(b"/FT /Sig")
+        contents_field_pos = pdf_data.find(b"Contents", signature_field_pos)
+
+        # Computing the start and end position of the /Contents <signature> field
+        # to exclude the content of <> (aka the actual signature) from the byte range
+        placeholder_start = contents_field_pos + 9
+        placeholder_end = placeholder_start + len(b"\0" * 8192) * 2 + 2
+
+        # Replacing the placeholder byte range with the actual range
+        # that will be used to compute the document digest
+        placeholder_byte_range = sig_field_value.get("/ByteRange")
+
+        # Here the byte range represents an array [index, length, index, length, ...]
+        # where 'index' represents the index of a byte, and length the number of bytes to take
+        # This array indicates the bytes that are used when computing the digest of the document
+        byte_range = [0, placeholder_start,
+                      placeholder_end, abs(len(pdf_data) - placeholder_end)]
+
+        byte_range = self._correct_byte_range(
+            placeholder_byte_range, byte_range, len(pdf_data))
+
+        sig_field_value.update({
+            NameObject("/ByteRange"): self._create_number_array_object(byte_range)
+        })
+
+        pdf_data = self._get_document_data()
+
+        digest = self._compute_digest_from_byte_range(pdf_data, byte_range)
+
+        cms_content_info = self._get_cms_object(digest)
+
+        if cms_content_info == None:
+            return False
+
+        signature_hex = cms_content_info.dump().hex()
+        signature_hex = signature_hex.ljust(8192 * 2, "0")
+
+        sig_field_value.update({
+            NameObject("/Contents"): ByteStringObject(bytes.fromhex(signature_hex))
+        })
+        return True
+
+    def _get_document_data(self):
+        """Retrieves the bytes of the document from the writer"""
+        output_stream = io.BytesIO()
+        self.writer.write_stream(output_stream)
+        return output_stream.getvalue()
+
+
+    def _correct_byte_range(self, old_range: list[int], new_range: list[int], base_pdf_len: int) -> list[int]:
+        """Corrects the last value of the new byte range
+
+        This function corrects the initial byte range (old_range) which was computed for document containing
+        the placeholder values for the /ByteRange and /Contents fields. This is needed because when updating
+        /ByteRange, the length of the document will change as the byte range will take more bytes of the
+        document, resulting in an invalid byte range.
+
+        Args:
+            old_range (list[int]): the previous byte range
+            new_range (list[int]): the new byte range
+            base_pdf_len (int): the base length of the pdf, before insertion of the actual byte range
+
+        Returns:
+            list[int]: the corrected byte range
+        """
+        # Computing the difference of length of the strings of the old and new byte ranges.
+        # Used to determine if a re-computation of the range is needed or not
+        current_len = len(str(old_range))
+        corrected_len = len(str(new_range))
+        diff = corrected_len - current_len
+
+        if diff == 0:
+            return new_range
+
+        corrected_range = new_range.copy()
+        corrected_range[-1] = abs((base_pdf_len + diff) - new_range[-2])
+        return self._correct_byte_range(new_range, corrected_range, base_pdf_len)
+
+
+    def _compute_digest_from_byte_range(self, data: bytes, byte_range: list[int]) -> bytes:
+        """Computes the digest of the data from a byte range. Uses SHA256 algorithm to compute the hash.
+
+        The byte range is defined as an array [offset, length, offset, length, ...] which corresponds to the bytes from the document
+        that will be used in the computation of the hash.
+
+        i.e. for document = b'example' and byte_range = [0, 1, 6, 1],
+        the hash will be computed from b'ee'
+
+        Args:
+            document (bytes): the data in bytes
+            byte_range (list[int]): the byte range used to compute the digest.
+
+        Returns:
+            bytes: the computed digest
+        """
+        hashed = hashlib.sha256()
+        for i in range(0, len(byte_range), 2):
+            hashed.update(data[byte_range[i]:byte_range[i] + byte_range[i+1]])
+        return hashed.digest()
+
+    def _create_number_array_object(self, array: list[int]) -> ArrayObject:
+        return ArrayObject([NumberObject(item) for item in array])