"""Custom element classes related to document comments.""" from __future__ import annotations import datetime as dt from typing import TYPE_CHECKING, Callable, cast from docx.oxml.ns import nsdecls from docx.oxml.parser import parse_xml from docx.oxml.simpletypes import ST_DateTime, ST_DecimalNumber, ST_String from docx.oxml.xmlchemy import BaseOxmlElement, OptionalAttribute, RequiredAttribute, ZeroOrMore if TYPE_CHECKING: from docx.oxml.table import CT_Tbl from docx.oxml.text.paragraph import CT_P class CT_Comments(BaseOxmlElement): """`w:comments` element, the root element for the comments part. Simply contains a collection of `w:comment` elements, each representing a single comment. Each contained comment is identified by a unique `w:id` attribute, used to reference the comment from the document text. The offset of the comment in this collection is arbitrary; it is essentially a _set_ implemented as a list. """ # -- type-declarations to fill in the gaps for metaclass-added methods -- comment_lst: list[CT_Comment] comment = ZeroOrMore("w:comment") def add_comment(self) -> CT_Comment: """Return newly added `w:comment` child of this `w:comments`. The returned `w:comment` element is the minimum valid value, having a `w:id` value unique within the existing comments and the required `w:author` attribute present but set to the empty string. It's content is limited to a single run containing the necessary annotation reference but no text. Content is added by adding runs to this first paragraph and by adding additional paragraphs as needed. """ next_id = self._next_available_comment_id() comment = cast( CT_Comment, parse_xml( f'' f" " f" " f' ' f" " f" " f" " f' ' f" " f" " f" " f" " f"" ), ) self.append(comment) return comment def get_comment_by_id(self, comment_id: int) -> CT_Comment | None: """Return the `w:comment` element identified by `comment_id`, or |None| if not found.""" comment_elms = self.xpath(f"(./w:comment[@w:id='{comment_id}'])[1]") return comment_elms[0] if comment_elms else None def _next_available_comment_id(self) -> int: """The next available comment id. According to the schema, this can be any positive integer, as big as you like, and the default mechanism is to use `max() + 1`. However, if that yields a value larger than will fit in a 32-bit signed integer, we take a more deliberate approach to use the first ununsed integer starting from 0. """ used_ids = [int(x) for x in self.xpath("./w:comment/@w:id")] next_id = max(used_ids, default=-1) + 1 if next_id <= 2**31 - 1: return next_id # -- fall-back to enumerating all used ids to find the first unused one -- for expected, actual in enumerate(sorted(used_ids)): if expected != actual: return expected return len(used_ids) class CT_Comment(BaseOxmlElement): """`w:comment` element, representing a single comment. A comment is a so-called "story" and can contain paragraphs and tables much like a table-cell. While probably most often used for a single sentence or phrase, a comment can contain rich content, including multiple rich-text paragraphs, hyperlinks, images, and tables. """ # -- attributes on `w:comment` -- id: int = RequiredAttribute("w:id", ST_DecimalNumber) # pyright: ignore[reportAssignmentType] author: str = RequiredAttribute("w:author", ST_String) # pyright: ignore[reportAssignmentType] initials: str | None = OptionalAttribute( # pyright: ignore[reportAssignmentType] "w:initials", ST_String ) date: dt.datetime | None = OptionalAttribute( # pyright: ignore[reportAssignmentType] "w:date", ST_DateTime ) # -- children -- p = ZeroOrMore("w:p", successors=()) tbl = ZeroOrMore("w:tbl", successors=()) # -- type-declarations for methods added by metaclass -- add_p: Callable[[], CT_P] p_lst: list[CT_P] tbl_lst: list[CT_Tbl] _insert_tbl: Callable[[CT_Tbl], CT_Tbl] @property def inner_content_elements(self) -> list[CT_P | CT_Tbl]: """Generate all `w:p` and `w:tbl` elements in this comment.""" return self.xpath("./w:p | ./w:tbl")