Docling Document
This is an automatic generated API reference of the DoclingDocument type.
doc
Package for models defined by the Document type.
Classes:
-
DoclingDocument
–DoclingDocument.
-
DocumentOrigin
–FileSource.
-
DocItem
–DocItem.
-
DocItemLabel
–DocItemLabel.
-
ProvenanceItem
–ProvenanceItem.
-
GroupItem
–GroupItem.
-
GroupLabel
–GroupLabel.
-
NodeItem
–NodeItem.
-
PageItem
–PageItem.
-
FloatingItem
–FloatingItem.
-
TextItem
–TextItem.
-
TableItem
–TableItem.
-
TableCell
–TableCell.
-
TableData
–BaseTableData.
-
TableCellLabel
–TableCellLabel.
-
KeyValueItem
–KeyValueItem.
-
SectionHeaderItem
–SectionItem.
-
PictureItem
–PictureItem.
-
ImageRef
–ImageRef.
-
PictureClassificationClass
–PictureClassificationData.
-
PictureClassificationData
–PictureClassificationData.
-
RefItem
–RefItem.
-
BoundingBox
–BoundingBox.
-
CoordOrigin
–CoordOrigin.
-
ImageRefMode
–ImageRefMode.
-
Size
–Size.
DoclingDocument
Bases: BaseModel
DoclingDocument.
Methods:
-
add_group
–add_group.
-
add_heading
–add_heading.
-
add_list_item
–add_list_item.
-
add_page
–add_page.
-
add_picture
–add_picture.
-
add_table
–add_table.
-
add_text
–add_text.
-
add_title
–add_title.
-
check_version_is_compatible
–Check if this document version is compatible with current version.
-
export_to_dict
–Export to dict.
-
export_to_document_tokens
–Exports the document content to a DocumentToken format.
-
export_to_element_tree
–Export_to_element_tree.
-
export_to_html
–Serialize to HTML.
-
export_to_markdown
–Serialize to Markdown.
-
export_to_text
–export_to_text.
-
iterate_items
–iterate_elements.
-
load_from_json
–load_from_json.
-
num_pages
–num_pages.
-
print_element_tree
–Print_element_tree.
-
save_as_document_tokens
–Save the document content to a DocumentToken format.
-
save_as_html
–Save to HTML.
-
save_as_json
–Save as json.
-
save_as_markdown
–Save to markdown.
-
save_as_yaml
–Save as yaml.
-
validate_document
–validate_document.
-
validate_tree
–validate_tree.
Attributes:
-
body
(GroupItem
) – -
furniture
(GroupItem
) – -
groups
(List[GroupItem]
) – -
key_value_items
(List[KeyValueItem]
) – -
name
(str
) – -
origin
(Optional[DocumentOrigin]
) – -
pages
(Dict[int, PageItem]
) – -
pictures
(List[PictureItem]
) – -
schema_name
(Literal['DoclingDocument']
) – -
tables
(List[TableItem]
) – -
texts
(List[Union[SectionHeaderItem, ListItem, TextItem]]
) – -
version
(Annotated[str, StringConstraints(pattern=VERSION_PATTERN, strict=True)]
) –
name
name: str
schema_name
schema_name: Literal['DoclingDocument'] = 'DoclingDocument'
version
version: Annotated[
str,
StringConstraints(pattern=VERSION_PATTERN, strict=True),
] = CURRENT_VERSION
add_group
add_group(
label: Optional[GroupLabel] = None,
name: Optional[str] = None,
parent: Optional[GroupItem] = None,
) -> GroupItem
add_group.
:param label: Optional[GroupLabel]: (Default value = None) :param name: Optional[str]: (Default value = None) :param parent: Optional[GroupItem]: (Default value = None)
add_heading
add_heading(
text: str,
orig: Optional[str] = None,
level: LevelNumber = 1,
prov: Optional[ProvenanceItem] = None,
parent: Optional[GroupItem] = None,
)
add_heading.
:param label: DocItemLabel: :param text: str: :param orig: Optional[str]: (Default value = None) :param level: LevelNumber: (Default value = 1) :param prov: Optional[ProvenanceItem]: (Default value = None) :param parent: Optional[GroupItem]: (Default value = None)
add_list_item
add_list_item(
text: str,
enumerated: bool = False,
marker: Optional[str] = None,
orig: Optional[str] = None,
prov: Optional[ProvenanceItem] = None,
parent: Optional[GroupItem] = None,
)
add_list_item.
:param label: str: :param text: str: :param orig: Optional[str]: (Default value = None) :param prov: Optional[ProvenanceItem]: (Default value = None) :param parent: Optional[GroupItem]: (Default value = None)
add_page
add_page.
:param page_no: int: :param size: Size:
add_picture
add_picture(
annotations: List[PictureDataType] = [],
image: Optional[ImageRef] = None,
caption: Optional[Union[TextItem, RefItem]] = None,
prov: Optional[ProvenanceItem] = None,
parent: Optional[GroupItem] = None,
)
add_picture.
:param data: List[PictureData]: (Default value = []) :param caption: Optional[Union[TextItem: :param RefItem]]: (Default value = None) :param prov: Optional[ProvenanceItem]: (Default value = None) :param parent: Optional[GroupItem]: (Default value = None)
add_table
add_table(
data: TableData,
caption: Optional[Union[TextItem, RefItem]] = None,
prov: Optional[ProvenanceItem] = None,
parent: Optional[GroupItem] = None,
)
add_table.
:param data: BaseTableData: :param caption: Optional[Union[TextItem: :param RefItem]]: (Default value = None) :param # This is not cool yet.prov: Optional[ProvenanceItem] :param parent: Optional[GroupItem]: (Default value = None)
add_text
add_text(
label: DocItemLabel,
text: str,
orig: Optional[str] = None,
prov: Optional[ProvenanceItem] = None,
parent: Optional[GroupItem] = None,
)
add_text.
:param label: str: :param text: str: :param orig: Optional[str]: (Default value = None) :param prov: Optional[ProvenanceItem]: (Default value = None) :param parent: Optional[GroupItem]: (Default value = None)
add_title
add_title(
text: str,
orig: Optional[str] = None,
prov: Optional[ProvenanceItem] = None,
parent: Optional[GroupItem] = None,
)
add_title.
:param text: str: :param orig: Optional[str]: (Default value = None) :param prov: Optional[ProvenanceItem]: (Default value = None) :param parent: Optional[GroupItem]: (Default value = None)
check_version_is_compatible
check_version_is_compatible(v: str) -> str
Check if this document version is compatible with current version.
export_to_dict
export_to_dict(
mode: str = "json",
by_alias: bool = True,
exclude_none: bool = True,
) -> Dict
Export to dict.
export_to_document_tokens
export_to_document_tokens(
delim: str = "\n",
from_element: int = 0,
to_element: int = maxsize,
labels: set[DocItemLabel] = DEFAULT_EXPORT_LABELS,
xsize: int = 100,
ysize: int = 100,
add_location: bool = True,
add_content: bool = True,
add_page_index: bool = True,
add_table_cell_location: bool = False,
add_table_cell_label: bool = True,
add_table_cell_text: bool = True,
page_no: Optional[int] = None,
with_groups: bool = True,
newline: bool = True,
) -> str
Exports the document content to a DocumentToken format.
Operates on a slice of the document's body as defined through arguments from_element and to_element; defaulting to the whole main_text.
:param delim: str: (Default value = "\n\n") :param from_element: int: (Default value = 0) :param to_element: Optional[int]: (Default value = None) :param labels: set[DocItemLabel] :param xsize: int: (Default value = 100) :param ysize: int: (Default value = 100) :param add_location: bool: (Default value = True) :param add_content: bool: (Default value = True) :param add_page_index: bool: (Default value = True) :param # table specific flagsadd_table_cell_location: bool :param add_table_cell_label: bool: (Default value = True) :param add_table_cell_text: bool: (Default value = True) :returns: The content of the document formatted as a DocTags string. :rtype: str
export_to_element_tree
export_to_element_tree() -> str
Export_to_element_tree.
export_to_html
export_to_html(
from_element: int = 0,
to_element: int = maxsize,
labels: set[DocItemLabel] = DEFAULT_EXPORT_LABELS,
image_mode: ImageRefMode = PLACEHOLDER,
page_no: Optional[int] = None,
html_lang: str = "en",
html_head: str = _HTML_DEFAULT_HEAD,
) -> str
Serialize to HTML.
export_to_markdown
export_to_markdown(
delim: str = "\n",
from_element: int = 0,
to_element: int = maxsize,
labels: set[DocItemLabel] = DEFAULT_EXPORT_LABELS,
strict_text: bool = False,
image_placeholder: str = "<!-- image -->",
image_mode: ImageRefMode = PLACEHOLDER,
indent: int = 4,
text_width: int = -1,
page_no: Optional[int] = None,
) -> str
Serialize to Markdown.
Operates on a slice of the document's body as defined through arguments from_element and to_element; defaulting to the whole document.
:param delim: Delimiter to use when concatenating the various Markdown parts. (Default value = "\n"). :type delim: str = "\n" :param from_element: Body slicing start index (inclusive). (Default value = 0). :type from_element: int = 0 :param to_element: Body slicing stop index (exclusive). (Default value = maxint). :type to_element: int = sys.maxsize :param labels: The set of document labels to include in the export. :type labels: set[DocItemLabel] = DEFAULT_EXPORT_LABELS :param strict_text: bool: Whether to only include the text content of the document. (Default value = False). :type strict_text: bool = False :param image_placeholder: The placeholder to include to position images in the markdown. (Default value = "\<!-- image -->"). :type image_placeholder: str = "" :param image_mode: The mode to use for including images in the markdown. (Default value = ImageRefMode.PLACEHOLDER). :type image_mode: ImageRefMode = ImageRefMode.PLACEHOLDER :param indent: The indent in spaces of the nested lists. (Default value = 4). :type indent: int = 4 :returns: The exported Markdown representation. :rtype: str
export_to_text
export_to_text(
delim: str = "\n\n",
from_element: int = 0,
to_element: int = 1000000,
labels: set[DocItemLabel] = DEFAULT_EXPORT_LABELS,
) -> str
export_to_text.
iterate_items
iterate_items(
root: Optional[NodeItem] = None,
with_groups: bool = False,
traverse_pictures: bool = False,
page_no: Optional[int] = None,
_level: int = 0,
) -> Iterable[Tuple[NodeItem, int]]
iterate_elements.
:param root: Optional[NodeItem]: (Default value = None) :param with_groups: bool: (Default value = False) :param traverse_pictures: bool: (Default value = True) :param page_no: Optional[int]: (Default value = None) :param _level: (Default value = 0) :param # fixed parameter: :param carries through the node nesting level:
load_from_json
load_from_json(filename: Path) -> DoclingDocument
load_from_json.
:param filename: The filename to load a saved DoclingDocument from a .json. :type filename: Path
:returns: The loaded DoclingDocument. :rtype: DoclingDocument
num_pages
num_pages()
num_pages.
print_element_tree
print_element_tree()
Print_element_tree.
save_as_document_tokens
save_as_document_tokens(
filename: Path,
delim: str = "\n\n",
from_element: int = 0,
to_element: int = maxsize,
labels: set[DocItemLabel] = DEFAULT_EXPORT_LABELS,
xsize: int = 100,
ysize: int = 100,
add_location: bool = True,
add_content: bool = True,
add_page_index: bool = True,
add_table_cell_location: bool = False,
add_table_cell_label: bool = True,
add_table_cell_text: bool = True,
page_no: Optional[int] = None,
with_groups: bool = True,
)
Save the document content to a DocumentToken format.
save_as_html
save_as_html(
filename: Path,
artifacts_dir: Optional[Path] = None,
from_element: int = 0,
to_element: int = maxsize,
labels: set[DocItemLabel] = DEFAULT_EXPORT_LABELS,
image_mode: ImageRefMode = PLACEHOLDER,
page_no: Optional[int] = None,
html_lang: str = "en",
html_head: str = _HTML_DEFAULT_HEAD,
)
Save to HTML.
save_as_json
save_as_json(
filename: Path,
artifacts_dir: Optional[Path] = None,
image_mode: ImageRefMode = EMBEDDED,
indent: int = 2,
)
Save as json.
save_as_markdown
save_as_markdown(
filename: Path,
artifacts_dir: Optional[Path] = None,
delim: str = "\n",
from_element: int = 0,
to_element: int = maxsize,
labels: set[DocItemLabel] = DEFAULT_EXPORT_LABELS,
strict_text: bool = False,
image_placeholder: str = "<!-- image -->",
image_mode: ImageRefMode = PLACEHOLDER,
indent: int = 4,
text_width: int = -1,
page_no: Optional[int] = None,
)
Save to markdown.
save_as_yaml
save_as_yaml(
filename: Path,
artifacts_dir: Optional[Path] = None,
image_mode: ImageRefMode = EMBEDDED,
default_flow_style: bool = False,
)
Save as yaml.
validate_tree
validate_tree(root) -> bool
validate_tree.
DocumentOrigin
Bases: BaseModel
FileSource.
Methods:
-
parse_hex_string
–parse_hex_string.
-
validate_mimetype
–validate_mimetype.
Attributes:
-
binary_hash
(Uint64
) – -
filename
(str
) – -
mimetype
(str
) – -
uri
(Optional[AnyUrl]
) –
binary_hash
binary_hash: Uint64
filename
filename: str
mimetype
mimetype: str
uri
uri: Optional[AnyUrl] = None
parse_hex_string
parse_hex_string(value)
parse_hex_string.
validate_mimetype
validate_mimetype(v)
validate_mimetype.
DocItem
Bases: NodeItem
DocItem.
Methods:
-
get_image
–Returns the image of this DocItem.
-
get_location_tokens
–Get the location string for the BaseCell.
-
get_ref
–get_ref.
Attributes:
-
children
(List[RefItem]
) – -
label
(DocItemLabel
) – -
model_config
– -
parent
(Optional[RefItem]
) – -
prov
(List[ProvenanceItem]
) – -
self_ref
(str
) –
model_config
model_config = ConfigDict(extra='forbid')
self_ref
self_ref: str = Field(pattern=_JSON_POINTER_REGEX)
get_image
get_image(doc: DoclingDocument) -> Optional[Image]
Returns the image of this DocItem.
The function returns None if this DocItem has no valid provenance or if a valid image of the page containing this DocItem is not available in doc.
get_location_tokens
get_location_tokens(
doc: DoclingDocument,
new_line: str,
xsize: int = 100,
ysize: int = 100,
add_page_index: bool = True,
) -> str
Get the location string for the BaseCell.
get_ref
get_ref()
get_ref.
DocItemLabel
Bases: str
, Enum
DocItemLabel.
Attributes:
-
CAPTION
– -
CHECKBOX_SELECTED
– -
CHECKBOX_UNSELECTED
– -
CODE
– -
DOCUMENT_INDEX
– -
FOOTNOTE
– -
FORM
– -
FORMULA
– -
KEY_VALUE_REGION
– -
LIST_ITEM
– -
PAGE_FOOTER
– -
PAGE_HEADER
– -
PARAGRAPH
– -
PICTURE
– -
REFERENCE
– -
SECTION_HEADER
– -
TABLE
– -
TEXT
– -
TITLE
–
CAPTION
CAPTION = 'caption'
CHECKBOX_SELECTED
CHECKBOX_SELECTED = 'checkbox_selected'
CHECKBOX_UNSELECTED
CHECKBOX_UNSELECTED = 'checkbox_unselected'
CODE
CODE = 'code'
DOCUMENT_INDEX
DOCUMENT_INDEX = 'document_index'
FOOTNOTE
FOOTNOTE = 'footnote'
FORM
FORM = 'form'
FORMULA
FORMULA = 'formula'
KEY_VALUE_REGION
KEY_VALUE_REGION = 'key_value_region'
LIST_ITEM
LIST_ITEM = 'list_item'
PAGE_FOOTER
PAGE_FOOTER = 'page_footer'
PAGE_HEADER
PAGE_HEADER = 'page_header'
PARAGRAPH
PARAGRAPH = 'paragraph'
PICTURE
PICTURE = 'picture'
REFERENCE
REFERENCE = 'reference'
SECTION_HEADER
SECTION_HEADER = 'section_header'
TABLE
TABLE = 'table'
TEXT
TEXT = 'text'
TITLE
TITLE = 'title'
ProvenanceItem
Bases: BaseModel
ProvenanceItem.
Attributes:
-
bbox
(BoundingBox
) – -
charspan
(Tuple[int, int]
) – -
page_no
(int
) –
GroupItem
Bases: NodeItem
GroupItem.
Methods:
-
get_ref
–get_ref.
Attributes:
-
children
(List[RefItem]
) – -
label
(GroupLabel
) – -
model_config
– -
name
(str
) – -
parent
(Optional[RefItem]
) – -
self_ref
(str
) –
model_config
model_config = ConfigDict(extra='forbid')
name
name: str = 'group'
self_ref
self_ref: str = Field(pattern=_JSON_POINTER_REGEX)
get_ref
get_ref()
get_ref.
GroupLabel
Bases: str
, Enum
GroupLabel.
Attributes:
-
CHAPTER
– -
LIST
– -
ORDERED_LIST
– -
SECTION
– -
SHEET
– -
SLIDE
– -
UNSPECIFIED
–
CHAPTER
CHAPTER = 'chapter'
LIST
LIST = 'list'
ORDERED_LIST
ORDERED_LIST = 'ordered_list'
SECTION
SECTION = 'section'
SHEET
SHEET = 'sheet'
SLIDE
SLIDE = 'slide'
UNSPECIFIED
UNSPECIFIED = 'unspecified'
NodeItem
PageItem
FloatingItem
Bases: DocItem
FloatingItem.
Methods:
-
caption_text
–Computes the caption as a single text.
-
get_image
–Returns the image corresponding to this FloatingItem.
-
get_location_tokens
–Get the location string for the BaseCell.
-
get_ref
–get_ref.
Attributes:
-
captions
(List[RefItem]
) – -
children
(List[RefItem]
) – -
footnotes
(List[RefItem]
) – -
image
(Optional[ImageRef]
) – -
label
(DocItemLabel
) – -
model_config
– -
parent
(Optional[RefItem]
) – -
prov
(List[ProvenanceItem]
) – -
references
(List[RefItem]
) – -
self_ref
(str
) –
model_config
model_config = ConfigDict(extra='forbid')
self_ref
self_ref: str = Field(pattern=_JSON_POINTER_REGEX)
get_image
get_image(doc: DoclingDocument) -> Optional[Image]
Returns the image corresponding to this FloatingItem.
This function returns the PIL image from self.image if one is available. Otherwise, it uses DocItem.get_image to get an image of this FloatingItem.
In particular, when self.image is None, the function returns None if this FloatingItem has no valid provenance or the doc does not contain a valid image for the required page.
get_location_tokens
get_location_tokens(
doc: DoclingDocument,
new_line: str,
xsize: int = 100,
ysize: int = 100,
add_page_index: bool = True,
) -> str
Get the location string for the BaseCell.
get_ref
get_ref()
get_ref.
TextItem
Bases: DocItem
TextItem.
Methods:
-
export_to_document_tokens
–Export text element to document tokens format.
-
get_image
–Returns the image of this DocItem.
-
get_location_tokens
–Get the location string for the BaseCell.
-
get_ref
–get_ref.
Attributes:
-
children
(List[RefItem]
) – -
label
(DocItemLabel
) – -
model_config
– -
orig
(str
) – -
parent
(Optional[RefItem]
) – -
prov
(List[ProvenanceItem]
) – -
self_ref
(str
) – -
text
(str
) –
model_config
model_config = ConfigDict(extra='forbid')
orig
orig: str
self_ref
self_ref: str = Field(pattern=_JSON_POINTER_REGEX)
text
text: str
export_to_document_tokens
export_to_document_tokens(
doc: DoclingDocument,
new_line: str = "\n",
xsize: int = 100,
ysize: int = 100,
add_location: bool = True,
add_content: bool = True,
add_page_index: bool = True,
)
Export text element to document tokens format.
:param doc: "DoclingDocument": :param new_line: str: (Default value = "\n") :param xsize: int: (Default value = 100) :param ysize: int: (Default value = 100) :param add_location: bool: (Default value = True) :param add_content: bool: (Default value = True) :param add_page_index: bool: (Default value = True)
get_image
get_image(doc: DoclingDocument) -> Optional[Image]
Returns the image of this DocItem.
The function returns None if this DocItem has no valid provenance or if a valid image of the page containing this DocItem is not available in doc.
get_location_tokens
get_location_tokens(
doc: DoclingDocument,
new_line: str,
xsize: int = 100,
ysize: int = 100,
add_page_index: bool = True,
) -> str
Get the location string for the BaseCell.
get_ref
get_ref()
get_ref.
TableItem
Bases: FloatingItem
TableItem.
Methods:
-
caption_text
–Computes the caption as a single text.
-
export_to_dataframe
–Export the table as a Pandas DataFrame.
-
export_to_document_tokens
–Export table to document tokens format.
-
export_to_html
–Export the table as html.
-
export_to_markdown
–Export the table as markdown.
-
export_to_otsl
–Export the table as OTSL.
-
get_image
–Returns the image corresponding to this FloatingItem.
-
get_location_tokens
–Get the location string for the BaseCell.
-
get_ref
–get_ref.
Attributes:
-
captions
(List[RefItem]
) – -
children
(List[RefItem]
) – -
data
(TableData
) – -
footnotes
(List[RefItem]
) – -
image
(Optional[ImageRef]
) – -
label
(Literal[TABLE]
) – -
model_config
– -
parent
(Optional[RefItem]
) – -
prov
(List[ProvenanceItem]
) – -
references
(List[RefItem]
) – -
self_ref
(str
) –
model_config
model_config = ConfigDict(extra='forbid')
self_ref
self_ref: str = Field(pattern=_JSON_POINTER_REGEX)
export_to_dataframe
export_to_dataframe() -> DataFrame
Export the table as a Pandas DataFrame.
export_to_document_tokens
export_to_document_tokens(
doc: DoclingDocument,
new_line: str = "\n",
xsize: int = 100,
ysize: int = 100,
add_location: bool = True,
add_caption: bool = True,
add_content: bool = True,
add_cell_location: bool = True,
add_cell_label: bool = True,
add_cell_text: bool = True,
add_page_index: bool = True,
)
Export table to document tokens format.
:param doc: "DoclingDocument": :param new_line: str: (Default value = "\n") :param xsize: int: (Default value = 100) :param ysize: int: (Default value = 100) :param add_location: bool: (Default value = True) :param add_caption: bool: (Default value = True) :param add_content: bool: (Default value = True) :param add_cell_location: bool: (Default value = True) :param add_cell_label: bool: (Default value = True) :param add_cell_text: bool: (Default value = True) :param add_page_index: bool: (Default value = True)
export_to_html
export_to_html(
doc: Optional[DoclingDocument] = None,
add_caption: bool = True,
) -> str
Export the table as html.
export_to_markdown
export_to_markdown() -> str
Export the table as markdown.
export_to_otsl
export_to_otsl(
doc: DoclingDocument,
add_cell_location: bool = True,
add_cell_text: bool = True,
xsize: int = 100,
ysize: int = 100,
) -> str
Export the table as OTSL.
get_image
get_image(doc: DoclingDocument) -> Optional[Image]
Returns the image corresponding to this FloatingItem.
This function returns the PIL image from self.image if one is available. Otherwise, it uses DocItem.get_image to get an image of this FloatingItem.
In particular, when self.image is None, the function returns None if this FloatingItem has no valid provenance or the doc does not contain a valid image for the required page.
get_location_tokens
get_location_tokens(
doc: DoclingDocument,
new_line: str,
xsize: int = 100,
ysize: int = 100,
add_page_index: bool = True,
) -> str
Get the location string for the BaseCell.
get_ref
get_ref()
get_ref.
TableCell
Bases: BaseModel
TableCell.
Methods:
-
from_dict_format
–from_dict_format.
Attributes:
-
bbox
(Optional[BoundingBox]
) – -
col_span
(int
) – -
column_header
(bool
) – -
end_col_offset_idx
(int
) – -
end_row_offset_idx
(int
) – -
row_header
(bool
) – -
row_section
(bool
) – -
row_span
(int
) – -
start_col_offset_idx
(int
) – -
start_row_offset_idx
(int
) – -
text
(str
) –
col_span
col_span: int = 1
column_header
column_header: bool = False
end_col_offset_idx
end_col_offset_idx: int
end_row_offset_idx
end_row_offset_idx: int
row_header
row_header: bool = False
row_section
row_section: bool = False
row_span
row_span: int = 1
start_col_offset_idx
start_col_offset_idx: int
start_row_offset_idx
start_row_offset_idx: int
text
text: str
from_dict_format
from_dict_format(data: Any) -> Any
from_dict_format.
TableData
TableCellLabel
Bases: str
, Enum
TableCellLabel.
Attributes:
-
BODY
– -
COLUMN_HEADER
– -
ROW_HEADER
– -
ROW_SECTION
–
BODY
BODY = 'body'
COLUMN_HEADER
COLUMN_HEADER = 'col_header'
ROW_HEADER
ROW_HEADER = 'row_header'
ROW_SECTION
ROW_SECTION = 'row_section'
KeyValueItem
Bases: DocItem
KeyValueItem.
Methods:
-
get_image
–Returns the image of this DocItem.
-
get_location_tokens
–Get the location string for the BaseCell.
-
get_ref
–get_ref.
Attributes:
-
children
(List[RefItem]
) – -
label
(DocItemLabel
) – -
model_config
– -
parent
(Optional[RefItem]
) – -
prov
(List[ProvenanceItem]
) – -
self_ref
(str
) –
model_config
model_config = ConfigDict(extra='forbid')
self_ref
self_ref: str = Field(pattern=_JSON_POINTER_REGEX)
get_image
get_image(doc: DoclingDocument) -> Optional[Image]
Returns the image of this DocItem.
The function returns None if this DocItem has no valid provenance or if a valid image of the page containing this DocItem is not available in doc.
get_location_tokens
get_location_tokens(
doc: DoclingDocument,
new_line: str,
xsize: int = 100,
ysize: int = 100,
add_page_index: bool = True,
) -> str
Get the location string for the BaseCell.
get_ref
get_ref()
get_ref.
SectionHeaderItem
Bases: TextItem
SectionItem.
Methods:
-
export_to_document_tokens
–Export text element to document tokens format.
-
get_image
–Returns the image of this DocItem.
-
get_location_tokens
–Get the location string for the BaseCell.
-
get_ref
–get_ref.
Attributes:
-
children
(List[RefItem]
) – -
label
(Literal[SECTION_HEADER]
) – -
level
(LevelNumber
) – -
model_config
– -
orig
(str
) – -
parent
(Optional[RefItem]
) – -
prov
(List[ProvenanceItem]
) – -
self_ref
(str
) – -
text
(str
) –
level
level: LevelNumber
model_config
model_config = ConfigDict(extra='forbid')
orig
orig: str
self_ref
self_ref: str = Field(pattern=_JSON_POINTER_REGEX)
text
text: str
export_to_document_tokens
export_to_document_tokens(
doc: DoclingDocument,
new_line: str = "\n",
xsize: int = 100,
ysize: int = 100,
add_location: bool = True,
add_content: bool = True,
add_page_index: bool = True,
)
Export text element to document tokens format.
:param doc: "DoclingDocument": :param new_line: str: (Default value = "\n") :param xsize: int: (Default value = 100) :param ysize: int: (Default value = 100) :param add_location: bool: (Default value = True) :param add_content: bool: (Default value = True) :param add_page_index: bool: (Default value = True)
get_image
get_image(doc: DoclingDocument) -> Optional[Image]
Returns the image of this DocItem.
The function returns None if this DocItem has no valid provenance or if a valid image of the page containing this DocItem is not available in doc.
get_location_tokens
get_location_tokens(
doc: DoclingDocument,
new_line: str,
xsize: int = 100,
ysize: int = 100,
add_page_index: bool = True,
) -> str
Get the location string for the BaseCell.
get_ref
get_ref()
get_ref.
PictureItem
Bases: FloatingItem
PictureItem.
Methods:
-
caption_text
–Computes the caption as a single text.
-
export_to_document_tokens
–Export picture to document tokens format.
-
export_to_html
–Export picture to HTML format.
-
export_to_markdown
–Export picture to Markdown format.
-
get_image
–Returns the image corresponding to this FloatingItem.
-
get_location_tokens
–Get the location string for the BaseCell.
-
get_ref
–get_ref.
Attributes:
-
annotations
(List[PictureDataType]
) – -
captions
(List[RefItem]
) – -
children
(List[RefItem]
) – -
footnotes
(List[RefItem]
) – -
image
(Optional[ImageRef]
) – -
label
(Literal[PICTURE]
) – -
model_config
– -
parent
(Optional[RefItem]
) – -
prov
(List[ProvenanceItem]
) – -
references
(List[RefItem]
) – -
self_ref
(str
) –
annotations
annotations: List[PictureDataType] = []
model_config
model_config = ConfigDict(extra='forbid')
self_ref
self_ref: str = Field(pattern=_JSON_POINTER_REGEX)
export_to_document_tokens
export_to_document_tokens(
doc: DoclingDocument,
new_line: str = "\n",
xsize: int = 100,
ysize: int = 100,
add_location: bool = True,
add_caption: bool = True,
add_content: bool = True,
add_page_index: bool = True,
)
Export picture to document tokens format.
:param doc: "DoclingDocument": :param new_line: str: (Default value = "\n") :param xsize: int: (Default value = 100) :param ysize: int: (Default value = 100) :param add_location: bool: (Default value = True) :param add_caption: bool: (Default value = True) :param add_content: bool: (Default value = True) :param # not used at the momentadd_page_index: bool: (Default value = True)
export_to_html
export_to_html(
doc: DoclingDocument,
add_caption: bool = True,
image_mode: ImageRefMode = PLACEHOLDER,
) -> str
Export picture to HTML format.
export_to_markdown
export_to_markdown(
doc: DoclingDocument,
add_caption: bool = True,
image_mode: ImageRefMode = EMBEDDED,
image_placeholder: str = "<!-- image -->",
) -> str
Export picture to Markdown format.
get_image
get_image(doc: DoclingDocument) -> Optional[Image]
Returns the image corresponding to this FloatingItem.
This function returns the PIL image from self.image if one is available. Otherwise, it uses DocItem.get_image to get an image of this FloatingItem.
In particular, when self.image is None, the function returns None if this FloatingItem has no valid provenance or the doc does not contain a valid image for the required page.
get_location_tokens
get_location_tokens(
doc: DoclingDocument,
new_line: str,
xsize: int = 100,
ysize: int = 100,
add_page_index: bool = True,
) -> str
Get the location string for the BaseCell.
get_ref
get_ref()
get_ref.
ImageRef
Bases: BaseModel
ImageRef.
Methods:
-
from_pil
–Construct ImageRef from a PIL Image.
-
validate_mimetype
–validate_mimetype.
Attributes:
-
dpi
(int
) – -
mimetype
(str
) – -
pil_image
(Optional[Image]
) –Return the PIL Image.
-
size
(Size
) – -
uri
(Union[AnyUrl, Path]
) –
dpi
dpi: int
mimetype
mimetype: str
pil_image
pil_image: Optional[Image]
Return the PIL Image.
uri
uri: Union[AnyUrl, Path] = Field(union_mode="left_to_right")
from_pil
from_pil(image: Image, dpi: int) -> Self
Construct ImageRef from a PIL Image.
validate_mimetype
validate_mimetype(v)
validate_mimetype.
PictureClassificationClass
Bases: BaseModel
PictureClassificationData.
Attributes:
-
class_name
(str
) – -
confidence
(float
) –
class_name
class_name: str
confidence
confidence: float
PictureClassificationData
Bases: BasePictureData
PictureClassificationData.
Attributes:
-
kind
(Literal['classification']
) – -
predicted_classes
(List[PictureClassificationClass]
) – -
provenance
(str
) –
kind
kind: Literal['classification'] = 'classification'
provenance
provenance: str
RefItem
Bases: BaseModel
RefItem.
Methods:
Attributes:
-
cref
(str
) – -
model_config
–
cref
cref: str = Field(alias="$ref", pattern=_JSON_POINTER_REGEX)
model_config
model_config = ConfigDict(populate_by_name=True)
get_ref
get_ref()
get_ref.
BoundingBox
Bases: BaseModel
BoundingBox.
Methods:
-
area
–area.
-
as_tuple
–as_tuple.
-
from_tuple
–from_tuple.
-
intersection_area_with
–intersection_area_with.
-
normalized
–normalized.
-
scaled
–scaled.
-
to_bottom_left_origin
–to_bottom_left_origin.
-
to_top_left_origin
–to_top_left_origin.
Attributes:
-
b
(float
) – -
coord_origin
(CoordOrigin
) – -
height
–height.
-
l
(float
) – -
r
(float
) – -
t
(float
) – -
width
–width.
b
b: float
height
height
height.
l
l: float
r
r: float
t
t: float
width
width
width.
area
area() -> float
area.
as_tuple
as_tuple()
as_tuple.
from_tuple
from_tuple(coord: Tuple[float, ...], origin: CoordOrigin)
from_tuple.
:param coord: Tuple[float: :param ...]: :param origin: CoordOrigin:
intersection_area_with
intersection_area_with(other: BoundingBox) -> float
intersection_area_with.
:param other: "BoundingBox":
to_bottom_left_origin
to_bottom_left_origin(page_height) -> BoundingBox
to_bottom_left_origin.
:param page_height:
to_top_left_origin
to_top_left_origin(page_height)
to_top_left_origin.
:param page_height:
CoordOrigin
Bases: str
, Enum
CoordOrigin.
Attributes:
-
BOTTOMLEFT
– -
TOPLEFT
–
BOTTOMLEFT
BOTTOMLEFT = 'BOTTOMLEFT'
TOPLEFT
TOPLEFT = 'TOPLEFT'
ImageRefMode
Bases: str
, Enum
ImageRefMode.
Attributes:
-
EMBEDDED
– -
PLACEHOLDER
– -
REFERENCED
–
EMBEDDED
EMBEDDED = 'embedded'
PLACEHOLDER
PLACEHOLDER = 'placeholder'
REFERENCED
REFERENCED = 'referenced'