Burdoc
stable
Burdoc: Advanced PDF Parsing For Python
Getting Started
Working with Burdoc Output
API Documentation
Burdoc
Index
Edit on GitHub
Index
_
|
A
|
B
|
C
|
D
|
E
|
F
|
G
|
H
|
I
|
J
|
L
|
M
|
N
|
O
|
P
|
R
|
S
|
T
|
U
|
W
|
X
|
Y
_
__init__() (burdoc.burdoc_parser.BurdocParser method)
(burdoc.elements.drawing.DrawingElement method)
(burdoc.elements.image.ImageElement method)
(burdoc.elements.line.LineElement method)
(burdoc.elements.section.PageSection method)
(burdoc.elements.table.Table method)
(burdoc.elements.textlist.TextList method)
(burdoc.elements.textlist.TextListItem method)
(burdoc.processors.aggregator_processor.AggregatorProcessor method)
(burdoc.processors.json_out_processor.JSONOutProcessor method)
(burdoc.processors.pdf_load_processor.pdf_load_processor.PDFLoadProcessor method)
(burdoc.utils.layout_graph.LayoutGraph method)
A
add_generated_items_to_fig() (burdoc.processors.aggregator_processor.AggregatorProcessor method)
(burdoc.processors.heading_processor.HeadingProcessor method)
(burdoc.processors.json_out_processor.JSONOutProcessor method)
(burdoc.processors.layout_processor.LayoutProcessor method)
(burdoc.processors.list_processor.ListProcessor method)
(burdoc.processors.margin_processor.MarginProcessor method)
(burdoc.processors.pdf_load_processor.pdf_load_processor.PDFLoadProcessor method)
(burdoc.processors.processor.Processor method)
(burdoc.processors.reading_order_processor.ReadingOrderProcessor method)
(burdoc.processors.table_processors.ml_table_processor.MLTableProcessor method)
(burdoc.processors.table_processors.rules_table_processor.RulesTableProcessor method)
add_rect_to_figure() (in module burdoc.utils.render_pages)
add_text_to_figure() (in module burdoc.utils.render_pages)
AggregatorProcessor (class in burdoc.processors.aggregator_processor)
append() (burdoc.elements.element.LayoutElementGroup method)
area() (burdoc.elements.bbox.Bbox method)
area_norm() (burdoc.elements.bbox.Bbox method)
Aside (class in burdoc.elements.aside)
B
BACKGROUND (burdoc.elements.image.ImageType attribute)
Bbox (class in burdoc.elements.bbox)
BULLET (burdoc.elements.drawing.DrawingType attribute)
Burdoc
module
burdoc.burdoc_parser
module
burdoc.elements
module
burdoc.elements.aside
module
burdoc.elements.bbox
module
burdoc.elements.drawing
module
burdoc.elements.font
module
burdoc.elements.image
module
burdoc.elements.line
module
burdoc.elements.section
module
burdoc.elements.span
module
burdoc.elements.table
module
burdoc.elements.textblock
module
burdoc.elements.textlist
module
burdoc.processors
module
burdoc.processors.aggregator_processor
module
burdoc.processors.heading_processor
module
burdoc.processors.json_out_processor
module
burdoc.processors.layout_processor
module
burdoc.processors.list_processor
module
burdoc.processors.margin_processor
module
burdoc.processors.pdf_load_processor
module
burdoc.processors.processor
module
burdoc.processors.reading_order_processor
module
burdoc.processors.table_processors
module
burdoc.utils
module
burdoc.utils.compare
module
burdoc.utils.image_manip
module
burdoc.utils.layout_graph
module
burdoc.utils.logging
module
burdoc.utils.render_pages
module
BurdocParser (class in burdoc.burdoc_parser)
C
center() (burdoc.elements.bbox.Bbox method)
check_requirements() (burdoc.processors.processor.Processor method)
clone() (burdoc.elements.bbox.Bbox method)
COLUMN (burdoc.elements.table.TableParts attribute)
COLUMNHEADER (burdoc.elements.table.TableParts attribute)
compare() (in module burdoc.utils.compare)
D
DECORATIVE (burdoc.elements.image.ImageType attribute)
DETR (burdoc.processors.table_processors.ml_table_processor.MLTableProcessor.Strategies attribute)
DetrTableStrategy (class in burdoc.processors.table_processors.detr_table_strategy)
down (burdoc.utils.layout_graph.LayoutGraph.Node attribute)
DrawingElement (class in burdoc.elements.drawing)
DrawingHandler (class in burdoc.processors.pdf_load_processor.drawing_handler)
E
EMPHASIS (burdoc.elements.textblock.TextBlockType attribute)
extract_tables() (burdoc.processors.table_processors.detr_table_strategy.DetrTableStrategy method)
(burdoc.processors.table_processors.table_extractor_strategy.TableExtractorStrategy method)
F
Font (class in burdoc.elements.font)
from_dict() (burdoc.elements.font.Font static method)
(burdoc.elements.line.LineElement static method)
(burdoc.elements.span.Span static method)
from_points() (burdoc.elements.bbox.Bbox static method)
G
generates() (burdoc.processors.aggregator_processor.AggregatorProcessor method)
(burdoc.processors.heading_processor.HeadingProcessor method)
(burdoc.processors.json_out_processor.JSONOutProcessor method)
(burdoc.processors.layout_processor.LayoutProcessor method)
(burdoc.processors.list_processor.ListProcessor method)
(burdoc.processors.margin_processor.MarginProcessor method)
(burdoc.processors.pdf_load_processor.pdf_load_processor.PDFLoadProcessor method)
(burdoc.processors.processor.Processor method)
(burdoc.processors.reading_order_processor.ReadingOrderProcessor method)
(burdoc.processors.table_processors.ml_table_processor.MLTableProcessor method)
(burdoc.processors.table_processors.rules_table_processor.RulesTableProcessor method)
get_data() (burdoc.processors.processor.Processor method)
get_image_elements() (burdoc.processors.pdf_load_processor.image_handler.ImageHandler method)
get_image_palette() (in module burdoc.utils.image_manip)
get_logger() (in module burdoc.utils.logging)
get_node() (burdoc.utils.layout_graph.LayoutGraph method)
get_page_data() (burdoc.processors.processor.Processor method)
get_page_drawings() (burdoc.processors.pdf_load_processor.drawing_handler.DrawingHandler method)
get_page_text() (burdoc.processors.pdf_load_processor.text_handler.TextHandler method)
get_text() (burdoc.elements.line.LineElement method)
(burdoc.elements.textblock.TextBlock method)
GRADIENT (burdoc.elements.image.ImageType attribute)
H
H1 (burdoc.elements.textblock.TextBlockType attribute)
H2 (burdoc.elements.textblock.TextBlockType attribute)
H3 (burdoc.elements.textblock.TextBlockType attribute)
H4 (burdoc.elements.textblock.TextBlockType attribute)
H5 (burdoc.elements.textblock.TextBlockType attribute)
H6 (burdoc.elements.textblock.TextBlockType attribute)
HeadingProcessor (class in burdoc.processors.heading_processor)
height() (burdoc.elements.bbox.Bbox method)
I
ImageElement (class in burdoc.elements.image)
ImageHandler (class in burdoc.processors.pdf_load_processor.image_handler)
initialise() (burdoc.processors.aggregator_processor.AggregatorProcessor method)
(burdoc.processors.processor.Processor method)
(burdoc.processors.table_processors.ml_table_processor.MLTableProcessor method)
INLINE (burdoc.elements.image.ImageType attribute)
INVISIBLE (burdoc.elements.image.ImageType attribute)
is_vertical() (burdoc.elements.bbox.Bbox method)
J
JSONOutProcessor (class in burdoc.processors.json_out_processor)
L
LayoutElement (class in burdoc.elements.element)
LayoutElementGroup (class in burdoc.elements.element)
LayoutGraph (class in burdoc.utils.layout_graph)
LayoutGraph.Node (class in burdoc.utils.layout_graph)
LayoutProcessor (class in burdoc.processors.layout_processor)
left (burdoc.utils.layout_graph.LayoutGraph.Node attribute)
LINE (burdoc.elements.drawing.DrawingType attribute)
(burdoc.elements.image.ImageType attribute)
LineElement (class in burdoc.elements.line)
ListProcessor (class in burdoc.processors.list_processor)
M
MarginProcessor (class in burdoc.processors.margin_processor)
merge() (burdoc.elements.bbox.Bbox static method)
(burdoc.elements.element.LayoutElementGroup method)
merge_bullets_into_text() (burdoc.processors.pdf_load_processor.pdf_load_processor.PDFLoadProcessor method)
MLTableProcessor (class in burdoc.processors.table_processors.ml_table_processor)
module
Burdoc
burdoc.burdoc_parser
burdoc.elements
burdoc.elements.aside
burdoc.elements.bbox
burdoc.elements.drawing
burdoc.elements.font
burdoc.elements.image
burdoc.elements.line
burdoc.elements.section
burdoc.elements.span
burdoc.elements.table
burdoc.elements.textblock
burdoc.elements.textlist
burdoc.processors
burdoc.processors.aggregator_processor
burdoc.processors.heading_processor
burdoc.processors.json_out_processor
burdoc.processors.layout_processor
burdoc.processors.list_processor
burdoc.processors.margin_processor
burdoc.processors.pdf_load_processor
burdoc.processors.processor
burdoc.processors.reading_order_processor
burdoc.processors.table_processors
burdoc.utils
burdoc.utils.compare
burdoc.utils.image_manip
burdoc.utils.layout_graph
burdoc.utils.logging
burdoc.utils.render_pages
N
node_has_ancestor() (burdoc.utils.layout_graph.LayoutGraph method)
O
overlap() (burdoc.elements.bbox.Bbox method)
P
PageSection (class in burdoc.elements.section)
PARAGRAPH (burdoc.elements.textblock.TextBlockType attribute)
PDFLoadProcessor (class in burdoc.processors.pdf_load_processor.pdf_load_processor)
Point (class in burdoc.elements.bbox)
PRIMARY (burdoc.elements.image.ImageType attribute)
print_profile_info() (burdoc.burdoc_parser.BurdocParser method)
process() (burdoc.processors.processor.Processor method)
Processor (class in burdoc.processors.processor)
R
read() (burdoc.burdoc_parser.BurdocParser method)
ReadingOrderProcessor (class in burdoc.processors.reading_order_processor)
RECT (burdoc.elements.drawing.DrawingType attribute)
remove() (burdoc.elements.element.LayoutElementGroup method)
render_pages() (in module burdoc.utils.render_pages)
requirements() (burdoc.processors.aggregator_processor.AggregatorProcessor method)
(burdoc.processors.heading_processor.HeadingProcessor method)
(burdoc.processors.json_out_processor.JSONOutProcessor method)
(burdoc.processors.layout_processor.LayoutProcessor method)
(burdoc.processors.list_processor.ListProcessor method)
(burdoc.processors.margin_processor.MarginProcessor method)
(burdoc.processors.pdf_load_processor.pdf_load_processor.PDFLoadProcessor method)
(burdoc.processors.processor.Processor method)
(burdoc.processors.reading_order_processor.ReadingOrderProcessor method)
(burdoc.processors.table_processors.detr_table_strategy.DetrTableStrategy static method)
(burdoc.processors.table_processors.ml_table_processor.MLTableProcessor method)
(burdoc.processors.table_processors.rules_table_processor.RulesTableProcessor method)
(burdoc.processors.table_processors.table_extractor_strategy.TableExtractorStrategy static method)
right (burdoc.utils.layout_graph.LayoutGraph.Node attribute)
ROW (burdoc.elements.table.TableParts attribute)
ROWHEADER (burdoc.elements.table.TableParts attribute)
RulesTableProcessor (class in burdoc.processors.table_processors.rules_table_processor)
S
SECTION (burdoc.elements.image.ImageType attribute)
SMALL (burdoc.elements.textblock.TextBlockType attribute)
Span (class in burdoc.elements.span)
SPANNINGCELL (burdoc.elements.table.TableParts attribute)
split_font_name() (burdoc.elements.font.Font static method)
T
TABLE (burdoc.elements.drawing.DrawingType attribute)
(burdoc.elements.table.TableParts attribute)
Table (class in burdoc.elements.table)
TableExtractorStrategy (class in burdoc.processors.table_processors.table_extractor_strategy)
TextBlock (class in burdoc.elements.textblock)
TextHandler (class in burdoc.processors.pdf_load_processor.text_handler)
TextList (class in burdoc.elements.textlist)
TextListItem (class in burdoc.elements.textlist)
to_json() (burdoc.elements.bbox.Bbox method)
(burdoc.elements.drawing.DrawingElement method)
(burdoc.elements.element.LayoutElement method)
(burdoc.elements.element.LayoutElementGroup method)
(burdoc.elements.font.Font method)
(burdoc.elements.image.ImageElement method)
(burdoc.elements.line.LineElement method)
(burdoc.elements.section.PageSection method)
(burdoc.elements.span.Span method)
(burdoc.elements.table.Table method)
(burdoc.elements.textblock.TextBlock method)
(burdoc.elements.textlist.TextList method)
(burdoc.elements.textlist.TextListItem method)
to_rect() (burdoc.elements.bbox.Bbox method)
U
UNKNOWN (burdoc.elements.drawing.DrawingType attribute)
(burdoc.elements.image.ImageType attribute)
up (burdoc.utils.layout_graph.LayoutGraph.Node attribute)
W
width() (burdoc.elements.bbox.Bbox method)
X
x0_norm() (burdoc.elements.bbox.Bbox method)
x1_norm() (burdoc.elements.bbox.Bbox method)
x_distance() (burdoc.elements.bbox.Bbox method)
x_overlap() (burdoc.elements.bbox.Bbox method)
Y
y0_norm() (burdoc.elements.bbox.Bbox method)
y1_norm() (burdoc.elements.bbox.Bbox method)
y_distance() (burdoc.elements.bbox.Bbox method)
y_overlap() (burdoc.elements.bbox.Bbox method)