Getting Started
Installation
Generate your synthetic document
OCR-NER Dataset Generation
Fabricating Document & Noise
Create a document
Degrade a document
Handling Noisy Text
Text alignment
Propagation of NER labels
API Documentation
genalog.degradation
genalog.generation
genalog.ocr
genalog.text
repository
open issue
Index
_
|
A
|
B
|
C
|
D
|
E
|
F
|
G
|
I
|
J
|
L
|
M
|
O
|
P
|
R
|
S
|
T
|
U
|
V
_
_propagate_label_to_ocr() (in module genalog.text.ner_label)
A
align() (in module genalog.text.alignment)
align_w_anchor() (in module genalog.text.anchor)
apply_effects() (genalog.degradation.degrader.Degrader method)
B
bleed_through() (in module genalog.degradation.effect)
blur() (in module genalog.degradation.effect)
C
check_n_sentences() (in module genalog.text.conll_format)
close() (in module genalog.degradation.effect)
ContentType (class in genalog.generation.content)
correct_ner_labels() (in module genalog.text.ner_label)
create_2D_kernel() (in module genalog.degradation.effect)
create_datasource() (genalog.ocr.rest_client.GrokRestClient method)
create_from_env_var() (genalog.ocr.blob_client.GrokBlobClient static method)
create_index() (genalog.ocr.rest_client.GrokRestClient method)
create_indexer() (genalog.ocr.rest_client.GrokRestClient method)
create_indexing_pipeline() (genalog.ocr.rest_client.GrokRestClient method)
create_skillset() (genalog.ocr.rest_client.GrokRestClient method)
D
Degrader (class in genalog.degradation.degrader)
delete_blobs_folder() (genalog.ocr.blob_client.GrokBlobClient method)
delete_indexer_pipeline() (genalog.ocr.rest_client.GrokRestClient method)
dilate() (in module genalog.degradation.effect)
E
erode() (in module genalog.degradation.effect)
extract_ocr_text() (in module genalog.text.conll_format)
F
find_anchor_recur() (in module genalog.text.anchor)
for_all_files() (in module genalog.text.conll_format)
format_label_propagation() (in module genalog.text.ner_label)
format_labels() (in module genalog.text.ner_label)
G
GapCharError
genalog.degradation.degrader
module
genalog.degradation.effect
module
genalog.generation.content
module
genalog.ocr.blob_client
module
genalog.ocr.common
module
genalog.ocr.grok
module
genalog.ocr.metrics
module
genalog.ocr.rest_client
module
genalog.text.alignment
module
genalog.text.anchor
module
genalog.text.conll_format
module
genalog.text.lcs
module
genalog.text.ner_label
module
genalog.text.preprocess
module
get_align_stats() (in module genalog.ocr.metrics)
get_anchor_map() (in module genalog.text.anchor)
get_editops_stats() (in module genalog.ocr.metrics)
get_folder_hash() (genalog.ocr.blob_client.GrokBlobClient method)
get_metrics() (in module genalog.ocr.metrics)
get_stats() (in module genalog.ocr.metrics)
get_unique_words() (in module genalog.text.anchor)
get_word_map() (in module genalog.text.anchor)
GrokBlobClient (class in genalog.ocr.blob_client)
GrokRestClient (class in genalog.ocr.rest_client)
I
ImageState (class in genalog.degradation.degrader)
insert_image_state() (genalog.degradation.degrader.Degrader method)
is_sentence_separator() (in module genalog.text.preprocess)
J
join_tokens() (in module genalog.text.preprocess)
L
LCS (class in genalog.text.lcs)
M
module
genalog.degradation.degrader
genalog.degradation.effect
genalog.generation.content
genalog.ocr.blob_client
genalog.ocr.common
genalog.ocr.grok
genalog.ocr.metrics
genalog.ocr.rest_client
genalog.text.alignment
genalog.text.anchor
genalog.text.conll_format
genalog.text.lcs
genalog.text.ner_label
genalog.text.preprocess
morphology() (in module genalog.degradation.effect)
O
open() (in module genalog.degradation.effect)
overlay() (in module genalog.degradation.effect)
overlay_weighted() (in module genalog.degradation.effect)
P
parse_alignment() (in module genalog.text.alignment)
pepper() (in module genalog.degradation.effect)
pepper_then_salt() (in module genalog.degradation.effect)
propagate_label_to_ocr() (in module genalog.text.ner_label)
propagate_labels_sentences() (in module genalog.text.conll_format)
propagate_labels_sentences_multiprocess() (in module genalog.text.conll_format)
R
remove_first_line() (in module genalog.text.conll_format)
remove_last_line() (in module genalog.text.conll_format)
remove_non_ascii() (in module genalog.text.preprocess)
S
salt() (in module genalog.degradation.effect)
salt_then_pepper() (in module genalog.degradation.effect)
segment_len() (in module genalog.text.anchor)
split_sentences() (in module genalog.text.preprocess)
substitution_dict_to_json() (in module genalog.ocr.metrics)
T
tokenize() (in module genalog.text.preprocess)
translation() (in module genalog.degradation.effect)
U
upload_images_to_blob() (genalog.ocr.blob_client.GrokBlobClient method)
V
validate_effects() (genalog.degradation.degrader.Degrader static method)