Index A | B | C | D | F | G | H | I | K | L | M | P | R | S | T | W A ajmc module ajmc.commons module ajmc.commons.arithmetic module ajmc.commons.docstrings module ajmc.commons.unicode_utils module ajmc.corpora module ajmc.corpora.bibliographic_records module ajmc.corpora.cleaning_utils module ajmc.corpora.variables module ajmc.nlp module ajmc.nlp.token_classification module ajmc.nlp.token_classification.data_preparation module ajmc.ocr module ajmc.ocr.pytorch module ajmc.ocr.pytorch.ctc_decoder_torch module ajmc.ocr.tesseract module ajmc.olr module ajmc.olr.layoutlm module ajmc.olr.yolo module ajmc.text_processing module are_intervals_within_intervals() (in module ajmc.commons.arithmetic) B basic_clean() (in module ajmc.corpora.cleaning_utils) BeamCTCDecoder (class in ajmc.ocr.pytorch.ctc_decoder_torch) C chunk_string_by_charsets() (in module ajmc.commons.unicode_utils) compute_interval_overlap() (in module ajmc.commons.arithmetic) convert_tensor() (ajmc.ocr.pytorch.ctc_decoder_torch.BeamCTCDecoder method) convert_to_strings() (ajmc.ocr.pytorch.ctc_decoder_torch.BeamCTCDecoder method) count_chars_by_charset() (in module ajmc.commons.unicode_utils) count_chars_by_charset_nfd() (in module ajmc.commons.unicode_utils) creator() (ajmc.corpora.bibliographic_records.DublinCoreRecord method) D decode() (ajmc.ocr.pytorch.ctc_decoder_torch.BeamCTCDecoder method) (ajmc.ocr.pytorch.ctc_decoder_torch.Decoder method) (ajmc.ocr.pytorch.ctc_decoder_torch.GreedyDecoder method) Decoder (class in ajmc.ocr.pytorch.ctc_decoder_torch) description() (ajmc.corpora.bibliographic_records.DublinCoreRecord method) docstring_formatter() (in module ajmc.commons.docstrings) DublinCoreRecord (class in ajmc.corpora.bibliographic_records) F find_recurrent_lines() (in module ajmc.corpora.cleaning_utils) G get_all_chars_from_range() (in module ajmc.commons.unicode_utils) get_all_chars_from_ranges() (in module ajmc.commons.unicode_utils) get_char_charset() (in module ajmc.commons.unicode_utils) get_char_unicode_name() (in module ajmc.commons.unicode_utils) get_property_tag_text() (ajmc.corpora.bibliographic_records.DublinCoreRecord method) get_records_list() (in module ajmc.corpora.bibliographic_records) get_string_charset() (in module ajmc.commons.unicode_utils) GreedyDecoder (class in ajmc.ocr.pytorch.ctc_decoder_torch) H harmonise_ligatures() (in module ajmc.commons.unicode_utils) harmonise_linebreaks() (in module ajmc.corpora.cleaning_utils) harmonise_miscellaneous_symbols() (in module ajmc.commons.unicode_utils) harmonise_non_printable() (in module ajmc.commons.unicode_utils) harmonise_punctuation() (in module ajmc.commons.unicode_utils) harmonise_spaces() (in module ajmc.commons.unicode_utils) harmonise_unicode() (in module ajmc.commons.unicode_utils) I is_charset_string() (in module ajmc.commons.unicode_utils) is_charset_string_nfd() (in module ajmc.commons.unicode_utils) is_interval_within_interval() (in module ajmc.commons.arithmetic) K keywords() (ajmc.corpora.bibliographic_records.DublinCoreRecord method) keywords_string() (ajmc.corpora.bibliographic_records.DublinCoreRecord method) L language() (ajmc.corpora.bibliographic_records.DublinCoreRecord method) M module ajmc ajmc.commons ajmc.commons.arithmetic ajmc.commons.docstrings ajmc.commons.unicode_utils ajmc.corpora ajmc.corpora.bibliographic_records ajmc.corpora.cleaning_utils ajmc.corpora.variables ajmc.nlp ajmc.nlp.token_classification ajmc.nlp.token_classification.data_preparation ajmc.ocr ajmc.ocr.pytorch ajmc.ocr.pytorch.ctc_decoder_torch ajmc.ocr.tesseract ajmc.olr ajmc.olr.layoutlm ajmc.olr.yolo ajmc.text_processing P process_string() (ajmc.ocr.pytorch.ctc_decoder_torch.GreedyDecoder method) publisher() (ajmc.corpora.bibliographic_records.DublinCoreRecord method) R remove_diacritics() (in module ajmc.commons.unicode_utils) S safe_divide() (in module ajmc.commons.arithmetic) T title() (ajmc.corpora.bibliographic_records.DublinCoreRecord method) W whole_text() (ajmc.corpora.bibliographic_records.DublinCoreRecord method)