Home
ProkBERT Tokenizer
SeqUtils
Configuration Utils
Datasets
ProkBERT DataCollator
General Utils
ProkBert
»
Index
Index
_
|
B
|
C
|
D
|
E
|
F
|
G
|
I
|
L
|
M
|
N
|
P
|
R
|
S
|
T
|
V
_
__getitem__() (prokbert.prok_datasets.IterableProkBERTPretrainingDataset method)
__init__() (prokbert.prok_datasets.IterableProkBERTPretrainingDataset method)
(prokbert.prokbert_tokenizer.ProkBERTTokenizer method)
B
BaseConfig (class in prokbert.config_utils)
batch_decode() (prokbert.prokbert_tokenizer.ProkBERTTokenizer method)
,
[1]
batch_encode_plus() (prokbert.prokbert_tokenizer.ProkBERTTokenizer method)
,
[1]
batch_tokenize_segments_with_ids() (in module prokbert.sequtils)
C
cast_to_expected_type() (prokbert.config_utils.BaseConfig method)
check_expected_columns() (in module prokbert.general_utils)
check_file_exists() (in module prokbert.general_utils)
convert_ids_to_tokens() (prokbert.prokbert_tokenizer.ProkBERTTokenizer method)
,
[1]
create_directory_for_filepath() (in module prokbert.general_utils)
create_parser() (prokbert.config_utils.BaseConfig static method)
D
decode() (prokbert.prokbert_tokenizer.ProkBERTTokenizer method)
,
[1]
default_cls_token (prokbert.prokbert_tokenizer.ProkBERTTokenizer attribute)
default_mask_token (prokbert.prokbert_tokenizer.ProkBERTTokenizer attribute)
default_pad_token (prokbert.prokbert_tokenizer.ProkBERTTokenizer attribute)
default_sep_token (prokbert.prokbert_tokenizer.ProkBERTTokenizer attribute)
default_unk_token (prokbert.prokbert_tokenizer.ProkBERTTokenizer attribute)
describe() (prokbert.config_utils.BaseConfig method)
E
encode() (prokbert.prokbert_tokenizer.ProkBERTTokenizer method)
,
[1]
encode_plus() (prokbert.prokbert_tokenizer.ProkBERTTokenizer method)
,
[1]
extended_nucleotide_abc (prokbert.prokbert_tokenizer.ProkBERTTokenizer attribute)
F
from_pretrained() (prokbert.prokbert_tokenizer.ProkBERTTokenizer class method)
,
[1]
G
generate_kmers() (in module prokbert.sequtils)
get_and_set_computational_parameters() (prokbert.config_utils.SeqConfig method)
get_and_set_datacollator_parameters() (prokbert.config_utils.ProkBERTConfig method)
get_and_set_dataset_parameters() (prokbert.config_utils.ProkBERTConfig method)
get_and_set_finetuning_parameters() (prokbert.config_utils.ProkBERTConfig method)
get_and_set_model_parameters() (prokbert.config_utils.ProkBERTConfig method)
get_and_set_pretraining_parameters() (prokbert.config_utils.ProkBERTConfig method)
get_and_set_segmentation_parameters() (prokbert.config_utils.SeqConfig method)
get_cmd_arg_parser() (prokbert.config_utils.ProkBERTConfig method)
(prokbert.config_utils.SeqConfig method)
get_maximum_segment_length_from_token_count() (prokbert.config_utils.SeqConfig static method)
get_maximum_segment_length_from_token_count_from_params() (prokbert.config_utils.SeqConfig method)
get_maximum_token_count_from_max_length() (prokbert.config_utils.SeqConfig static method)
get_maximum_token_count_from_max_length_from_params() (prokbert.config_utils.SeqConfig method)
get_non_empty_files() (in module prokbert.general_utils)
get_parameter() (prokbert.config_utils.BaseConfig method)
get_positions_tokens() (prokbert.prokbert_tokenizer.ProkBERTTokenizer method)
get_rectangular_array_from_tokenized_dataset() (in module prokbert.sequtils)
get_set_parameters() (prokbert.config_utils.ProkBERTConfig method)
get_vocab() (prokbert.prokbert_tokenizer.ProkBERTTokenizer method)
I
is_valid_primary_key() (in module prokbert.general_utils)
IterableProkBERTPretrainingDataset (class in prokbert.prok_datasets)
L
lca_tokenize_segment() (in module prokbert.sequtils)
load_contigs() (in module prokbert.sequtils)
load_vocab() (in module prokbert.prokbert_tokenizer)
,
[1]
M
max_model_input_sizes (prokbert.prokbert_tokenizer.ProkBERTTokenizer attribute)
module
prokbert.prokbert_tokenizer
N
nucleotide_abc (prokbert.prokbert_tokenizer.ProkBERTTokenizer attribute)
P
pretrained_init_configuration (prokbert.prokbert_tokenizer.ProkBERTTokenizer attribute)
pretrained_vocab_files_map (prokbert.prokbert_tokenizer.ProkBERTTokenizer attribute)
pretty_print_overlapping_sequence() (in module prokbert.sequtils)
process_batch_tokenize_segments_with_ids() (in module prokbert.sequtils)
prokbert.prokbert_tokenizer
module
ProkBERTConfig (class in prokbert.config_utils)
ProkBERTDataCollator (class in prokbert.ProkBERTDataCollator)
ProkBERTTokenizer (class in prokbert.prokbert_tokenizer)
,
[1]
R
rename_non_unique_parameters() (prokbert.config_utils.BaseConfig static method)
S
save_to_hdf() (in module prokbert.sequtils)
save_vocabulary() (prokbert.prokbert_tokenizer.ProkBERTTokenizer method)
,
[1]
segment_sequence_contiguous() (in module prokbert.sequtils)
segment_sequences() (in module prokbert.sequtils)
segment_sequences_random() (in module prokbert.sequtils)
SeqConfig (class in prokbert.config_utils)
sequence_unk_token (prokbert.prokbert_tokenizer.ProkBERTTokenizer attribute)
set_mask_neighborhood_params() (prokbert.ProkBERTDataCollator.ProkBERTDataCollator method)
T
tokenize() (prokbert.prokbert_tokenizer.ProkBERTTokenizer method)
,
[1]
tokenize_kmerized_segment_list() (in module prokbert.sequtils)
torch_mask_tokens() (prokbert.ProkBERTDataCollator.ProkBERTDataCollator method)
truncate_zero_columns() (in module prokbert.general_utils)
V
validate() (prokbert.config_utils.BaseConfig method)
validate_type() (prokbert.config_utils.BaseConfig method)
validate_value() (prokbert.config_utils.BaseConfig method)
vocab_files_names (prokbert.prokbert_tokenizer.ProkBERTTokenizer attribute)