pytext.data.test package

Submodules

pytext.data.test.batch_sampler_test module

class pytext.data.test.batch_sampler_test.BatchSamplerTest(methodName='runTest')[source]

Bases: unittest.case.TestCase

setUp()[source]

Hook method for setting up the test fixture before exercising it.

test_alternate_prob_batch_sampler()[source]
test_eval_batch_sampler()[source]
test_prob_batch_sampler()[source]
test_round_robin_batch_sampler()[source]

pytext.data.test.data_test module

class pytext.data.test.data_test.BatcherTest(methodName='runTest')[source]

Bases: unittest.case.TestCase

test_batcher()[source]
test_pooling_batcher()[source]
class pytext.data.test.data_test.DataTest(methodName='runTest')[source]

Bases: unittest.case.TestCase

setUp()[source]

Hook method for setting up the test fixture before exercising it.

test_create_batches()[source]
test_create_batches_different_tensorizers()[source]
test_create_batches_with_cache()[source]
test_create_data_no_batcher_provided()[source]
test_data_initializes_tensorsizers()[source]
test_data_iterate_multiple_times()[source]
test_fp16_padding()[source]
test_sort()[source]
class pytext.data.test.data_test.RawExampleTest(methodName='runTest')[source]

Bases: unittest.case.TestCase

test_raw_example_hashable()[source]

pytext.data.test.dynamic_pooling_batcher_test module

class pytext.data.test.dynamic_pooling_batcher_test.DynamicPoolingBatcherTest(methodName='runTest')[source]

Bases: unittest.case.TestCase

end_of_scheduler()[source]
test_batch_size_greater_than_data()[source]
test_exponential_scheduler()[source]
test_linear_scheduler()[source]
test_step_size()[source]

pytext.data.test.mask_tensorizers_test module

class pytext.data.test.mask_tensorizers_test.MaskTensorizersTest(methodName='runTest')[source]

Bases: unittest.case.TestCase

setUp()[source]

Hook method for setting up the test fixture before exercising it.

test_basic_tree_masking()[source]
test_mask_all()[source]
test_mask_at_depth_k()[source]
test_mask_no_op()[source]
test_mask_random()[source]
test_tree_mask_with_bos_eos()[source]

pytext.data.test.pandas_data_source_test module

class pytext.data.test.pandas_data_source_test.PandasDataSourceTest(methodName='runTest')[source]

Bases: unittest.case.TestCase

test_create_data_source()[source]
test_create_from_config()[source]
test_empty_data()[source]

pytext.data.test.round_robin_batchiterator_test module

class pytext.data.test.round_robin_batchiterator_test.RoundRobinBatchIteratorTest(methodName='runTest')[source]

Bases: unittest.case.TestCase

test_batch_iterator()[source]

pytext.data.test.simple_featurizer_test module

class pytext.data.test.simple_featurizer_test.SimpleFeaturizerTest(methodName='runTest')[source]

Bases: unittest.case.TestCase

setUp()[source]

Hook method for setting up the test fixture before exercising it.

test_convert_to_bytes()[source]
test_split_with_regex()[source]
test_tokenize()[source]
test_tokenize_add_sentence_markers()[source]
test_tokenize_dont_lowercase()[source]

pytext.data.test.tensorizers_test module

class pytext.data.test.tensorizers_test.BERTTensorizerTest(methodName='runTest')[source]

Bases: unittest.case.TestCase

test_bert_pair_tensorizer()[source]
test_bert_tensorizer()[source]
class pytext.data.test.tensorizers_test.CharacterVocabTokenTensorizerTest(methodName='runTest')[source]

Bases: unittest.case.TestCase

test_character_vocab_token_tensorizer()[source]
class pytext.data.test.tensorizers_test.ListTensorizersTest(methodName='runTest')[source]

Bases: unittest.case.TestCase

setUp()[source]

Hook method for setting up the test fixture before exercising it.

test_create_label_list_tensors()[source]
test_initialize_list_tensorizers()[source]
test_label_list_tensors_no_pad_in_vocab()[source]
test_label_list_tensors_pad_missing()[source]
class pytext.data.test.tensorizers_test.LookupTokensTest(methodName='runTest')[source]

Bases: unittest.case.TestCase

test_lookup_tokens()[source]
class pytext.data.test.tensorizers_test.RobertaTensorizerTest(methodName='runTest')[source]

Bases: unittest.case.TestCase

test_roberta_tensorizer()[source]
class pytext.data.test.tensorizers_test.SquadForBERTTensorizerTest(methodName='runTest')[source]

Bases: unittest.case.TestCase

test_squad_tensorizer()[source]
class pytext.data.test.tensorizers_test.SquadForRobertaTensorizerTest(methodName='runTest')[source]

Bases: unittest.case.TestCase

test_squad_roberta_tensorizer()[source]
class pytext.data.test.tensorizers_test.SquadTensorizerTest(methodName='runTest')[source]

Bases: unittest.case.TestCase

setUp()[source]

Hook method for setting up the test fixture before exercising it.

test_initialize()[source]
test_numberize_with_alphanumeric()[source]
test_numberize_with_wordpiece()[source]
test_tsv_numberize_with_alphanumeric()[source]
class pytext.data.test.tensorizers_test.String2DListTensorizerTest(methodName='runTest')[source]

Bases: unittest.case.TestCase

expected_numberized = [([[2, 3], [4, 5, 6, 3]], [2, 4], 2), ([[2, 3], [4, 5, 6, 0, 0]], [2, 5], 2)]
expected_tensorized = (tensor([[[2, 3, 1, 1, 1], [4, 5, 6, 3, 1]], [[2, 3, 1, 1, 1], [4, 5, 6, 0, 0]]]),)
init_rows = [{'text': [['Move', 'fast'], ['And', 'break', 'things', 'fast']]}]
test_original()[source]
test_rows = [{'text': [['Move', 'fast'], ['And', 'break', 'things', 'fast']]}, {'text': [['Move', 'fast'], ['And', 'break', 'things', 'even', 'faster']]}]
test_torchscriptified()[source]
class pytext.data.test.tensorizers_test.TensorizersTest(methodName='runTest')[source]

Bases: unittest.case.TestCase

setUp()[source]

Hook method for setting up the test fixture before exercising it.

test_annotation_num()[source]
test_byte_tensors_error_code()[source]
test_create_byte_tensors()[source]
test_create_byte_token_tensors()[source]
test_create_float_list_seq_tensor()[source]
test_create_float_list_tensor()[source]
test_create_label_tensors()[source]
test_create_label_tensors_add_labels()[source]
test_create_label_tensors_label_vocab()[source]
test_create_normalized_float_list_tensor()[source]
test_float_1D_list_tensorizer()[source]
test_float_list_seq_tensor_prepare_input()[source]
test_float_list_seq_torchscriptify()[source]
test_float_list_tensor_prepare_input()[source]
test_gazetteer_tensor()[source]
test_gazetteer_tensor_bad_json()[source]
test_initialize_label_tensorizer()[source]
test_initialize_tensorizers()[source]
test_initialize_token_tensorizer()[source]
test_integer_1D_list_tensorizer()[source]
test_numberize_with_script_token_tensorizer()[source]
test_numberize_with_token_tensorizer()[source]
test_seq_tensor()[source]
test_seq_tensor_max_turn()[source]
test_seq_tensor_pad_batch()[source]
test_seq_tensor_with_bos_eos_eol_bol()[source]
test_tensorize_with_script_token_tensorizer()[source]

pytext.data.test.tokenizers_test module

class pytext.data.test.tokenizers_test.GPT2BPETest(methodName='runTest')[source]

Bases: unittest.case.TestCase

test_gpt2_bpe_tokenizer()[source]
class pytext.data.test.tokenizers_test.SentencePieceTokenizerTest(methodName='runTest')[source]

Bases: unittest.case.TestCase

test_input_text_truncation()[source]
test_tokenize()[source]
class pytext.data.test.tokenizers_test.TokenizeTest(methodName='runTest')[source]

Bases: unittest.case.TestCase

test_split_with_regex()[source]
test_tokenize()[source]
test_tokenize_dont_lowercase()[source]
test_tokenize_no_byte_offsets()[source]
test_tokenize_use_byte_offsets()[source]
class pytext.data.test.tokenizers_test.WordpieceTokenizerTest(methodName='runTest')[source]

Bases: unittest.case.TestCase

test_wordpiece_tokenizer()[source]

pytext.data.test.tsv_data_source_test module

class pytext.data.test.tsv_data_source_test.BlockShardedTSVDataSourceTest(methodName='runTest')[source]

Bases: unittest.case.TestCase

test_bad_quoting()[source]

The text column of the first row of this file opens a quote but does not close it.

test_quoting()[source]

The text column of the first row of this file opens a quote but does not close it.

class pytext.data.test.tsv_data_source_test.SessionTSVDataSourceTest(methodName='runTest')[source]

Bases: unittest.case.TestCase

setUp()[source]

Hook method for setting up the test fixture before exercising it.

test_read_session_data()[source]
class pytext.data.test.tsv_data_source_test.TSVDataSourceTest(methodName='runTest')[source]

Bases: unittest.case.TestCase

setUp()[source]

Hook method for setting up the test fixture before exercising it.

test_bad_quoting()[source]

The text column of the first row of this file opens a quote but does not close it.

test_csv()[source]
test_iterate_training_data_multiple_times()[source]
test_quoting()[source]

The text column of the first row of this file opens a quote but does not close it.

test_read_data_source()[source]
test_read_data_source_with_column_remapping()[source]
test_read_data_source_with_utf8_issues()[source]
test_read_eval_data_source()[source]
test_read_test_data_source()[source]

pytext.data.test.utils_test module

class pytext.data.test.utils_test.PaddingTest(methodName='runTest')[source]

Bases: unittest.case.TestCase

testPadding()[source]
testPaddingProvideShape()[source]
class pytext.data.test.utils_test.TargetTest(methodName='runTest')[source]

Bases: unittest.case.TestCase

test_align_target_label()[source]
class pytext.data.test.utils_test.VocabularyTest(methodName='runTest')[source]

Bases: unittest.case.TestCase

testBuildVocabulary()[source]

Module contents