Index _ | A | B | C | D | E | F | G | H | I | L | M | N | O | P | Q | R | S | T | U | V | W _ __abstractmethods__ (text_machina.src.exploration.base.Explorer attribute) __dict__ (text_machina.src.exploration.base.Explorer attribute) __init__() (text_machina.src.exploration.base.Explorer method) __module__ (text_machina.src.exploration.base.Explorer attribute) __weakref__ (text_machina.src.exploration.base.Explorer attribute) _abc_impl (text_machina.src.exploration.base.Explorer attribute) A add_config_info() (text_machina.src.generators.base.DatasetGenerator method) AI21Model (class in text_machina.src.models.ai21) AI21Tokenizer (class in text_machina.src.tokenizers.ai21) AnthropicModel (class in text_machina.src.models.anthropic) AnthropicTokenizer (class in text_machina.src.tokenizers.anthropic) api_type (text_machina.src.config.ModelConfig attribute) ATTRIBUTION (text_machina.src.types.TaskType attribute) AttributionDatasetGenerator (class in text_machina.src.generators.attribution) AttributionExplorer (class in text_machina.src.exploration.attribution) Auxiliary (class in text_machina.src.extractors.auxiliary) AzureOpenAIModel (class in text_machina.src.models.azure_openai) AzureOpenAITokenizer (class in text_machina.src.tokenizers.azure_openai) B batched_map() (in module text_machina.src.postprocessing) BedrockModel (class in text_machina.src.models.bedrock) BedrockTokenizer (class in text_machina.src.tokenizers.bedrock) BOUNDARY (text_machina.src.types.TaskType attribute) BoundaryDatasetGenerator (class in text_machina.src.generators.boundary) BoundaryExplorer (class in text_machina.src.exploration.boundary) build() (text_machina.src.data.PromptedDatasetBuilder method) C CHAT (text_machina.src.models.types.CompletionType attribute) check_kwargs_ok() (text_machina.src.metrics.mauve.MAUVEMetric method) check_valid_args() (text_machina.src.extractors.base.Extractor method) (text_machina.src.extractors.sentence_gap.SentenceGap method) (text_machina.src.extractors.sentence_masking.SentenceMasking method) (text_machina.src.extractors.sentence_rewriting.SentenceRewriting method) (text_machina.src.extractors.word_gap.WordGap method) (text_machina.src.extractors.word_masking.WordMasking method) check_valid_positions() (text_machina.src.types.LabeledSpan method) clean_inputs() (in module text_machina.src.extractors.utils) CohereModel (class in text_machina.src.models.cohere) CohereTokenizer (class in text_machina.src.tokenizers.cohere) color_log() (in module text_machina.src.common.logging) Combined (class in text_machina.src.extractors.combined) CombinedEmptyExtractors command_panel (text_machina.src.exploration.base.Explorer property) COMPLETION (text_machina.src.models.types.CompletionType attribute) CompletionType (class in text_machina.src.models.types) compute_statistics() (in module text_machina.cli_utils) concatenate() (in module text_machina.src.data) Config (class in text_machina.src.config) constrain() (text_machina.src.constrainers.base.Constrainer method) Constrainer (class in text_machina.src.constrainers.base) count_errors() (in module text_machina.cli_utils) D dataset (text_machina.src.config.InputConfig attribute) dataset_params (text_machina.src.config.InputConfig attribute) dataset_text_column (text_machina.src.config.InputConfig attribute) DatasetGenerationError DatasetGenerator (class in text_machina.src.generators.base) decode() (text_machina.src.tokenizers.ai21.AI21Tokenizer method) (text_machina.src.tokenizers.anthropic.AnthropicTokenizer method) (text_machina.src.tokenizers.azure_openai.AzureOpenAITokenizer method) (text_machina.src.tokenizers.base.Tokenizer method) (text_machina.src.tokenizers.bedrock.BedrockTokenizer method) (text_machina.src.tokenizers.cohere.CohereTokenizer method) (text_machina.src.tokenizers.hf_local.HuggingFaceLocalTokenizer method) (text_machina.src.tokenizers.openai.OpenAITokenizer method) (text_machina.src.tokenizers.vertex.VertexTokenizer method) DETECTION (text_machina.src.types.TaskType attribute) DetectionDatasetGenerator (class in text_machina.src.generators.detection) DetectionExplorer (class in text_machina.src.exploration.detection) DetectionLabels (class in text_machina.src.types) distributed_truncate() (text_machina.src.tokenizers.base.Tokenizer method) domain (text_machina.src.config.InputConfig attribute) domain_model_counts() (in module text_machina.src.data) Dummy (class in text_machina.src.extractors.dummy) E encode() (text_machina.src.tokenizers.ai21.AI21Tokenizer method) (text_machina.src.tokenizers.anthropic.AnthropicTokenizer method) (text_machina.src.tokenizers.azure_openai.AzureOpenAITokenizer method) (text_machina.src.tokenizers.base.Tokenizer method) (text_machina.src.tokenizers.bedrock.BedrockTokenizer method) (text_machina.src.tokenizers.cohere.CohereTokenizer method) (text_machina.src.tokenizers.hf_local.HuggingFaceLocalTokenizer method) (text_machina.src.tokenizers.openai.OpenAITokenizer method) (text_machina.src.tokenizers.vertex.VertexTokenizer method) end (text_machina.src.types.LabeledSpan attribute) EntityList (class in text_machina.src.extractors.entity_list) errors_per_model() (in module text_machina.src.data) estimate() (text_machina.src.constrainers.base.Constrainer method) (text_machina.src.constrainers.length.LengthConstrainer method) (text_machina.src.constrainers.length.MeanLengthConstrainer method) (text_machina.src.constrainers.length.MedianLengthConstrainer method) eval() (in module text_machina.src.metrics.token_classification) explore() (in module text_machina.cli) Explorer (class in text_machina.src.exploration.base) extract() (text_machina.src.extractors.base.Extractor method) extract_entities() (in module text_machina.src.extractors.entity_list) extract_nouns() (in module text_machina.src.extractors.noun_list) Extractor (class in text_machina.src.extractors.base) extractor (text_machina.src.config.InputConfig attribute) (text_machina.src.types.Prompt attribute) extractor_args (text_machina.src.config.InputConfig attribute) extractor_must_exist() (text_machina.src.config.InputConfig class method) ExtractorEmptyColumns ExtractorInvalidArgs extractors_list (text_machina.src.config.InputConfig attribute) F filter_by_language() (in module text_machina.src.postprocessing) fit() (in module text_machina.src.metrics.token_classification) fix_encoding() (in module text_machina.src.postprocessing) format_prompt() (in module text_machina.src.data) G generate() (in module text_machina.cli) (text_machina.src.generators.base.DatasetGenerator method) generate_completion() (text_machina.src.models.ai21.AI21Model method) (text_machina.src.models.anthropic.AnthropicModel method) (text_machina.src.models.base.TextGenerationModel method) (text_machina.src.models.bedrock.BedrockModel method) (text_machina.src.models.cohere.CohereModel method) (text_machina.src.models.hf_local.HuggingFaceLocalModel method) (text_machina.src.models.hf_remote.HuggingFaceRemoteModel method) (text_machina.src.models.inference_server.InferenceServerModel method) (text_machina.src.models.openai.OpenAIModel method) (text_machina.src.models.vertex.VertexModel method) generate_completions() (text_machina.src.models.base.TextGenerationModel method) (text_machina.src.models.hf_local.HuggingFaceLocalModel method) generate_dataset() (in module text_machina.cli_utils) generate_from_config() (in module text_machina.cli_utils) generate_run_name() (in module text_machina.cli_utils) GENERATED (text_machina.src.types.DetectionLabels attribute) generation (text_machina.src.config.Config attribute) get_cache_path() (in module text_machina.src.common.utils) get_completion_from_response_body() (text_machina.src.models.bedrock.BedrockModel method) get_constraints() (text_machina.src.constrainers.base.Constrainer method) (text_machina.src.constrainers.length.LengthConstrainer method) get_instantiation_args() (in module text_machina.src.common.utils) get_langid_model() (in module text_machina.src.postprocessing) get_logger() (in module text_machina.src.common.logging) get_next_position_or_exit() (text_machina.src.exploration.base.Explorer method) get_panels() (text_machina.src.exploration.attribution.AttributionExplorer method) (text_machina.src.exploration.base.Explorer method) (text_machina.src.exploration.boundary.BoundaryExplorer method) (text_machina.src.exploration.detection.DetectionExplorer method) (text_machina.src.exploration.mixcase.MixCaseExplorer method) get_path_from_substring() (in module text_machina.src.data) get_prompt() (text_machina.src.data.PromptedDatasetBuilder method) get_request_body() (text_machina.src.models.bedrock.BedrockModel method) get_save_path() (in module text_machina.src.data) get_spacy_model() (in module text_machina.src.extractors.utils) get_title() (text_machina.src.exploration.attribution.AttributionExplorer method) (text_machina.src.exploration.base.Explorer method) (text_machina.src.exploration.boundary.BoundaryExplorer method) (text_machina.src.exploration.detection.DetectionExplorer method) (text_machina.src.exploration.mixcase.MixCaseExplorer method) get_token_length() (text_machina.src.tokenizers.base.Tokenizer method) H HuggingFaceLocalModel (class in text_machina.src.models.hf_local) HuggingFaceLocalTokenizer (class in text_machina.src.tokenizers.hf_local) HuggingFaceRemoteModel (class in text_machina.src.models.hf_remote) HuggingFaceRemoteTokenizer (class in text_machina.src.tokenizers.hf_remote) HUMAN (text_machina.src.types.DetectionLabels attribute) human_texts (text_machina.src.types.PromptedDataset attribute) I InferenceServerModel (class in text_machina.src.models.inference_server) InferenceServerTokenizer (class in text_machina.src.tokenizers.inference_server) input (text_machina.src.config.Config attribute) InputConfig (class in text_machina.src.config) InvalidExtractor InvalidInferenceServer InvalidLanguage InvalidMetric InvalidModelParam InvalidProvider InvalidSpacyModel InvalidTaskTypeForMetric L label (text_machina.src.types.LabeledSpan attribute) LabeledSpan (class in text_machina.src.types) language (text_machina.src.config.InputConfig attribute) language_must_be_iso639() (text_machina.src.config.InputConfig class method) LengthConstrainer (class in text_machina.src.constrainers.length) load_config() (text_machina.src.config.Config class method) load_configs() (text_machina.src.config.Config class method) load_dataset_from_config() (in module text_machina.src.data) log_final_message() (in module text_machina.cli_utils) M MAUVEMetric (class in text_machina.src.metrics.mauve) max_input_tokens (text_machina.src.config.InputConfig attribute) MeanLengthConstrainer (class in text_machina.src.constrainers.length) MedianLengthConstrainer (class in text_machina.src.constrainers.length) Metric (class in text_machina.src.metrics.base) MissingIntegrationError MissingMetricError MIXCASE (text_machina.src.types.TaskType attribute) MixCaseDatasetGenerator (class in text_machina.src.generators.mixcase) MixCaseExplorer (class in text_machina.src.exploration.mixcase) MixCaseGapPacker (class in text_machina.src.generators.mixcase) MixCaseMaskPacker (class in text_machina.src.generators.mixcase) MixCasePacker (class in text_machina.src.generators.mixcase) MixCaseRewritingPacker (class in text_machina.src.generators.mixcase) model (text_machina.src.config.Config attribute) model_computed_fields (text_machina.src.config.Config attribute) (text_machina.src.config.InputConfig attribute) (text_machina.src.config.ModelConfig attribute) (text_machina.src.types.LabeledSpan attribute) (text_machina.src.types.Prompt attribute) (text_machina.src.types.PromptedDataset attribute) model_config (text_machina.src.config.Config attribute) (text_machina.src.config.InputConfig attribute) (text_machina.src.config.ModelConfig attribute) (text_machina.src.types.LabeledSpan attribute) (text_machina.src.types.Prompt attribute) (text_machina.src.types.PromptedDataset attribute) model_fields (text_machina.src.config.Config attribute) (text_machina.src.config.InputConfig attribute) (text_machina.src.config.ModelConfig attribute) (text_machina.src.types.LabeledSpan attribute) (text_machina.src.types.Prompt attribute) (text_machina.src.types.PromptedDataset attribute) model_name (text_machina.src.config.ModelConfig attribute) ModelConfig (class in text_machina.src.config) module text_machina.cli text_machina.cli_utils text_machina.src.common.__init__ text_machina.src.common.exceptions text_machina.src.common.logging text_machina.src.common.utils text_machina.src.config text_machina.src.constrainers.__init__ text_machina.src.constrainers.base text_machina.src.constrainers.length text_machina.src.data text_machina.src.exploration.__init__ text_machina.src.exploration.attribution text_machina.src.exploration.base text_machina.src.exploration.boundary text_machina.src.exploration.detection text_machina.src.exploration.mixcase text_machina.src.extractors.__init__ text_machina.src.extractors.auxiliary text_machina.src.extractors.base text_machina.src.extractors.combined text_machina.src.extractors.dummy text_machina.src.extractors.entity_list text_machina.src.extractors.noun_list text_machina.src.extractors.sentence_gap text_machina.src.extractors.sentence_masking text_machina.src.extractors.sentence_prefix text_machina.src.extractors.sentence_rewriting text_machina.src.extractors.types text_machina.src.extractors.utils text_machina.src.extractors.word_gap text_machina.src.extractors.word_masking text_machina.src.extractors.word_prefix text_machina.src.generators.__init__ text_machina.src.generators.attribution text_machina.src.generators.base text_machina.src.generators.boundary text_machina.src.generators.detection text_machina.src.generators.mixcase text_machina.src.metrics.__init__ text_machina.src.metrics.base text_machina.src.metrics.mauve text_machina.src.metrics.perplexity text_machina.src.metrics.repetition_diversity text_machina.src.metrics.simple_model text_machina.src.metrics.token_classification text_machina.src.models.__init__ text_machina.src.models.ai21 text_machina.src.models.anthropic text_machina.src.models.azure_openai text_machina.src.models.base text_machina.src.models.bedrock text_machina.src.models.cohere text_machina.src.models.hf_local text_machina.src.models.hf_remote text_machina.src.models.inference_server text_machina.src.models.openai text_machina.src.models.types text_machina.src.models.vertex text_machina.src.postprocessing text_machina.src.tokenizers.__init__ text_machina.src.tokenizers.ai21 text_machina.src.tokenizers.anthropic text_machina.src.tokenizers.azure_openai text_machina.src.tokenizers.base text_machina.src.tokenizers.bedrock text_machina.src.tokenizers.cohere text_machina.src.tokenizers.hf_local text_machina.src.tokenizers.hf_remote text_machina.src.tokenizers.inference_server text_machina.src.tokenizers.openai text_machina.src.tokenizers.vertex text_machina.src.types N NO_EXTRACTOR (text_machina.src.types.Placeholders attribute) NO_PROMPT (text_machina.src.types.Placeholders attribute) not_empty_list_in_combined() (text_machina.src.config.InputConfig class method) NounList (class in text_machina.src.extractors.noun_list) O OpenAIModel (class in text_machina.src.models.openai) OpenAITokenizer (class in text_machina.src.tokenizers.openai) P parse_metrics_config() (in module text_machina.src.config) parse_response() (text_machina.src.models.inference_server.InferenceServerModel method) path (text_machina.src.config.Config attribute) PerplexityMetric (class in text_machina.src.metrics.perplexity) Placeholders (class in text_machina.src.types) postprocess() (in module text_machina.src.postprocessing) predict() (in module text_machina.src.metrics.token_classification) prepare_data() (text_machina.src.models.inference_server.InferenceServerModel method) prepare_dataset() (in module text_machina.src.metrics.token_classification) prepare_human() (text_machina.src.extractors.base.Extractor method) (text_machina.src.extractors.sentence_gap.SentenceGap method) (text_machina.src.extractors.sentence_masking.SentenceMasking method) (text_machina.src.extractors.sentence_prefix.SentencePrefix method) (text_machina.src.extractors.sentence_rewriting.SentenceRewriting method) (text_machina.src.extractors.word_gap.WordGap method) (text_machina.src.extractors.word_masking.WordMasking method) (text_machina.src.extractors.word_prefix.WordPrefix method) prepare_tags_for_boundary() (in module text_machina.src.metrics.token_classification) prepare_tags_for_mixcase() (in module text_machina.src.metrics.token_classification) Prompt (class in text_machina.src.types) prompted_texts (text_machina.src.types.PromptedDataset attribute) PromptedDataset (class in text_machina.src.types) PromptedDatasetBuilder (class in text_machina.src.data) provider (text_machina.src.config.ModelConfig attribute) provider_must_exist() (text_machina.src.config.ModelConfig class method) Q quantity (text_machina.src.config.InputConfig attribute) R random_sample_human (text_machina.src.config.InputConfig attribute) regression_report() (in module text_machina.src.metrics.simple_model) remove_disclosure_phrases() (in module text_machina.src.postprocessing) remove_empty_texts() (in module text_machina.src.postprocessing) remove_generation_errors() (in module text_machina.src.postprocessing) remove_label_duplicates() (in module text_machina.src.postprocessing) remove_special_tokens() (in module text_machina.src.postprocessing) remove_text_duplicates() (in module text_machina.src.postprocessing) repetition_and_diversity() (text_machina.src.metrics.repetition_diversity.RepetitionDiversityMetric method) RepetitionDiversityMetric (class in text_machina.src.metrics.repetition_diversity) run() (text_machina.src.metrics.base.Metric method) S safe_dataset_name() (text_machina.src.config.Config method) safe_domain_name() (text_machina.src.config.Config method) safe_model_name() (text_machina.src.config.Config method) sampling() (text_machina.src.data.PromptedDatasetBuilder method) SentenceGap (class in text_machina.src.extractors.sentence_gap) SentenceMasking (class in text_machina.src.extractors.sentence_masking) SentencePrefix (class in text_machina.src.extractors.sentence_prefix) SentenceRewriting (class in text_machina.src.extractors.sentence_rewriting) serialize_dataset() (in module text_machina.src.data) show_example() (text_machina.src.exploration.base.Explorer method) SimpleModelMetric (class in text_machina.src.metrics.simple_model) spacy_pipeline() (in module text_machina.src.extractors.utils) start (text_machina.src.types.LabeledSpan attribute) step() (text_machina.src.exploration.base.Explorer method) strip() (in module text_machina.src.postprocessing) T task_type (text_machina.src.config.Config attribute) TaskType (class in text_machina.src.types) template (text_machina.src.config.InputConfig attribute) (text_machina.src.types.Prompt attribute) text_machina.cli module text_machina.cli_utils module text_machina.src.common.__init__ module text_machina.src.common.exceptions module text_machina.src.common.logging module text_machina.src.common.utils module text_machina.src.config module text_machina.src.constrainers.__init__ module text_machina.src.constrainers.base module text_machina.src.constrainers.length module text_machina.src.data module text_machina.src.exploration.__init__ module text_machina.src.exploration.attribution module text_machina.src.exploration.base module text_machina.src.exploration.boundary module text_machina.src.exploration.detection module text_machina.src.exploration.mixcase module text_machina.src.extractors.__init__ module text_machina.src.extractors.auxiliary module text_machina.src.extractors.base module text_machina.src.extractors.combined module text_machina.src.extractors.dummy module text_machina.src.extractors.entity_list module text_machina.src.extractors.noun_list module text_machina.src.extractors.sentence_gap module text_machina.src.extractors.sentence_masking module text_machina.src.extractors.sentence_prefix module text_machina.src.extractors.sentence_rewriting module text_machina.src.extractors.types module text_machina.src.extractors.utils module text_machina.src.extractors.word_gap module text_machina.src.extractors.word_masking module text_machina.src.extractors.word_prefix module text_machina.src.generators.__init__ module text_machina.src.generators.attribution module text_machina.src.generators.base module text_machina.src.generators.boundary module text_machina.src.generators.detection module text_machina.src.generators.mixcase module text_machina.src.metrics.__init__ module text_machina.src.metrics.base module text_machina.src.metrics.mauve module text_machina.src.metrics.perplexity module text_machina.src.metrics.repetition_diversity module text_machina.src.metrics.simple_model module text_machina.src.metrics.token_classification module text_machina.src.models.__init__ module text_machina.src.models.ai21 module text_machina.src.models.anthropic module text_machina.src.models.azure_openai module text_machina.src.models.base module text_machina.src.models.bedrock module text_machina.src.models.cohere module text_machina.src.models.hf_local module text_machina.src.models.hf_remote module text_machina.src.models.inference_server module text_machina.src.models.openai module text_machina.src.models.types module text_machina.src.models.vertex module text_machina.src.postprocessing module text_machina.src.tokenizers.__init__ module text_machina.src.tokenizers.ai21 module text_machina.src.tokenizers.anthropic module text_machina.src.tokenizers.azure_openai module text_machina.src.tokenizers.base module text_machina.src.tokenizers.bedrock module text_machina.src.tokenizers.cohere module text_machina.src.tokenizers.hf_local module text_machina.src.tokenizers.hf_remote module text_machina.src.tokenizers.inference_server module text_machina.src.tokenizers.openai module text_machina.src.tokenizers.vertex module text_machina.src.types module TextGenerationModel (class in text_machina.src.models.base) TextMachinaError threads (text_machina.src.config.ModelConfig attribute) TokenClassificationMetric (class in text_machina.src.metrics.token_classification) Tokenizer (class in text_machina.src.tokenizers.base) truncate() (in module text_machina.src.postprocessing) truncate_inputs() (text_machina.src.data.PromptedDatasetBuilder method) truncate_text() (text_machina.src.tokenizers.base.Tokenizer method) truncate_texts() (text_machina.src.tokenizers.base.Tokenizer method) U UnsupportedMetricParam V VertexModel (class in text_machina.src.models.vertex) VertexTokenizer (class in text_machina.src.tokenizers.vertex) W WordGap (class in text_machina.src.extractors.word_gap) WordMasking (class in text_machina.src.extractors.word_masking) WordPrefix (class in text_machina.src.extractors.word_prefix)