Index _ | A | B | C | D | E | F | G | H | I | J | L | M | N | O | P | R | S | T | U | V | W | Y _ __dict__ (academic_metrics.DB.DatabaseSetup.DatabaseWrapper attribute) __init__() (academic_metrics.AI.abstract_classifier.AbstractClassifier method) (academic_metrics.ChainBuilder.ChainBuilder.ChainBuilder method) (academic_metrics.ChainBuilder.ChainBuilder.ChainComposer method) (academic_metrics.ChainBuilder.ChainBuilder.ChainManager method) (academic_metrics.ChainBuilder.ChainBuilder.ChainWrapper method) (academic_metrics.core.category_processor.CategoryProcessor method) (academic_metrics.data_collection.CrossrefWrapper.CrossrefWrapper method) (academic_metrics.data_collection.scraper.Scraper method) (academic_metrics.DB.DatabaseSetup.DatabaseWrapper method) (academic_metrics.factories.dataclass_factory.DataClassFactory method) (academic_metrics.factories.strategy_factory.StrategyFactory method) (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator method) (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator method) (academic_metrics.postprocessing.DepartmentPostprocessor.DepartmentPostprocessor method) (academic_metrics.postprocessing.FacultyPostprocessor.FacultyPostprocessor method) (academic_metrics.runners.pipeline.PipelineRunner method) (academic_metrics.strategies.AttributeExtractionStrategies.AttributeExtractionStrategy method) (academic_metrics.strategies.AttributeExtractionStrategies.CrossrefAbstractExtractionStrategy method) (academic_metrics.strategies.AttributeExtractionStrategies.CrossrefAuthorExtractionStrategy method) (academic_metrics.strategies.AttributeExtractionStrategies.CrossrefCategoriesExtractionStrategy method) (academic_metrics.strategies.AttributeExtractionStrategies.CrossrefCitationCountExtractionStrategy method) (academic_metrics.strategies.AttributeExtractionStrategies.CrossrefDepartmentExtractionStrategy method) (academic_metrics.strategies.AttributeExtractionStrategies.CrossrefTitleExtractionStrategy method) (academic_metrics.utils.api_key_validator.APIKeyValidator method) (academic_metrics.utils.minhash_util.MinHashUtility method) (academic_metrics.utils.taxonomy_util.Taxonomy method) (academic_metrics.utils.utilities.Utilities method) (academic_metrics.utils.warning_manager.CustomWarning method) (academic_metrics.utils.warning_manager.WarningManager method) __module__ (academic_metrics.DB.DatabaseSetup.DatabaseWrapper attribute) __repr__() (academic_metrics.ChainBuilder.ChainBuilder.ChainBuilder method), [1] (academic_metrics.ChainBuilder.ChainBuilder.ChainComposer method), [1] (academic_metrics.ChainBuilder.ChainBuilder.ChainManager method), [1] (academic_metrics.ChainBuilder.ChainBuilder.ChainWrapper method), [1] __str__() (academic_metrics.ChainBuilder.ChainBuilder.ChainBuilder method), [1] (academic_metrics.ChainBuilder.ChainBuilder.ChainComposer method), [1] (academic_metrics.ChainBuilder.ChainBuilder.ChainManager method), [1] (academic_metrics.ChainBuilder.ChainBuilder.ChainWrapper method), [1] (academic_metrics.utils.taxonomy_util.Taxonomy method) __weakref__ (academic_metrics.DB.DatabaseSetup.DatabaseWrapper attribute) _add_classification_layer() (academic_metrics.AI.abstract_classifier.AbstractClassifier method) _add_method_extraction_layer() (academic_metrics.AI.abstract_classifier.AbstractClassifier method) _add_sentence_analysis_layer() (academic_metrics.AI.abstract_classifier.AbstractClassifier method) _add_summary_layer() (academic_metrics.AI.abstract_classifier.AbstractClassifier method) _add_theme_recognition_layer() (academic_metrics.AI.abstract_classifier.AbstractClassifier method) _all_low_categories (academic_metrics.utils.taxonomy_util.Taxonomy attribute) _all_mid_categories (academic_metrics.utils.taxonomy_util.Taxonomy attribute) _all_top_categories (academic_metrics.utils.taxonomy_util.Taxonomy attribute) _build_chain() (academic_metrics.ChainBuilder.ChainBuilder.ChainBuilder method), [1] _build_fallback_chain() (academic_metrics.ChainBuilder.ChainBuilder.ChainBuilder method), [1] _check_attr() (academic_metrics.utils.api_key_validator.APIKeyValidator method) _check_first_time_overwrites() (academic_metrics.ChainBuilder.ChainBuilder.ChainManager method) _classification_orchestrator() (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator method), [1] _clean_category_data() (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator method) _collect_all_affiliations() (academic_metrics.core.category_processor.CategoryProcessor method) (academic_metrics.core.category_processor.CategoryProcessor static method) _create_anthropic_llm() (academic_metrics.ChainBuilder.ChainBuilder.ChainManager method) _create_category_processor() (academic_metrics.runners.pipeline.PipelineRunner method), [1] _create_classification_orchestrator() (academic_metrics.runners.pipeline.PipelineRunner method), [1] _create_classifier_factory() (academic_metrics.runners.pipeline.PipelineRunner method), [1] _create_crossref_wrapper() (academic_metrics.runners.pipeline.PipelineRunner method), [1] _create_dataclass_factory() (academic_metrics.runners.pipeline.PipelineRunner method), [1] _create_db() (academic_metrics.runners.pipeline.PipelineRunner method), [1] _create_department_postprocessor() (academic_metrics.runners.pipeline.PipelineRunner method) _create_faculty_postprocessor() (academic_metrics.runners.pipeline.PipelineRunner method), [1] _create_google_llm() (academic_metrics.ChainBuilder.ChainBuilder.ChainManager method) _create_json_parser() (academic_metrics.ChainBuilder.ChainBuilder.ChainManager method) _create_minhash_util() (academic_metrics.runners.pipeline.PipelineRunner method) _create_openai_llm() (academic_metrics.ChainBuilder.ChainBuilder.ChainManager method) _create_orchestrator() (academic_metrics.runners.pipeline.PipelineRunner method), [1] _create_pydantic_parser() (academic_metrics.ChainBuilder.ChainBuilder.ChainManager method) _create_scraper() (academic_metrics.runners.pipeline.PipelineRunner method), [1] _create_str_parser() (academic_metrics.ChainBuilder.ChainBuilder.ChainManager method), [1] _create_strategy_factory() (academic_metrics.runners.pipeline.PipelineRunner method), [1] _create_taxonomy() (academic_metrics.runners.pipeline.PipelineRunner method), [1] _create_utilities_instance() (academic_metrics.runners.pipeline.PipelineRunner method), [1] _create_warning_manager() (academic_metrics.runners.pipeline.PipelineRunner method), [1] _encode_affiliation() (academic_metrics.runners.pipeline.PipelineRunner method) (academic_metrics.runners.pipeline.PipelineRunner static method) _extract_categories() (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator method), [1] _flatten_to_list() (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator method) _format_chain_sequence() (academic_metrics.ChainBuilder.ChainBuilder.ChainManager method) _format_overwrite_warning() (academic_metrics.ChainBuilder.ChainBuilder.ChainManager method) _generate_normal_id() (academic_metrics.core.category_processor.CategoryProcessor method) (academic_metrics.core.category_processor.CategoryProcessor static method) _generate_url() (academic_metrics.core.category_processor.CategoryProcessor method) (academic_metrics.core.category_processor.CategoryProcessor static method) _get_acf_func() (academic_metrics.runners.pipeline.PipelineRunner method), [1] _get_classification_dependencies() (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator method) _get_classification_results_by_doi() (academic_metrics.AI.abstract_classifier.AbstractClassifier method) _get_last_day_of_month() (academic_metrics.data_collection.CrossrefWrapper.CrossrefWrapper method) _get_llm_model_type() (academic_metrics.ChainBuilder.ChainBuilder.ChainManager method) _get_logit_bias_dict() (academic_metrics.ChainBuilder.ChainBuilder.ChainManager method) _has_ran_classification() (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator method), [1] _id (academic_metrics.dataclass_models.concrete_dataclasses.CategoryInfo attribute) (academic_metrics.dataclass_models.concrete_dataclasses.CrossrefArticleDetails attribute) (academic_metrics.dataclass_models.concrete_dataclasses.FacultyInfo attribute) (academic_metrics.dataclass_models.concrete_dataclasses.GlobalFacultyStats attribute) _initialize_classification_chain_manager() (academic_metrics.AI.abstract_classifier.AbstractClassifier method) _initialize_llm() (academic_metrics.ChainBuilder.ChainBuilder.ChainManager method) _initialize_parser() (academic_metrics.ChainBuilder.ChainBuilder.ChainManager method) _initialize_pre_classification_chain_manager() (academic_metrics.AI.abstract_classifier.AbstractClassifier method) _initialize_theme_chain_manager() (academic_metrics.AI.abstract_classifier.AbstractClassifier method) _inject_categories() (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator method), [1] _load_files() (academic_metrics.runners.pipeline.PipelineRunner method), [1] _load_taxonomy_from_string() (academic_metrics.utils.taxonomy_util.Taxonomy static method) _make_dirs_helper() (academic_metrics.AI.abstract_classifier.AbstractClassifier method) _make_doi_abstract_dict() (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator method), [1] _make_files() (academic_metrics.runners.pipeline.PipelineRunner method), [1] _normalize_abstract() (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator method), [1] _recreate_llm() (academic_metrics.ChainBuilder.ChainBuilder.ChainManager method) _refine_departments() (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator method) _refine_faculty() (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator method) _refine_faculty_stats() (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator method) _registry (academic_metrics.factories.dataclass_factory.DataClassFactory attribute) _retrieve_doi_abstract() (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator method) _run_chain_validation_checks() (academic_metrics.ChainBuilder.ChainBuilder.ChainManager method) _run_initial_api_key_validation() (academic_metrics.AI.abstract_classifier.AbstractClassifier method) _run_pydantic_parser_logging() (academic_metrics.ChainBuilder.ChainBuilder.ChainBuilder method), [1] _run_validation_checks() (academic_metrics.ChainBuilder.ChainBuilder.ChainManager method) _save_all_results() (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator method) _serialize_and_save_articles() (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator method) _serialize_and_save_category_article_stats() (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator method) _serialize_and_save_category_data() (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator method) _serialize_and_save_faculty_stats() (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator method) _serialize_and_save_global_faculty_stats() (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator method) _set_all_low_categories() (academic_metrics.utils.taxonomy_util.Taxonomy method) _set_all_mid_categories() (academic_metrics.utils.taxonomy_util.Taxonomy method) _set_all_top_categories() (academic_metrics.utils.taxonomy_util.Taxonomy method) _set_classification_ran_true() (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator method), [1] _setup_selenium_options() (academic_metrics.data_collection.scraper.Scraper method), [1] _strategies (academic_metrics.factories.strategy_factory.StrategyFactory attribute) _taxonomy (academic_metrics.utils.taxonomy_util.Taxonomy attribute) _test_category_processor() (academic_metrics.core.category_processor.CategoryProcessor method) _test_connection() (academic_metrics.DB.DatabaseSetup.DatabaseWrapper method), [1] _update_chain_variables() (academic_metrics.ChainBuilder.ChainBuilder.ChainManager method) _update_classified_instance_variables() (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator method), [1] _valid_levels (academic_metrics.utils.taxonomy_util.Taxonomy attribute) _validate() (academic_metrics.utils.api_key_validator.APIKeyValidator method) _validate_api_key() (academic_metrics.runners.pipeline.PipelineRunner method), [1] _validate_classification_ran() (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator method), [1] _validate_words_to_ban() (academic_metrics.ChainBuilder.ChainBuilder.ChainManager method) _write_to_json() (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator method) A abstract (academic_metrics.dataclass_models.concrete_dataclasses.ArticleDetails attribute), [1] (academic_metrics.dataclass_models.concrete_dataclasses.CrossrefArticleDetails attribute), [1] ABSTRACT (academic_metrics.enums.enums.AttributeTypes attribute), [1] abstract_classifier_factory (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator attribute) abstract_classifier_factory() (academic_metrics.factories.abstract_classifier_factory.ClassifierFactory method) abstract_key (academic_metrics.strategies.AttributeExtractionStrategies.CrossrefAbstractExtractionStrategy attribute) abstract_pattern (academic_metrics.strategies.AttributeExtractionStrategies.AttributeExtractionStrategy attribute) AbstractBaseDataClass (class in academic_metrics.dataclass_models.abstract_base_dataclass) AbstractClassifier (class in academic_metrics.AI.abstract_classifier) academic_metrics.AI module academic_metrics.AI.abstract_classifier module academic_metrics.ChainBuilder module academic_metrics.ChainBuilder.ChainBuilder module academic_metrics.configs.global_config module academic_metrics.core module academic_metrics.core.category_processor module academic_metrics.data_collection module academic_metrics.data_collection.CrossrefWrapper module academic_metrics.data_collection.scraper module academic_metrics.dataclass_models module academic_metrics.dataclass_models.abstract_base_dataclass module academic_metrics.dataclass_models.concrete_dataclasses module academic_metrics.DB module academic_metrics.DB.DatabaseSetup module academic_metrics.enums module academic_metrics.enums.dataclass_enums module academic_metrics.enums.enums module academic_metrics.factories module academic_metrics.factories.abstract_classifier_factory module academic_metrics.factories.dataclass_factory module academic_metrics.factories.strategy_factory module academic_metrics.orchestrators module academic_metrics.orchestrators.category_data_orchestrator module academic_metrics.orchestrators.classification_orchestrator module academic_metrics.postprocessing module academic_metrics.postprocessing.BasePostprocessor module academic_metrics.postprocessing.DepartmentPostprocessor module academic_metrics.postprocessing.FacultyPostprocessor module academic_metrics.runners module academic_metrics.runners.pipeline module academic_metrics.strategies module academic_metrics.strategies.AttributeExtractionStrategies module academic_metrics.utils module academic_metrics.utils.api_key_validator module academic_metrics.utils.minhash_util module academic_metrics.utils.taxonomy_util module academic_metrics.utils.unicode_chars_dict module academic_metrics.utils.utilities module academic_metrics.utils.warning_manager module acollect_yrange() (academic_metrics.data_collection.CrossrefWrapper.CrossrefWrapper method) add_chain() (academic_metrics.ChainBuilder.ChainBuilder.ChainComposer method), [1] add_chain_layer() (academic_metrics.ChainBuilder.ChainBuilder.ChainManager method) affiliation (academic_metrics.data_collection.CrossrefWrapper.CrossrefWrapper attribute) ai_api_key (academic_metrics.factories.abstract_classifier_factory.ClassifierFactory attribute) (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator attribute) (academic_metrics.runners.pipeline.PipelineRunner attribute) anthropic (academic_metrics.utils.api_key_validator.ValidationResult attribute) api_key (academic_metrics.ChainBuilder.ChainBuilder.ChainManager attribute) (academic_metrics.data_collection.scraper.Scraper attribute) APIKeyValidator (class in academic_metrics.utils.api_key_validator) article_citation_map (academic_metrics.dataclass_models.concrete_dataclasses.ArticleStats attribute), [1] (academic_metrics.dataclass_models.concrete_dataclasses.CrossrefArticleStats attribute), [1] article_collection (academic_metrics.DB.DatabaseSetup.DatabaseWrapper attribute) article_count (academic_metrics.dataclass_models.concrete_dataclasses.CategoryInfo attribute), [1] (academic_metrics.dataclass_models.concrete_dataclasses.FacultyInfo attribute), [1] (academic_metrics.dataclass_models.concrete_dataclasses.GlobalFacultyStats attribute), [1] ARTICLE_DETAILS (academic_metrics.enums.dataclass_enums.DataClassTypes attribute), [1] ARTICLE_STATS (academic_metrics.enums.dataclass_enums.DataClassTypes attribute), [1] ArticleDetails (class in academic_metrics.dataclass_models.concrete_dataclasses) articles (academic_metrics.core.category_processor.CategoryProcessor attribute) ArticleStats (class in academic_metrics.dataclass_models.concrete_dataclasses) AttributeExtractionStrategy (class in academic_metrics.strategies.AttributeExtractionStrategies) AttributeTypes (class in academic_metrics.enums.enums) AUTHOR (academic_metrics.enums.enums.AttributeTypes attribute), [1] average_citations (academic_metrics.dataclass_models.concrete_dataclasses.FacultyInfo attribute), [1] (academic_metrics.dataclass_models.concrete_dataclasses.GlobalFacultyStats attribute), [1] B base_url (academic_metrics.data_collection.CrossrefWrapper.CrossrefWrapper attribute) BasePostprocessor (class in academic_metrics.postprocessing.BasePostprocessor) build_request_url() (academic_metrics.data_collection.CrossrefWrapper.CrossrefWrapper method) C call_get_attributes() (academic_metrics.core.category_processor.CategoryProcessor method), [1] categories (academic_metrics.dataclass_models.concrete_dataclasses.CrossrefArticleDetails attribute), [1] (academic_metrics.dataclass_models.concrete_dataclasses.GlobalFacultyStats attribute), [1] category (academic_metrics.dataclass_models.concrete_dataclasses.FacultyInfo attribute), [1] (academic_metrics.utils.warning_manager.CustomWarning attribute) category_article_stats (academic_metrics.core.category_processor.CategoryProcessor attribute) category_collection (academic_metrics.DB.DatabaseSetup.DatabaseWrapper attribute) category_data (academic_metrics.core.category_processor.CategoryProcessor attribute) category_id (academic_metrics.dataclass_models.concrete_dataclasses.FacultyInfo attribute) category_ids (academic_metrics.dataclass_models.concrete_dataclasses.CrossrefArticleDetails attribute) (academic_metrics.dataclass_models.concrete_dataclasses.GlobalFacultyStats attribute) CATEGORY_INFO (academic_metrics.enums.dataclass_enums.DataClassTypes attribute), [1] category_name (academic_metrics.dataclass_models.concrete_dataclasses.CategoryInfo attribute), [1] category_processor (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator attribute) (academic_metrics.runners.pipeline.PipelineRunner attribute) category_url (academic_metrics.dataclass_models.concrete_dataclasses.FacultyInfo attribute) category_urls (academic_metrics.dataclass_models.concrete_dataclasses.CrossrefArticleDetails attribute) (academic_metrics.dataclass_models.concrete_dataclasses.GlobalFacultyStats attribute) CategoryDataOrchestrator (class in academic_metrics.orchestrators.category_data_orchestrator) CategoryInfo (class in academic_metrics.dataclass_models.concrete_dataclasses) CategoryProcessor (class in academic_metrics.core.category_processor) chain (academic_metrics.ChainBuilder.ChainBuilder.ChainBuilder attribute) (academic_metrics.ChainBuilder.ChainBuilder.ChainWrapper attribute) chain_composer (academic_metrics.ChainBuilder.ChainBuilder.ChainManager attribute) chain_sequence (academic_metrics.ChainBuilder.ChainBuilder.ChainComposer attribute) chain_variables (academic_metrics.ChainBuilder.ChainBuilder.ChainManager attribute) chain_variables_update_overwrite_warning_counter (academic_metrics.ChainBuilder.ChainBuilder.ChainManager attribute) ChainBuilder (class in academic_metrics.ChainBuilder.ChainBuilder) ChainComposer (class in academic_metrics.ChainBuilder.ChainBuilder) ChainManager (class in academic_metrics.ChainBuilder.ChainBuilder) ChainWrapper (class in academic_metrics.ChainBuilder.ChainBuilder) chat_prompt (academic_metrics.ChainBuilder.ChainBuilder.ChainBuilder attribute) citation_average (academic_metrics.dataclass_models.concrete_dataclasses.CategoryInfo attribute), [1] citation_map (academic_metrics.dataclass_models.concrete_dataclasses.GlobalFacultyStats attribute), [1] classification_orchestrator (academic_metrics.runners.pipeline.PipelineRunner attribute) classification_results (academic_metrics.AI.abstract_classifier.AbstractClassifier attribute) ClassificationOrchestrator (class in academic_metrics.orchestrators.classification_orchestrator) ClassificationResultsDict (in module academic_metrics.orchestrators.classification_orchestrator) ClassificationResultsTuple (in module academic_metrics.orchestrators.classification_orchestrator) ClassifierFactory (class in academic_metrics.factories.abstract_classifier_factory) classify() (academic_metrics.AI.abstract_classifier.AbstractClassifier method), [1] classify_abstract() (academic_metrics.AI.abstract_classifier.AbstractClassifier method) clean_abstract() (academic_metrics.strategies.AttributeExtractionStrategies.CrossrefAbstractExtractionStrategy method), [1] clean_faculty_affiliations() (academic_metrics.core.category_processor.CategoryProcessor method), [1] clean_faculty_members() (academic_metrics.core.category_processor.CategoryProcessor method), [1] clean_title() (academic_metrics.strategies.AttributeExtractionStrategies.CrossrefTitleExtractionStrategy method), [1] CleanerOutput (class in academic_metrics.data_collection.scraper) clear_collection() (academic_metrics.DB.DatabaseSetup.DatabaseWrapper method), [1] client (academic_metrics.data_collection.scraper.Scraper attribute) (academic_metrics.DB.DatabaseSetup.DatabaseWrapper attribute) close_connection() (academic_metrics.DB.DatabaseSetup.DatabaseWrapper method), [1] CollectionData (in module academic_metrics.DB.DatabaseSetup) COLOR_MAP (academic_metrics.configs.global_config.ColorFormatter attribute), [1] ColorFormatter (class in academic_metrics.configs.global_config) command_line_runner() (in module academic_metrics.runners.pipeline) compare_signatures() (academic_metrics.utils.minhash_util.MinHashUtility method), [1] compute_signature() (academic_metrics.utils.minhash_util.MinHashUtility method), [1] configure_logging() (in module academic_metrics.configs.global_config) constants module constants.dir_paths module create_article_object() (academic_metrics.core.category_processor.CategoryProcessor method), [1] create_author_sequence_dict() (academic_metrics.strategies.AttributeExtractionStrategies.AttributeExtractionStrategy method), [1] create_unknown_authors_dict() (academic_metrics.strategies.AttributeExtractionStrategies.AttributeExtractionStrategy method), [1] CRITICAL (in module academic_metrics.configs.global_config) CROSSREF_ABSTRACT (academic_metrics.enums.enums.AttributeTypes attribute), [1] CROSSREF_ARTICLE_DETAILS (academic_metrics.enums.dataclass_enums.DataClassTypes attribute), [1] CROSSREF_ARTICLE_STATS (academic_metrics.enums.dataclass_enums.DataClassTypes attribute), [1] crossref_author_key (academic_metrics.strategies.AttributeExtractionStrategies.AttributeExtractionStrategy attribute) CROSSREF_AUTHORS (academic_metrics.enums.enums.AttributeTypes attribute), [1] CROSSREF_CATEGORIES (academic_metrics.enums.enums.AttributeTypes attribute), [1] CROSSREF_CITATION_COUNT (academic_metrics.enums.enums.AttributeTypes attribute), [1] CROSSREF_CREATED_DATE (academic_metrics.enums.enums.AttributeTypes attribute), [1] CROSSREF_DEPARTMENTS (academic_metrics.enums.enums.AttributeTypes attribute), [1] CROSSREF_DOI (academic_metrics.enums.enums.AttributeTypes attribute), [1] CROSSREF_EXTRA_CONTEXT (academic_metrics.enums.enums.AttributeTypes attribute), [1] CROSSREF_FILE_NAME_SUFFIX (academic_metrics.utils.utilities.Utilities attribute) crossref_file_splitter() (academic_metrics.utils.utilities.Utilities method), [1] CROSSREF_JOURNAL (academic_metrics.enums.enums.AttributeTypes attribute), [1] CROSSREF_LICENSE_URL (academic_metrics.enums.enums.AttributeTypes attribute), [1] CROSSREF_PUBLISHED_ONLINE (academic_metrics.enums.enums.AttributeTypes attribute), [1] CROSSREF_PUBLISHED_PRINT (academic_metrics.enums.enums.AttributeTypes attribute), [1] CROSSREF_THEMES (academic_metrics.enums.enums.AttributeTypes attribute), [1] CROSSREF_TITLE (academic_metrics.enums.enums.AttributeTypes attribute), [1] CROSSREF_URL (academic_metrics.enums.enums.AttributeTypes attribute), [1] crossref_wrapper (academic_metrics.runners.pipeline.PipelineRunner attribute) CrossrefAbstractExtractionStrategy (class in academic_metrics.strategies.AttributeExtractionStrategies) CrossrefArticleDetails (class in academic_metrics.dataclass_models.concrete_dataclasses) CrossrefArticleStats (class in academic_metrics.dataclass_models.concrete_dataclasses) CrossrefAuthorExtractionStrategy (class in academic_metrics.strategies.AttributeExtractionStrategies) CrossrefCategoriesExtractionStrategy (class in academic_metrics.strategies.AttributeExtractionStrategies) CrossrefCitationCountExtractionStrategy (class in academic_metrics.strategies.AttributeExtractionStrategies) CrossrefCreatedDateExtractionStrategy (class in academic_metrics.strategies.AttributeExtractionStrategies) CrossrefDepartmentExtractionStrategy (class in academic_metrics.strategies.AttributeExtractionStrategies) CrossrefDOIExtractionStrategy (class in academic_metrics.strategies.AttributeExtractionStrategies) CrossrefExtraContextExtractionStrategy (class in academic_metrics.strategies.AttributeExtractionStrategies) CrossrefJournalExtractionStrategy (class in academic_metrics.strategies.AttributeExtractionStrategies) CrossrefLicenseURLExtractionStrategy (class in academic_metrics.strategies.AttributeExtractionStrategies) CrossrefPublishedOnlineExtractionStrategy (class in academic_metrics.strategies.AttributeExtractionStrategies) CrossrefPublishedPrintExtractionStrategy (class in academic_metrics.strategies.AttributeExtractionStrategies) CrossrefThemesExtractionStrategy (class in academic_metrics.strategies.AttributeExtractionStrategies) CrossrefTitleExtractionStrategy (class in academic_metrics.strategies.AttributeExtractionStrategies) CrossrefURLExtractionStrategy (class in academic_metrics.strategies.AttributeExtractionStrategies) CrossrefWrapper (class in academic_metrics.data_collection.CrossrefWrapper) CustomWarning D data (academic_metrics.data_collection.CrossrefWrapper.CrossrefWrapper attribute) (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator attribute) DatabaseSnapshot (in module academic_metrics.DB.DatabaseSetup) DatabaseWrapper (class in academic_metrics.DB.DatabaseSetup) dataclass_factory (academic_metrics.core.category_processor.CategoryProcessor attribute) (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator attribute) (academic_metrics.runners.pipeline.PipelineRunner attribute) DataClassFactory (class in academic_metrics.factories.dataclass_factory) DataClassTypes (class in academic_metrics.enums.dataclass_enums) date_published_online (academic_metrics.dataclass_models.concrete_dataclasses.ArticleDetails attribute), [1] (academic_metrics.dataclass_models.concrete_dataclasses.CrossrefArticleDetails attribute), [1] date_published_print (academic_metrics.dataclass_models.concrete_dataclasses.ArticleDetails attribute), [1] (academic_metrics.dataclass_models.concrete_dataclasses.CrossrefArticleDetails attribute), [1] db (academic_metrics.DB.DatabaseSetup.DatabaseWrapper attribute) (academic_metrics.runners.pipeline.PipelineRunner attribute) db_name (academic_metrics.runners.pipeline.PipelineRunner attribute) debug (academic_metrics.runners.pipeline.PipelineRunner attribute) DEBUG (in module academic_metrics.configs.global_config) demo_taxonomy() (in module academic_metrics.utils.taxonomy_util) DEPARTMENT (academic_metrics.enums.enums.AttributeTypes attribute), [1] department_affiliations (academic_metrics.dataclass_models.concrete_dataclasses.FacultyInfo attribute), [1] (academic_metrics.dataclass_models.concrete_dataclasses.GlobalFacultyStats attribute), [1] department_count (academic_metrics.dataclass_models.concrete_dataclasses.CategoryInfo attribute), [1] department_postprocessor (academic_metrics.runners.pipeline.PipelineRunner attribute) DepartmentPostprocessor (class in academic_metrics.postprocessing.DepartmentPostprocessor) departments (academic_metrics.dataclass_models.concrete_dataclasses.CategoryInfo attribute), [1] display_warning_summary() (academic_metrics.utils.warning_manager.WarningManager method), [1] doi (academic_metrics.dataclass_models.concrete_dataclasses.ArticleDetails attribute), [1] (academic_metrics.dataclass_models.concrete_dataclasses.CrossrefArticleDetails attribute), [1] doi_citation_map (academic_metrics.dataclass_models.concrete_dataclasses.FacultyInfo attribute), [1] doi_list (academic_metrics.dataclass_models.concrete_dataclasses.CategoryInfo attribute), [1] dois (academic_metrics.dataclass_models.concrete_dataclasses.FacultyInfo attribute), [1] (academic_metrics.dataclass_models.concrete_dataclasses.GlobalFacultyStats attribute), [1] download_url (academic_metrics.dataclass_models.concrete_dataclasses.ArticleDetails attribute), [1] (academic_metrics.dataclass_models.concrete_dataclasses.CrossrefArticleDetails attribute), [1] duplicate_postprocessor() (academic_metrics.postprocessing.BasePostprocessor.BasePostprocessor method), [1] E END_RECORD (academic_metrics.enums.enums.AttributeTypes attribute), [1] entry_id (academic_metrics.utils.warning_manager.CustomWarning attribute) ERROR (in module academic_metrics.configs.global_config) extend (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator attribute) (academic_metrics.runners.pipeline.SaveOfflineKwargs attribute) extra_context (academic_metrics.data_collection.scraper.CleanerOutput attribute), [1] extract_attribute() (academic_metrics.strategies.AttributeExtractionStrategies.AttributeExtractionStrategy method), [1] (academic_metrics.strategies.AttributeExtractionStrategies.CrossrefAbstractExtractionStrategy method), [1] (academic_metrics.strategies.AttributeExtractionStrategies.CrossrefAuthorExtractionStrategy method), [1] (academic_metrics.strategies.AttributeExtractionStrategies.CrossrefCategoriesExtractionStrategy method), [1] (academic_metrics.strategies.AttributeExtractionStrategies.CrossrefCitationCountExtractionStrategy method), [1] (academic_metrics.strategies.AttributeExtractionStrategies.CrossrefCreatedDateExtractionStrategy method) (academic_metrics.strategies.AttributeExtractionStrategies.CrossrefDepartmentExtractionStrategy method), [1] (academic_metrics.strategies.AttributeExtractionStrategies.CrossrefDOIExtractionStrategy method) (academic_metrics.strategies.AttributeExtractionStrategies.CrossrefExtraContextExtractionStrategy method) (academic_metrics.strategies.AttributeExtractionStrategies.CrossrefJournalExtractionStrategy method) (academic_metrics.strategies.AttributeExtractionStrategies.CrossrefLicenseURLExtractionStrategy method) (academic_metrics.strategies.AttributeExtractionStrategies.CrossrefPublishedOnlineExtractionStrategy method) (academic_metrics.strategies.AttributeExtractionStrategies.CrossrefPublishedPrintExtractionStrategy method) (academic_metrics.strategies.AttributeExtractionStrategies.CrossrefThemesExtractionStrategy method) (academic_metrics.strategies.AttributeExtractionStrategies.CrossrefTitleExtractionStrategy method), [1] (academic_metrics.strategies.AttributeExtractionStrategies.CrossrefURLExtractionStrategy method) extract_classified_categories() (academic_metrics.AI.abstract_classifier.AbstractClassifier method) extract_sets() (academic_metrics.postprocessing.BasePostprocessor.BasePostprocessor method), [1] F faculty (academic_metrics.dataclass_models.concrete_dataclasses.CategoryInfo attribute), [1] faculty_affiliations (academic_metrics.dataclass_models.concrete_dataclasses.ArticleDetails attribute), [1] (academic_metrics.dataclass_models.concrete_dataclasses.CrossrefArticleDetails attribute), [1] faculty_collection (academic_metrics.DB.DatabaseSetup.DatabaseWrapper attribute) faculty_count (academic_metrics.dataclass_models.concrete_dataclasses.CategoryInfo attribute), [1] FACULTY_INFO (academic_metrics.enums.dataclass_enums.DataClassTypes attribute), [1] faculty_members (academic_metrics.dataclass_models.concrete_dataclasses.ArticleDetails attribute), [1] (academic_metrics.dataclass_models.concrete_dataclasses.CrossrefArticleDetails attribute), [1] faculty_postprocessor (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator attribute) (academic_metrics.runners.pipeline.PipelineRunner attribute) faculty_stats (academic_metrics.core.category_processor.CategoryProcessor attribute) (academic_metrics.dataclass_models.concrete_dataclasses.FacultyStats attribute), [1] FACULTY_STATS (academic_metrics.enums.dataclass_enums.DataClassTypes attribute), [1] FacultyInfo (class in academic_metrics.dataclass_models.concrete_dataclasses) FacultyPostprocessor (class in academic_metrics.postprocessing.FacultyPostprocessor) FacultyStats (class in academic_metrics.dataclass_models.concrete_dataclasses) fallback_chain (academic_metrics.ChainBuilder.ChainBuilder.ChainBuilder attribute) (academic_metrics.ChainBuilder.ChainBuilder.ChainWrapper attribute) fallback_parser (academic_metrics.ChainBuilder.ChainBuilder.ChainBuilder attribute) (academic_metrics.ChainBuilder.ChainBuilder.ChainWrapper attribute) FallbackParserType (class in academic_metrics.ChainBuilder.ChainBuilder) fetch_data() (academic_metrics.data_collection.CrossrefWrapper.CrossrefWrapper method) fetch_data_for_multiple_years() (academic_metrics.data_collection.CrossrefWrapper.CrossrefWrapper method), [1] files (academic_metrics.dataclass_models.concrete_dataclasses.CategoryInfo attribute), [1] final_article_data (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator attribute) final_article_stats_data (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator attribute) final_category_data (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator attribute) final_data_process() (academic_metrics.data_collection.CrossrefWrapper.CrossrefWrapper method), [1] final_faculty_data (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator attribute) final_global_faculty_data (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator attribute) FirstCallRequired (in module academic_metrics.ChainBuilder.ChainBuilder) fix_counts() (academic_metrics.DB.DatabaseSetup.DatabaseWrapper method) format() (academic_metrics.configs.global_config.ColorFormatter method) from_year (academic_metrics.data_collection.CrossrefWrapper.CrossrefWrapper attribute) G generate_coeeficients() (academic_metrics.utils.minhash_util.MinHashUtility method) generate_coefficients() (academic_metrics.utils.minhash_util.MinHashUtility method) generate_error_id() (academic_metrics.strategies.AttributeExtractionStrategies.AttributeExtractionStrategy method), [1] generate_hash_functions() (academic_metrics.utils.minhash_util.MinHashUtility method), [1] generate_signatures() (academic_metrics.postprocessing.BasePostprocessor.BasePostprocessor method), [1] get_abstract() (academic_metrics.data_collection.scraper.Scraper method) get_all_data() (academic_metrics.DB.DatabaseSetup.DatabaseWrapper method), [1] get_articles() (academic_metrics.core.category_processor.CategoryProcessor method), [1] get_attributes() (academic_metrics.utils.utilities.Utilities method), [1] get_author_name() (academic_metrics.strategies.AttributeExtractionStrategies.CrossrefAuthorExtractionStrategy method), [1] get_author_obj() (academic_metrics.strategies.AttributeExtractionStrategies.AttributeExtractionStrategy method), [1] get_authors_as_list() (academic_metrics.strategies.AttributeExtractionStrategies.AttributeExtractionStrategy method), [1] get_category_article_stats() (academic_metrics.core.category_processor.CategoryProcessor method), [1] get_category_data() (academic_metrics.core.category_processor.CategoryProcessor method), [1] get_chain() (academic_metrics.ChainBuilder.ChainBuilder.ChainBuilder method), [1] get_chain_sequence() (academic_metrics.ChainBuilder.ChainBuilder.ChainManager method), [1] get_chain_variables() (academic_metrics.ChainBuilder.ChainBuilder.ChainManager method), [1] get_classification_results_by_doi() (academic_metrics.AI.abstract_classifier.AbstractClassifier method), [1] get_classification_results_dict() (academic_metrics.AI.abstract_classifier.AbstractClassifier method) get_crossref_author_affils() (academic_metrics.strategies.AttributeExtractionStrategies.AttributeExtractionStrategy method), [1] get_dataclass() (academic_metrics.factories.dataclass_factory.DataClassFactory class method) (academic_metrics.factories.dataclass_factory.DataClassFactory method) get_dois() (academic_metrics.DB.DatabaseSetup.DatabaseWrapper method), [1] get_duplicate_utilities() (academic_metrics.postprocessing.BasePostprocessor.BasePostprocessor method), [1] get_excel_report() (in module academic_metrics.runners.pipeline) get_faculty_stats() (academic_metrics.core.category_processor.CategoryProcessor method), [1] get_fallback_chain() (academic_metrics.ChainBuilder.ChainBuilder.ChainBuilder method), [1] get_fallback_parser_type() (academic_metrics.ChainBuilder.ChainBuilder.ChainWrapper method), [1] get_final_article_data() (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator method) get_final_article_stats_data() (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator method) get_final_category_data() (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator method) get_final_faculty_data() (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator method) get_final_global_faculty_data() (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator method) get_full_results() (academic_metrics.utils.api_key_validator.APIKeyValidator method) get_global_faculty_stats() (academic_metrics.core.category_processor.CategoryProcessor method), [1] get_low_categories() (academic_metrics.utils.taxonomy_util.Taxonomy method) get_mid_cat_for_low_cat() (academic_metrics.utils.taxonomy_util.Taxonomy method) get_mid_categories() (academic_metrics.utils.taxonomy_util.Taxonomy method) get_most_frequent_value_variation() (academic_metrics.postprocessing.BasePostprocessor.BasePostprocessor method) get_most_frequent_variation() (academic_metrics.postprocessing.BasePostprocessor.BasePostprocessor method) get_package_data_dir() (in module constants.dir_paths) get_parser_type() (academic_metrics.ChainBuilder.ChainBuilder.ChainWrapper method), [1] get_raw_classification_outputs() (academic_metrics.AI.abstract_classifier.AbstractClassifier method), [1] get_raw_theme_results() (academic_metrics.AI.abstract_classifier.AbstractClassifier method), [1] get_refined_faculty_name() (academic_metrics.dataclass_models.concrete_dataclasses.FacultyStats method) get_result_list() (academic_metrics.data_collection.CrossrefWrapper.CrossrefWrapper method), [1] get_results_for_api_key() (academic_metrics.utils.api_key_validator.APIKeyValidator method) get_strategy() (academic_metrics.factories.strategy_factory.StrategyFactory class method) (academic_metrics.factories.strategy_factory.StrategyFactory method) get_taxonomy() (academic_metrics.utils.taxonomy_util.Taxonomy method) get_top_cat_for_mid_cat() (academic_metrics.utils.taxonomy_util.Taxonomy method) get_top_categories() (academic_metrics.utils.taxonomy_util.Taxonomy method) get_unclassified_abstracts() (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator method), [1] get_unclassified_details_dict() (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator method), [1] get_unclassified_doi_abstract_dict() (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator method), [1] get_unclassified_dois() (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator method), [1] get_unclassified_item_count() (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator method), [1] get_unclassified_items() (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator method), [1] global_faculty_stats (academic_metrics.core.category_processor.CategoryProcessor attribute) GLOBAL_FACULTY_STATS (academic_metrics.enums.dataclass_enums.DataClassTypes attribute), [1] GlobalFacultyStats (class in academic_metrics.dataclass_models.concrete_dataclasses) google (academic_metrics.utils.api_key_validator.ValidationResult attribute) H hash_fns (academic_metrics.utils.minhash_util.MinHashUtility attribute) html_to_markdown() (academic_metrics.strategies.AttributeExtractionStrategies.AttributeExtractionStrategy method), [1] I INFO (in module academic_metrics.configs.global_config) initialize_categories() (academic_metrics.core.category_processor.CategoryProcessor method), [1] insert_articles() (academic_metrics.DB.DatabaseSetup.DatabaseWrapper method), [1] insert_categories() (academic_metrics.DB.DatabaseSetup.DatabaseWrapper method), [1] insert_faculty() (academic_metrics.DB.DatabaseSetup.DatabaseWrapper method), [1] is_registered() (academic_metrics.factories.dataclass_factory.DataClassFactory class method) (academic_metrics.factories.dataclass_factory.DataClassFactory method) is_valid() (academic_metrics.utils.api_key_validator.APIKeyValidator method) is_valid_category() (academic_metrics.AI.abstract_classifier.AbstractClassifier method) (academic_metrics.utils.taxonomy_util.Taxonomy method) J journal (academic_metrics.dataclass_models.concrete_dataclasses.ArticleDetails attribute), [1] (academic_metrics.dataclass_models.concrete_dataclasses.CrossrefArticleDetails attribute), [1] journals (academic_metrics.dataclass_models.concrete_dataclasses.GlobalFacultyStats attribute), [1] L large_prime (academic_metrics.utils.minhash_util.MinHashUtility attribute) license_url (academic_metrics.dataclass_models.concrete_dataclasses.ArticleDetails attribute), [1] (academic_metrics.dataclass_models.concrete_dataclasses.CrossrefArticleDetails attribute), [1] llm (academic_metrics.ChainBuilder.ChainBuilder.ChainBuilder attribute) (academic_metrics.ChainBuilder.ChainBuilder.ChainManager attribute) llm_kwargs (academic_metrics.ChainBuilder.ChainBuilder.ChainManager attribute) llm_model (academic_metrics.ChainBuilder.ChainBuilder.ChainManager attribute) llm_model_type (academic_metrics.ChainBuilder.ChainBuilder.ChainManager attribute) llm_temperature (academic_metrics.ChainBuilder.ChainBuilder.ChainManager attribute) locate_academic_metrics_root() (in module constants.dir_paths) locate_src_root() (in module constants.dir_paths) log_extraction_warning() (academic_metrics.strategies.AttributeExtractionStrategies.AttributeExtractionStrategy method), [1] log_file_path (academic_metrics.ChainBuilder.ChainBuilder.ChainBuilder attribute) (academic_metrics.core.category_processor.CategoryProcessor attribute) (academic_metrics.factories.dataclass_factory.DataClassFactory attribute) (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator attribute) LOG_LEVEL (in module academic_metrics.configs.global_config) LOG_TO_CONSOLE (in module academic_metrics.configs.global_config) log_warning() (academic_metrics.utils.warning_manager.WarningManager method) logger (academic_metrics.ChainBuilder.ChainBuilder.ChainBuilder attribute) (academic_metrics.ChainBuilder.ChainBuilder.ChainComposer attribute) (academic_metrics.ChainBuilder.ChainBuilder.ChainManager attribute) (academic_metrics.ChainBuilder.ChainBuilder.ChainWrapper attribute) (academic_metrics.core.category_processor.CategoryProcessor attribute) (academic_metrics.data_collection.CrossrefWrapper.CrossrefWrapper attribute) (academic_metrics.DB.DatabaseSetup.DatabaseWrapper attribute) (academic_metrics.factories.abstract_classifier_factory.ClassifierFactory attribute) (academic_metrics.factories.dataclass_factory.DataClassFactory attribute) (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator attribute) (academic_metrics.runners.pipeline.PipelineRunner attribute) (academic_metrics.strategies.AttributeExtractionStrategies.AttributeExtractionStrategy attribute) (academic_metrics.utils.taxonomy_util.Taxonomy attribute) low_category_urls (academic_metrics.dataclass_models.concrete_dataclasses.CrossrefArticleDetails attribute) (academic_metrics.dataclass_models.concrete_dataclasses.GlobalFacultyStats attribute) low_level_categories (academic_metrics.dataclass_models.concrete_dataclasses.CrossrefArticleDetails attribute), [1] (academic_metrics.dataclass_models.concrete_dataclasses.GlobalFacultyStats attribute), [1] M main() (in module academic_metrics.runners.pipeline) make_files (academic_metrics.runners.pipeline.SaveOfflineKwargs attribute) make_files() (academic_metrics.utils.utilities.Utilities method) MAX_CONCURRENT_REQUESTS (academic_metrics.data_collection.CrossrefWrapper.CrossrefWrapper attribute) message (academic_metrics.utils.warning_manager.CustomWarning attribute) mid_category_urls (academic_metrics.dataclass_models.concrete_dataclasses.CrossrefArticleDetails attribute) (academic_metrics.dataclass_models.concrete_dataclasses.GlobalFacultyStats attribute) mid_level_categories (academic_metrics.dataclass_models.concrete_dataclasses.CrossrefArticleDetails attribute), [1] (academic_metrics.dataclass_models.concrete_dataclasses.GlobalFacultyStats attribute), [1] minhash_util (academic_metrics.postprocessing.BasePostprocessor.BasePostprocessor attribute) MinHashUtility (class in academic_metrics.utils.minhash_util) missing_abstracts_file (academic_metrics.strategies.AttributeExtractionStrategies.AttributeExtractionStrategy attribute) missing_authors_file (academic_metrics.strategies.AttributeExtractionStrategies.CrossrefAuthorExtractionStrategy attribute) model_computed_fields (academic_metrics.data_collection.scraper.CleanerOutput attribute) model_config (academic_metrics.data_collection.scraper.CleanerOutput attribute) model_fields (academic_metrics.data_collection.scraper.CleanerOutput attribute) module academic_metrics.AI academic_metrics.AI.abstract_classifier academic_metrics.ChainBuilder academic_metrics.ChainBuilder.ChainBuilder academic_metrics.configs.global_config academic_metrics.core academic_metrics.core.category_processor academic_metrics.data_collection academic_metrics.data_collection.CrossrefWrapper academic_metrics.data_collection.scraper academic_metrics.dataclass_models academic_metrics.dataclass_models.abstract_base_dataclass academic_metrics.dataclass_models.concrete_dataclasses academic_metrics.DB academic_metrics.DB.DatabaseSetup academic_metrics.enums academic_metrics.enums.dataclass_enums academic_metrics.enums.enums academic_metrics.factories academic_metrics.factories.abstract_classifier_factory academic_metrics.factories.dataclass_factory academic_metrics.factories.strategy_factory academic_metrics.orchestrators academic_metrics.orchestrators.category_data_orchestrator academic_metrics.orchestrators.classification_orchestrator academic_metrics.postprocessing academic_metrics.postprocessing.BasePostprocessor academic_metrics.postprocessing.DepartmentPostprocessor academic_metrics.postprocessing.FacultyPostprocessor academic_metrics.runners academic_metrics.runners.pipeline academic_metrics.strategies academic_metrics.strategies.AttributeExtractionStrategies academic_metrics.utils academic_metrics.utils.api_key_validator academic_metrics.utils.minhash_util academic_metrics.utils.taxonomy_util academic_metrics.utils.unicode_chars_dict academic_metrics.utils.utilities academic_metrics.utils.warning_manager constants constants.dir_paths mongodb_uri (academic_metrics.runners.pipeline.PipelineRunner attribute) N name (academic_metrics.dataclass_models.concrete_dataclasses.FacultyInfo attribute), [1] (academic_metrics.dataclass_models.concrete_dataclasses.GlobalFacultyStats attribute), [1] num_hashes (academic_metrics.utils.minhash_util.MinHashUtility attribute) O offline (academic_metrics.runners.pipeline.SaveOfflineKwargs attribute) openai (academic_metrics.utils.api_key_validator.ValidationResult attribute) options (academic_metrics.data_collection.scraper.Scraper attribute) output_dir_path (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator attribute) P page_content (academic_metrics.data_collection.scraper.CleanerOutput attribute), [1] parser (academic_metrics.ChainBuilder.ChainBuilder.ChainBuilder attribute) (academic_metrics.ChainBuilder.ChainBuilder.ChainWrapper attribute) ParserType (class in academic_metrics.ChainBuilder.ChainBuilder) ParserUnion (in module academic_metrics.ChainBuilder.ChainBuilder) PipelineRunner (class in academic_metrics.runners.pipeline) postprocessor (academic_metrics.ChainBuilder.ChainBuilder.ChainManager attribute) (academic_metrics.ChainBuilder.ChainBuilder.ChainWrapper attribute) preprocessor (academic_metrics.ChainBuilder.ChainBuilder.ChainManager attribute) (academic_metrics.ChainBuilder.ChainBuilder.ChainWrapper attribute) print_chain_sequence() (academic_metrics.ChainBuilder.ChainBuilder.ChainManager method), [1] print_chain_variables() (academic_metrics.ChainBuilder.ChainBuilder.ChainManager method), [1] print_full_results() (academic_metrics.utils.api_key_validator.APIKeyValidator method) print_results_for_api_key() (academic_metrics.utils.api_key_validator.APIKeyValidator method) process() (academic_metrics.DB.DatabaseSetup.DatabaseWrapper method), [1] process_data_list() (academic_metrics.core.category_processor.CategoryProcessor method), [1] process_items() (academic_metrics.data_collection.CrossrefWrapper.CrossrefWrapper method) process_value_pair() (academic_metrics.postprocessing.BasePostprocessor.BasePostprocessor method), [1] processed_sets_list (academic_metrics.postprocessing.BasePostprocessor.BasePostprocessor attribute) R raw_classification_outputs (academic_metrics.AI.abstract_classifier.AbstractClassifier attribute) raw_results (academic_metrics.data_collection.scraper.Scraper attribute) raw_theme_outputs (academic_metrics.AI.abstract_classifier.AbstractClassifier attribute) refine_faculty_stats() (academic_metrics.dataclass_models.concrete_dataclasses.FacultyStats method) register_dataclass() (academic_metrics.factories.dataclass_factory.DataClassFactory class method) (academic_metrics.factories.dataclass_factory.DataClassFactory method) register_strategy() (academic_metrics.factories.strategy_factory.StrategyFactory class method) (academic_metrics.factories.strategy_factory.StrategyFactory method) remove_near_duplicates() (academic_metrics.postprocessing.BasePostprocessor.BasePostprocessor method), [1] (academic_metrics.postprocessing.DepartmentPostprocessor.DepartmentPostprocessor method) (academic_metrics.postprocessing.FacultyPostprocessor.FacultyPostprocessor method) remove_update_attribute() (academic_metrics.postprocessing.BasePostprocessor.BasePostprocessor method), [1] run() (academic_metrics.ChainBuilder.ChainBuilder.ChainComposer method), [1] (academic_metrics.ChainBuilder.ChainBuilder.ChainManager method) run_afetch_yrange() (academic_metrics.data_collection.CrossrefWrapper.CrossrefWrapper method) run_all_process() (academic_metrics.data_collection.CrossrefWrapper.CrossrefWrapper method) (academic_metrics.DB.DatabaseSetup.DatabaseWrapper method), [1] run_chain() (academic_metrics.ChainBuilder.ChainBuilder.ChainWrapper method), [1] run_classification() (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator method), [1] run_crossref_before_file_load (academic_metrics.runners.pipeline.SaveOfflineKwargs attribute) run_orchestrator() (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator method) run_pipeline() (academic_metrics.runners.pipeline.PipelineRunner method), [1] S save_classification_results() (academic_metrics.AI.abstract_classifier.AbstractClassifier method), [1] SAVE_OFFLINE_KWARGS (academic_metrics.runners.pipeline.PipelineRunner attribute), [1] save_raw_classification_results() (academic_metrics.AI.abstract_classifier.AbstractClassifier method), [1] save_raw_results() (academic_metrics.data_collection.scraper.Scraper method), [1] save_raw_theme_results() (academic_metrics.AI.abstract_classifier.AbstractClassifier method), [1] SaveOfflineKwargs (class in academic_metrics.runners.pipeline) scraper (academic_metrics.runners.pipeline.PipelineRunner attribute) Scraper (class in academic_metrics.data_collection.scraper) semaphore (academic_metrics.data_collection.CrossrefWrapper.CrossrefWrapper attribute) serialize_to_json() (academic_metrics.data_collection.CrossrefWrapper.CrossrefWrapper method) service (academic_metrics.data_collection.scraper.Scraper attribute) set_author_sequence_dict() (academic_metrics.strategies.AttributeExtractionStrategies.AttributeExtractionStrategy method), [1] set_log_to_console() (in module academic_metrics.configs.global_config) set_params() (academic_metrics.dataclass_models.abstract_base_dataclass.AbstractBaseDataClass method), [1] (academic_metrics.dataclass_models.concrete_dataclasses.ArticleStats method) (academic_metrics.dataclass_models.concrete_dataclasses.CrossrefArticleStats method) (academic_metrics.dataclass_models.concrete_dataclasses.FacultyStats method) set_words_to_ban() (academic_metrics.ChainBuilder.ChainBuilder.ChainManager method) setup_chain() (academic_metrics.data_collection.scraper.Scraper method) standardize_attribute() (academic_metrics.postprocessing.BasePostprocessor.BasePostprocessor method), [1] standardize_values_across_sets() (academic_metrics.postprocessing.BasePostprocessor.BasePostprocessor method), [1] standardized_data_update() (academic_metrics.postprocessing.BasePostprocessor.BasePostprocessor method), [1] strategy_factory (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator attribute) (academic_metrics.runners.pipeline.PipelineRunner attribute) (academic_metrics.utils.utilities.Utilities attribute) StrategyFactory (class in academic_metrics.factories.strategy_factory) T taxonomy (academic_metrics.factories.abstract_classifier_factory.ClassifierFactory attribute) (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator attribute) (academic_metrics.runners.pipeline.PipelineRunner attribute) Taxonomy (class in academic_metrics.utils.taxonomy_util) taxonomy_util (academic_metrics.core.category_processor.CategoryProcessor attribute) TaxonomyDict (in module academic_metrics.utils.taxonomy_util) TaxonomyLevel (in module academic_metrics.utils.taxonomy_util) tc_count (academic_metrics.dataclass_models.concrete_dataclasses.ArticleDetails attribute), [1] (academic_metrics.dataclass_models.concrete_dataclasses.CategoryInfo attribute), [1] (academic_metrics.dataclass_models.concrete_dataclasses.CrossrefArticleDetails attribute), [1] tc_list (academic_metrics.dataclass_models.concrete_dataclasses.CategoryInfo attribute) test_run() (academic_metrics.runners.pipeline.PipelineRunner method) themes (academic_metrics.dataclass_models.concrete_dataclasses.CategoryInfo attribute), [1] (academic_metrics.dataclass_models.concrete_dataclasses.CrossrefArticleDetails attribute), [1] (academic_metrics.dataclass_models.concrete_dataclasses.GlobalFacultyStats attribute), [1] title (academic_metrics.dataclass_models.concrete_dataclasses.CrossrefArticleDetails attribute), [1] TITLE (academic_metrics.enums.enums.AttributeTypes attribute), [1] title_key (academic_metrics.strategies.AttributeExtractionStrategies.CrossrefTitleExtractionStrategy attribute) titles (academic_metrics.dataclass_models.concrete_dataclasses.CategoryInfo attribute), [1] (academic_metrics.dataclass_models.concrete_dataclasses.FacultyInfo attribute), [1] (academic_metrics.dataclass_models.concrete_dataclasses.GlobalFacultyStats attribute), [1] to_dict() (academic_metrics.dataclass_models.abstract_base_dataclass.AbstractBaseDataClass method), [1] to_year (academic_metrics.data_collection.CrossrefWrapper.CrossrefWrapper attribute) tokenize() (academic_metrics.utils.minhash_util.MinHashUtility method), [1] top_category_urls (academic_metrics.dataclass_models.concrete_dataclasses.CrossrefArticleDetails attribute) (academic_metrics.dataclass_models.concrete_dataclasses.GlobalFacultyStats attribute) top_level_categories (academic_metrics.dataclass_models.concrete_dataclasses.CrossrefArticleDetails attribute), [1] (academic_metrics.dataclass_models.concrete_dataclasses.GlobalFacultyStats attribute), [1] total_citations (academic_metrics.dataclass_models.concrete_dataclasses.FacultyInfo attribute), [1] (academic_metrics.dataclass_models.concrete_dataclasses.GlobalFacultyStats attribute), [1] U unclassified_abstracts (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator attribute) unclassified_details (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator attribute) unclassified_doi_abstract_dict (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator attribute) unclassified_dois (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator attribute) unclassified_item_count (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator attribute) unclassified_items (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator attribute) unknown_authors (academic_metrics.strategies.AttributeExtractionStrategies.CrossrefAuthorExtractionStrategy attribute) unknown_authors_dict (academic_metrics.strategies.AttributeExtractionStrategies.AttributeExtractionStrategy attribute) unknown_authors_file (academic_metrics.strategies.AttributeExtractionStrategies.AttributeExtractionStrategy attribute) update_category() (academic_metrics.DB.DatabaseSetup.DatabaseWrapper method), [1] update_category_article_stats() (academic_metrics.core.category_processor.CategoryProcessor method), [1] update_category_stats() (academic_metrics.core.category_processor.CategoryProcessor method), [1] update_faculty() (academic_metrics.DB.DatabaseSetup.DatabaseWrapper method), [1] update_faculty_stats() (academic_metrics.core.category_processor.CategoryProcessor method), [1] update_global_faculty_stats() (academic_metrics.core.category_processor.CategoryProcessor method), [1] url (academic_metrics.dataclass_models.concrete_dataclasses.CategoryInfo attribute), [1] (academic_metrics.dataclass_models.concrete_dataclasses.CrossrefArticleDetails attribute) utilities (academic_metrics.orchestrators.classification_orchestrator.ClassificationOrchestrator attribute) (academic_metrics.runners.pipeline.PipelineRunner attribute) Utilities (class in academic_metrics.utils.utilities) utils (academic_metrics.core.category_processor.CategoryProcessor attribute) (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator attribute) V ValidationResult (class in academic_metrics.utils.api_key_validator) value_to_remove() (academic_metrics.postprocessing.BasePostprocessor.BasePostprocessor method), [1] value_variations (academic_metrics.postprocessing.BasePostprocessor.BasePostprocessor attribute) W WARNING (in module academic_metrics.configs.global_config) warning_count (academic_metrics.utils.warning_manager.WarningManager attribute) warning_manager (academic_metrics.core.category_processor.CategoryProcessor attribute) (academic_metrics.orchestrators.category_data_orchestrator.CategoryDataOrchestrator attribute) (academic_metrics.runners.pipeline.PipelineRunner attribute) (academic_metrics.strategies.AttributeExtractionStrategies.AttributeExtractionStrategy attribute) (academic_metrics.utils.utilities.Utilities attribute) WarningManager (class in academic_metrics.utils.warning_manager) warnings (academic_metrics.utils.warning_manager.WarningManager attribute) WC_PATTERN (academic_metrics.enums.enums.AttributeTypes attribute), [1] write_missing_authors_file() (academic_metrics.strategies.AttributeExtractionStrategies.AttributeExtractionStrategy method), [1] Y years (academic_metrics.data_collection.CrossrefWrapper.CrossrefWrapper attribute)