MANIFEST.in
README.rst
pyproject.toml
requirements.txt
data_gatherer/__init__.py
data_gatherer/classifier.py
data_gatherer/data_fetcher.py
data_gatherer/data_gatherer.py
data_gatherer/env.py
data_gatherer/logger_setup.py
data_gatherer/mcp.py
data_gatherer/resources_loader.py
data_gatherer/selenium_setup.py
data_gatherer.egg-info/PKG-INFO
data_gatherer.egg-info/SOURCES.txt
data_gatherer.egg-info/dependency_links.txt
data_gatherer.egg-info/entry_points.txt
data_gatherer.egg-info/requires.txt
data_gatherer.egg-info/top_level.txt
data_gatherer/config/data_repos_ontology.json
data_gatherer/config/open_bio_data_repos.json
data_gatherer/config/retrieval_patterns.json
data_gatherer/llm/__init__.py
data_gatherer/llm/batch_storage.py
data_gatherer/llm/llm_client.py
data_gatherer/llm/local_model_client.py
data_gatherer/llm/response_schema.py
data_gatherer/parser/__init__.py
data_gatherer/parser/base_parser.py
data_gatherer/parser/grobid_pdf_parser.py
data_gatherer/parser/html_parser.py
data_gatherer/parser/pdf_parser.py
data_gatherer/parser/xml_parser.py
data_gatherer/prompts/__init__.py
data_gatherer/prompts/prompt_manager.py
data_gatherer/prompts/prompt_templates/GEMINI_FDR_FewShot.json
data_gatherer/prompts/prompt_templates/GEMINI_RTR_FewShot.json
data_gatherer/prompts/prompt_templates/GPT_FDR_FewShot.json
data_gatherer/prompts/prompt_templates/GPT_FDR_FewShot_CitationType.json
data_gatherer/prompts/prompt_templates/GPT_FDR_FewShot_Descr.json
data_gatherer/prompts/prompt_templates/GPT_FDR_FewShot_Syn.json
data_gatherer/prompts/prompt_templates/GPT_FDR_FewShot_shortDescr.json
data_gatherer/prompts/prompt_templates/GPT_FewShot.json
data_gatherer/prompts/prompt_templates/GPT_RTR_FewShot_CitationType.json
data_gatherer/prompts/prompt_templates/Ollama_FewShot.json
data_gatherer/prompts/prompt_templates/T5_primer.json
data_gatherer/prompts/prompt_templates/metadata_prompts/gemini_metadata_extract.json
data_gatherer/prompts/prompt_templates/metadata_prompts/gpt_metadata_extract.json
data_gatherer/prompts/prompt_templates/metadata_prompts/portkey_gemini_metadata_extract.json
data_gatherer/retriever/__init__.py
data_gatherer/retriever/base_retriever.py
data_gatherer/retriever/embeddings_retriever.py
data_gatherer/retriever/html_retriever.py
data_gatherer/retriever/xml_retriever.py
tests/test_data_fetcher_methods.py
tests/test_orchestrator.py
tests/test_parser_utils.py