LICENSE
README.md
pyproject.toml
src/perla_extract/__init__.py
src/perla_extract/allowed_journals.csv
src/perla_extract/configuration.py
src/perla_extract/constants.py
src/perla_extract/evaluations.py
src/perla_extract/export.py
src/perla_extract/llm_call.py
src/perla_extract/optimizer.py
src/perla_extract/papersbot_new.py
src/perla_extract/pipeline.py
src/perla_extract/postprocessing.py
src/perla_extract/pydantic_model_reduced.py
src/perla_extract.egg-info/PKG-INFO
src/perla_extract.egg-info/SOURCES.txt
src/perla_extract.egg-info/dependency_links.txt
src/perla_extract.egg-info/entry_points.txt
src/perla_extract.egg-info/requires.txt
src/perla_extract.egg-info/top_level.txt
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1002--adfm.201500335.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1002--adfm.201904856.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1002--adfm.202212698.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1002--adma.202302143.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1002--adma.202305822.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1002--solr.201900370.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1002--solr.202100879.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1002--solr.202300438.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1002--solr.202300817.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1016--j.jallcom.2023.170970.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1016--j.jmst.2021.03.045.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1016--j.matlet.2016.07.004.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1016--j.matt.2023.09.006.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1016--j.nanoen.2016.05.023.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1016--j.nanoen.2022.107416.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1021--acs.chemmater.8b01521.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1021--acsaelm.4c02297.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1021--acsaem.4c02660.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1021--acsaem.9b01928.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1038--nmat4014.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1038--s41467-020-20272-3.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1038--s41467-021-27740-4.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1038--s41467-023-36141-8.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1038--s41560-022-01061-2.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1038--s41560-022-01102-w.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1038--s41563-025-02163-4.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1039--c5dt02388b.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1039--c5ta00568j.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1039--c7nr04692h.json
src/perla_extract/data/extractions/claude-opus-4-1-20250805/10.1126--science.adf0194.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1002--adfm.201500335.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1002--adfm.201904856.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1002--adfm.202212698.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1002--adma.202302143.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1002--adma.202305822.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1002--solr.201900370.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1002--solr.202100879.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1002--solr.202300438.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1002--solr.202300817.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1016--j.jallcom.2023.170970.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1016--j.jmst.2021.03.045.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1016--j.matlet.2016.07.004.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1016--j.matt.2023.09.006.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1016--j.nanoen.2016.05.023.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1016--j.nanoen.2022.107416.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1021--acs.chemmater.8b01521.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1021--acsaelm.4c02297.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1021--acsaem.4c02660.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1021--acsaem.9b01928.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1038--nmat4014.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1038--s41467-020-20272-3.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1038--s41467-021-27740-4.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1038--s41467-023-36141-8.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1038--s41560-022-01061-2.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1038--s41560-022-01102-w.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1038--s41563-025-02163-4.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1039--c5dt02388b.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1039--c5ta00568j.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1039--c7nr04692h.json
src/perla_extract/data/extractions/claude-opus-4-20250514/10.1126--science.adf0194.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1002--adfm.201500335.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1002--adfm.201904856.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1002--adfm.202212698.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1002--adma.202302143.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1002--adma.202305822.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1002--solr.201900370.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1002--solr.202100879.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1002--solr.202300438.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1002--solr.202300817.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1016--j.jallcom.2023.170970.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1016--j.jmst.2021.03.045.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1016--j.matlet.2016.07.004.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1016--j.matt.2023.09.006.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1016--j.nanoen.2016.05.023.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1016--j.nanoen.2022.107416.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1021--acs.chemmater.8b01521.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1021--acsaelm.4c02297.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1021--acsaem.4c02660.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1021--acsaem.9b01928.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1038--nmat4014.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1038--s41467-020-20272-3.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1038--s41467-021-27740-4.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1038--s41467-023-36141-8.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1038--s41560-022-01061-2.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1038--s41560-022-01102-w.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1038--s41563-025-02163-4.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1039--c5dt02388b.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1039--c5ta00568j.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1039--c7nr04692h.json
src/perla_extract/data/extractions/claude-sonnet-4-20250514/10.1126--science.adf0194.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1002--adfm.201500335.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1002--adfm.201904856.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1002--adfm.202212698.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1002--adma.202302143.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1002--adma.202305822.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1002--solr.201900370.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1002--solr.202100879.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1002--solr.202300438.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1002--solr.202300817.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1016--j.jallcom.2023.170970.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1016--j.jmst.2021.03.045.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1016--j.matlet.2016.07.004.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1016--j.matt.2023.09.006.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1016--j.nanoen.2016.05.023.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1016--j.nanoen.2022.107416.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1021--acs.chemmater.8b01521.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1021--acsaelm.4c02297.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1021--acsaem.4c02660.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1021--acsaem.9b01928.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1038--nmat4014.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1038--s41467-020-20272-3.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1038--s41467-021-27740-4.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1038--s41467-023-36141-8.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1038--s41560-022-01061-2.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1038--s41560-022-01102-w.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1038--s41563-025-02163-4.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1039--c5dt02388b.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1039--c5ta00568j.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1039--c7nr04692h.json
src/perla_extract/data/extractions/gpt-4.1-2025-04-14/10.1126--science.adf0194.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1002--adfm.201500335.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1002--adfm.201904856.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1002--adfm.202212698.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1002--adma.202302143.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1002--adma.202305822.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1002--solr.201900370.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1002--solr.202100879.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1002--solr.202300438.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1002--solr.202300817.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1016--j.jallcom.2023.170970.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1016--j.jmst.2021.03.045.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1016--j.matlet.2016.07.004.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1016--j.matt.2023.09.006.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1016--j.nanoen.2016.05.023.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1016--j.nanoen.2022.107416.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1021--acs.chemmater.8b01521.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1021--acsaelm.4c02297.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1021--acsaem.4c02660.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1021--acsaem.9b01928.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1038--nmat4014.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1038--s41467-020-20272-3.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1038--s41467-021-27740-4.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1038--s41467-023-36141-8.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1038--s41560-022-01061-2.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1038--s41560-022-01102-w.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1038--s41563-025-02163-4.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1039--c5dt02388b.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1039--c5ta00568j.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1039--c7nr04692h.json
src/perla_extract/data/extractions/gpt-4o-2024-08-06/10.1126--science.adf0194.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1002--adfm.201500335.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1002--adfm.201904856.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1002--adfm.202212698.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1002--adma.202302143.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1002--adma.202305822.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1002--solr.201900370.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1002--solr.202100879.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1002--solr.202300438.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1002--solr.202300817.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1016--j.jallcom.2023.170970.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1016--j.jmst.2021.03.045.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1016--j.matlet.2016.07.004.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1016--j.matt.2023.09.006.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1016--j.nanoen.2016.05.023.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1016--j.nanoen.2022.107416.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1021--acs.chemmater.8b01521.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1021--acsaelm.4c02297.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1021--acsaem.4c02660.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1021--acsaem.9b01928.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1038--nmat4014.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1038--s41467-020-20272-3.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1038--s41467-021-27740-4.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1038--s41467-023-36141-8.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1038--s41560-022-01061-2.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1038--s41560-022-01102-w.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1038--s41563-025-02163-4.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1039--c5dt02388b.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1039--c5ta00568j.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1039--c7nr04692h.json
src/perla_extract/data/extractions/gpt-5-2025-08-07/10.1126--science.adf0194.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1002--adfm.201500335.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1002--adfm.201904856.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1002--adfm.202212698.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1002--adma.202302143.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1002--adma.202305822.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1002--solr.201900370.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1002--solr.202100879.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1002--solr.202300438.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1002--solr.202300817.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1016--j.jallcom.2023.170970.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1016--j.jmst.2021.03.045.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1016--j.matlet.2016.07.004.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1016--j.matt.2023.09.006.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1016--j.nanoen.2016.05.023.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1016--j.nanoen.2022.107416.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1021--acs.chemmater.8b01521.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1021--acsaelm.4c02297.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1021--acsaem.4c02660.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1021--acsaem.9b01928.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1038--nmat4014.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1038--s41467-020-20272-3.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1038--s41467-021-27740-4.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1038--s41467-023-36141-8.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1038--s41560-022-01061-2.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1038--s41560-022-01102-w.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1038--s41563-025-02163-4.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1039--c5dt02388b.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1039--c5ta00568j.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1039--c7nr04692h.json
src/perla_extract/data/extractions/gpt-5-mini-2025-08-07/10.1126--science.adf0194.json
src/perla_extract/data/extractions/humans/Bear/10.1002--adma.202400105.json
src/perla_extract/data/extractions/humans/Bear/10.1002--advs.201903009.json
src/perla_extract/data/extractions/humans/Bear/10.1002--aenm.201701640.json
src/perla_extract/data/extractions/humans/Bear/10.1002--smll.201704007.json
src/perla_extract/data/extractions/humans/Bear/10.1002--smtd.201900511.json
src/perla_extract/data/extractions/humans/Bear/10.1002--solr.201900370.json
src/perla_extract/data/extractions/humans/Bear/10.1002--solr.202000740.json
src/perla_extract/data/extractions/humans/Bear/10.1002--solr.202100879.json
src/perla_extract/data/extractions/humans/Bear/10.1016--j.jallcom.2018.08.279.json
src/perla_extract/data/extractions/humans/Bear/10.1016--j.jechem.2019.03.023.json
src/perla_extract/data/extractions/humans/Bear/10.1016--j.jechem.2023.07.002.json
src/perla_extract/data/extractions/humans/Bear/10.1016--j.matlet.2016.07.004.json
src/perla_extract/data/extractions/humans/Bear/10.1016--j.nanoen.2016.05.023.json
src/perla_extract/data/extractions/humans/Bear/10.1021--acs.jpclett.1c04241.json
src/perla_extract/data/extractions/humans/Bear/10.1021--acsaem.0c02405.json
src/perla_extract/data/extractions/humans/Bear/10.1039--c5dt02388b.json
src/perla_extract/data/extractions/humans/Bear/10.1039--c5nr05563f.json
src/perla_extract/data/extractions/humans/Bear/10.1039--c6ee02139e.json
src/perla_extract/data/extractions/humans/Bear/10.1039--c7nr04692h.json
src/perla_extract/data/extractions/humans/Bear/10.1039--c9tc03259b.json
src/perla_extract/data/extractions/humans/Bear/10.1186--s11671-017-1992-1.json
src/perla_extract/data/extractions/humans/Bear/10.1246--cl.150984.json
src/perla_extract/data/extractions/humans/Bee/10.1002--adfm.201500335.json
src/perla_extract/data/extractions/humans/Bee/10.1002--adfm.201904856.json
src/perla_extract/data/extractions/humans/Bee/10.1002--adma.202302143.json
src/perla_extract/data/extractions/humans/Bee/10.1002--advs.201903009.json
src/perla_extract/data/extractions/humans/Bee/10.1002--aenm.201802051.json
src/perla_extract/data/extractions/humans/Bee/10.1002--aenm.201802346.json
src/perla_extract/data/extractions/humans/Bee/10.1002--aenm.202000566.json
src/perla_extract/data/extractions/humans/Bee/10.1002--cptc.201900245.json
src/perla_extract/data/extractions/humans/Bee/10.1002--solr.202100454.json
src/perla_extract/data/extractions/humans/Bee/10.1002--solr.202100879.json
src/perla_extract/data/extractions/humans/Bee/10.1016--j.jechem.2023.09.023.json
src/perla_extract/data/extractions/humans/Bee/10.1021--acsaem.9b01928.json
src/perla_extract/data/extractions/humans/Bee/10.1021--acsami.7b01038.json
src/perla_extract/data/extractions/humans/Bee/10.1021--acsnano.7b02015.json
src/perla_extract/data/extractions/humans/Bee/10.1038--s41467-024-53953-4.json
src/perla_extract/data/extractions/humans/Bee/10.1039--c4ta04179h.json
src/perla_extract/data/extractions/humans/Bee/10.1039--c5ee03874j.json
src/perla_extract/data/extractions/humans/Bee/10.1039--c6ra25149h.json
src/perla_extract/data/extractions/humans/Bee/10.1039--c9se00513g.json
src/perla_extract/data/extractions/humans/Bee/10.1039--d1ta04330g.json
src/perla_extract/data/extractions/humans/Bee/10.1557--s43578-021-00155-z.json
src/perla_extract/data/extractions/humans/Consensus/10.1002--adfm.201500335.json
src/perla_extract/data/extractions/humans/Consensus/10.1002--adfm.201904856.json
src/perla_extract/data/extractions/humans/Consensus/10.1002--adfm.202212698.json
src/perla_extract/data/extractions/humans/Consensus/10.1002--adma.202302143.json
src/perla_extract/data/extractions/humans/Consensus/10.1002--cphc.201500456.json
src/perla_extract/data/extractions/humans/Consensus/10.1002--solr.201900370.json
src/perla_extract/data/extractions/humans/Consensus/10.1002--solr.202100879.json
src/perla_extract/data/extractions/humans/Consensus/10.1016--j.matlet.2016.07.004.json
src/perla_extract/data/extractions/humans/Consensus/10.1016--j.nanoen.2016.05.023.json
src/perla_extract/data/extractions/humans/Consensus/10.1016--j.nanoen.2022.107416.json
src/perla_extract/data/extractions/humans/Consensus/10.1021--acs.chemmater.8b01521.json
src/perla_extract/data/extractions/humans/Consensus/10.1021--acsaem.9b01928.json
src/perla_extract/data/extractions/humans/Consensus/10.1039--c5dt02388b.json
src/perla_extract/data/extractions/humans/Consensus/10.1039--c5ta00568j.json
src/perla_extract/data/extractions/humans/Consensus/10.1039--c7nr04692h.json
src/perla_extract/data/extractions/humans/Dove/10.1002--adfm.201500335.json
src/perla_extract/data/extractions/humans/Dove/10.1002--adma.202400105.json
src/perla_extract/data/extractions/humans/Dove/10.1002--aenm.201701640.json
src/perla_extract/data/extractions/humans/Dove/10.1002--smtd.201900511.json
src/perla_extract/data/extractions/humans/Dove/10.1016--j.jcou.2019.04.001.json
src/perla_extract/data/extractions/humans/Dove/10.1016--j.jechem.2019.03.023.json
src/perla_extract/data/extractions/humans/Dove/10.1016--j.jechem.2023.07.002.json
src/perla_extract/data/extractions/humans/Dove/10.1016--j.matlet.2016.07.004.json
src/perla_extract/data/extractions/humans/Dove/10.1016--j.nanoen.2016.05.023.json
src/perla_extract/data/extractions/humans/Dove/10.1016--j.nanoen.2022.107416.json
src/perla_extract/data/extractions/humans/Dove/10.1016--j.synthmet.2017.08.007.json
src/perla_extract/data/extractions/humans/Dove/10.1021--acsaem.9b01928.json
src/perla_extract/data/extractions/humans/Dove/10.1021--acsami.7b01038.json
src/perla_extract/data/extractions/humans/Dove/10.1021--acsmaterialslett.3c00337.json
src/perla_extract/data/extractions/humans/Dove/10.1038--s41467-024-53953-4.json
src/perla_extract/data/extractions/humans/Dove/10.1039--c5nr05563f.json
src/perla_extract/data/extractions/humans/Dove/10.1039--c7nr04692h.json
src/perla_extract/data/extractions/humans/Dove/10.1039--c8ee02252f.json
src/perla_extract/data/extractions/humans/Dove/10.1039--c9se00513g.json
src/perla_extract/data/extractions/humans/Dove/10.1039--c9tc03259b.json
src/perla_extract/data/extractions/humans/Dove/10.1186--s11671-017-1992-1.json
src/perla_extract/data/extractions/humans/Dove/10.1246--cl.150984.json
src/perla_extract/data/extractions/humans/Dove/10.1557--s43578-021-00155-z.json
src/perla_extract/data/extractions/humans/Fox/10.1002--adfm.201904856.json
src/perla_extract/data/extractions/humans/Fox/10.1002--adfm.202002342.json
src/perla_extract/data/extractions/humans/Fox/10.1002--adfm.202212698.json
src/perla_extract/data/extractions/humans/Fox/10.1002--aenm.201802051.json
src/perla_extract/data/extractions/humans/Fox/10.1002--aenm.201802346.json
src/perla_extract/data/extractions/humans/Fox/10.1002--aenm.202000566.json
src/perla_extract/data/extractions/humans/Fox/10.1002--aenm.202303742.json
src/perla_extract/data/extractions/humans/Fox/10.1002--cptc.201900245.json
src/perla_extract/data/extractions/humans/Fox/10.1002--solr.201800012.json
src/perla_extract/data/extractions/humans/Fox/10.1002--solr.202000718.json
src/perla_extract/data/extractions/humans/Fox/10.1002--solr.202100454.json
src/perla_extract/data/extractions/humans/Fox/10.1016--j.joule.2018.10.003.json
src/perla_extract/data/extractions/humans/Fox/10.1016--j.nanoen.2022.107416.json
src/perla_extract/data/extractions/humans/Fox/10.1021--acs.jpcc.5b07950.json
src/perla_extract/data/extractions/humans/Fox/10.1021--acsnano.7b02015.json
src/perla_extract/data/extractions/humans/Fox/10.1038--s41467-024-53953-4.json
src/perla_extract/data/extractions/humans/Fox/10.1039--c4ta04179h.json
src/perla_extract/data/extractions/humans/Fox/10.1039--c4ta05373g.json
src/perla_extract/data/extractions/humans/Fox/10.1039--c5ee03874j.json
src/perla_extract/data/extractions/humans/Fox/10.1039--c6ra25149h.json
src/perla_extract/data/extractions/humans/Fox/10.1039--c7ta04225f.json
src/perla_extract/data/extractions/humans/Fox/10.1039--d1ta04330g.json
src/perla_extract/data/extractions/humans/Hawk/10.1002--adfm.202212698.json
src/perla_extract/data/extractions/humans/Hawk/10.1002--adma.202400105.json
src/perla_extract/data/extractions/humans/Hawk/10.1002--aenm.201701640.json
src/perla_extract/data/extractions/humans/Hawk/10.1002--aenm.202303742.json
src/perla_extract/data/extractions/humans/Hawk/10.1002--cptc.201900245.json
src/perla_extract/data/extractions/humans/Hawk/10.1002--smll.201704007.json
src/perla_extract/data/extractions/humans/Hawk/10.1002--solr.202000740.json
src/perla_extract/data/extractions/humans/Hawk/10.1002--solr.202100879.json
src/perla_extract/data/extractions/humans/Hawk/10.1007--s11696-017-0373-7.json
src/perla_extract/data/extractions/humans/Hawk/10.1016--j.apsusc.2019.144478.json
src/perla_extract/data/extractions/humans/Hawk/10.1016--j.jcou.2019.04.001.json
src/perla_extract/data/extractions/humans/Hawk/10.1016--j.jechem.2023.07.002.json
src/perla_extract/data/extractions/humans/Hawk/10.1016--j.jechem.2023.09.023.json
src/perla_extract/data/extractions/humans/Hawk/10.1016--j.nanoen.2016.05.023.json
src/perla_extract/data/extractions/humans/Hawk/10.1016--j.nanoen.2022.107416.json
src/perla_extract/data/extractions/humans/Hawk/10.1016--j.synthmet.2017.08.007.json
src/perla_extract/data/extractions/humans/Hawk/10.1021--acsami.7b01038.json
src/perla_extract/data/extractions/humans/Hawk/10.1021--acsmaterialslett.3c00337.json
src/perla_extract/data/extractions/humans/Hawk/10.1039--D3TA02030D.json
src/perla_extract/data/extractions/humans/Hawk/10.1039--c8ee02252f.json
src/perla_extract/data/extractions/humans/Hawk/10.1039--c9tc03259b.json
src/perla_extract/data/extractions/humans/Kit/10.1002--adfm.201904856.json
src/perla_extract/data/extractions/humans/Kit/10.1002--adfm.202212698.json
src/perla_extract/data/extractions/humans/Kit/10.1002--advs.201903009.json
src/perla_extract/data/extractions/humans/Kit/10.1002--aenm.202303742.json
src/perla_extract/data/extractions/humans/Kit/10.1002--smll.201704007.json
src/perla_extract/data/extractions/humans/Kit/10.1002--smtd.201900511.json
src/perla_extract/data/extractions/humans/Kit/10.1002--solr.201900370.json
src/perla_extract/data/extractions/humans/Kit/10.1002--solr.202000740.json
src/perla_extract/data/extractions/humans/Kit/10.1016--j.jallcom.2018.08.279.json
src/perla_extract/data/extractions/humans/Kit/10.1021--acs.chemmater.6b02744.json
src/perla_extract/data/extractions/humans/Kit/10.1021--acs.chemmater.8b01521.json
src/perla_extract/data/extractions/humans/Kit/10.1021--acsaem.0c02405.json
src/perla_extract/data/extractions/humans/Kit/10.1021--acsmaterialslett.3c00337.json
src/perla_extract/data/extractions/humans/Kit/10.1039--c5dt02388b.json
src/perla_extract/data/extractions/humans/Kit/10.1039--c5ta00568j.json
src/perla_extract/data/extractions/humans/Kit/10.1039--c6ee02139e.json
src/perla_extract/data/extractions/humans/Kit/10.1039--c7nr04692h.json
src/perla_extract/data/extractions/humans/Kit/10.1039--c8nr09353a.json
src/perla_extract/data/extractions/humans/Kit/10.1186--s11671-017-1992-1.json
src/perla_extract/data/extractions/humans/Kit/10.1246--cl.150984.json
src/perla_extract/data/extractions/humans/Lark/10.1002--adfm.202212698.json
src/perla_extract/data/extractions/humans/Lark/10.1002--adma.202400105.json
src/perla_extract/data/extractions/humans/Lark/10.1002--aenm.202303742.json
src/perla_extract/data/extractions/humans/Lark/10.1002--cptc.201900245.json
src/perla_extract/data/extractions/humans/Lark/10.1002--smll.201704007.json
src/perla_extract/data/extractions/humans/Lark/10.1002--solr.201900370.json
src/perla_extract/data/extractions/humans/Lark/10.1002--solr.202000740.json
src/perla_extract/data/extractions/humans/Lark/10.1002--solr.202100879.json
src/perla_extract/data/extractions/humans/Lark/10.1016--j.jallcom.2018.08.279.json
src/perla_extract/data/extractions/humans/Lark/10.1016--j.jcou.2019.04.001.json
src/perla_extract/data/extractions/humans/Lark/10.1016--j.jechem.2023.07.002.json
src/perla_extract/data/extractions/humans/Lark/10.1016--j.jechem.2023.09.023.json
src/perla_extract/data/extractions/humans/Lark/10.1016--j.matlet.2016.07.004.json
src/perla_extract/data/extractions/humans/Lark/10.1016--j.nanoen.2016.05.023.json
src/perla_extract/data/extractions/humans/Lark/10.1016--j.nanoen.2022.107416.json
src/perla_extract/data/extractions/humans/Lark/10.1016--j.synthmet.2017.08.007.json
src/perla_extract/data/extractions/humans/Lark/10.1021--acsami.7b01038.json
src/perla_extract/data/extractions/humans/Lark/10.1021--acsmaterialslett.3c00337.json
src/perla_extract/data/extractions/humans/Lark/10.1039--D3TA02030D.json
src/perla_extract/data/extractions/humans/Lark/10.1039--c8ee02252f.json
src/perla_extract/data/extractions/humans/Lark/10.1039--c9tc03259b.json
src/perla_extract/data/extractions/humans/Otto/10.1002--smll.201704007.json
src/perla_extract/data/extractions/humans/Otto/10.1002--solr.201800012.json
src/perla_extract/data/extractions/humans/Otto/10.1002--solr.202000718.json
src/perla_extract/data/extractions/humans/Otto/10.1016--j.nanoen.2022.107416.json
src/perla_extract/data/extractions/humans/Otto/10.1021--acs.jpclett.1c04241.json
src/perla_extract/data/extractions/humans/Otto/10.1039--c4ta05373g.json
src/perla_extract/data/extractions/humans/Otto/10.1039--c5dt02388b.json
src/perla_extract/data/extractions/humans/Otto/10.1039--c5ta00568j.json
src/perla_extract/data/extractions/humans/Otto/10.1039--c6ee02139e.json
src/perla_extract/data/extractions/humans/Otto/10.1039--c7ta04225f.json
src/perla_extract/data/extractions/humans/Otto/10.1039--c8nr09353a.json
src/perla_extract/data/extractions/humans/Panda/10.1002--adfm.201500335.json
src/perla_extract/data/extractions/humans/Panda/10.1002--aenm.201802346.json
src/perla_extract/data/extractions/humans/Panda/10.1002--cphc.201500456.json
src/perla_extract/data/extractions/humans/Panda/10.1002--solr.202100454.json
src/perla_extract/data/extractions/humans/Panda/10.1007--s11696-017-0373-7.json
src/perla_extract/data/extractions/humans/Panda/10.1016--j.apsusc.2019.144478.json
src/perla_extract/data/extractions/humans/Panda/10.1016--j.jechem.2019.03.023.json
src/perla_extract/data/extractions/humans/Panda/10.1016--j.jechem.2023.07.002.json
src/perla_extract/data/extractions/humans/Panda/10.1016--j.nanoen.2016.05.023.json
src/perla_extract/data/extractions/humans/Panda/10.1016--j.synthmet.2017.08.007.json
src/perla_extract/data/extractions/humans/Panda/10.1021--acsaem.9b01928.json
src/perla_extract/data/extractions/humans/Panda/10.1021--acsami.7b01038.json
src/perla_extract/data/extractions/humans/Panda/10.1021--acsmaterialslett.3c00337.json
src/perla_extract/data/extractions/humans/Panda/10.1039--c4ta04179h.json
src/perla_extract/data/extractions/humans/Panda/10.1039--c5nr05563f.json
src/perla_extract/data/extractions/humans/Panda/10.1039--c9se00513g.json
src/perla_extract/data/extractions/humans/Panda/10.1039--c9tc03259b.json
src/perla_extract/data/extractions/humans/Panda/10.1039--d1ta04330g.json
src/perla_extract/data/extractions/humans/Panda/10.1557--s43578-021-00155-z.json
src/perla_extract/data/extractions/humans/Robin/10.1002--adfm.202002342.json
src/perla_extract/data/extractions/humans/Robin/10.1002--adma.202302143.json
src/perla_extract/data/extractions/humans/Robin/10.1002--aenm.201802051.json
src/perla_extract/data/extractions/humans/Robin/10.1002--aenm.202000566.json
src/perla_extract/data/extractions/humans/Robin/10.1002--aenm.202303742.json
src/perla_extract/data/extractions/humans/Robin/10.1002--cphc.201500456.json
src/perla_extract/data/extractions/humans/Robin/10.1002--cptc.201900245.json
src/perla_extract/data/extractions/humans/Robin/10.1002--solr.201800012.json
src/perla_extract/data/extractions/humans/Robin/10.1002--solr.202000718.json
src/perla_extract/data/extractions/humans/Robin/10.1016--j.jechem.2023.09.023.json
src/perla_extract/data/extractions/humans/Robin/10.1016--j.joule.2018.10.003.json
src/perla_extract/data/extractions/humans/Robin/10.1021--acs.chemmater.6b02744.json
src/perla_extract/data/extractions/humans/Robin/10.1021--acs.chemmater.8b01521.json
src/perla_extract/data/extractions/humans/Robin/10.1021--acs.jpcc.5b07950.json
src/perla_extract/data/extractions/humans/Robin/10.1021--acs.jpclett.1c04241.json
src/perla_extract/data/extractions/humans/Robin/10.1021--acsnano.7b02015.json
src/perla_extract/data/extractions/humans/Robin/10.1039--c4ta05373g.json
src/perla_extract/data/extractions/humans/Robin/10.1039--c5ee03874j.json
src/perla_extract/data/extractions/humans/Robin/10.1039--c5ta00568j.json
src/perla_extract/data/extractions/humans/Robin/10.1039--c6ra25149h.json
src/perla_extract/data/extractions/humans/Robin/10.1039--c7ta04225f.json
src/perla_extract/data/extractions/humans/Robin/10.1039--c8nr09353a.json
src/perla_extract/data/extractions/humans/Seal/10.1002--adfm.202002342.json
src/perla_extract/data/extractions/humans/Seal/10.1002--adfm.202212698.json
src/perla_extract/data/extractions/humans/Seal/10.1002--adma.202400105.json
src/perla_extract/data/extractions/humans/Seal/10.1002--advs.201903009.json
src/perla_extract/data/extractions/humans/Seal/10.1002--cphc.201500456.json
src/perla_extract/data/extractions/humans/Seal/10.1002--cptc.201900245.json
src/perla_extract/data/extractions/humans/Seal/10.1002--solr.202000740.json
src/perla_extract/data/extractions/humans/Seal/10.1002--solr.202100454.json
src/perla_extract/data/extractions/humans/Seal/10.1007--s11696-017-0373-7.json
src/perla_extract/data/extractions/humans/Seal/10.1016--j.apsusc.2019.144478.json
src/perla_extract/data/extractions/humans/Seal/10.1016--j.joule.2018.10.003.json
src/perla_extract/data/extractions/humans/Seal/10.1016--j.nanoen.2016.05.023.json
src/perla_extract/data/extractions/humans/Seal/10.1016--j.synthmet.2017.08.007.json
src/perla_extract/data/extractions/humans/Seal/10.1021--acs.chemmater.6b02744.json
src/perla_extract/data/extractions/humans/Seal/10.1021--acs.chemmater.8b01521.json
src/perla_extract/data/extractions/humans/Seal/10.1021--acs.jpcc.5b07950.json
src/perla_extract/data/extractions/humans/Seal/10.1021--acsaem.0c02405.json
src/perla_extract/data/extractions/humans/Seal/10.1021--acsaem.9b01928.json
src/perla_extract/data/extractions/humans/Seal/10.1039--c5nr05563f.json
src/perla_extract/data/extractions/humans/Seal/10.1039--c9se00513g.json
src/perla_extract/data/ground_truth/dev/10.1002--adfm.201500335.json
src/perla_extract/data/ground_truth/dev/10.1002--adfm.201904856.json
src/perla_extract/data/ground_truth/dev/10.1002--adma.202302143.json
src/perla_extract/data/ground_truth/dev/10.1002--solr.201900370.json
src/perla_extract/data/ground_truth/dev/10.1016--j.matlet.2016.07.004.json
src/perla_extract/data/ground_truth/dev/10.1016--j.nanoen.2016.05.023.json
src/perla_extract/data/ground_truth/dev/10.1021--acs.chemmater.8b01521.json
src/perla_extract/data/ground_truth/dev/10.1021--acsaem.9b01928.json
src/perla_extract/data/ground_truth/dev/10.1039--c5dt02388b.json
src/perla_extract/data/ground_truth/dev/10.1039--c7nr04692h.json
src/perla_extract/data/ground_truth/test/10.1002--adfm.202212698.json
src/perla_extract/data/ground_truth/test/10.1002--adma.202305822.json
src/perla_extract/data/ground_truth/test/10.1002--solr.202100879.json
src/perla_extract/data/ground_truth/test/10.1002--solr.202300438.json
src/perla_extract/data/ground_truth/test/10.1002--solr.202300817.json
src/perla_extract/data/ground_truth/test/10.1016--j.jallcom.2023.170970.json
src/perla_extract/data/ground_truth/test/10.1016--j.jmst.2021.03.045.json
src/perla_extract/data/ground_truth/test/10.1016--j.matt.2023.09.006.json
src/perla_extract/data/ground_truth/test/10.1016--j.nanoen.2022.107416.json
src/perla_extract/data/ground_truth/test/10.1021--acsaelm.4c02297.json
src/perla_extract/data/ground_truth/test/10.1021--acsaem.4c02660.json
src/perla_extract/data/ground_truth/test/10.1038--nmat4014.json
src/perla_extract/data/ground_truth/test/10.1038--s41467-020-20272-3.json
src/perla_extract/data/ground_truth/test/10.1038--s41467-021-27740-4.json
src/perla_extract/data/ground_truth/test/10.1038--s41467-023-36141-8.json
src/perla_extract/data/ground_truth/test/10.1038--s41560-022-01061-2.json
src/perla_extract/data/ground_truth/test/10.1038--s41560-022-01102-w.json
src/perla_extract/data/ground_truth/test/10.1038--s41563-025-02163-4.json
src/perla_extract/data/ground_truth/test/10.1039--c5ta00568j.json
src/perla_extract/data/ground_truth/test/10.1126--science.adf0194.json
src/perla_extract/papersbot/feeds.txt
src/perla_extract/papersbot/hf_utils.py
src/perla_extract/papersbot/match_pdf.py
src/perla_extract/papersbot/nomad_utils.py
src/perla_extract/papersbot/papersbot.py
src/perla_extract/papersbot/proc_abstracts.py
src/perla_extract/papersbot/utils.py
src/perla_extract/preprocessing/__init__.py
src/perla_extract/preprocessing/base.py
src/perla_extract/preprocessing/marker_processor.py
src/perla_extract/preprocessing/nougat_processor.py
src/perla_extract/preprocessing/pdf_utils.py
src/perla_extract/preprocessing/preprocessor.py
src/perla_extract/preprocessing/pymupdf_processor.py
src/perla_extract/preprocessing/utils.py
tests/test_data_accessibility.py