diff --git a/tools/aoptk/.shed.yml b/tools/aoptk/.shed.yml
index a44aadf1..9824bac6 100644
--- a/tools/aoptk/.shed.yml
+++ b/tools/aoptk/.shed.yml
@@ -4,13 +4,13 @@ remote_repository_url: "https://github.com/rdurnik/aoptk"
 homepage_url: "https://github.com/rdurnik/aoptk"
 categories:
   - Machine Learning
-description: "AOP-toolkit (aoptk) is a Python package designed to support the development of Adverse Outcome Pathways (AOPs) that require extensive data mining."
+description: "AOP-toolkit (aoptk) is a Python package designed to support data mining and analysis of toxicological outcomes."
 long_description: |
-  "AOP-toolkit (aoptk) is a Python package developed to support the construction of Adverse Outcome Pathways (AOPs) that require extensive mining and integration of toxicological data from heterogeneous sources. It enables researchers to collect literature from databases such as PubMed and Europe PMC, extract relevant information from full-text publications, and analyze complex, unstructured data using large language models. The toolkit also provides functionality for normalizing chemical names across publications, helping ensure consistency and interoperability."
+  "AOP-toolkit (aoptk) is a Python package for mining and analyzing toxicological and biomedical literature. Originally developed to support the construction of Adverse Outcome Pathways (AOPs), it provides general-purpose tools for retrieving, processing, and analyzing scientific publications."
 auto_tool_repositories:
   name_template: "{{ tool_id }}"
   description_template: "{{ tool_name }} tool from the aoptk package"
 suite:
   name: suite_aoptk
-  description: AOP-toolkit (aoptk) is a Python package developed to support the construction of Adverse Outcome Pathways (AOPs) that require extensive mining and integration of toxicological data from heterogeneous sources.
+  description: AOP-toolkit (aoptk) is a Python package for mining and analyzing toxicological and biomedical literature. Originally developed to support the construction of Adverse Outcome Pathways (AOPs), it provides general-purpose tools for retrieving, processing, and analyzing scientific publications.
   type: repository_suite_definition
\ No newline at end of file
diff --git a/tools/aoptk/aoptk_chemical_identifier.xml b/tools/aoptk/aoptk_chemical_identifier.xml
index 2d5b66e8..2f530247 100644
--- a/tools/aoptk/aoptk_chemical_identifier.xml
+++ b/tools/aoptk/aoptk_chemical_identifier.xml
@@ -6,19 +6,21 @@
 
     <requirements>
         <expand macro="requirements"/>
+        <expand macro="email_credentials"/>
     </requirements>
  
     <command detect_errors="exit_code"><![CDATA[
         chemical-identifier
             --query '$query'
-            --literature_database "$literature_database"
+            --literature_database "$literature_database_pubmed_europepmc"
             --chemical_database "$chemical_database"
             --outdir .
             \${EMAIL:+--email \$EMAIL}
     ]]></command>
 
     <inputs>
-        <expand macro="inputs"/>
+        <expand macro="query"/>
+        <expand macro="literature_database_pubmed_europepmc"/>
         <param argument="--chemical_database" type="data" format="xlsx" label="Chemical database" help="Custom chemical database with toxicologically relevant chemicals. Excel file with single column: chemical_name. Examples can be found in Citations." />
     </inputs>
 
@@ -31,13 +33,13 @@
         <!-- Hint: You can use [ctrl+alt+t] after defining the inputs/outputs to auto-scaffold some basic test cases. -->
         <test>
            <param name="query" value="hepg2 thioacetamide"/>
-           <param name="literature_database" value="pubmed"/>
+           <param name="literature_database_pubmed_europepmc" value="pubmed"/>
            <param name="chemical_database" location="https://zenodo.org/records/16532456/files/tg_gates.xlsx?download=1"/>
            <output name="Chemicals_per_publication" file="chemicals_per_publication_test.xlsx" compare="sim_size" delta="100"/>
         </test>
         <test>
             <param name="query" value="hepg2 thioacetamide spheroid"/>
-            <param name="literature_database" value="europepmc"/>
+            <param name="literature_database_pubmed_europepmc" value="europepmc"/>
             <param name="chemical_database" location="https://zenodo.org/records/16532456/files/tg_gates.xlsx?download=1"/>
             <output name="Publications_per_chemical" file="publications_per_chemical.xlsx" compare="sim_size" delta="100"/>
         </test>
diff --git a/tools/aoptk/aoptk_chemical_matching.xml b/tools/aoptk/aoptk_chemical_matching.xml
new file mode 100644
index 00000000..3f027850
--- /dev/null
+++ b/tools/aoptk/aoptk_chemical_matching.xml
@@ -0,0 +1,58 @@
+<tool id="aoptk_match_chemicals" name="aoptk match chemicals" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="25.1" license="MIT">
+    <description>Match chemical entities.</description>
+    <macros>
+        <import>macros.xml</import>
+    </macros>
+
+    <requirements>
+        <expand macro="requirements"/>
+    </requirements>
+ 
+    <command detect_errors="exit_code"><![CDATA[
+        python3 '${match_chemicals}'
+    ]]></command>
+
+<configfiles>
+<configfile name="match_chemicals">
+import os
+import pandas as pd
+
+chemicals_df_1 = pd.read_csv("$input_file_1", sep="\t")
+chemicals_df_2 = pd.read_csv("$input_file_2", sep="\t")
+merged_files = chemicals_df_1.merge(
+    chemicals_df_2,
+    left_on="heading",
+    right_on="heading",
+    how="outer",
+)
+merged_files.to_csv("merged_chemicals.tsv", sep="\t", index=False)
+
+</configfile>
+</configfiles>
+
+    <inputs>
+        <param name="input_file_1" type="data" format="tabular" label="TSV with heading column." help="Input tsv file with heading column." />
+        <param name="input_file_2" type="data" format="tabular" label="TSV with heading column." help="Input tsv file with heading column." />
+    </inputs>
+
+    <outputs>
+        <data name="merged_chemicals" format="tabular" from_work_dir="merged_chemicals.tsv" label="Merged chemicals with heading." />
+    </outputs>
+
+    <tests>
+        <test>
+           <param name="input_file_1" value="test-data/normalized.tsv"/>
+           <param name="input_file_2" value="test-data/normalized.tsv"/>
+           <output name="merged_chemicals" file="test-data/normalized.tsv" compare="sim_size" delta="100"/>
+        </test>
+    </tests>
+
+    <help><![CDATA[
+Chemical Matching
+===================
+
+Tool to match chemical entities.
+
+    ]]></help>
+
+</tool>
\ No newline at end of file
diff --git a/tools/aoptk/aoptk_chemical_normalization_llm.xml b/tools/aoptk/aoptk_chemical_normalization_llm.xml
new file mode 100644
index 00000000..9ab43265
--- /dev/null
+++ b/tools/aoptk/aoptk_chemical_normalization_llm.xml
@@ -0,0 +1,62 @@
+<tool id="aoptk_normalize_chemicals_llm" name="aoptk normalize chemicals llm" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="25.1" license="MIT">
+    <description>Normalize chemical entities using LLMs.</description>
+    <macros>
+        <import>macros.xml</import>
+    </macros>
+
+    <requirements>
+        <expand macro="requirements"/>
+        <expand macro="openai_api_key_credentials"/>
+    </requirements>
+ 
+    <command detect_errors="exit_code"><![CDATA[
+        python3 '${normalize_chemicals_llm}'
+    ]]></command>
+
+<configfiles>
+<configfile name="normalize_chemicals_llm">
+import os
+from aoptk.text_generation_api import TextGenerationAPI
+from aoptk.chemical import Chemical
+import pandas as pd
+
+openai_key = os.environ.get("OPENAI_KEY")
+text_generation_api = TextGenerationAPI(model="$llm_model", api_key=openai_key)
+chemical_list = pd.read_csv("$chemical_list", sep="\t")["chemical"].tolist()
+chemicals = pd.read_csv("$chemicals", sep="\t")
+chemicals["chemical"] = chemicals["chemical"].apply(
+    lambda x: TextGenerationAPI(model="$llm_model", api_key=openai_key).normalize_chemical(chemical=Chemical(x), chemical_list=chemical_list)
+    )
+chemicals["heading"] = chemicals["chemical"].apply(lambda chem: chem.heading)
+chemicals.to_csv("normalized_chemicals.tsv", sep="\t", index=False)
+
+</configfile>
+</configfiles>
+
+    <inputs>
+        <expand macro="llm_models"/>
+        <param name="chemicals" type="data" format="tabular" label="TSV with chemical column." help="Input tsv file with chemical column." />
+        <param name="chemical_list" type="data" format="tabular" label="TSV with chemical list." help="Input tsv file with chemical list." />
+    </inputs>
+
+    <outputs>
+        <data name="normalized_chemicals" format="tabular" from_work_dir="normalized_chemicals.tsv" label="Chemicals with heading generated." />
+    </outputs>
+
+    <tests>
+        <test>
+           <param name="chemicals" value="test-data/chemicals.tsv"/>
+           <param name="chemical_list" value="test-data/chemicals.tsv"/>
+           <output name="normalized_chemicals" file="test-data/normalized.tsv" compare="sim_size" delta="100"/>
+        </test>
+    </tests>
+
+    <help><![CDATA[
+Chemical Normalization LLMs
+===================
+
+Tool to normalize chemical entities using LLMs. Using LLM to match a given chemical against a provided chemical list.
+
+    ]]></help>
+
+</tool>
\ No newline at end of file
diff --git a/tools/aoptk/aoptk_chemical_normalization_mesh.xml b/tools/aoptk/aoptk_chemical_normalization_mesh.xml
new file mode 100644
index 00000000..ef204e6a
--- /dev/null
+++ b/tools/aoptk/aoptk_chemical_normalization_mesh.xml
@@ -0,0 +1,55 @@
+<tool id="aoptk_normalize_chemicals_mesh" name="aoptk normalize chemicals mesh" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="25.1" license="MIT">
+    <description>Normalize chemical entities using MeshTerms.</description>
+    <macros>
+        <import>macros.xml</import>
+    </macros>
+
+    <requirements>
+        <expand macro="requirements"/>
+    </requirements>
+ 
+    <command detect_errors="exit_code"><![CDATA[
+        python3 '${normalize_chemicals_mesh}'
+    ]]></command>
+
+<configfiles>
+<configfile name="normalize_chemicals_mesh">
+from aoptk.chemical import Chemical
+from aoptk.normalization.mesh_terms import MeshTerms
+import os
+import pandas as pd
+
+chemicals = pd.read_csv("$input_file", sep="\t")
+chemicals["chemical"] = chemicals["chemical"].apply(
+    lambda x: MeshTerms().normalize_chemical(Chemical(x))
+    )
+chemicals["heading"] = chemicals["chemical"].apply(lambda chem: chem.heading)
+chemicals.to_csv("normalized_chemicals.tsv", sep="\t", index=False)
+
+</configfile>
+</configfiles>
+
+    <inputs>
+        <param name="input_file" type="data" format="tabular" label="TSV with chemical column." help="Input tsv file with chemical column." />
+    </inputs>
+
+    <outputs>
+        <data name="normalized_chemicals" format="tabular" from_work_dir="normalized_chemicals.tsv" label="Chemicals with heading generated." />
+    </outputs>
+
+    <tests>
+        <test>
+           <param name="input_file" value="test-data/chemicals.tsv"/>
+           <output name="normalized_chemicals" file="test-data/normalized.tsv" compare="sim_size" delta="100"/>
+        </test>
+    </tests>
+
+    <help><![CDATA[
+Chemical Normalization MeSH Terms
+===================
+
+Tool to normalize chemical entities using MeSH Terms.
+
+    ]]></help>
+
+</tool>
\ No newline at end of file
diff --git a/tools/aoptk/aoptk_chemical_normalization_pubchem.xml b/tools/aoptk/aoptk_chemical_normalization_pubchem.xml
new file mode 100644
index 00000000..ee1bd67a
--- /dev/null
+++ b/tools/aoptk/aoptk_chemical_normalization_pubchem.xml
@@ -0,0 +1,55 @@
+<tool id="aoptk_normalize_chemicals_pubchem" name="aoptk normalize chemicals pubchem" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="25.1" license="MIT">
+    <description>Normalize chemical entities using PubChem API.</description>
+    <macros>
+        <import>macros.xml</import>
+    </macros>
+
+    <requirements>
+        <expand macro="requirements"/>
+    </requirements>
+ 
+    <command detect_errors="exit_code"><![CDATA[
+        python3 '${normalize_chemicals_pubchem}'
+    ]]></command>
+
+<configfiles>
+<configfile name="normalize_chemicals_pubchem">
+from aoptk.normalization.pubchem_api import PubChemAPI
+from aoptk.chemical import Chemical
+import os
+import pandas as pd
+
+chemicals = pd.read_csv("$input_file", sep="\t")
+chemicals["chemical"] = chemicals["chemical"].apply(
+    lambda x: PubChemAPI().normalize_chemical(Chemical(x))
+    )
+chemicals["heading"] = chemicals["chemical"].apply(lambda chem: chem.heading)
+chemicals.to_csv("normalized_chemicals.tsv", sep="\t", index=False)
+
+</configfile>
+</configfiles>
+
+    <inputs>
+        <param name="input_file" type="data" format="tabular" label="TSV with chemical column." help="Input tsv file with chemical column." />
+    </inputs>
+
+    <outputs>
+        <data name="normalized_chemicals" format="tabular" from_work_dir="normalized_chemicals.tsv" label="Chemicals with heading generated." />
+    </outputs>
+
+    <tests>
+        <test>
+           <param name="input_file" value="test-data/chemicals.tsv"/>
+           <output name="normalized_chemicals" file="test-data/normalized.tsv" compare="sim_size" delta="100"/>
+        </test>
+    </tests>
+
+    <help><![CDATA[
+Chemical Normalization PubChem
+===================
+
+Tool to normalize chemical entities using PubChem API.
+
+    ]]></help>
+
+</tool>
\ No newline at end of file
diff --git a/tools/aoptk/aoptk_download_abstracts.xml b/tools/aoptk/aoptk_download_abstracts.xml
new file mode 100644
index 00000000..0294deea
--- /dev/null
+++ b/tools/aoptk/aoptk_download_abstracts.xml
@@ -0,0 +1,74 @@
+<tool id="aoptk_download_abstracts" name="aoptk download abstracts" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="25.1" license="MIT">
+    <description>Download abstracts for a list of publication IDs.</description>
+    <macros>
+        <import>macros.xml</import>
+    </macros>
+
+    <requirements>
+        <expand macro="requirements"/>
+        <expand macro="email_credentials"/>
+    </requirements>
+ 
+    <command detect_errors="exit_code"><![CDATA[
+        python3 '${download_abstracts}'
+    ]]></command>
+
+    <configfiles>
+        <configfile name="download_abstracts">
+from aoptk.literature.databases.pubmed import PubMed
+from aoptk.literature.databases.europepmc import EuropePMC
+from aoptk.literature.abstract import Abstract
+from Bio import Entrez
+import os
+
+with open("$input_file", "r") as f:
+    ids = [line.strip() for line in f.readlines()]
+email = os.environ.get("EMAIL")
+
+
+if "${literature_database_pubmed_europepmc}" == "pubmed":
+    Entrez.email = email    
+    pubmed = PubMed.__new__(PubMed)
+    pubmed.id_list = ids
+    abstracts = pubmed.get_abstracts()
+elif "${literature_database_pubmed_europepmc}" == "europepmc":
+    europepmc = EuropePMC("")
+    europepmc.id_list = ids
+    abstracts = europepmc.get_abstracts()
+else:
+    raise ValueError("Select valid database.")
+
+for abstract in abstracts:
+    with open(f"{abstract.publication_id}.txt", "w") as f:
+        f.write(abstract.text)
+
+    </configfile>
+    </configfiles>
+
+    <inputs>
+        <expand macro="literature_database_pubmed_europepmc"/>
+        <param name="input_file" type="data" format="txt" label="List of IDs to search for." help="Input text file with IDs to search for." />
+    </inputs>
+
+    <outputs>
+    <collection name="abstracts" type="list" label="Downloaded abstracts">
+        <discover_datasets pattern="(?P&lt;designation&gt;.*)$" format="txt" visible="false" />
+    </collection>
+    </outputs>
+
+    <tests>
+        <test>
+            <param name="input_file" value="test-data/ids.txt"/>
+            <output_collection name="abstracts" type="list" count="2"/>
+        </test>
+    </tests>
+
+    <help><![CDATA[
+Download Abstracts
+===================
+
+Tool to download publication abstracts.
+
+    ]]></help>
+
+</tool>
\ No newline at end of file
diff --git a/tools/aoptk/aoptk_download_fulltext.xml b/tools/aoptk/aoptk_download_fulltext.xml
new file mode 100644
index 00000000..4b6f3b5d
--- /dev/null
+++ b/tools/aoptk/aoptk_download_fulltext.xml
@@ -0,0 +1,76 @@
+<tool id="aoptk_download_publications" name="aoptk download publications" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="25.1" license="MIT">
+    <description>Download full texts for a list of publication IDs.</description>
+    <macros>
+        <import>macros.xml</import>
+    </macros>
+
+    <requirements>
+        <expand macro="requirements"/>
+        <expand macro="email_credentials"/>
+    </requirements>
+ 
+    <command detect_errors="exit_code"><![CDATA[
+        python3 '${download_publications}'
+    ]]></command>
+
+    <configfiles>
+        <configfile name="download_publications">
+from aoptk.literature.databases.pmc import PMC
+from aoptk.literature.databases.europepmc import EuropePMC
+from Bio import Entrez
+import os
+
+with open("$input_file", "r") as f:
+    ids = [line.strip() for line in f.readlines()]
+email = os.environ.get("EMAIL")
+
+
+if "${literature_database_europepmc_pmc}" == "pmc":
+    Entrez.email = email
+    pmc = PMC("", storage = "./", figure_storage="./figures")
+    pmc.id_list = ids
+    publications = pmc.get_publications()
+elif "${literature_database_europepmc_pmc}" == "europepmc":
+    europepmc = EuropePMC("", storage = "./", figure_storage="./figures")
+    europepmc.id_list = ids
+    publications = europepmc.get_publications()
+else:
+    raise ValueError("Select valid database.")
+
+for publication in publications:
+    with open(f"{publication.publication_id}.txt", "w") as f:
+        f.write(publication.full_text)
+
+    </configfile>
+    </configfiles>
+
+    <inputs>
+        <expand macro="literature_database_europepmc_pmc"/>
+        <param name="input_file" type="data" format="txt" label="List of IDs to search for." help="Input text file with IDs to search for." />
+    </inputs>
+
+    <outputs>
+    <collection name="full_texts" type="list" label="Downloaded full texts">
+        <discover_datasets pattern="(?P&lt;designation&gt;.*)$" format="txt" visible="false" />
+    </collection>
+    <collection name="figures" type="list" label="Downloaded figures">
+        <discover_datasets directory="figures" pattern="(?P&lt;designation&gt;.*)$" format="data" visible="false" />
+    </collection>
+    </outputs>
+
+    <tests>
+        <test>
+            <param name="input_file" value="test-data/ids.txt"/>
+            <output_collection name="full_texts" type="list" count="2"/>
+        </test>
+    </tests>
+
+    <help><![CDATA[
+Download Publications
+===================
+
+Tool to download publications.
+
+    ]]></help>
+
+</tool>
\ No newline at end of file
diff --git a/tools/aoptk/aoptk_download_pdf.xml b/tools/aoptk/aoptk_download_pdf.xml
new file mode 100644
index 00000000..4df1a824
--- /dev/null
+++ b/tools/aoptk/aoptk_download_pdf.xml
@@ -0,0 +1,55 @@
+<tool id="aoptk_download_pdfs" name="aoptk download PDFs" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="25.1" license="MIT">
+    <description>Download PDFs for a list of publication IDs.</description>
+    <macros>
+        <import>macros.xml</import>
+    </macros>
+
+    <requirements>
+        <expand macro="requirements"/>
+    </requirements>
+ 
+    <command detect_errors="exit_code"><![CDATA[
+        python3 '${download_pdfs}'
+    ]]></command>
+
+    <configfiles>
+        <configfile name="download_pdfs">
+from aoptk.literature.databases.pmc import PMC
+import os
+
+with open("$input_file", "r") as f:
+    ids = [line.strip() for line in f.readlines()]
+
+pmc = PMC("", storage = "./")
+pmc.id_list = ids
+pdfs = pmc.get_pdfs()
+
+    </configfile>
+    </configfiles>
+
+    <inputs>
+        <param name="input_file" type="data" format="txt" label="List of IDs to search for." help="Input text file with IDs to search for." />
+    </inputs>
+
+    <outputs>
+    <collection name="pdfs" type="list" label="Downloaded PDFs">
+        <discover_datasets pattern="(?P&lt;designation&gt;.*)$" format="pdf" visible="false" />
+    </collection>
+    </outputs>
+
+    <tests>
+        <test>
+            <param name="input_file" value="test-data/ids.txt"/>
+            <output_collection name="pdfs" type="list" count="2"/>
+        </test>
+    </tests>
+
+    <help><![CDATA[
+Download PDFs
+===================
+
+Tool to download PDFs for a list of publication IDs.
+
+    ]]></help>
+
+</tool>
\ No newline at end of file
diff --git a/tools/aoptk/aoptk_find_chemicals.xml b/tools/aoptk/aoptk_find_chemicals.xml
new file mode 100644
index 00000000..6c45b081
--- /dev/null
+++ b/tools/aoptk/aoptk_find_chemicals.xml
@@ -0,0 +1,73 @@
+<tool id="aoptk_find_chemicals" name="aoptk find chemicals" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="25.1" license="MIT">
+    <description>Detect chemicals in text.</description>
+    <macros>
+        <import>macros.xml</import>
+    </macros>
+
+    <requirements>
+        <expand macro="requirements"/>
+        <expand macro="openai_api_key_credentials"/>
+    </requirements>
+ 
+    <command detect_errors="exit_code"><![CDATA[
+        python3 '${find_chemicals}'
+    ]]></command>
+
+<configfiles>
+<configfile name="find_chemicals">
+import os
+from aoptk.text_generation_api import TextGenerationAPI
+from aoptk.literature.pdf import PDF
+from aoptk.literature.pymupdf_parser import PymupdfParser
+
+publication_id = os.path.splitext("$input_file.element_identifier")[0]
+openai_key = os.environ.get("OPENAI_KEY")
+text_generation_api = TextGenerationAPI(model="$llm_model", api_key=openai_key)
+
+if "${input_file.ext}" == "pdf":
+    text = PymupdfParser([PDF("$input_file")]).get_publications()[0].full_text
+    chemicals = text_generation_api.find_chemicals(text)
+
+elif "${input_file.ext}" == "txt":
+    with open("$input_file", "r") as f_in:
+        text = f_in.read()
+        chemicals = text_generation_api.find_chemicals(text)
+else:
+    raise ValueError(f"Unsupported input file format: {input_ext}")
+
+with open("chemicals.tsv", "w") as f_out:
+    f_out.write("id\tchemical\n")
+    for chemical in chemicals:
+        f_out.write(f"{publication_id}\t{chemical.name}\n")
+</configfile>
+</configfiles>
+
+    <inputs>
+        <expand macro="llm_models"/>
+        <expand macro="prompt_specification"/>
+        <param name="input_file" type="data" format="txt,pdf" label="Text to analyze" help="Input text file or PDF." />
+        <param argument="effect" type="text" value="" label="Effect to search" help="Specify the effect you want to search for.">
+            <validator type="regex">[0-9a-zA-Z]+</validator>
+        </param>
+    </inputs>
+
+    <outputs>
+        <data name="chemicals" format="tabular" from_work_dir="chemicals.tsv" label="Chemicals identified in text." />
+    </outputs>
+
+    <tests>
+        <test>
+           <param name="input_file" value="test-data/text.tsv"/>
+           <output name="chemicals" file="chemicals.tsv" compare="sim_size" delta="100"/>
+        </test>
+    </tests>
+
+    <help><![CDATA[
+Chemical Identification
+===================
+
+Tool to identify chemical entities in a given text.
+
+    ]]></help>
+
+</tool>
\ No newline at end of file
diff --git a/tools/aoptk/aoptk_find_chemicals_non_llm.xml b/tools/aoptk/aoptk_find_chemicals_non_llm.xml
new file mode 100644
index 00000000..2b1619a5
--- /dev/null
+++ b/tools/aoptk/aoptk_find_chemicals_non_llm.xml
@@ -0,0 +1,65 @@
+<tool id="aoptk_find_chemicals_non_llm" name="aoptk find chemicals non llm" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="25.1" license="MIT">
+    <description>Detect chemicals in text.</description>
+    <macros>
+        <import>macros.xml</import>
+    </macros>
+
+    <requirements>
+        <expand macro="requirements"/>
+    </requirements>
+ 
+    <command detect_errors="exit_code"><![CDATA[
+        python3 '${find_chemicals_non_llm}'
+    ]]></command>
+
+<configfiles>
+<configfile name="find_chemicals_non_llm">
+from aoptk.spacy_text_processor import SpacyText
+from aoptk.literature.pdf import PDF
+from aoptk.literature.pymupdf_parser import PymupdfParser
+import os
+
+publication_id = os.path.splitext("$input_file.element_identifier")[0]
+
+if "${input_file.ext}" == "pdf":
+    text = PymupdfParser([PDF("$input_file")]).get_publications()[0].full_text
+    chemicals = SpacyText().find_chemical(text)
+
+elif "${input_file.ext}" == "txt":
+    with open("$input_file", "r") as f_in:
+        text = f_in.read()
+        chemicals = SpacyText().find_chemical(text)
+else:
+    raise ValueError(f"Unsupported input file format: {input_ext}")
+
+with open("chemicals.tsv", "w") as f_out:
+    f_out.write("id\tchemical\n")
+    for chemical in chemicals:
+        f_out.write(f"{publication_id}\t{chemical.name}\n")
+</configfile>
+</configfiles>
+
+    <inputs>
+        <param name="input_file" type="data" format="txt,pdf" label="Text to analyze" help="Input text file or PDF." />
+    </inputs>
+
+    <outputs>
+        <data name="chemicals" format="tabular" from_work_dir="chemicals.tsv" label="Chemicals identified in text." />
+    </outputs>
+
+    <tests>
+        <test>
+           <param name="input_file" value="test-data/text.tsv"/>
+           <output name="chemicals" file="chemicals.tsv" compare="sim_size" delta="100"/>
+        </test>
+    </tests>
+
+    <help><![CDATA[
+Chemical Identification
+===================
+
+Tool to identify chemical entities in a given text.
+
+    ]]></help>
+
+</tool>
\ No newline at end of file
diff --git a/tools/aoptk/aoptk_find_relationships_non_llm.xml b/tools/aoptk/aoptk_find_relationships_non_llm.xml
new file mode 100644
index 00000000..12f8b20d
--- /dev/null
+++ b/tools/aoptk/aoptk_find_relationships_non_llm.xml
@@ -0,0 +1,84 @@
+<tool id="aoptk_find_relationships_text_non_llm" name="aoptk find relationships text non llm" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="25.1" license="MIT">
+    <description>Detect relationships between chemicals and effects in text.</description>
+    <macros>
+        <import>macros.xml</import>
+    </macros>
+
+    <requirements>
+        <expand macro="requirements"/>
+    </requirements>
+ 
+    <command detect_errors="exit_code"><![CDATA[
+        python3 '${find_relationships_text_non_llm}'
+    ]]></command>
+
+<configfiles>
+<configfile name="find_relationships_text_non_llm">
+import os
+import sys
+
+os.environ.setdefault("TORCHINDUCTOR_CACHE_DIR", os.path.join(os.getcwd(), ".torchinductor_cache"))
+os.makedirs(os.environ["TORCHINDUCTOR_CACHE_DIR"], exist_ok=True)
+
+from aoptk.spacy_text_processor import SpacyText
+from aoptk.relationships.zero_shot_classification_single import ZeroShotClassificationSingle
+from aoptk.literature.pdf import PDF
+from aoptk.literature.pymupdf_parser import PymupdfParser
+
+publication_id = os.path.splitext("$input_file.element_identifier")[0]
+effects = ["${effect}"]
+email = os.environ.get("EMAIL")
+
+if "${input_file.ext}" == "pdf":
+    text = PymupdfParser([PDF("$input_file")]).get_publications()[0].full_text
+    chemicals = SpacyText().find_chemical(text)
+    relationships = ZeroShotClassificationSingle().find_relationships(
+    text=text, chemicals=chemicals, effects=effects
+)
+
+elif "${input_file.ext}" == "txt":
+    with open("$input_file", "r") as f_in:
+        text = f_in.read()
+        chemicals = SpacyText().find_chemical(text)
+        relationships = ZeroShotClassificationSingle().find_relationships(
+        text=text, chemicals=chemicals, effects=effects
+    )
+
+else:
+    raise ValueError(f"Unsupported input file format: ${input_file.ext}")
+
+with open("relationships.tsv", "w") as f_out:
+    f_out.write("id\tchemical\teffect\trelationship\n")
+    for relationship in relationships:
+        f_out.write(f"{publication_id}\t{relationship.chemical}\t{relationship.effect}\t{relationship.relationship_type}\n")
+</configfile>
+</configfiles>
+
+    <inputs>
+        <param name="input_file" type="data" format="txt,pdf" label="Text to analyze" help="Input text file or PDF." />
+        <param argument="effect" type="text" value="" label="Effect to search" help="Specify the effect you want to search for.">
+            <validator type="regex">[0-9a-zA-Z]+</validator>
+        </param>
+    </inputs>
+
+    <outputs>
+        <data name="relationships" format="tabular" from_work_dir="relationships.tsv" label="Relationships identified in text." />
+    </outputs>
+
+    <tests>
+        <test>
+           <param name="input_file" value="test-data/text.tsv"/>
+           <param name="effect" value="liver fibrosis"/>
+           <output name="relationships" file="relationships.tsv" compare="sim_size" delta="100"/>
+        </test>
+    </tests>
+
+    <help><![CDATA[
+Relationship Identification
+===================
+
+Tool to identify relationships between chemicals and effects in a given text.
+
+    ]]></help>
+
+</tool>
\ No newline at end of file
diff --git a/tools/aoptk/aoptk_find_relationships_text.xml b/tools/aoptk/aoptk_find_relationships_text.xml
new file mode 100644
index 00000000..2545c60f
--- /dev/null
+++ b/tools/aoptk/aoptk_find_relationships_text.xml
@@ -0,0 +1,86 @@
+<tool id="aoptk_find_relationships_text" name="aoptk find relationships text" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="25.1" license="MIT">
+    <description>Detect relationships between chemicals and effects in text.</description>
+    <macros>
+        <import>macros.xml</import>
+    </macros>
+
+    <requirements>
+        <expand macro="requirements"/>
+        <expand macro="openai_api_key_credentials"/>
+    </requirements>
+ 
+    <command detect_errors="exit_code"><![CDATA[
+        python3 '${find_relationships_text}'
+    ]]></command>
+
+<configfiles>
+<configfile name="find_relationships_text">
+import os
+from aoptk.text_generation_api import TextGenerationAPI
+from aoptk.relationship_type import Causative
+from aoptk.relationship_type import Inhibitive
+from aoptk.relationship_type import RelationshipType
+from aoptk.relationships.relationship import Relationship
+from aoptk.effect import Effect
+
+publication_id = os.path.splitext("$input_file.element_identifier")[0]
+effects = ["${effect}"]
+openai_key = os.environ.get("OPENAI_KEY")
+text_generation_api = TextGenerationAPI(model="$llm_model", api_key=openai_key)
+text_generation_api.specification_relationship_text_prompt="$prompt_specification"
+
+if "${input_file.ext}" == "pdf":
+    text = PymupdfParser([PDF("$input_file")]).inject_text_generation(TextGenerationAPI(model="redhatai-scout")).get_publications()[0].full_text
+    chemicals = text_generation_api.find_chemicals(text)
+    relationships = text_generation_api.find_relationships_in_text(
+    text=text, chemicals=chemicals, effects=effects
+)
+
+elif "${input_file.ext}" == "txt":
+    with open("$input_file", "r") as f_in:
+        text = f_in.read()
+        chemicals = text_generation_api.find_chemicals(text)
+        relationships = text_generation_api.find_relationships_in_text(
+        text=text, chemicals=chemicals, effects=effects
+    )
+
+else:
+    raise ValueError(f"Unsupported input file format: ${input_file.ext}")
+    
+with open("relationships.tsv", "w") as f_out:
+    f_out.write("id\tchemical\teffect\trelationship\n")
+    for relationship in relationships:
+        f_out.write(f"{publication_id}\t{relationship.chemical}\t{relationship.effect}\t{relationship.relationship_type}\n")
+</configfile>
+</configfiles>
+
+    <inputs>
+        <expand macro="llm_models"/>
+        <expand macro="prompt_specification"/>
+        <param name="input_file" type="data" format="txt,pdf" label="Text to analyze" help="Input text file or PDF." />
+        <param argument="effect" type="text" value="" label="Effect to search" help="Specify the effect you want to search for.">
+            <validator type="regex">[0-9a-zA-Z]+</validator>
+        </param>
+    </inputs>
+
+    <outputs>
+        <data name="relationships" format="tabular" from_work_dir="relationships.tsv" label="Relationships identified in text." />
+    </outputs>
+
+    <tests>
+        <test>
+           <param name="input_file" value="test-data/text.tsv"/>
+            <param name="effect" value="liver fibrosis"/>
+           <output name="relationships" file="relationships.tsv" compare="sim_size" delta="100"/>
+        </test>
+    </tests>
+
+    <help><![CDATA[
+Relationship Identification in Text
+===================
+
+Tool to identify relationships between chemicals and effects in a given text.
+
+    ]]></help>
+
+</tool>
\ No newline at end of file
diff --git a/tools/aoptk/aoptk_find_relationships_text_images.xml b/tools/aoptk/aoptk_find_relationships_text_images.xml
new file mode 100644
index 00000000..88cb1295
--- /dev/null
+++ b/tools/aoptk/aoptk_find_relationships_text_images.xml
@@ -0,0 +1,105 @@
+<tool id="aoptk_find_relationships_text_images" name="aoptk find relationships text images" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="25.1" license="MIT">
+    <description>Detect relationships between chemicals and effects in text.</description>
+    <macros>
+        <import>macros.xml</import>
+    </macros>
+
+    <requirements>
+        <expand macro="requirements"/>
+        <expand macro="openai_api_key_credentials"/>
+    </requirements>
+ 
+    <command detect_errors="exit_code"><![CDATA[
+        python3 '${find_relationships_text_images}'
+    ]]></command>
+
+<configfiles>
+<configfile name="find_relationships_text_images">
+import os
+from aoptk.text_generation_api import TextGenerationAPI
+from aoptk.relationship_type import Causative
+from aoptk.relationship_type import Inhibitive
+from aoptk.relationship_type import RelationshipType
+from aoptk.relationships.relationship import Relationship
+from aoptk.effect import Effect
+
+publication_id = os.path.splitext("$input_file.element_identifier")[0]
+effects = ["${effect}"]
+openai_key = os.environ.get("OPENAI_KEY")
+text_generation_api = TextGenerationAPI(model="$llm_model", api_key=openai_key)
+text_generation_api.specification_relationship_text_prompt="$prompt_specification"
+
+if "${input_file.ext}" == "pdf":
+    text = ""
+    publication = PymupdfParser([PDF("$input_file")]).inject_text_generation(TextGenerationAPI(model="$llm_models_images")).get_publications()[0]
+    text += publication.full_text
+
+    for image in publication.images:
+        text_image = TextGenerationAPI(model="$llm_models_images").convert_image(
+            image_path=image.path,
+            text=publication.full_text,
+        )
+        text += f"\n\n{image.name}:\n{text_image}"
+
+    chemicals = text_generation_api.find_chemicals(text)
+    relationships = text_generation_api.find_relationships_in_text(
+    text=text, chemicals=chemicals, effects=effects
+)
+
+elif "${input_file.ext}" == "txt":
+    with open("$input_file", "r") as f_in:
+        text = ""
+        text += f_in.read()
+        text += "\n\n\n\nALSO ANALYZE THESE FIGURES CONVERTED TO TEXT:"
+        for image in publication_images_folder.iterdir():
+            text_image = TextGenerationAPI(model="$llm_models_images").convert_image(
+                image_path=image,
+                text=matching_pub_data["publication.full_text"],
+            )
+        text += f"\n\n{image.name}:\n{text_image}"
+
+        chemicals = text_generation_api.find_chemicals(text)
+        relationships = text_generation_api.find_relationships_in_text(
+        text=text, chemicals=chemicals, effects=effects
+    )
+else:
+    raise ValueError(f"Unsupported input file format: ${input_file.ext}")
+
+with open("relationships.tsv", "w") as f_out:
+    f_out.write("id\tchemical\teffect\trelationship\n")
+    for relationship in relationships:
+        f_out.write(f"{publication_id}\t{relationship.chemical}\t{relationship.effect}\t{relationship.relationship_type}\n")
+</configfile>
+</configfiles>
+     <inputs>
+        <expand macro="llm_models"/>
+        <expand macro="prompt_specification"/>
+        <expand macro="llm_models_images"/>
+        <param name="input_file" type="data" format="txt,pdf" label="Text to analyze" help="Input text file or PDF." />
+        <param name="input_images" type="data_collection" collection_type="list" format="png,jpg,jpeg,gif,tif,tiff,bmp,webp" label="Images to analyze" help="Input collection (folder) of image files." />
+        <param argument="effect" type="text" value="" label="Effect to search" help="Specify the effect you want to search for.">
+            <validator type="regex">[0-9a-zA-Z]+</validator>
+        </param>
+    </inputs>
+
+    <outputs>
+        <data name="relationships" format="tabular" from_work_dir="relationships.tsv" label="Relationships identified in text." />
+    </outputs>
+
+    <tests>
+        <test>
+           <param name="input_file" value="test-data/text.tsv"/>
+            <param name="effect" value="liver fibrosis"/>
+           <output name="relationships" file="relationships.tsv" compare="sim_size" delta="100"/>
+        </test>
+    </tests>
+
+    <help><![CDATA[
+Relationship Identification in Text
+===================
+
+Tool to identify relationships between chemicals and effects in a given text.
+
+    ]]></help>
+
+</tool>
\ No newline at end of file
diff --git a/tools/aoptk/aoptk_parse_pdf.xml b/tools/aoptk/aoptk_parse_pdf.xml
new file mode 100644
index 00000000..798c1240
--- /dev/null
+++ b/tools/aoptk/aoptk_parse_pdf.xml
@@ -0,0 +1,63 @@
+<tool id="aoptk_parse_pdf" name="aoptk parse PDF" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="25.1" license="MIT">
+    <description>Parse PDF files.</description>
+    <macros>
+        <import>macros.xml</import>
+    </macros>
+
+    <requirements>
+        <expand macro="requirements"/>
+        <expand macro="openai_api_key_credentials"/>
+    </requirements>
+ 
+    <command detect_errors="exit_code"><![CDATA[
+        python3 '${parse_pdf}'
+    ]]></command>
+
+<configfiles>
+<configfile name="parse_pdf">
+from aoptk.literature.pdf import PDF
+from aoptk.literature.pymupdf_parser import PymupdfParser
+from aoptk.text_generation_api import TextGenerationAPI
+import os
+
+publication_id = os.path.splitext("$input_file.element_identifier")[0]
+if "${input_file.ext}" == "pdf":
+    parser = PymupdfParser([PDF("$input_file")])
+    if os.environ.get("OPENAI_KEY"):
+        parser = parser.inject_text_generation(TextGenerationAPI(model="$llm_models_images", api_key=os.environ.get("OPENAI_KEY")))
+
+    pdf = parser.get_publications()
+    text = pdf[0].full_text
+    with open(f"{publication_id}.txt", "w") as f:
+        f.write(text)
+
+else:
+    raise ValueError(f"Unsupported input file format: ${input_file.ext}")
+</configfile>
+</configfiles>
+
+    <inputs>
+        <param name="input_file" type="data" format="pdf" label="PDF to parse" help="Input PDF." />
+        <expand macro="llm_models_images"/>
+    </inputs>
+
+    <outputs>
+    <data name="text" format="txt" from_work_dir="*.txt" label="Parsed text." />
+    </outputs>
+
+    <tests>
+        <test>
+           <param name="input_file" value="test-data/text.pdf"/>
+           <output name="text" file="text.txt" compare="sim_size" delta="100"/>
+        </test>
+    </tests>
+
+    <help><![CDATA[
+Parse PDF
+===================
+
+Tool to parse PDF files. API key for LLMs is optional and only needed for PDFs that are scanned images.
+
+    ]]></help>
+
+</tool>
\ No newline at end of file
diff --git a/tools/aoptk/aoptk_publication_tracker.xml b/tools/aoptk/aoptk_publication_tracker.xml
index b20a13ab..05e4a82d 100644
--- a/tools/aoptk/aoptk_publication_tracker.xml
+++ b/tools/aoptk/aoptk_publication_tracker.xml
@@ -6,6 +6,7 @@
 
     <requirements>
         <expand macro="requirements"/>
+        <expand macro="email_credentials"/>
     </requirements>
 
     <command detect_errors="exit_code"><![CDATA[
@@ -16,13 +17,13 @@
             --master 'master.${master.ext}'
             --code '$code'
             --query '$query'
-            --database '$literature_database'
+            --database '$literature_database_pubmed_europepmc'
             --outdir .
             \${EMAIL:+--email \$EMAIL}
     ]]></command>
 
     <inputs>
-        <expand macro="inputs"/>
+        <expand macro="query"/>
         <param argument="--code" type="text" value="" label="Your search code" help="Type your search code. E.g., 1.1. or 1.2.1.">
             <sanitizer invalid_char="">
                 <valid initial="string.digits">
@@ -46,7 +47,7 @@
         <test>
            <param name="query" value="hepg2 thioacetamide"/>
            <param name="code" value="1.1.1."/>
-           <param name="literature_database" value="pubmed"/>
+           <param name="literature_database_pubmed_europepmc" value="pubmed"/>
            <param name="read" value="read_test.xlsx"/>
            <param name="master" value="master_test.xlsx"/>
            <output name="to_read" file="read1.xlsx" compare="sim_size" delta="100"/>
@@ -54,7 +55,7 @@
         <test>
            <param name="query" value="hepg2 heparg thioacetamide spheroid"/>
            <param name="code" value="1.2.1."/>
-           <param name="literature_database" value="europepmc"/>
+           <param name="literature_database_pubmed_europepmc" value="europepmc"/>
            <param name="read" value="read_test.xlsx"/>
            <param name="master" value="master_test.xlsx"/>
            <output name="to_read" file="read2.xlsx" compare="sim_size" delta="100"/>
@@ -62,7 +63,7 @@
         <test>
            <param name="query" value="lx-2 col1a1"/>
            <param name="code" value="3.1."/>
-           <param name="literature_database" value="pubmed"/>
+           <param name="literature_database_pubmed_europepmc" value="pubmed"/>
            <param name="read" value="read_test.xlsx"/>
            <param name="master" value="master_test.xlsx"/>
            <output name="updated_master_table" file="updated_master_table.xlsx" compare="sim_size" delta="100"/>
diff --git a/tools/aoptk/aoptk_query_literature.xml b/tools/aoptk/aoptk_query_literature.xml
new file mode 100644
index 00000000..095cf849
--- /dev/null
+++ b/tools/aoptk/aoptk_query_literature.xml
@@ -0,0 +1,71 @@
+<tool id="aoptk_query_literature" name="aoptk query literature" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="25.1" license="MIT">
+    <description>Query literature for a list of publication IDs.</description>
+    <macros>
+        <import>macros.xml</import>
+    </macros>
+
+    <requirements>
+        <expand macro="requirements"/>
+        <expand macro="email_credentials"/>
+    </requirements>
+ 
+    <command detect_errors="exit_code"><![CDATA[
+        python3 '${query_literature}'
+    ]]></command>
+
+    <configfiles>
+        <configfile name="query_literature">
+from aoptk.literature.databases.pubmed import PubMed
+from aoptk.literature.databases.europepmc import EuropePMC
+from aoptk.literature.databases.pmc import PMC
+from Bio import Entrez
+import os
+
+email = os.environ.get("EMAIL")
+
+
+if "${literature_database_pubmed_europepmc_pmc}" == "pubmed":
+    Entrez.email = email    
+    ids = PubMed("${query}").get_id()
+elif "${literature_database_pubmed_europepmc_pmc}" == "europepmc":
+    ids = EuropePMC("${query}").get_id()
+elif "${literature_database_pubmed_europepmc_pmc}" == "pmc":
+    Entrez.email = email
+    ids = PMC("${query}").get_id()
+
+else:
+    raise ValueError("Select valid database.")
+
+with open(f"ids.txt", "w") as f:
+    for id in ids:
+        f.write(f"{id}\n")
+
+    </configfile>
+    </configfiles>
+
+    <inputs>
+        <expand macro="query"/>
+        <expand macro="literature_database_pubmed_europepmc_pmc"/>
+    </inputs>
+
+    <outputs>
+        <data name="ids" format="txt" from_work_dir="ids.txt" label="List of IDs." />
+    </outputs>
+
+    <tests>
+        <test>
+           <param name="query" value="hepg2 thioacetamide"/>
+           <param name="literature_database_pubmed_europepmc_pmc" value="pubmed"/>
+           <output name="ids" file="ids.txt" compare="sim_size" delta="100"/>
+        </test>
+    </tests>
+
+    <help><![CDATA[
+Download IDs
+===================
+
+Tool to download publication IDs.
+
+    ]]></help>
+
+</tool>
\ No newline at end of file
diff --git a/tools/aoptk/macros.xml b/tools/aoptk/macros.xml
index 5c0881e5..3826a7a0 100644
--- a/tools/aoptk/macros.xml
+++ b/tools/aoptk/macros.xml
@@ -1,18 +1,30 @@
 <macros>
-    <token name="@TOOL_VERSION@">0.1.6</token>
+    <token name="@TOOL_VERSION@">0.2.0</token>
     <token name="@VERSION_SUFFIX@">0</token>
 
     <xml name="requirements">
         <requirement type="package" version="@TOOL_VERSION@">aoptk</requirement>
+    </xml>
+
+    <xml name="email_credentials">
         <credentials name="email_credentials" 
                      label="Your e-mail address" 
                      version="1.0"
                      description="E-mail is required to follow NCBI/PubMed guidelines.">
             <variable name="email" inject_as_env="EMAIL" optional="true"/>
-          </credentials>
+        </credentials>
+    </xml>
+
+    <xml name="openai_api_key_credentials">
+        <credentials name="openai_api_key_credentials" 
+                     label="Your OpenAI API key" 
+                     version="1.0"
+                     description="OpenAI API key is required to use the OpenAI API.">
+            <variable name="openai_key" inject_as_env="OPENAI_KEY" optional="true"/>
+        </credentials>
     </xml>
 
-    <xml name="inputs">
+    <xml name="query">
         <param argument="--query" type="text" value="" label="Your search term" help="Type your search term as you would in PubMed/Europe PMC.">
             <sanitizer invalid_char="">
                 <valid initial="string.letters,string.digits">
@@ -82,11 +94,109 @@
             </sanitizer>
             <validator type="regex">[0-9a-zA-Z_ ()*'"[\]\[\]\-:.\[\]α-ωΑ-Ω]+</validator>
         </param>
+    </xml>
+
+    <xml name="literature_database_pubmed_europepmc">
         <param name="literature_database" type="select" label="Select which database to search." help="PubMed only accepts searches with up to 10 000 results. No limit for Europe PMC.">
             <option value="pubmed" selected="true">PubMed</option>
             <option value="europepmc">EuropePMC</option>
         </param>
     </xml>
+    <xml name="literature_database_pubmed_europepmc_pmc">
+        <param name="literature_database" type="select" label="Select which database to search." help="PubMed only accepts searches with up to 10 000 results. No limit for Europe PMC and PMC.">
+            <option value="pubmed" selected="true">PubMed</option>
+            <option value="europepmc">EuropePMC</option>
+            <option value="pmc">PMC</option>
+        </param>
+    </xml>
+    <xml name="literature_database_europepmc_pmc">
+        <param name="literature_database" type="select" label="Select which database to search." help="PubMed only accepts searches with up to 10 000 results. No limit for Europe PMC and PMC.">
+            <option value="europepmc">EuropePMC</option>
+            <option value="pmc">PMC</option>
+        </param>
+    </xml>
+    <xml name="llm_models">
+        <param name="llm_model" type="select" label="Select LLM model." help="Choose the LLM to use for relationship detection.">
+            <option value="gpt-oss-120b">GPT OSS 120B</option>
+        </param>
+    </xml>
+    <xml name="llm_models_images">
+        <param name="llm_models_images" type="select" label="Select LLM model to handle image data." help="Choose the LLM to use for image data processing.">
+            <option value="redhatai-scout">RedHatAI Scout</option>
+        </param>
+    </xml>
+    <xml name="prompt_specification">
+        <param argument="--prompt_specification" type="text" value="" label="Prompt specification" help="Modify the prompt.">
+            <sanitizer invalid_char="">
+                <valid initial="string.letters,string.digits">
+                    <add value="_" />
+                    <add value=" " />
+                    <add value="&apos;" />
+                    <add value="&quot;" />
+                    <add value="(" />
+                    <add value=")" />
+                    <add value="*" />
+                    <add value="[" />
+                    <add value="]" />
+                    <add value="-" />
+                    <add value=":" />
+                    <add value="/" />
+                    <!-- Lowercase Greek letters -->
+                    <add value="α" />
+                    <add value="β" />
+                    <add value="γ" />
+                    <add value="δ" />
+                    <add value="ε" />
+                    <add value="ζ" />
+                    <add value="η" />
+                    <add value="θ" />
+                    <add value="ι" />
+                    <add value="κ" />
+                    <add value="λ" />
+                    <add value="μ" />
+                    <add value="ν" />
+                    <add value="ξ" />
+                    <add value="ο" />
+                    <add value="π" />
+                    <add value="ρ" />
+                    <add value="σ" />
+                    <add value="τ" />
+                    <add value="υ" />
+                    <add value="φ" />
+                    <add value="χ" />
+                    <add value="ψ" />
+                    <add value="ω" />
+                    <!-- Uppercase Greek letters -->
+                    <add value="Α" />
+                    <add value="Β" />
+                    <add value="Γ" />
+                    <add value="Δ" />
+                    <add value="Ε" />
+                    <add value="Ζ" />
+                    <add value="Η" />
+                    <add value="Θ" />
+                    <add value="Ι" />
+                    <add value="Κ" />
+                    <add value="Λ" />
+                    <add value="Μ" />
+                    <add value="Ν" />
+                    <add value="Ξ" />
+                    <add value="Ο" />
+                    <add value="Π" />
+                    <add value="Ρ" />
+                    <add value="Σ" />
+                    <add value="Τ" />
+                    <add value="Υ" />
+                    <add value="Φ" />
+                    <add value="Χ" />
+                    <add value="Ψ" />
+                    <add value="Ω" />
+                </valid>
+            </sanitizer>
+            <validator type="regex">[0-9a-zA-Z_ ()*'"[\]\[\]\-:.\[\]α-ωΑ-Ω]+</validator>
+        </param>
+    </xml>
+
 
 
 <token name="@init_scores@">
diff --git a/tools/aoptk/test-data/chemicals.tsv b/tools/aoptk/test-data/chemicals.tsv
new file mode 100644
index 00000000..a373f17c
--- /dev/null
+++ b/tools/aoptk/test-data/chemicals.tsv
@@ -0,0 +1,4 @@
+id	chemical
+123	thioacetamide
+456	acetaminophen
+789	paracetamol
\ No newline at end of file
diff --git a/tools/aoptk/test-data/ids.txt b/tools/aoptk/test-data/ids.txt
new file mode 100644
index 00000000..45504114
--- /dev/null
+++ b/tools/aoptk/test-data/ids.txt
@@ -0,0 +1,2 @@
+41480994
+PMC12930283
\ No newline at end of file
diff --git a/tools/aoptk/test-data/normalized.tsv b/tools/aoptk/test-data/normalized.tsv
new file mode 100644
index 00000000..774b0683
--- /dev/null
+++ b/tools/aoptk/test-data/normalized.tsv
@@ -0,0 +1,4 @@
+heading	chemical
+thioacetamide	thioacetamide
+acetaminophen	acetaminophen
+acetaminophen	paracetamol
\ No newline at end of file
diff --git a/tools/aoptk/test-data/relationships.tsv b/tools/aoptk/test-data/relationships.tsv
new file mode 100644
index 00000000..62e0c8a8
--- /dev/null
+++ b/tools/aoptk/test-data/relationships.tsv
@@ -0,0 +1,2 @@
+id  chemical   effect  relationship
+text  thioacetamide  liver fibrosis    positive
\ No newline at end of file
diff --git a/tools/aoptk/test-data/text.pdf b/tools/aoptk/test-data/text.pdf
new file mode 100644
index 00000000..4fc5b3dc
Binary files /dev/null and b/tools/aoptk/test-data/text.pdf differ
diff --git a/tools/aoptk/test-data/text.txt b/tools/aoptk/test-data/text.txt
new file mode 100644
index 00000000..5b5f97da
--- /dev/null
+++ b/tools/aoptk/test-data/text.txt
@@ -0,0 +1 @@
+Thioacetamide is a chemical that causes liver fibrosis.
\ No newline at end of file