Spaces:
Running
on
Zero
Running
on
Zero
"""Prompt templates used for problems in the ether0 dataset.""" | |
# ruff: noqa: E501, W505 | |
NAME_IUPAC_PROMPTS = [ | |
"What are the SMILES from the IUPAC name: {iupac}?", | |
"Could you please tell me the SMILES representation for {iupac}?", | |
"I have {iupac}. What would its SMILES be?", | |
"Provide the SMILES string for the molecule named {iupac}.", | |
"Convert this IUPAC name into a SMILES format: {iupac}.", | |
"Give me the SMILES notation for the compound {iupac}.", | |
"What SMILES corresponds to the IUPAC chemical name {iupac}?", | |
"How can I represent {iupac} as a SMILES string?", | |
"Generate the SMILES structure for this compound: {iupac}.", | |
"If the molecule is called {iupac}, what's the SMILES representation?", | |
] | |
NAME_SMILES_PROMPTS = [ | |
"What is the IUPAC name of this molecule: {smiles}?", | |
"Could you please tell me the IUPAC name for the compound represented by the SMILES string: {smiles}?", | |
"I have a molecule here with the SMILES notation {smiles}. What would its IUPAC name be?", | |
"I'm working with a chemical compound, and its SMILES representation is {smiles}. Can you help me determine its IUPAC name?", | |
"What is the correct IUPAC nomenclature for a molecule with the SMILES code {smiles}?", | |
"I'm trying to identify a compound. Its SMILES string is {smiles}. What's its IUPAC name?", | |
"If I provide you with the SMILES string of a molecule, which is {smiles}, could you generate its IUPAC name for me?", | |
"I've encountered a molecule in my research, denoted by the SMILES {smiles}. I'd appreciate it if you could tell me its IUPAC name.", | |
"Can you derive the IUPAC name from this SMILES representation: {smiles}?", | |
"For a compound with the structural representation given by the SMILES {smiles}, what is the corresponding IUPAC name?", | |
] | |
REACTION_PROMPTS = [ | |
"What is the product of this reaction? {rxn_smiles}", | |
"If {rxn_smiles} are allowed to react, what would the resulting molecule be in SMILES format?", | |
"Can you predict the outcome of this chemical reaction? {rxn_smiles}", | |
"I have a reaction scheme here: {rxn_smiles}. What will be generated as the product?", | |
"Assuming the reaction {rxn_smiles} goes to completion, what is the SMILES representation of the product?", | |
"In this reaction: {rxn_smiles}, what compound is formed?", | |
"Given the reactants and conditions in {rxn_smiles}, what is the expected product?", | |
"After performing the reaction {rxn_smiles}, what would I obtain as the main product?", | |
"If I mix these reactants under the specified conditions, {rxn_smiles}, what is the SMILES of the product?", | |
"Please provide the SMILES string of the product for this reaction: {rxn_smiles}", | |
] | |
NAME_REACTION_PROMPTS = [ | |
"What is the name of this reaction?\n{rxn_smiles}", | |
"I have a reaction here with {rxn_smiles}. Can you tell me its commonly used name?", | |
"Given the reaction represented by {rxn_smiles}, what is the standard name associated with it?", | |
"If I were to describe this reaction, {rxn_smiles}, in a textbook, what reaction name would I use?", | |
"I'm trying to identify this reaction: {rxn_smiles}. What is its well-known name?", | |
"The reaction {rxn_smiles} is taking place. What's the name of this type of transformation?", | |
"I came across this reaction pathway: {rxn_smiles}. Do you know the name it generally goes by?", | |
"In the context of organic chemistry, what is the established name for the reaction shown here: {rxn_smiles}?", | |
"I'm writing a lab report and need to name this reaction, {rxn_smiles}. What should I call it?", | |
"Can you identify the name of the reaction that follows this scheme: {rxn_smiles}?", | |
] | |
COMPLETE_MOL_PROMPTS = [ | |
"I have a partial molecule represented by the SMILES string {smiles}. What is a valid completion of this molecule, providing only the remaining characters in SMILES format?", | |
"Given the incomplete SMILES fragment {smiles}, can you suggest a realistic ending to complete the molecule? Please provide only the additional SMILES characters needed.", | |
"I'm working with a molecule that's partially described as {smiles}. What sequence of SMILES characters would you add to make it a complete, valid molecule?", | |
"The beginning of a molecule's SMILES representation is {smiles}. How would you finish this SMILES string to represent a viable chemical compound? Only provide the continuation of the SMILES.", | |
"Imagine you need to complete the SMILES string {smiles}. What's a plausible way to extend it to form a complete molecule, expressed as the remaining SMILES characters?", | |
"If I give you the partial SMILES {smiles}, what's a reasonable way to finish it off to create a valid molecule? Respond with just the additional SMILES characters.", | |
"I'm trying to construct a molecule, and I have the start of its SMILES: {smiles}. Could you provide a completion for it, ensuring the final molecule is realistic? Only give me the rest of the SMILES string.", | |
"Here's a fragment of a SMILES string: {smiles}. What would be a chemically sound way to complete it? Respond with the missing portion of the SMILES representation.", | |
"Suppose you have the incomplete molecular structure {smiles} in SMILES. How would you complete it to represent a real molecule, adding only the necessary SMILES characters?", | |
"I have an unfinished molecule represented by the SMILES fragment {smiles}. Can you help me complete it by suggesting the remaining SMILES characters needed to make it a valid chemical structure?", | |
] | |
MOL_FORMULA_PROMPTS = [ | |
"A compound with formula {formula} was isolated from {source}. What is a plausible SMILES for it given this organism?", | |
"{source} makes a compound with this formula: {formula}. What SMILES structure might correspond to it?", | |
"In {source}, I found a substance with formula {formula}. What biosynthetically plausible SMILES might this represent?", | |
"Analysis of {source} revealed a compound ({formula}). What SMILES structure aligns with this organism's metabolism?", | |
"The organism {source} contains a compound with formula {formula}. What's a likely SMILES based on its biochemistry?", | |
"A {formula} compound was extracted from {source}. Based on this organism, what's a probable SMILES structure?", | |
"What SMILES could have the formula {formula} and be isolated from {source}?", | |
"What would be a biologically relevant SMILES for a {formula} compound isolated from the organism {source}?", | |
"The organism {source} produced a compound with formula {formula}, what SMILES structure makes biosynthetic sense?", | |
"A {formula} metabolite from {source} was identified. What's a biologically plausible compound for this (as SMILES)?", | |
] | |
FUNCTIONAL_GROUP_PROMPTS = [ | |
"Propose a compound with molecular formula {formula} that contains the following functional groups: {functional_group}.", | |
"Suggest a SMILES structure for a molecule with formula {formula} and the following functional groups: {functional_group}.", | |
"Given that a compound has formula {formula}, propose SMILES for one that also contains these groups: {functional_group}", | |
"Provide a reasonable SMILES for a chemical with molecular formula {formula} and these groups: {functional_group}.", | |
"Generate a SMILES representation for a molecule containing groups: {functional_group}. It should also have formula {formula}.", | |
"Identify a plausible SMILES for a chemical compound with formula {formula} containing these groups: {functional_group}.", | |
] | |
PROPERTY_TRIPLET_PROMPTS = [ | |
"I have a molecule {smiles1} with a {property} of {value1}. Which of these similar molecules will most likely {change} this property?\n{options}", | |
"Given a molecule ({smiles1}) having a {property} of {value1}, select the modified molecule below that would {change} this property significantly:\n{options}", | |
"Molecule {smiles1} currently exhibits {property} of {value1}. Which modifications from the list below would effectively {change} it?\n{options}", | |
"If molecule {smiles1} has a {property} value of {value1}, which of the following options would best {change} this property?\n{options}", | |
"Considering {smiles1} has a measured {property} of {value1}, which candidate modification listed would most effectively {change} this property?\n{options}", | |
"Molecule {smiles1} demonstrates a {property} of {value1}. Which similar molecule below is best suited to {change} this characteristic?\n{options}", | |
"Given molecule {smiles1} with {property} at {value1}, identify which molecule among the following options would {change} it most effectively:\n{options}", | |
"Starting from molecule {smiles1}, which shows a {property} of {value1}, choose the structural change below that would notably {change} this property:\n{options}", | |
"The molecule {smiles1} has a {property} of {value1}. Which molecule listed would optimally {change} this value?\n{options}", | |
"Given a {property} of {value1} for molecule {smiles1}, pick the best molecule from below to {change} this property:\n{options}", | |
] | |
# I have a molecule {smiles1} which is not a blood-brain barrier penetrating. Which of these similar molecules will most likely have this property?\n{options}", | |
PROPERTY_TRIPLET_PROMPTS_CAT = [ | |
"I have a molecule {smiles1} which {rel} {property}. Which of these similar molecules will most likely {irel} this property?\n{options}", | |
"Given molecule {smiles1} that {rel} {property}, which molecule below is likely to {irel} this property?\n{options}", | |
"Molecule {smiles1} currently {rel} {property}. Choose from these similar molecules the one most likely to {irel} this property:\n{options}", | |
"Considering {smiles1} {rel} {property}, identify which of the following candidates will most likely {irel} the characteristic:\n{options}", | |
"Given that molecule {smiles1} {rel} {property}, select from below the molecule most expected to {irel} this characteristic:\n{options}", | |
"Starting from molecule {smiles1} which {rel} {property}, determine which listed molecule is most likely to {irel} this property:\n{options}", | |
"If molecule {smiles1} {rel} {property}, which of these related structures will most probably {irel} that property?\n{options}", | |
"Given molecule {smiles1} {rel} {property}, select the similar molecule listed below most likely to {irel} this property:\n{options}", | |
] | |
# Which of the following options likely is a blood-brain barrier penetrating molecule? | |
# Which of the following options likely is not a blood-brain barrier penetrating molecule? | |
# Which of the following molecules is likely to not be blood-brain barrier penetrating? | |
PROPERTY_PROMPTS_CAT = [ | |
"Which of the following options likely is{rel} a {property} molecule?\n{options}", | |
"Which of the following molecules is likely to{rel} be {property}?\n{options}", | |
"Identify the molecule below that likely is{rel} a {property} molecule:\n{options}", | |
"From the list below, select the molecule most likely to{rel} be {property}:\n{options}", | |
"Choose the molecule from the options below that most probably is{rel} {property}:\n{options}", | |
"Among the following, which molecule likely is{rel} considered {property}?\n{options}", | |
"Select the molecule below most expected to{rel} have {property} properties:\n{options}", | |
"From these molecules, identify the one most likely to{rel} possess {property}:\n{options}", | |
"Which candidate below most probably is{rel} classified as a {property} molecule?\n{options}", | |
] | |
PROPERTY_PROMPTS = [ | |
"Which of the following molecules likely has a {property} of {value}?\n{options}", | |
"Identify the molecule below expected to have a {property} around {value}:\n{options}", | |
"From these options, select the molecule most likely exhibiting {property} of {value}:\n{options}", | |
"Determine which of the following molecules likely shows a {property} near {value}:\n{options}", | |
"Choose the molecule that would most plausibly have a {property} of {value} from the list below:\n{options}", | |
"Among the following, which molecule is predicted to have a {property} close to {value}?\n{options}", | |
"Given the choices below, pick the molecule most likely to possess a {property} of {value}:\n{options}", | |
"Select the molecule from these candidates that probably has a {property} of {value}:\n{options}", | |
"Which molecule listed here is most likely to have a {property} approximately equal to {value}?\n{options}", | |
"Identify which of the following molecules will most likely have a {property} of {value}:\n{options}", | |
] | |
RETRO_PROMPTS = [ | |
"Propose a 1-step synthesis for the molecule {smiles} using likely purchasable reactants.", | |
"Given the molecule {smiles}, suggest a 1-step synthesis using commercially available starting materials.", | |
"What is a plausible 1-step reaction for the molecule {smiles} using common reactants?", | |
"Suggest a commercially feasible one-step route to synthesize {smiles}.", | |
"Outline a practical single-step synthetic method to prepare the molecule {smiles}.", | |
"Design a straightforward 1-step reaction scheme for synthesizing {smiles} using commercially available reagents.", | |
"Identify a likely accessible precursor and reaction for a single-step synthesis of {smiles}.", | |
"Provide a realistic single-step synthetic pathway to obtain {smiles} from common chemicals.", | |
"Propose a viable one-step synthetic route toward the molecule {smiles} starting from purchasable precursors.", | |
"Suggest one plausible reaction step to generate {smiles} using standard, commercially sourced reactants.", | |
] | |
ORACLE_SOLUBILITY_PROMPTS = { | |
"tanimoto": [ | |
"Propose a small change to {smiles} to {direction} its solubility by about 1 logS.", | |
"Suggest a minimal structural modification to {smiles} that would {direction} its solubility by approximately 1 logS unit.", | |
"What minor alteration could be made to {smiles} to {direction} its solubility by roughly 1 logS?", | |
"Design a small molecular change to {smiles} that would {direction} its solubility by about 1 logS while maintaining overall similarity.", | |
"Identify a small structural adjustment to {smiles} that would {direction} its aqueous solubility by approximately 1 logS unit.", | |
], | |
"scaffold": [ | |
"Change {smiles} to {direction} its solubility by about 1 logS, but keep its scaffold", | |
"Modify {smiles} to {direction} its solubility by approximately 1 logS while preserving the core scaffold structure.", | |
"Suggest alterations to {smiles} that would {direction} its solubility by about 1 logS unit without changing the molecular scaffold.", | |
"How could {smiles} be transformed to {direction} its solubility by roughly 1 logS while maintaining its scaffold?", | |
"Design a derivative of {smiles} with {direction}d solubility (by about 1 logS) that retains the same molecular scaffold.", | |
], | |
"groups": [ | |
"Adjust {smiles} to {direction} its solubility by about 1 logS, but keep the following groups intact: {pretty_groups}", | |
"Modify {smiles} to achieve a {direction} in solubility of approximately 1 logS while preserving these functional groups: {pretty_groups}", | |
"How would you alter {smiles} to {direction} its solubility by about 1 logS unit without changing these key groups: {pretty_groups}?", | |
"Suggest structural changes to {smiles} that would {direction} its solubility by roughly 1 logS while maintaining these groups: {pretty_groups}", | |
"Design a variant of {smiles} with {direction}d solubility (by about 1 logS) that retains all of these intact functional groups: {pretty_groups}", | |
], | |
} | |
SMILES_FROM_FORMULA_PROMPTS = [ | |
"Propose a molecule that has the following formula: {formula}.", | |
"Generate a SMILES representation for a compound with the formula {formula}.", | |
"What is a plausible SMILES for a compound with the formula {formula}?", | |
"Given the formula {formula}, can you suggest a possible SMILES structure?", | |
"Create a SMILES representation for a molecule that corresponds to the formula {formula}.", | |
"Identify a potential SMILES for a compound with the molecular formula {formula}.", | |
"What SMILES structure could correspond to the formula {formula}?", | |
"Generate a plausible SMILES for a compound with the formula {formula}.", | |
"Given the formula {formula}, what would be a reasonable SMILES representation?", | |
"Propose a SMILES structure for a molecule with the formula {formula}.", | |
"Generate a SMILES representation for a compound with the formula {formula}.", | |
] | |