Benchmark Sets
Browse retrosynthesis benchmark datasets with ground truth routes
| Name | Description | Targets | Stock |
|---|---|---|---|
SMILES
CCCCn1nc(C#N)c(-c2ccccc2N)c1CCCS(=O)(=O)c1ccccc1
InChiKey
CZGOEYCNDUSNNH-UHFFFAOYSA-N
Route Signature
33d496aa881d539d5ba26287118383803d71115bb988d42cd88b78414c588a47
Synthesis route with 7 steps
Route tree structure (JSON format)
{
"route": {
"id": "cmisc0b0j04am7qdd72gj8qdx",
"signature": "33d496aa881d539d5ba26287118383803d71115bb988d42cd88b78414c588a47",
"length": 7,
"isConvergent": false
},
"target": {
"id": "cmisc0b0j04al7qddnrkvizum",
"benchmarkSetId": "cmisc09u000007qddhq6eczgb",
"targetId": "n5-01104",
"moleculeId": "tdm1bfvcomiprf4z1w81rm0b",
"routeLength": 7,
"isConvergent": false,
"metadata": "{}",
"molecule": {
"id": "tdm1bfvcomiprf4z1w81rm0b",
"inchikey": "CZGOEYCNDUSNNH-UHFFFAOYSA-N",
"smiles": "CCCCn1nc(C#N)c(-c2ccccc2N)c1CCCS(=O)(=O)c1ccccc1"
},
"hasAcceptableRoutes": true,
"acceptableRoutesCount": 1
},
"rootNode": {
"id": "cmisc0b0k04an7qddis89a6mg",
"routeId": "cmisc0b0j04am7qdd72gj8qdx",
"moleculeId": "tdm1bfvcomiprf4z1w81rm0b",
"parentId": null,
"reactionStepId": "rccvpjcj9mcqs7xx4v72mck8",
"isLeaf": false,
"molecule": {
"id": "tdm1bfvcomiprf4z1w81rm0b",
"inchikey": "CZGOEYCNDUSNNH-UHFFFAOYSA-N",
"smiles": "CCCCn1nc(C#N)c(-c2ccccc2N)c1CCCS(=O)(=O)c1ccccc1"
},
"reactionStep": {
"id": "rccvpjcj9mcqs7xx4v72mck8",
"reactionHash": "836fc6d240867bda42feadaedc9734a061fc21bc63581eb2db01b9d403ed6aa3",
"template": null,
"metadata": "{\"ID\":\"US20090075980A1;1470;680896\",\"rsmi\":\"Br[c:10]1[c:7]([C:8]#[N:9])[n:6][n:5]([CH2:4][CH2:3][CH2:2][CH3:1])[c:18]1[CH2:19][CH2:20][CH2:21][S:22](=[O:23])(=[O:24])[c:25]1[cH:26][cH:27][cH:28][cH:29][cH:30]1.OB(O)[c:11]1[c:12]([NH2:13])[cH:14][cH:15][cH:16][cH:17]1>CCOC(C)=O.Cc1ccccc1.Cl.O=C(/C=C/c1ccccc1)/C=C/c1ccccc1.O=C(/C=C/c1ccccc1)/C=C/c1ccccc1.O=C(/C=C/c1ccccc1)/C=C/c1ccccc1.O=P(O)(O)O.[K+].[K+].[K+].[Pd].[Pd]>[CH3:1][CH2:2][CH2:3][CH2:4][n:5]1[n:6][c:7]([C:8]#[N:9])[c:10](-[c:11]2[c:12]([NH2:13])[cH:14][cH:15][cH:16][cH:17]2)[c:18]1[CH2:19][CH2:20][CH2:21][S:22](=[O:23])(=[O:24])[c:25]1[cH:26][cH:27][cH:28][cH:29][cH:30]1\"}"
},
"children": [
{
"id": "cmisc0b0k04ao7qdd7kwjaz3i",
"routeId": "cmisc0b0j04am7qdd72gj8qdx",
"moleculeId": "w4mknxrt2hwlzc7gkudpxtdl",
"parentId": "cmisc0b0k04an7qddis89a6mg",
"reactionStepId": "but4dh67hendbi5m6kx8fadb",
"isLeaf": false,
"molecule": {
"id": "w4mknxrt2hwlzc7gkudpxtdl",
"inchikey": "HEIHCDYKIBDBLU-UHFFFAOYSA-N",
"smiles": "CCCCn1nc(C#N)c(Br)c1CCCS(=O)(=O)c1ccccc1"
},
"reactionStep": {
"id": "but4dh67hendbi5m6kx8fadb",
"reactionHash": "f6fbe230280dae30d72065155bdb21dec4d19beac711b661b2bfb7a4566baa8c",
"template": null,
"metadata": "{\"ID\":\"US20090075980A1;1469;680895\",\"rsmi\":\"Br[Br:11].[CH3:1][CH2:2][CH2:3][CH2:4][n:5]1[n:6][c:7]([C:8]#[N:9])[cH:10][c:12]1[CH2:13][CH2:14][CH2:15][S:16](=[O:17])(=[O:18])[c:19]1[cH:20][cH:21][cH:22][cH:23][cH:24]1>CC(=O)O.CC(=O)O.O=S(O)(O)=S.[K+].[Na+].[Na+]>[CH3:1][CH2:2][CH2:3][CH2:4][n:5]1[n:6][c:7]([C:8]#[N:9])[c:10]([Br:11])[c:12]1[CH2:13][CH2:14][CH2:15][S:16](=[O:17])(=[O:18])[c:19]1[cH:20][cH:21][cH:22][cH:23][cH:24]1\"}"
},
"children": [
{
"id": "cmisc0b0k04aq7qdd1o3t3v4m",
"routeId": "cmisc0b0j04am7qdd72gj8qdx",
"moleculeId": "q30x62ijpb42sfoxl7crkizy",
"parentId": "cmisc0b0k04ao7qdd7kwjaz3i",
"reactionStepId": null,
"isLeaf": true,
"molecule": {
"id": "q30x62ijpb42sfoxl7crkizy",
"inchikey": "GDTBXPJZTBHREO-UHFFFAOYSA-N",
"smiles": "BrBr"
},
"reactionStep": null,
"children": []
},
{
"id": "cmisc0b0k04ar7qdd503jv1wy",
"routeId": "cmisc0b0j04am7qdd72gj8qdx",
"moleculeId": "q9z2jt2t0njpz5pa0pyh8w5j",
"parentId": "cmisc0b0k04ao7qdd7kwjaz3i",
"reactionStepId": "rzhx1nz7b972pvs1h7um3n90",
"isLeaf": false,
"molecule": {
"id": "q9z2jt2t0njpz5pa0pyh8w5j",
"inchikey": "MNSQXCKTGBCVME-UHFFFAOYSA-N",
"smiles": "CCCCn1nc(C#N)cc1CCCS(=O)(=O)c1ccccc1"
},
"reactionStep": {
"id": "rzhx1nz7b972pvs1h7um3n90",
"reactionHash": "463438d47cb649042c77c3c7eb2aaec21c58c9029e7dfac33d32c0d1f196c324",
"template": null,
"metadata": "{\"ID\":\"US20090075980A1;1468;680894\",\"rsmi\":\"O=[C:8]([c:7]1[n:6][n:5]([CH2:4][CH2:3][CH2:2][CH3:1])[c:11]([CH2:12][CH2:13][CH2:14][S:15](=[O:16])(=[O:17])[c:18]2[cH:19][cH:20][cH:21][cH:22][cH:23]2)[cH:10]1)[NH2:9]>O=P(Cl)(Cl)Cl.N.O>[CH3:1][CH2:2][CH2:3][CH2:4][n:5]1[n:6][c:7]([C:8]#[N:9])[cH:10][c:11]1[CH2:12][CH2:13][CH2:14][S:15](=[O:16])(=[O:17])[c:18]1[cH:19][cH:20][cH:21][cH:22][cH:23]1\"}"
},
"children": [
{
"id": "cmisc0b0l04as7qddrrx6sq9v",
"routeId": "cmisc0b0j04am7qdd72gj8qdx",
"moleculeId": "fhir02gagl2to5copsegbwyn",
"parentId": "cmisc0b0k04ar7qdd503jv1wy",
"reactionStepId": "pxqfu63dghopj2z6mb1yb0pf",
"isLeaf": false,
"molecule": {
"id": "fhir02gagl2to5copsegbwyn",
"inchikey": "SRUJRCRWAOVHEG-UHFFFAOYSA-N",
"smiles": "CCCCn1nc(C(N)=O)cc1CCCS(=O)(=O)c1ccccc1"
},
"reactionStep": {
"id": "pxqfu63dghopj2z6mb1yb0pf",
"reactionHash": "17a2842d658bc793a75606fef79a7d1051e187c0dc6f05cad1b1e8db09245fb4",
"template": null,
"metadata": "{\"ID\":\"US20090075980A1;1467;680893\",\"rsmi\":\"O[C:8]([c:7]1[n:6][n:5]([CH2:4][CH2:3][CH2:2][CH3:1])[c:12]([CH2:13][CH2:14][CH2:15][S:16](=[O:17])(=[O:18])[c:19]2[cH:20][cH:21][cH:22][cH:23][cH:24]2)[cH:11]1)=[O:10].[NH3:9]>CN(C)C=O.ClCCl.O=C(Cl)C(=O)Cl.Cl>[CH3:1][CH2:2][CH2:3][CH2:4][n:5]1[n:6][c:7]([C:8]([NH2:9])=[O:10])[cH:11][c:12]1[CH2:13][CH2:14][CH2:15][S:16](=[O:17])(=[O:18])[c:19]1[cH:20][cH:21][cH:22][cH:23][cH:24]1\"}"
},
"children": [
{
"id": "cmisc0b0l04at7qddx82j6qz7",
"routeId": "cmisc0b0j04am7qdd72gj8qdx",
"moleculeId": "rgje08kz8rcl6tsq6yh96z0r",
"parentId": "cmisc0b0l04as7qddrrx6sq9v",
"reactionStepId": "g3ry1rx1edoq7c4lyq8i1hrl",
"isLeaf": false,
"molecule": {
"id": "rgje08kz8rcl6tsq6yh96z0r",
"inchikey": "SIMUECUFERWAPD-UHFFFAOYSA-N",
"smiles": "CCCCn1nc(C(=O)O)cc1CCCS(=O)(=O)c1ccccc1"
},
"reactionStep": {
"id": "g3ry1rx1edoq7c4lyq8i1hrl",
"reactionHash": "e5fd577f883f7cbbd40b9c4aae884e3c6b4b4fdf922bd303d083dea02130df0f",
"template": null,
"metadata": "{\"ID\":\"US20090075980A1;1466;680892\",\"rsmi\":\"CC[O:10][C:8]([c:7]1[n:6][n:5]([CH2:4][CH2:3][CH2:2][CH3:1])[c:12]([CH2:13][CH2:14][CH2:15][S:16](=[O:17])(=[O:18])[c:19]2[cH:20][cH:21][cH:22][cH:23][cH:24]2)[cH:11]1)=[O:9]>CCO.[Na+].O>[CH3:1][CH2:2][CH2:3][CH2:4][n:5]1[n:6][c:7]([C:8](=[O:9])[OH:10])[cH:11][c:12]1[CH2:13][CH2:14][CH2:15][S:16](=[O:17])(=[O:18])[c:19]1[cH:20][cH:21][cH:22][cH:23][cH:24]1\"}"
},
"children": [
{
"id": "cmisc0b0l04av7qddsu18qjn8",
"routeId": "cmisc0b0j04am7qdd72gj8qdx",
"moleculeId": "zmfsdbnt0ije635uehwl7ln1",
"parentId": "cmisc0b0l04at7qddx82j6qz7",
"reactionStepId": "eeubgg44hhz5hncf4j8chuq6",
"isLeaf": false,
"molecule": {
"id": "zmfsdbnt0ije635uehwl7ln1",
"inchikey": "GPTLQRWFDXLVFW-UHFFFAOYSA-N",
"smiles": "CCCCn1nc(C(=O)OCC)cc1CCCS(=O)(=O)c1ccccc1"
},
"reactionStep": {
"id": "eeubgg44hhz5hncf4j8chuq6",
"reactionHash": "d7c943be13578491f717c6bad84660eac72911c9dae3eef865aa3a85efdbe16b",
"template": null,
"metadata": "{\"ID\":\"US20090075980A1;1465;680891\",\"rsmi\":\"CCO[C:7](=O)[C:8](=[O:9])[O:10][CH2:11][CH3:12].O=[C:14]([CH3:13])[CH2:15][CH2:16][CH2:17][S:18](=[O:19])(=[O:20])[c:21]1[cH:22][cH:23][cH:24][cH:25][cH:26]1.[CH3:1][CH2:2][CH2:3][CH2:4][NH:5][NH2:6]>CC(=O)O.CC(=O)O.CC(C)(C)O.CCO.O=C(O)C(=O)O.[K+].[Na+]>[CH3:1][CH2:2][CH2:3][CH2:4][n:5]1[n:6][c:7]([C:8](=[O:9])[O:10][CH2:11][CH3:12])[cH:13][c:14]1[CH2:15][CH2:16][CH2:17][S:18](=[O:19])(=[O:20])[c:21]1[cH:22][cH:23][cH:24][cH:25][cH:26]1\"}"
},
"children": [
{
"id": "cmisc0b0l04aw7qdda7ope8c5",
"routeId": "cmisc0b0j04am7qdd72gj8qdx",
"moleculeId": "u5wwz8kctweeh199wcz09xvk",
"parentId": "cmisc0b0l04av7qddsu18qjn8",
"reactionStepId": "pdci6whu0j8oeek2olutquyc",
"isLeaf": false,
"molecule": {
"id": "u5wwz8kctweeh199wcz09xvk",
"inchikey": "LBJLEWKUPTYQMS-UHFFFAOYSA-N",
"smiles": "CC(=O)CCCS(=O)(=O)c1ccccc1"
},
"reactionStep": {
"id": "pdci6whu0j8oeek2olutquyc",
"reactionHash": "64df1e7473aa984024d5fe2d541bf4e5d5500e67827238fcce701c6767e58abc",
"template": null,
"metadata": "{\"ID\":\"US20090075980A1;1464;680890\",\"rsmi\":\"CCOC(=O)[CH:4]([C:2]([CH3:1])=[O:3])[CH2:5][CH2:6][S:7](=[O:8])(=[O:9])[c:10]1[cH:11][cH:12][cH:13][cH:14][cH:15]1>CCO.Cl>[CH3:1][C:2](=[O:3])[CH2:4][CH2:5][CH2:6][S:7](=[O:8])(=[O:9])[c:10]1[cH:11][cH:12][cH:13][cH:14][cH:15]1\"}"
},
"children": [
{
"id": "cmisc0b0l04az7qddu258frwj",
"routeId": "cmisc0b0j04am7qdd72gj8qdx",
"moleculeId": "uian4icfruzogd7t72c0g6ok",
"parentId": "cmisc0b0l04aw7qdda7ope8c5",
"reactionStepId": null,
"isLeaf": true,
"molecule": {
"id": "uian4icfruzogd7t72c0g6ok",
"inchikey": "PQFSLTSAOIDRSY-UHFFFAOYSA-N",
"smiles": "CCOC(=O)C(CCS(=O)(=O)c1ccccc1)C(C)=O"
},
"reactionStep": null,
"children": []
}
]
},
{
"id": "cmisc0b0l04ax7qdd86szh985",
"routeId": "cmisc0b0j04am7qdd72gj8qdx",
"moleculeId": "ze3o6kzjuze66ba4mo9ex9mu",
"parentId": "cmisc0b0l04av7qddsu18qjn8",
"reactionStepId": null,
"isLeaf": true,
"molecule": {
"id": "ze3o6kzjuze66ba4mo9ex9mu",
"inchikey": "XKLVLDXNZDIDKQ-UHFFFAOYSA-N",
"smiles": "CCCCNN"
},
"reactionStep": null,
"children": []
},
{
"id": "cmisc0b0l04ay7qdd43m06v98",
"routeId": "cmisc0b0j04am7qdd72gj8qdx",
"moleculeId": "xkkag5bit55pvgpjepliywrf",
"parentId": "cmisc0b0l04av7qddsu18qjn8",
"reactionStepId": null,
"isLeaf": true,
"molecule": {
"id": "xkkag5bit55pvgpjepliywrf",
"inchikey": "WYACBZDAHNBPPB-UHFFFAOYSA-N",
"smiles": "CCOC(=O)C(=O)OCC"
},
"reactionStep": null,
"children": []
}
]
}
]
},
{
"id": "cmisc0b0l04au7qddnl6cbtrx",
"routeId": "cmisc0b0j04am7qdd72gj8qdx",
"moleculeId": "f8e2zb4tye7yqtxjpdjfu06c",
"parentId": "cmisc0b0l04as7qddrrx6sq9v",
"reactionStepId": null,
"isLeaf": true,
"molecule": {
"id": "f8e2zb4tye7yqtxjpdjfu06c",
"inchikey": "QGZKDVFQNNGYKY-UHFFFAOYSA-N",
"smiles": "N"
},
"reactionStep": null,
"children": []
}
]
}
]
}
]
},
{
"id": "cmisc0b0k04ap7qddrjaa7xn7",
"routeId": "cmisc0b0j04am7qdd72gj8qdx",
"moleculeId": "xvxejazz55helk2ndlfvzg5q",
"parentId": "cmisc0b0k04an7qddis89a6mg",
"reactionStepId": null,
"isLeaf": true,
"molecule": {
"id": "xvxejazz55helk2ndlfvzg5q",
"inchikey": "DIRRKLFMHQUJCM-UHFFFAOYSA-N",
"smiles": "Nc1ccccc1B(O)O"
},
"reactionStep": null,
"children": []
}
]
}
}