Integrate with API v2 (#6)

brunokam · ardcore · Marek · web-flow · commit 2257de2eacd6 · 2021-09-16T16:09:11.000+02:00
* Adapt python wrapper to API v2

* Add InvalidTargetStrategy support

* Update setup.py

* Readme update

* Update API docs link

* Improved readme, version bump

* Update README.md

Co-authored-by: Mateusz Bruno-Kamiński &lt;bruno@molecule.one&gt;

* Update README.md

Co-authored-by: Mateusz Bruno-Kamiński &lt;bruno@molecule.one&gt;

* Update README.md

Co-authored-by: Mateusz Bruno-Kamiński &lt;bruno@molecule.one&gt;

* Update README.md

Co-authored-by: Mateusz Bruno-Kamiński &lt;bruno@molecule.one&gt;

Co-authored-by: Szymon Pilkowski &lt;s.pilkowski@molecule.one&gt;
Co-authored-by: Marek &lt;marek@devalchemist.com&gt;
Co-authored-by: Michał Krutul &lt;m.krutul@molecule.one&gt;
diff --git a/README.md b/README.md
@@ -12,25 +12,47 @@ pip install git+https://github.com/molecule-one/m1wrapper-python
 from m1wrapper import MoleculeOneWrapper
 m1wrapper = MoleculeOneWrapper(api_token, 'https://app.molecule.one')
 ```
-- *api_token*: API token you'll need to authorize in our system. You can get
+- *api_token*: API token you'll need to authorize in our system. You can
   generate yours at https://app.molecule.one/dashboard/user/api-tokens
 - *api_base_url* (optional): URI of the batch scoring service. Defaults to Molecule One's public
   server, but you will need to provide custom value if you're using a dedicated solution.
 
-### Running batch scoring request:
+### Getting a list of batch scoring requests:
+```py
+searches = m1wrapper.list_batch_searches()
+```
+
+### Running new batch scoring request:
 ```py
 search = m1wrapper.run_batch_search(
     targets=['cc', 'O=C(Nc1cc(Nc2nc(-c3cnccc3)ccn2)c(cc1)C)c3ccc(cc3)CN3CCN(CC3)C'],
-    parameters={'exploratory_search': False, 'detail_level': 'score'}
+    parameters={'model': 'gat'}
 )
 ```
 - *targets*: list of target compounds in SMILES format
 - *parameters* (optional): additional configuration for your batch
-  scoring request. See [Batch Scoring API](https://github.com/molecule-one/api/blob/master/batch-scoring.md) for more information.
-- *priority* (optional): priority of the batch request.
+  scoring request. See [Batch Scoring API](https://github.com/molecule-one/api/blob/master/api-v2.md) for more information.
+- *detail_level* (optional): [detail level of the batch request](#batch-scoring-detail-level)
+- *priority* (optional): [priority of the batch request](#batch-scoring-priorities)
+- *invalid_target_strategy* (optional): if set to `InvalidTargetStrategy.PASS`, targets that cannot be canonized by our SMILES parser won't cause the whole batch request to be rejected. Defaults to `InvalidTargetStrategy.REJECT`.
 - *starting_materials* (optional): list of available compounds in SMILES format
 
-### Batch scoring priorities:
+### Batch scoring detail level
+Detail level determines how much information about each target synthesis you'll get. We define it as a `DetailLevel` enum with two variants:
+- `DetailLevel.SCORE` (default) - useful when you're not interested in full synthesis json/UI preview, but only numerical values
+- `DetailLevel.SYNTHESIS` - when you're also interested in reactions and compounds leading to the target product
+#### Example:
+```py
+from m1wrapper import MoleculeOneWrapper, DetailLevel
+m1wrapper = MoleculeOneWrapper(api_token, 'https://app.molecule.one')
+search = m1wrapper.run_batch_search(
+    targets=['cc', 'O=C(Nc1cc(Nc2nc(-c3cnccc3)ccn2)c(cc1)C)c3ccc(cc3)CN3CCN(CC3)C'],
+    parameters={'model': 'gat', },
+    detail_level=DetailLevel.SCORE
+)
+```
+
+### Batch scoring priorities
 Priorities are defined as integers in a range of 1 to 10. Requests with higher priority will be processed before those with lower priority.
 For convenience, we also define a `Priority` enum with the following variants:
 - `Priority.LOWEST` (1)
@@ -45,8 +67,9 @@ from m1wrapper import MoleculeOneWrapper, Priority
 m1wrapper = MoleculeOneWrapper(api_token, 'https://app.molecule.one')
 search = m1wrapper.run_batch_search(
     targets=['cc', 'O=C(Nc1cc(Nc2nc(-c3cnccc3)ccn2)c(cc1)C)c3ccc(cc3)CN3CCN(CC3)C'],
-    parameters={'exploratory_search': False, 'detail_level': 'score'},
-    priority=Priority.HIGH)
+    parameters={'model': 'gat'},
+    priority=Priority.HIGH
+)
 ```
 
 ### Getting exisiting scoring request by id:
@@ -71,32 +94,53 @@ Results are made available as soon as they are processed. This method
 provided a way to start working with some of your results without waiting until all targets are processed.
 This usually means implementing some kind of polling/scheduling on your side.
 ```py
-results = search.get_partial_results(precision=5, only=["targetSmiles, "result"])
+results = search.get_partial_results(precision=5, only=["target_smiles", "result"])
 ```
 - *precision* (optional): format the floating point scores returned by the system (certainty, result, price) to given number of significant digits.
 - *only* (optional): fetch only a subset of values. Defaults to
   all values.
 
+Returns JSON object of the following shape:
+Returns an object of the following shape:
+```python
+    [
+      {
+        'target_smiles': 'Cc1ccc(cc1Nc2nccc(n2)c3cccnc3)NC(=O)c4ccc(cc4)CN5CCN(CC5)C',
+        'result': '7.53000'
+      },
+      ...
+    ]
+```
+#### All values:
+```py
+results = search.get_partial_results(precision=5)
+```
+
 Returns JSON object of the following shape:
 ```json
     [
       {
-        "targetSmiles": "Cc1ccc(cc1Nc2nccc(n2)c3cccnc3)NC(=O)c4ccc(cc4)CN5CCN(CC5)C",
-        "status": "ok",
-        "result": "7.53",
-        "certainty": "0.581",
-        "price": "5230",
-        "reactionCount": 5,
-        "timedOut": false
+        'target_smiles': 'Cc1ccc(cc1Nc2nccc(n2)c3cccnc3)NC(=O)c4ccc(cc4)CN5CCN(CC5)C',
+        'status': 'ok',
+        'result': '7.53000',
+        'certainty': '0.581',
+        'price': '5230',
+        'reaction_count': 5,
+        'timed_out': False,
+        'started_at': '2021-09-13T14:45:31.012Z',
+        'finished_at': '2021-09-13T14:46:39.199Z',
+        'running_time': 68.187,
+        'url': 'https://app.molecule.one/dashboard/synthesis-plans/batch/b787bf5f-6736-443c-bef1-8f10a37da246/result/0e3c6e13-fce1-46ba-9811-8fe66e0e4122'
       },
-    ...
+      ...
     ]
 ```
+
 See [Batch Scoring API](https://github.com/molecule-one/api/blob/master/batch-scoring.md) for a full explaination of returned fields.
 
 ### Getting complete results:
 ```py
-results = search.get_results(precision=5, only=["targetSmiles, "result"])
+results = search.get_results(precision=5, only=["target_smiles", "result"])
 ```
 If you don't want to implement scheduling on your own, this method
 provides a simple way to wait until all targets are processed (sending periodical checks using
diff --git a/examples/example.py b/examples/example.py
@@ -1,14 +1,20 @@
-from m1wrapper import MoleculeOneWrapper
+from m1wrapper import MoleculeOneWrapper, Priority, DetailLevel
 
 if __name__ == '__main__':
     # get your token at https://app.molecule.one/dashboard/user/api-tokens
     token = 'f4614b1d96124d09ab14fbe6537c9007_4ea55651a3904037b9fe4c4a72d2b85d'
 
     m1wrapper = MoleculeOneWrapper(token)
 
+    searches = m1wrapper.list_batch_searches()
+    print('previous searches:', searches)
+
     search = m1wrapper.run_batch_search(
-        targets=['cc', 'O=C(Nc1cc(Nc2nc(-c3cnccc3)ccn2)c(cc1)C)c3ccc(cc3)CN3CCN(CC3)C'],
-        parameters={'exploratory_search': False, 'detail_level': 'score'}
+        targets=[
+            'cc', 'O=C(Nc1cc(Nc2nc(-c3cnccc3)ccn2)c(cc1)C)c3ccc(cc3)CN3CCN(CC3)C'],
+        parameters={'model': 'gat'},
+        detail_level=DetailLevel.SCORE,
+        priority=Priority.LOW
     )
     print('created search:', search.search_id)
 
@@ -24,7 +30,8 @@
     partial_results = search.get_partial_results()
     print("partial results:", partial_results)
 
-    results = search.get_results(precision=4, only=['targetSmiles', 'price', 'result'])
+    results = search.get_results(
+        precision=4, only=['target_smiles', 'price', 'result'])
     print('results:', results)
 
     m1wrapper.delete_batch_search(search.search_id)
diff --git a/m1wrapper/__init__.py b/m1wrapper/__init__.py
@@ -1 +1,2 @@
-from .m1wrapper import MoleculeOneWrapper, Priority
+from .m1wrapper import MoleculeOneWrapper, Priority, DetailLevel, InvalidTargetStrategy
+from .traverse import traverse_modify
diff --git a/m1wrapper/config.py b/m1wrapper/config.py
@@ -2,6 +2,7 @@
 api_token_version = 'v1'
 api_base_url = 'https://app.molecule.one/'
 api_search_endpoint = 'batch-search'
+api_status_endpoint = 'batch-search-status'
 api_results_endpoint = 'batch-search-result'
 status_check_delay_s = 15
 http_backoff_factor = 5
diff --git a/m1wrapper/errors.py b/m1wrapper/errors.py
@@ -0,0 +1,18 @@
+import requests
+
+def format_error_message(error):
+    if error["message"] and error["errors"]:
+        return f'{error["message"]}: {repr(error["errors"])}'
+    if error["message"]:
+        return f'{error["message"]}'
+    else:
+        return "unknown error"
+
+
+def maybe_handle_error(response):
+    if response.status_code >= 400 and response.status_code < 500:
+        error = format_error_message(response.json())
+        raise requests.exceptions.HTTPError(error)
+    else:
+        response.raise_for_status()
+
diff --git a/m1wrapper/m1wrapper.py b/m1wrapper/m1wrapper.py
@@ -1,8 +1,19 @@
+import requests
+from urllib.parse import urljoin
 from typing import List, Dict
-from enum import IntEnum
+from enum import Enum, IntEnum
 
 from .search import BatchSearch
-from .config import api_token_version, wrapper_version, api_base_url
+from .config import (
+    api_token_version,
+    wrapper_version,
+    api_base_url,
+    api_search_endpoint
+)
+
+from .errors import (
+    maybe_handle_error
+)
 
 class Priority(IntEnum):
     LOWEST = 1,
@@ -11,6 +22,14 @@ class Priority(IntEnum):
     HIGH = 8,
     HIGHEST = 10
 
+class DetailLevel(str, Enum):
+    SCORE = 'score',
+    SYNTHESIS = 'synthesis'
+
+class InvalidTargetStrategy(str, Enum):
+    REJECT = 'reject',
+    PASS = 'pass'
+
 class MoleculeOneWrapper:
     """
     Wrapper for MoleculeOne Batch Scoring REST API
@@ -22,7 +41,7 @@ def __init__(
         api_base_url: str = api_base_url
     ):
         self.api_token = api_token
-        self.api_base_url = f'{api_base_url}/api/v1/'
+        self.api_base_url = f'{api_base_url}/api/v2/'
         self.request_headers = self.__prepare_request_headers()
 
     def __prepare_request_headers(self) -> dict:
@@ -31,29 +50,44 @@ def __prepare_request_headers(self) -> dict:
             'User-Agent': f'api-wrapper-python/{wrapper_version}',
             'Authorization': f'ApiToken-{api_token_version} {self.api_token}'
         }
+    
+    def list_batch_searches(self):
+        response = requests.get(
+            urljoin(self.api_base_url, api_search_endpoint),
+            headers=self.request_headers,
+        )
+        print(response)
+        maybe_handle_error(response)
+        return response.json()
 
     def run_batch_search(
             self,
             targets: List[str],
             parameters: Dict = None,
+            detail_level = DetailLevel.SCORE,
             priority = Priority.NORMAL,
+            invalid_target_strategy = InvalidTargetStrategy.REJECT ,
             starting_materials: List[str] = None,
     ) -> BatchSearch:
         return BatchSearch(
                 self.api_base_url,
                 self.request_headers,
                 targets=targets,
                 parameters=parameters,
+                detail_level=detail_level,
                 priority=int(priority),
+                invalid_target_strategy=invalid_target_strategy,
                 starting_materials=starting_materials
             )
 
     def get_batch_search(self, search_id: str) -> BatchSearch:
-        return BatchSearch.from_id(
+        search = BatchSearch.from_id(
                 self.api_base_url,
                 self.request_headers,
                 search_id
         )
+        data = search.get()
+        return search
 
     def delete_batch_search(self, search_id: str):
         search = BatchSearch.from_id(
diff --git a/m1wrapper/search.py b/m1wrapper/search.py
diff --git a/m1wrapper/traverse.py b/m1wrapper/traverse.py
diff --git a/setup.py b/setup.py

Original file line number	Diff line number	Diff line change
`@@ -1 +1,2 @@`
`1`		`-from .m1wrapper import MoleculeOneWrapper, Priority`
	`1`	`+from .m1wrapper import MoleculeOneWrapper, Priority, DetailLevel, InvalidTargetStrategy`
	`2`	`+from .traverse import traverse_modify`