modzy
diff --git a/‎README.md
Lines changed: 91 additions & 10 deletions b/‎README.md
Lines changed: 91 additions & 10 deletions
diff --git a/‎modzy/_util.py
Lines changed: 53 additions & 46 deletions b/‎modzy/_util.py
Lines changed: 53 additions & 46 deletions
diff --git a/‎modzy/edge/__init__.py
Lines changed: 1 addition & 0 deletions b/‎modzy/edge/__init__.py
Lines changed: 1 addition & 0 deletions
@@ -213,36 +213,103 @@ To use **`client.models.deploy()`** there are 4 fields that are required:
 
 ## Running Inferences at the Edge
 
-The SDK provides support for running inferences on edge devices through Modzy's Edge Client. The inference workflow is almost identical to the previously outlined workflow:
+The SDK provides support for running inferences on edge devices through Modzy's Edge Client. The inference workflow is almost identical to the previously outlined workflow, and provides functionality for interacting with both Job and Inferences APIs:
 
-### Initialize *Edge* Client
+### Initialize Edge Client
 
 ```python
-from modzy.edge.client import EdgeClient
+from modzy import EdgeClient
 
 # Initialize edge client
 # Use 'localhost' for local inferences, otherwise use the device's full IP address
 client = EdgeClient('localhost',55000)
 ```
 
-### Submit Inference Job
+### Submit Inference with *Job* API
 Modzy Edge supports `text`, `embedded`, and `aws-s3` input types.
 
 ```python
 # Submit text job to Sentiment Analysis model deployed on edge device by providing a model ID, version, and raw text data, wait for completion
-job = client.submit_text("ed542963de","1.0.27",{"input.txt": "this is awesome"})
+job = client.jobs.submit_text("ed542963de","1.0.27",{"input.txt": "this is awesome"})
 # Block until results are ready
-final_job_details = client.block_until_complete(job)
-results = client.get_results(job)
+final_job_details = client.jobs.block_until_complete(job)
+results = client.jobs.get_results(job)
 ```
 
-### Query Details about Edge Jobs
+### Query Details about Inference with *Job* API
 ```python
 # get job details for a particular job
-job_details = client.get_job_details(job)
+job_details = client.jobs.get_job_details(job)
 
 # get job details for all jobs run on your Modzy Edge instance
-all_job_details = client.get_all_job_details()
+all_job_details = client.jobs.get_all_job_details()
+```
+
+### Submit Inference with *Inference* API
+
+The SDK provides several methods for interacting with Modzy's Inference API:
+* **Synchronous**: This convenience method wraps two SDK methods and is optimal for use cases that require real-time or sequential results (i.e., a prediction results are needed to inform action before submitting a new inference)
+* **Asynchronous**: This method combines two SDK methods and is optimal for submitting large batches of data and querying results at a later time (i.e., real-time inference is not required)
+* **Streaming**: This method is a convenience method for running multiple synchronous inferences consecutively and allows users to submit iterable objects to be processed sequentially in real-time
+
+*Synchronous (image-based model example)*
+```python
+from modzy import EdgeClient
+from modzy.edge import InputSource
+
+image_bytes = open("image_path.jpg", "rb").read()
+input_object = InputSource(
+    key="image", # input filename defined by model author
+    data=image_bytes,
+) 
+
+with EdgeClient('localhost', 55000) as client:
+  inference = client.inferences.run("<model-id>", "<model-version>", input_object, explain=False, tags=None)
+results = inference.result.outputs
+```
+
+*Asynchronous (image-based model example - submit batch of images in folder)*
+```python
+import os
+from modzy import EdgeClient
+from modzy.edge import InputSource
+
+# submit inferences
+img_folder = "./images"
+inferences = []
+for img in os.listdir(img_folder):
+  input_object = InputSource(
+    key="image", # input filename defined by model author
+    data=open(os.path.join(img_folder, img), 'rb').read()
+  )
+  with EdgeClient('localhost', 55000) as client:
+    inference = client.inferences.perform_inference("<model-id>", "<model-version>", input_object, explain=False, tags=None)
+  inferences.append(inference)
+
+# query results 
+with EdgeClient('localhost', 55000) as client:
+  results = [client.inferences.block_until_complete(inference.identifier) for inferences in inferences]
+```
+
+*Stream*
+```python
+import os
+from modzy import EdgeClient
+from modzy.edge import InputSource
+
+# generate requests iterator to pass to stream method
+requests = []
+for img in os.listdir(img_folder):
+  input_object = InputSource(
+    key="image", # input filename defined by model author
+    data=open(os.path.join(img_folder, img), 'rb').read()
+  )
+  with EdgeClient('localhost', 55000) as client:
+    requests.append(client.inferences.build_inference_request("<model-id>", "<model-version>", input_object, explain=False, tags=None)) 
+
+# submit list of inference requests to streaming API
+with EdgeClient('localhost', 55000) as client:
+  streaming_results = client.inferences.stream(requests)
 ```
 
 # SDK Code Examples
@@ -285,6 +352,20 @@ Modzy's SDK is built on top of the [Modzy HTTP/REST API](https://docs.modzy.com/
 |Get job details|client.jobs.get()|[api/jobs/:job-id](https://docs.modzy.com/reference/get-job-details)  |
 |Get results|job.get_result()|[api/results/:job-id](https://docs.modzy.com/reference/get-results)  |
 |Get the job history|client.jobs.get_history()|[api/jobs/history](https://docs.modzy.com/reference/list-the-job-history)  |
+|Submit a Job with Edge Client (Embedded)|EdgeClient.jobs.submit_embedded()|[Python/edge/jobs](https://docs.modzy.com/docs/edgeclientjobssubmit_embedded) |
+|Submit a Job with Edge Client (Text)|EdgeClient.jobs.submit_text()|[Python/edge/jobs](https://docs.modzy.com/docs/edgeclientjobssubmit_text) |
+|Submit a Job with Edge Client (AWS S3)|EdgeClient.jobs.submit_aws_s3()|[Python/edge/jobs](https://docs.modzy.com/docs/edgeclientjobssubmit_aws_s3) |
+|Get job details with Edge Client|EdgeClient.jobs.get_job_details()|[Python/edge/jobs](https://docs.modzy.com/docs/edgeclientjobsget_job_details) |
+|Get all job details with Edge Client|EdgeClient.jobs.get_all_job_details()|[Python/edge/jobs](https://docs.modzy.com/docs/edgeclientjobsget_all_job_details) |
+|Hold until job is complete with Edge Client|EdgeClient.jobs.block_until_complete()|[Python/edge/jobs](https://docs.modzy.com/docs/edgeclientjobsblock_until_complete) |
+|Get results with Edge Client|EdgeClient.jobs.get_results()|[Python/edge/jobs](https://docs.modzy.com/docs/edgeclientjobsget_results) |
+|Build inference request with Edge Client|EdgeClient.inferences.build_inference_request()|[Python/edge/inferences](https://docs.modzy.com/docs/edgeclientinferencesbuild_inference_request) |
+|Perform inference with Edge Client|EdgeClient.inferences.perform_inference()|[Python/edge/inferences](https://docs.modzy.com/docs/edgeclientinferencesperform_inference) |
+|Get inference details with Edge Client|EdgeClient.inferences.get_inference_details()|[Python/edge/inferences](https://docs.modzy.com/docs/edgeclientinferencesget_inference_details) |
+|Run synchronous inferences with Edge Client|EdgeClient.inferences.run()|[Python/edge/inferences](https://docs.modzy.com/docs/edgeclientinferencesrun) |
+|Hold until inference completes with Edge Client|EdgeClient.inferences.block_until_complete()|[Python/edge/inferences](https://docs.modzy.com/docs/edgeclientinferencesblock_until_complete) |
+|Stream inferences with Edge Client|EdgeClient.inferences.stream()|[Python/edge/inferences](https://docs.modzy.com/docs/edgeclientinferencesstream) |
+
 
 # Support
 
 
@@ -1,17 +1,20 @@
 # -*- coding: utf-8 -*-
-import json
 import pathlib
 import time
-from .error import NetworkError, InternalServerError
+from base64 import b64encode
+
 from requests.adapters import HTTPAdapter
 from requests.packages.urllib3.util.retry import Retry
-from base64 import b64encode
+
+from .error import InternalServerError, NetworkError
+
 
 def encode_data_uri(bytes_like, mimetype='application/octet-stream'):
     encoded = b64encode(bytes_like).decode('ascii')
     data_uri = 'data:{};base64,{}'.format(mimetype, encoded)
     return data_uri
 
+
 def file_to_bytes(file_like):
     if hasattr(file_like, 'read'):  # File-like object
         if hasattr(file_like, 'seekable') and file_like.seekable():
@@ -35,6 +38,7 @@ def file_to_bytes(file_like):
     with open(path, 'rb') as file:
         return file.read()
 
+
 def file_to_chunks(file_like, chunk_size):
     file = None
     should_close = False
@@ -67,20 +71,24 @@ def file_to_chunks(file_like, chunk_size):
     if should_close:
         file.close()
 
+
 def bytes_to_chunks(byte_array, chunk_size):
     for i in range(0, len(byte_array), chunk_size):
         yield byte_array[i:i + chunk_size]
 
+
 def depth(d):
     if d and isinstance(d, dict):
         return max(depth(v) for k, v in d.items()) + 1
     return 0
 
+
 '''
 Model Deployment (models.deploy()) specific utilities
 '''
-def load_model(client, logger, identifier, version):
 
+
+def load_model(client, logger, identifier, version):
     start = time.time()
     # Before loading the model we need to ensure that it has been pulled.
     percentage = -1
@@ -89,9 +97,9 @@ def load_model(client, logger, identifier, version):
             res = client.http.get(f"/models/{identifier}/versions/{version}/container-image")
             new_percentage = res.get("percentage")
         except NetworkError:
-            continue      
+            continue
         except InternalServerError:
-            continue      
+            continue
 
         if new_percentage != percentage:
             logger.info(f'Loading model at {new_percentage}%')
@@ -112,25 +120,25 @@ def load_model(client, logger, identifier, version):
     try:
         res = client.http.post(f"/models/{identifier}/versions/{version}/load-process")
     except NetworkError:
-        return      
+        return
     except InternalServerError:
-        return          
+        return
 
-    logger.info(f'Loading container image took [{1000*(time.time()-start)} ms]')
+    logger.info(f'Loading container image took [{1000 * (time.time() - start)} ms]')
 
-def upload_input_example(client, logger, identifier, version, model_data_metadata, input_sample_path):
 
+def upload_input_example(client, logger, identifier, version, model_data_metadata, input_sample_path):
     start = time.time()
 
     input_filename = model_data_metadata['inputs'][0]['name']
     files = {'file': open(input_sample_path, 'rb')}
     params = {'name': input_filename}
     res = client.http.post(f"/models/{identifier}/versions/{version}/testInput", params=params, file_data=files)
 
-    logger.info(f'Uploading sample input took [{1000*(time.time()-start)} ms]')
+    logger.info(f'Uploading sample input took [{1000 * (time.time() - start)} ms]')
 
-def run_model(client, logger, identifier, version):
 
+def run_model(client, logger, identifier, version):
     start = time.time()
     res = client.http.post(f"/models/{identifier}/versions/{version}/run-process")
 
@@ -155,50 +163,49 @@ def run_model(client, logger, identifier, version):
         raise ValueError(f'Sample inference test failed with error {test_output["error"]}. Check model container and try again.')
 
     sample_input = {'input': {'accessKeyID': '<accessKeyID>',
-                                    'region': '<region>',
-                                    'secretAccessKey': '<secretAccessKey>',
-                                    'sources': {'0001': {'input': {'bucket': '<bucket>',
-                                                        'key': '/path/to/s3/input'}}},
-                                                        'type': 'aws-s3'},
-                                'model': {'identifier': identifier, 'version':version}
+                              'region': '<region>',
+                              'secretAccessKey': '<secretAccessKey>',
+                              'sources': {'0001': {'input': {'bucket': '<bucket>',
+                                                             'key': '/path/to/s3/input'}}},
+                              'type': 'aws-s3'},
+                    'model': {'identifier': identifier, 'version': version}
                     }
-    
+
     formatted_sample_output = {'jobIdentifier': '<uuid>',
-                                'total': '<number of inputs>',
-                                'completed': '<total number of completed inputs>',
-                                'failed': '<number of failed inputs>',
-                                'finished': '<true or false>',
-                                'submittedByKey': '<api key>',
-                                'results': {'<input-id>': {'model': None,
-                                'userIdentifier': None,
-                                'status': test_output['status'],
-                                'engine': test_output['engine'],
-                                'error': test_output['error'],
-                                'startTime': test_output['startTime'],
-                                'endTime': test_output['endTime'],
-                                'updateTime': test_output['updateTime'],
-                                'inputSize': test_output['inputSize'],
-                                'accessKey': None,
-                                'teamIdentifier': None,
-                                'accountIdentifier': None,
-                                'timeMeters': None,
-                                'datasourceCompletedTime': None,
-                                'elapsedTime': test_output['elapsedTime'],
-                                'results.json': test_output['results.json']}
-                                }
-                            }
+                               'total': '<number of inputs>',
+                               'completed': '<total number of completed inputs>',
+                               'failed': '<number of failed inputs>',
+                               'finished': '<true or false>',
+                               'submittedByKey': '<api key>',
+                               'results': {'<input-id>': {'model': None,
+                                                          'userIdentifier': None,
+                                                          'status': test_output['status'],
+                                                          'engine': test_output['engine'],
+                                                          'error': test_output['error'],
+                                                          'startTime': test_output['startTime'],
+                                                          'endTime': test_output['endTime'],
+                                                          'updateTime': test_output['updateTime'],
+                                                          'inputSize': test_output['inputSize'],
+                                                          'accessKey': None,
+                                                          'teamIdentifier': None,
+                                                          'accountIdentifier': None,
+                                                          'timeMeters': None,
+                                                          'datasourceCompletedTime': None,
+                                                          'elapsedTime': test_output['elapsedTime'],
+                                                          'results.json': test_output['results.json']}
+                                           }
+                               }
 
     sample_input_res = client.http.put(f"/models/{identifier}/versions/{version}/sample-input", json_data=sample_input)
     sample_output_res = client.http.put(f"/models/{identifier}/versions/{version}/sample-output", json_data=formatted_sample_output)
 
-    logger.info(f'Inference test took [{1000*(time.time()-start)} ms]')
+    logger.info(f'Inference test took [{1000 * (time.time() - start)} ms]')
 
-def deploy_model(client, logger, identifier, version):
 
+def deploy_model(client, logger, identifier, version):
     start = time.time()
     status = {'status': 'active'}
 
     res = client.http.patch(f"/models/{identifier}/versions/{version}", status)
 
-    logger.info(f'Model Deployment took [{1000*(time.time()-start)} ms]')
-
+    logger.info(f'Model Deployment took [{1000 * (time.time() - start)} ms]')
@@ -0,0 +1 @@
+from modzy.edge.proto.inferences.api.v1.inferences_pb2 import InputSource
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	`+from modzy.edge.proto.inferences.api.v1.inferences_pb2 import InputSource`