pytorch
diff --git a/‎benchmarks/README.md
Lines changed: 4 additions & 4 deletions b/‎benchmarks/README.md
Lines changed: 4 additions & 4 deletions
diff --git a/‎test/benchmark/README.md renamed to ‎benchmarks/automated/README.md
Lines changed: 38 additions & 36 deletions b/‎test/benchmark/README.md renamed to ‎benchmarks/automated/README.md
Lines changed: 38 additions & 36 deletions
diff --git a/‎test/benchmark/requirements.txt renamed to ‎benchmarks/automated/requirements.txt b/‎test/benchmark/requirements.txt renamed to ‎benchmarks/automated/requirements.txt
diff --git a/‎benchmarks/automated/run_benchmark.py
Lines changed: 220 additions & 0 deletions b/‎benchmarks/automated/run_benchmark.py
Lines changed: 220 additions & 0 deletions
diff --git a/‎test/benchmark/tests/__init__.py renamed to ‎benchmarks/automated/tests/__init__.py b/‎test/benchmark/tests/__init__.py renamed to ‎benchmarks/automated/tests/__init__.py
@@ -273,16 +273,16 @@ python benchmark-ab.py --url https://torchserve.pytorch.org/mar_files/mnist.mar
 python benchmark-ab.py --url https://torchserve.pytorch.org/mar_files/mnist.mar --content_type application/png --config_properties config.properties --inference_model_url explanations/benchmark --input ../examples/image_classifier/mnist/test_data/0.png
 ```
 
-* KUBEFLOW SERVING PREDICTIONS
+* KSERVE SERVING PREDICTIONS
 
 ```
-python benchmark-ab.py --url https://torchserve.pytorch.org/mar_files/mnist.mar --content_type application/json --config_properties config_kf.properties --inference_model_url v1/models/benchmark:predict --input ../kubernetes/kfserving/kf_request_json/mnist.json
+python benchmark-ab.py --url https://torchserve.pytorch.org/mar_files/mnist.mar --content_type application/json --config_properties config_kf.properties --inference_model_url v1/models/benchmark:predict --input ../kubernetes/kserve/kf_request_json/mnist.json
 ```
 
-* KUBEFLOW SERVING EXPLANATIONS
+- KSERVE SERVING EXPLANATIONS
 
 ```
-python benchmark-ab.py --url https://torchserve.pytorch.org/mar_files/mnist.mar --content_type application/json --config_properties config_kf.properties --inference_model_url v1/models/benchmark:explain --input ../kubernetes/kfserving/kf_request_json/mnist.json
+python benchmark-ab.py --url https://torchserve.pytorch.org/mar_files/mnist.mar --content_type application/json --config_properties config_kf.properties --inference_model_url v1/models/benchmark:explain --input ../kubernetes/kserve/kf_request_json/mnist.json
 ```
 
 * TORCHSERVE SERVING PREDICTIONS WITH DOCKER
 
@@ -10,17 +10,17 @@ Check out a sample vgg11 model config at the path: `tests/suite/vgg11.yaml`
 -- [AmazonEC2ContainerRegistryFullAccess](https://console.aws.amazon.com/iam/home#policies/arn:aws:iam::aws:policy/AmazonEC2ContainerRegistryFullAccess) <br>
 -- [AmazonEC2FullAccess](https://console.aws.amazon.com/iam/home#policies/arn:aws:iam::aws:policy/AmazonEC2FullAccess) <br>
 -- [AmazonS3FullAccess](https://console.aws.amazon.com/iam/home#policies/arn:aws:iam::aws:policy/AmazonS3FullAccess) <br>
--- [AmazonIAMFullAccess](https://console.aws.amazon.com/iam/home#policies/arn:aws:iam::aws:policy/AmazonIAMFullAccess) 
+-- [IAMFullAccess](https://console.aws.amazon.com/iam/home#policies/arn:aws:iam::aws:policy/IAMFullAccess) 
 <br (or at the least iam:passrole).
 
 * [Create](https://docs.aws.amazon.com/cli/latest/reference/ecr/create-repository.html) an ECR repository with the name “torchserve-benchmark” in the us-west-2 region, e.g.
 ```
 aws ecr create-repository --repository-name torchserve-benchmark --region us-west-2
 ```
-If you'd like to use your own repo, edit the __init__.py under `serve/test/benchmark/tests/utils`
+If you'd like to use your own repo, edit the `config.yaml` file at `serve/benchmarks/automated/tests/suite/benchmark/config.yaml`
 * Ensure you have [docker](https://docs.docker.com/get-docker/) client set-up on your system - osx/ec2
-* Adjust the following global variables to your preference in the file `serve/test/benchmark/tests/utils/__init__.py` <br>
--- IAM_INSTANCE_PROFILE :this role is attached to all ec2 instances created as part of the benchmarking process. Create this as described [here](https://docs.aws.amazon.com/AWSEC2/latest/UserGuide/iam-roles-for-amazon-ec2.html#create-iam-role). Default role name is 'EC2Admin'.<br>
+* Adjust the following global variables to your preference in the file `serve/benchmarks/automated/tests/suite/benchmark/config.yaml` <br>
+-- iam_instance_profile :this role is attached to all ec2 instances created as part of the benchmarking process. Create this as described [here](https://docs.aws.amazon.com/AWSEC2/latest/UserGuide/iam-roles-for-amazon-ec2.html#create-iam-role). Default role name is 'EC2Admin'.<br>
 Use the following commands to create a new role if you don't have one you can use.
 1. Create the trust policy file `ec2-admin-trust-policy.json` and add the following content:
 ```
@@ -50,16 +50,12 @@ aws iam attach-role-policy --policy-arn arn:aws:iam::aws:policy/AmazonEC2FullAcc
 aws iam attach-role-policy --policy-arn arn:aws:iam::aws:policy/AmazonS3FullAccess --role-name EC2Admin
 aws iam attach-role-policy --policy-arn arn:aws:iam::aws:policy/AmazonEC2ContainerRegistryFullAccess --role-name EC2Admin
 ```
--- S3_BUCKET_BENCHMARK_ARTIFACTS :all temporary benchmarking artifacts including server logs will be stored in this bucket: <br>
+-- s3_bucket_benchmark_artifacts :all temporary benchmarking artifacts including server logs will be stored in this bucket. Note that this bucket must be in the same account, or the credentials being used should have read and write access to the bucket. <br>
 Use the following command to create a new S3 bucket if you don't have one you can use.
 ```
-aws s3api create-bucket --bucket <torchserve-benchmark> --region us-west-2
-```
--- DEFAULT_DOCKER_DEV_ECR_REPO :docker image used for benchmarking will be pushed to this repo <br>
-Use the following command to create a new ECR repo if you don't have one you can use.
-```
-aws ecr create-repository --bucket torchserve-benchmark --region us-west-2
+aws s3api create-bucket --bucket <torchserve-benchmark> --region us-west-2 --create-bucket-configuration LocationConstraint=us-west-2
 ```
+-- default_docker_dev_ecr_repo :docker image used for benchmarking will be pushed to this repo <br>
 * If you're running this setup on an EC2 instance, please ensure that the instance's security group settings 'allow' inbound ssh port 22. Refer [docs](https://docs.aws.amazon.com/AWSEC2/latest/UserGuide/security-group-rules.html).
 
 *The following steps assume that the current working directory is serve/.*
@@ -80,20 +76,23 @@ pip install -r test/benchmark/requirements.txt
 ```
 aws sts get-caller-identity
 ```
-4. For each of the test files under `test/benchmark/tests/`, e.g., test_vgg11.py, set the list of instance types you want to test on:
+4. The automation scripts uses the ts-config from the following location: `benchmarks/config.properties`. Make changes to this file in the current local folder to use this across all the runs.
+5. The simplest way to run a benchmark is to spin-up the ec2 instance type of your choice (must be a DLAMI), and run the benchmark with `--local-execution`, this will run through the models located in `benchmarks/automated/tests/suite/`, and execute benchmarks against these on the current instance. 
+Start the benchmark run as follows (run this a pseudo shell such as tmux or screen, as this is a long-running script):
 ```
-INSTANCE_TYPES_TO_TEST = ["p3.8xlarge"]
+python benchmarks/automated/run_benchmark.py --local-execution
 ```
-5. The automation scripts uses the ts-config from the following location: `benchmarks/config.properties`. Make changes to this file in the current local folder to use this across all the runs.
-6. Finally, start the benchmark run as follows (run this a pseudo shell such as tmux or screen, as this is a long-running script):
+7. Another method is to execute the above command from your desktop terminal, **without** the argument `local-exeuction`. This will cause the instance types mentioned in the `<model>.yaml` files to be spun up. For each of the model config files under `benchmarks/automated/tests/suite/`, e.g., vgg11.yaml, set the list of instance types you want to test on:
 ```
-python test/benchmark/run_benchmark.py
+instance_types:
+  - c4.4xlarge
+  - p3.8xlarge"
 ```
-7. To start test for a particual model, modify the `pytest_args` list in run_benchmark.py to include `["-k", "vgg11"]`, if that particular model is vgg11
-8. For generating benchmarking report, modify the argument to function `generate_comprehensive_report()` to point to the s3 bucket uri for the benchmark run. Run the script as:
+Start the benchmark run as follows:
 ```
-python report.py
+python benchmarks/automated/run_benchmark.py --local-execution
 ```
+
 The final benchmark report will be available in markdown format as `report.md` in the `serve/` folder. 
 
 **Example report for vgg11 model**
@@ -143,36 +142,39 @@ The final benchmark report will be available in markdown format as `report.md` i
 
 
 ## Features of the automation:
-1. To save time by *not* creating new instances for every benchmark run for local testing, use the '--do-not-terminate' flag. This will automatically create a file called 'instances.yaml' and write instance-related data into the file so that it may be re-used next time.
-```
-python test/benchmark/run_benchmark.py --do-not-terminate
-```
-
-2. To re-use an instance already recorded in `instances.yaml`, use the '--use-instances' flag:
-```
-python test/benchmark/run_benchmark.py --use-instances <full_path_to>/instances.yaml --do-no-terminate
-```
-`Note: Use --do-not-termninate flag to keep re-using the instances, else, it will be terminated`.
 
 3. To run a test containing a specific string, use the `--run-only` flag. Note that the argument is 'string matched' i.e. if the test-name contains the supplied argument as a substring, the test will run. 
 ```
 # To run mnist test
-python test/benchmark/run_benchmark.py --run-only mnist
+python benchmarks/automated/run_benchmark.py --run-only mnist
 
 # To run fastrcnn test
-python test/benchmark/run_benchmark.py --run-only fastrcnn
+python benchmarks/automated/run_benchmark.py --run-only fastrcnn
 
-# To run bert_neuron and bert
-python test/benchmark/run_benchmark.py --run-only bert
+# To run bert_neuron and bert_cpu
+python benchmarks/automated/run_benchmark.py --run-only bert_cpu
 
 # To run vgg11 test
-python test/benchmark/run_benchmark.py --run-only vgg11
+python benchmarks/automated/run_benchmark.py --run-only vgg11
 
 # To run vgg16 test
-python test/benchmark/run_benchmark.py --run-only vgg16
+python benchmarks/automated/run_benchmark.py --run-only vgg16
+
+# To run multiple:
+python benchmarks/automated/run_benchmark.py --run-only vgg11 vgg16 bert_cpu
 ```
 
 4. You can benchmark a specifc branch of the torchserve github repo by specifying the flag `--use-torchserve-branch` e.g., 
 ```
-python test/benchmark/run_benchmark.py --use-torchserve-branch issue_1115
+python benchmarks/automated/run_benchmark.py --use-torchserve-branch issue_1115
+```
+
+5. Once the docker image is built, you may choose to not have it re-built by passing the argument `--skip-docker-build` e.g.,
+```
+python benchmarks/automated/run_benchmark.py --skip-docker-build
+```
+
+6. If you do not wish to benchmark on different instance types specified in the model config `*.yaml`, you may pass the argument `--local-execution`. In this case, the instance types specified in the model config `*.yaml` file are *ignored*. Also, in this case, all the model benchmarks will be performed *sequentially* in order to 
+```
+python benchmarks/automated/run_benchmarks.py --local-execution
 ```
@@ -0,0 +1,220 @@
+import argparse
+import os
+import random
+import sys
+import logging
+import re
+import uuid
+
+
+import boto3
+import pytest
+
+from invoke import run
+from invoke.context import Context
+
+
+from tests.utils.report import Report
+from tests.utils import (
+    S3_BUCKET_BENCHMARK_ARTIFACTS,
+    DEFAULT_REGION,
+    DEFAULT_DOCKER_DEV_ECR_REPO,
+    YamlHandler,
+    DockerImageHandler,
+)
+
+LOGGER = logging.getLogger(__name__)
+LOGGER.setLevel(logging.DEBUG)
+LOGGER.addHandler(logging.StreamHandler(sys.stdout))
+
+
+def build_docker_container(torchserve_branch="master", push_image=True, use_local_serve_folder=False):
+    LOGGER.info(f"Setting up docker image to be used")
+
+    docker_dev_image_config_path = os.path.join(
+        os.getcwd(), "benchmarks", "automated", "tests", "suite", "docker", "docker.yaml"
+    )
+
+
+    if use_local_serve_folder:
+        LOGGER.info(f"*** Using the local 'serve' folder closure when creating the container image.")
+
+
+        local_serve_folder = os.getcwd()
+        tmp_local_serve_folder = os.path.join("/tmp", "serve")
+        serve_folder_in_docker_context = os.path.join(os.getcwd(), "docker", "serve")
+
+        run(f"mkdir -p {tmp_local_serve_folder}")
+        run(f"mkdir -p {serve_folder_in_docker_context}")
+
+        run(f"rsync -av --progress {local_serve_folder}/ {tmp_local_serve_folder}/")
+        run(f"rsync -av --progress {tmp_local_serve_folder}/ {serve_folder_in_docker_context}/")
+
+        run(f"rm -rf {tmp_local_serve_folder}")
+
+    docker_config = YamlHandler.load_yaml(docker_dev_image_config_path)
+    YamlHandler.validate_docker_yaml(docker_config)
+
+    account_id = run("aws sts get-caller-identity --query Account --output text").stdout.strip()
+
+    for processor, config in docker_config.items():
+        docker_tag = None
+        cuda_version = None
+        dockerhub_image = None
+        for config_key, config_value in config.items():
+            if processor == "gpu" and config_key == "cuda_version":
+                cuda_version = config_value
+            if config_key == "docker_tag":
+                docker_tag = config_value
+
+            if config_key == "dockerhub_image":
+                dockerhub_image = config_value
+
+        dockerImageHandler = DockerImageHandler(docker_tag, cuda_version, torchserve_branch)
+
+        if not dockerhub_image:
+            dockerImageHandler.build_image(use_local_serve_folder=use_local_serve_folder)
+        else:
+            # Image is pulled by process_docker_config in __init__.py
+            LOGGER.info(f"*** Note: dockerhub_image specified in docker.yaml. This container image will be used for benchmark.")
+            dockerImageHandler.pull_docker_image(dockerhub_image, docker_tag=docker_tag)
+
+        if push_image:
+            dockerImageHandler.push_docker_image_to_ecr(
+                account_id, DEFAULT_REGION, f"{DEFAULT_DOCKER_DEV_ECR_REPO}:{docker_tag}"
+            )
+        else:
+            LOGGER.warn(f"Docker image will not be pushed to ECR repo in local execution.")
+
+
+def main():
+
+    parser = argparse.ArgumentParser()
+
+    parser.add_argument(
+        "--use-instances",
+        action="store",
+        help="Supply a .yaml file with test_name, instance_id, and key_filename to re-use already-running instances",
+    )
+    parser.add_argument(
+        "--do-not-terminate",
+        action="store_true",
+        default=False,
+        help="Use with caution: does not terminate instances, instead saves the list to a file in order to re-use",
+    )
+
+    parser.add_argument(
+        "--run-only", nargs="+", default=None, help="Runs the tests that contain the supplied keyword as a substring"
+    )
+
+    parser.add_argument(
+        "--use-torchserve-branch",
+        default="master",
+        help="Specify a specific torchserve branch to build a container to benchmark on, else uses 'master' by default",
+    )
+
+    parser.add_argument(
+        "--use-local-serve-folder",
+        action="store_true",
+        default=False,
+        help="Specify this option if you'd like to build a container image out of your current 'serve' folder."
+    )
+
+    parser.add_argument(
+        "--skip-docker-build",
+        action="store_true",
+        default=False,
+        help="Use if you already have a docker image built and available locally and have specified it in docker.yaml",
+    )
+
+    parser.add_argument(
+        "--local-execution",
+        action="store_true",
+        default=False,
+        help="Specify when you want to execute benchmarks on the current instance. Note: this will execute the model benchmarks sequentially, and will ignore instances specified in the model config *.yaml files.",
+    )
+
+    parser.add_argument(
+        "--local-instance-type",
+        default=None,
+        help="Specify the current ec2 instance on which the benchmark executes. May not specify any other value than a valid ec2 instance type."
+    )
+
+
+    arguments = parser.parse_args()
+
+    if arguments.local_instance_type and not arguments.local_execution:
+        LOGGER.error(f"--local-instance-type may only be used with --local-execution")
+        sys.exit(1)
+
+    if arguments.local_execution and not arguments.local_instance_type:
+        LOGGER.error(f"--local-instance-type must be specified when using --local-execution")
+        sys.exit(1)
+
+    do_not_terminate_string = "" if not arguments.do_not_terminate else "--do-not-terminate"
+    local_execution_string = "" if not arguments.local_execution else "--local-execution"
+    use_instances_arg_list = ["--use-instances", f"{arguments.use_instances}"] if arguments.use_instances else []
+    run_only_test = arguments.run_only
+
+    if run_only_test:
+        LOGGER.info(f"run_only_test:{run_only_test}")
+        LOGGER.info(f"run_only_test type:{type(run_only_test)}")
+        run_only_string_list = " or ".join([model for model in run_only_test])
+        run_only_string = f"-k {run_only_string_list}"
+        LOGGER.info(f"Note: running only the tests that have the name '{run_only_string_list}'.")
+    else:
+        run_only_string = ""
+
+    if arguments.local_execution:
+        number_of_threads_string = ""
+        local_instance_type_list = ["--local-instance-type", arguments.local_instance_type]
+    else:
+        number_of_threads_string = "-n=4"
+        local_instance_type_list = []
+
+    torchserve_branch = arguments.use_torchserve_branch
+    use_local_serve_folder = arguments.use_local_serve_folder
+
+    # Build docker containers as specified in docker.yaml
+    if not arguments.skip_docker_build:
+        push_image = False if arguments.local_execution else True
+        build_docker_container(torchserve_branch=torchserve_branch, push_image=push_image, use_local_serve_folder=use_local_serve_folder)
+    else:
+        LOGGER.warn(f"Skipping docker build.")
+
+    # Run this script from the root directory 'serve', it changes directory below as required
+    os.chdir(os.path.join(os.getcwd(), "benchmarks", "automated"))
+
+    execution_id = f"ts-benchmark-run-{str(uuid.uuid4())}"
+
+    test_path = os.path.join(os.getcwd(), "tests")
+    LOGGER.info(f"Running tests from directory: {test_path}")
+
+    pytest_args = [
+        "-s",
+        run_only_string,
+        "-rA",
+        test_path,
+        number_of_threads_string,
+        "--disable-warnings",
+        "-v",
+        "--execution-id",
+        execution_id,
+        do_not_terminate_string,
+        local_execution_string,
+    ] + local_instance_type_list + use_instances_arg_list
+
+    LOGGER.info(f"Running pytest")
+
+    pytest.main(pytest_args)
+
+    # Generate report
+    s3_results_uri = f"{S3_BUCKET_BENCHMARK_ARTIFACTS}/{execution_id}"
+
+    report = Report()
+    report.download_benchmark_results_from_s3(s3_results_uri)
+    report.generate_comprehensive_report()
+
+
+if __name__ == "__main__":
+    main()