LiuFan
/
PrivacyScanData


			
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395
							# Copyright (c) Microsoft Corporation. All rights reserved.
# Licensed under the MIT License.

"""
This python script sets up an environment on AzureML and submits a
script to it to run pytest.  It is usually intended to be used as
part of a DevOps pipeline which runs testing on a github repo but
can also be used from command line.

Many parameters are set to default values and some are expected to be passed
in from either the DevOps pipeline or command line.
If calling from command line, there are some parameters you must pass in for
your job to run.


Args:
    Required:
    --clustername (str): the Azure cluster for this run. It can already exist
                         or it will be created.
    --subid       (str): the Azure subscription id

    Optional but suggested, this info will be stored on Azure as
    text information as part of the experiment:
    --pr          (str): the Github PR number
    --reponame    (str): the Github repository name
    --branch      (str): the branch being run
                    It is also possible to put any text string in these.
Example:
    Usually, this script is run by a DevOps pipeline. It can also be
    run from cmd line.
    >>> python tests/ci/refac.py --clustername 'cluster-d3-v2'
                                 --subid '12345678-9012-3456-abcd-123456789012'
                                 --pr '666'
                                 --reponame 'Recommenders'
                                 --branch 'staging'
"""
import argparse
import logging

from azureml.core.authentication import AzureCliAuthentication
from azureml.core import Workspace
from azureml.core import Experiment
from azureml.core.runconfig import RunConfiguration
from azureml.core.conda_dependencies import CondaDependencies
from azureml.core.script_run_config import ScriptRunConfig
from azureml.core.compute import ComputeTarget, AmlCompute
from azureml.core.compute_target import ComputeTargetException
from azureml.core.workspace import WorkspaceException


def setup_workspace(workspace_name, subscription_id, resource_group, cli_auth,
                    location):
    """
    This sets up an Azure Workspace.
    An existing Azure Workspace is used or a new one is created if needed for
    the pytest run.

    Args:
        workspace_name  (str): Centralized location on Azure to work
                               with all the artifacts used by AzureML
                               service
        subscription_id (str): the Azure subscription id
        resource_group  (str): Azure Resource Groups are logical collections of
                         assets associated with a project. Resource groups
                         make it easy to track or delete all resources
                         associated with a project by tracking or deleting
                         the Resource group.
        cli_auth         Azure authentication
        location        (str): workspace reference

    Returns:
        ws: workspace reference
    """
    logger.debug('setup: workspace_name is {}'.format(workspace_name))
    logger.debug('setup: resource_group is {}'.format(resource_group))
    logger.debug('setup: subid is {}'.format(subscription_id))
    logger.debug('setup: location is {}'.format(location))

    try:
            # use existing workspace if there is one
            ws = Workspace.get(
                name=workspace_name,
                subscription_id=subscription_id,
                resource_group=resource_group,
                auth=cli_auth
            )
    except WorkspaceException:
            # this call might take a minute or two.
            logger.debug('Creating new workspace')
            ws = Workspace.create(
                name=workspace_name,
                subscription_id=subscription_id,
                resource_group=resource_group,
                # create_resource_group=True,
                location=location,
                auth=cli_auth
            )
    return ws


def setup_persistent_compute_target(workspace, cluster_name, vm_size,
                                    max_nodes):
    """
    Set up a persistent compute target on AzureML.
    A persistent compute target runs noticeably faster than a
    regular compute target for subsequent runs.  The benefit
    is that AzureML manages turning the compute on/off as needed for
    each job so the user does not need to do this.

    Args:
        workspace    (str): Centralized location on Azure to work with
                         all the
                                artifacts used by AzureML service
        cluster_name (str): the Azure cluster for this run. It can
                            already exist or it will be created.
        vm_size      (str): Azure VM size, like STANDARD_D3_V2
        max_nodes    (int): Number of VMs, max_nodes=4 will
                            autoscale up to 4 VMs
    Returns:
        cpu_cluster : cluster reference
    """
    # setting vmsize and num nodes creates a persistent AzureML
    # compute resource

    logger.debug("setup: cluster_name {}".format(cluster_name))
    # https://docs.microsoft.com/en-us/azure/machine-learning/service/how-to-set-up-training-targets

    try:
        cpu_cluster = ComputeTarget(workspace=workspace, name=cluster_name)
        logger.debug('setup: Found existing cluster, use it.')
    except ComputeTargetException:
        logger.debug('setup: create cluster')
        compute_config = AmlCompute.provisioning_configuration(
                       vm_size=vm_size,
                       max_nodes=max_nodes)
        cpu_cluster = ComputeTarget.create(workspace,
                                           cluster_name,
                                           compute_config)
    cpu_cluster.wait_for_completion(show_output=True)
    return cpu_cluster


def create_run_config(cpu_cluster, docker_proc_type, conda_env_file):
    """
    AzureML requires the run environment to be setup prior to submission.
    This configures a docker persistent compute.  Even though
    it is called Persistent compute, AzureML handles startup/shutdown
    of the compute environment.

    Args:
        cpu_cluster      (str) : Names the cluster for the test
                                 In the case of unit tests, any of
                                 the following:
                                 - Reco_cpu_test
                                 - Reco_gpu_test
        docker_proc_type (str) : processor type, cpu or gpu
        conda_env_file   (str) : filename which contains info to
                                 set up conda env
    Return:
          run_amlcompute : AzureML run config
    """

    # runconfig with max_run_duration_seconds did not work, check why:
    # run_amlcompute = RunConfiguration(max_run_duration_seconds=60*30)
    run_amlcompute = RunConfiguration()
    run_amlcompute.target = cpu_cluster
    run_amlcompute.environment.docker.enabled = True
    run_amlcompute.environment.docker.base_image = docker_proc_type

    # Use conda_dependencies.yml to create a conda environment in
    # the Docker image for execution
    # False means the user will provide a conda file for setup
    # True means the user will manually configure the environment
    run_amlcompute.environment.python.user_managed_dependencies = False
    run_amlcompute.environment.python.conda_dependencies = CondaDependencies(
            conda_dependencies_file_path=conda_env_file)
    return run_amlcompute


def create_experiment(workspace, experiment_name):
    """
    AzureML requires an experiment as a container of trials.
    This will either create a new experiment or use an
    existing one.

    Args:
        workspace (str) : name of AzureML workspace
        experiment_name (str) : AzureML experiment name
    Return:
        exp - AzureML experiment
    """

    logger.debug('create: experiment_name {}'.format(experiment_name))
    exp = Experiment(workspace=workspace, name=experiment_name)
    return(exp)


def submit_experiment_to_azureml(test, test_folder, test_markers, junitxml,
                                 run_config, experiment):

    """
    Submitting the experiment to AzureML actually runs the script.

    Args:
        test         (str) - pytest script, folder/test
                             such as ./tests/ci/run_pytest.py
        test_folder  (str) - folder where tests to run are stored,
                             like ./tests/unit
        test_markers (str) - test markers used by pytest
                             "not notebooks and not spark and not gpu"
        junitxml     (str) - file of output summary of tests run
                             note "--junitxml" is required as part
                             of the string
                             Example: "--junitxml reports/test-unit.xml"
        run_config - environment configuration
        experiment - instance of an Experiment, a collection of
                     trials where each trial is a run.
    Return:
          run : AzureML run or trial
    """

    logger.debug('submit: testfolder {}'.format(test_folder))
    logger.debug('junitxml: {}'.format(junitxml))
    project_folder = "."

    script_run_config = ScriptRunConfig(source_directory=project_folder,
                                        script=test,
                                        run_config=run_config,
                                        arguments=["--testfolder",
                                                   test_folder,
                                                   "--testmarkers",
                                                   test_markers,
                                                   "--xmlname",
                                                   junitxml]
                                        )
    run = experiment.submit(script_run_config)
    # waits only for configuration to complete
    run.wait_for_completion(show_output=True, wait_post_processing=True)

    # test logs can also be found on azure
    # go to azure portal to see log in azure ws and look for experiment name
    # and look for individual run
    logger.debug('files {}'.format(run.get_file_names))

    return run


def create_arg_parser():
    """
    Many of the argument defaults are used as arg_parser makes it easy to
    use defaults. The user has many options they can select.
    """

    parser = argparse.ArgumentParser(description='Process some inputs')
    # script to run pytest
    parser.add_argument("--test",
                        action="store",
                        default="./tests/ci/run_pytest.py",
                        help="location of script to run pytest")
    # test folder
    parser.add_argument("--testfolder",
                        action="store",
                        default="./tests/unit",
                        help="folder where tests are stored")
    # pytest test markers
    parser.add_argument("--testmarkers",
                        action="store",
                        default="not notebooks and not spark and not gpu",
                        help="pytest markers indicate tests to run")
    # test summary file
    parser.add_argument("--junitxml",
                        action="store",
                        default="reports/test-unit.xml",
                        help="file for returned test results")
    # max num nodes in Azure cluster
    parser.add_argument("--maxnodes",
                        action="store",
                        default=4,
                        help="specify the maximum number of nodes for the run")
    # Azure resource group
    parser.add_argument("--rg",
                        action="store",
                        default="recommender",
                        help="Azure Resource Group")
    # AzureML workspace Name
    parser.add_argument("--wsname",
                        action="store",
                        default="RecoWS",
                        help="AzureML workspace name")
    # AzureML clustername
    parser.add_argument("--clustername",
                        action="store",
                        default="amlcompute",
                        help="Set name of Azure cluster")
    # Azure VM size
    parser.add_argument("--vmsize",
                        action="store",
                        default="STANDARD_D3_V2",
                        help="Set the size of the VM either STANDARD_D3_V2")
    # cpu or gpu
    parser.add_argument("--dockerproc",
                        action="store",
                        default="cpu",
                        help="Base image used in docker container")
    # Azure subscription id, when used in a pipeline, it is stored in keyvault
    parser.add_argument("--subid",
                        action="store",
                        default="123456",
                        help="Azure Subscription ID")
    # ./reco.yaml is created in the azure devops pipeline.
    # Not recommended to change this.
    parser.add_argument("--condafile",
                        action="store",
                        default="./reco.yaml",
                        help="file with environment variables")
    # AzureML experiment name
    parser.add_argument("--expname",
                        action="store",
                        default="persistentAML",
                        help="experiment name on Azure")
    # Azure datacenter location
    parser.add_argument("--location",
                        default="EastUS",
                        help="Azure location")
    # github repo, stored in AzureML experiment for info purposes
    parser.add_argument("--reponame",
                        action="store",
                        default="--reponame MyGithubRepo",
                        help="GitHub repo being tested")
    # github branch, stored in AzureML experiment for info purposes
    parser.add_argument("--branch",
                        action="store",
                        default="--branch MyGithubBranch",
                        help=" Identify the branch test test is run on")
    # github pull request, stored in AzureML experiment for info purposes
    parser.add_argument("--pr",
                        action="store",
                        default="--pr PRTestRun",
                        help="If a pr triggered the test, list it here")

    args = parser.parse_args()

    return args


if __name__ == "__main__":
    logger = logging.getLogger('submit_azureml_pytest.py')
    # logger.setLevel(logging.DEBUG)
    # logging.basicConfig(level=logging.DEBUG)
    args = create_arg_parser()

    if args.dockerproc == "cpu":
        from azureml.core.runconfig import DEFAULT_CPU_IMAGE
        docker_proc_type = DEFAULT_CPU_IMAGE
    else:
        from azureml.core.runconfig import DEFAULT_GPU_IMAGE
        docker_proc_type = DEFAULT_GPU_IMAGE

    cli_auth = AzureCliAuthentication()

    workspace = setup_workspace(workspace_name=args.wsname,
                                subscription_id=args.subid,
                                resource_group=args.rg,
                                cli_auth=cli_auth,
                                location=args.location)

    cpu_cluster = setup_persistent_compute_target(
                      workspace=workspace,
                      cluster_name=args.clustername,
                      vm_size=args.vmsize,
                      max_nodes=args.maxnodes)

    run_config = create_run_config(cpu_cluster=cpu_cluster,
                                   docker_proc_type=docker_proc_type,
                                   conda_env_file=args.condafile)

    logger.info('exp: In Azure, look for experiment named {}'.format(
                args.expname))

    # create new or use existing experiment
    experiment = Experiment(workspace=workspace, name=args.expname)
    run = submit_experiment_to_azureml(test=args.test,
                                       test_folder=args.testfolder,
                                       test_markers=args.testmarkers,
                                       junitxml=args.junitxml,
                                       run_config=run_config,
                                       experiment=experiment)

    # add helpful information to experiment on Azure
    run.tag('RepoName', args.reponame)
    run.tag('Branch', args.branch)
    run.tag('PR', args.pr)
    # download files from AzureML
    run.download_files(prefix='reports', output_paths='./reports')
    run.complete()