update cluster creation

2019-06-13 12:14:58 -04:00
parent daf27a76e4
commit de162316d7
29 changed files with 682 additions and 204 deletions
--- a/tutorials/img-classification-part1-training.ipynb
+++ b/tutorials/img-classification-part1-training.ipynb
@@ -126,7 +126,9 @@
      "metadata": {},
      "source": [
        "### Create or Attach existing compute resource\n",
-        "By using Azure Machine Learning Compute, a managed service, data scientists can train machine learning models on clusters of Azure virtual machines. Examples include VMs with GPU support. In this tutorial, you use default Azure Machine Learning Compute as your training environment."
+        "By using Azure Machine Learning Compute, a managed service, data scientists can train machine learning models on clusters of Azure virtual machines. Examples include VMs with GPU support. In this tutorial, you create Azure Machine Learning Compute as your training environment. The code below creates the compute clusters for you if they don't already exist in your workspace.\n",
+        "\n",
+        "**Creation of compute takes approximately 5 minutes.** If the AmlCompute with that name is already in your workspace the code will skip the creation process."
      ]
    },
    {
@@ -140,10 +142,38 @@
      },
      "outputs": [],
      "source": [
+        "from azureml.core.compute import AmlCompute\n",
+        "from azureml.core.compute import ComputeTarget\n",
        "import os\n",
        "\n",
-        "cluster_type = os.environ.get(\"AML_COMPUTE_CLUSTER_TYPE\", \"CPU\")\n",
-        "compute_target = ws.get_default_compute_target(cluster_type)"
+        "# choose a name for your cluster\n",
+        "compute_name = os.environ.get(\"AML_COMPUTE_CLUSTER_NAME\", \"cpu-cluster\")\n",
+        "compute_min_nodes = os.environ.get(\"AML_COMPUTE_CLUSTER_MIN_NODES\", 0)\n",
+        "compute_max_nodes = os.environ.get(\"AML_COMPUTE_CLUSTER_MAX_NODES\", 4)\n",
+        "\n",
+        "# This example uses CPU VM. For using GPU VM, set SKU to STANDARD_NC6\n",
+        "vm_size = os.environ.get(\"AML_COMPUTE_CLUSTER_SKU\", \"STANDARD_D2_V2\")\n",
+        "\n",
+        "\n",
+        "if compute_name in ws.compute_targets:\n",
+        "    compute_target = ws.compute_targets[compute_name]\n",
+        "    if compute_target and type(compute_target) is AmlCompute:\n",
+        "        print('found compute target. just use it. ' + compute_name)\n",
+        "else:\n",
+        "    print('creating a new compute target...')\n",
+        "    provisioning_config = AmlCompute.provisioning_configuration(vm_size = vm_size,\n",
+        "                                                                min_nodes = compute_min_nodes, \n",
+        "                                                                max_nodes = compute_max_nodes)\n",
+        "\n",
+        "    # create the cluster\n",
+        "    compute_target = ComputeTarget.create(ws, compute_name, provisioning_config)\n",
+        "    \n",
+        "    # can poll for a minimum number of nodes and for a specific timeout. \n",
+        "    # if no min node count is provided it will use the scale settings for the cluster\n",
+        "    compute_target.wait_for_completion(show_output=True, min_node_count=None, timeout_in_minutes=20)\n",
+        "    \n",
+        "     # For a more detailed view of current AmlCompute status, use get_status()\n",
+        "    print(compute_target.get_status().serialize())"
      ]
    },
    {
@@ -324,8 +354,8 @@
        "# get hold of the current run\n",
        "run = Run.get_context()\n",
        "\n",
-        "print('Train a logistic regression model with regularizaion rate of', args.reg)\n",
-        "clf = LogisticRegression(C=1.0/args.reg, random_state=42)\n",
+        "print('Train a logistic regression model with regularization rate of', args.reg)\n",
+        "clf = LogisticRegression(C=1.0/args.reg, solver=\"liblinear\", multi_class=\"auto\", random_state=42)\n",
        "clf.fit(X_train, y_train)\n",
        "\n",
        "print('Predict the test set')\n",
@@ -386,14 +416,13 @@
      "source": [
        "### Create an estimator\n",
        "\n",
-        "An estimator object is used to submit the run.  Create your estimator by running the following code to define:\n",
+        "An estimator object is used to submit the run. Azure Machine Learning has pre-configured estimators for common machine learning frameworks, as well as generic Estimator. Create SKLearn estimator for scikit-learn model, by specifying\n",
        "\n",
        "* The name of the estimator object, `est`\n",
        "* The directory that contains your scripts. All the files in this directory are uploaded into the cluster nodes for execution. \n",
        "* The compute target.  In this case you will use the AmlCompute you created\n",
        "* The training script name, train.py\n",
        "* Parameters required from the training script \n",
-        "* Python packages needed for training\n",
        "\n",
        "In this tutorial, this target is AmlCompute. All files in the script folder are uploaded into the cluster nodes for execution. The data_folder is set to use the datastore (`ds.path('mnist').as_mount()`)."
      ]
@@ -408,18 +437,17 @@
      },
      "outputs": [],
      "source": [
-        "from azureml.train.estimator import Estimator\n",
+        "from azureml.train.sklearn import SKLearn\n",
        "\n",
        "script_params = {\n",
        "    '--data-folder': ds.path('mnist').as_mount(),\n",
-        "    '--regularization': 0.05\n",
+        "    '--regularization': 0.5\n",
        "}\n",
        "\n",
-        "est = Estimator(source_directory=script_folder,\n",
+        "est = SKLearn(source_directory=script_folder,\n",
        "                script_params=script_params,\n",
        "                compute_target=compute_target,\n",
-        "                entry_script='train.py',\n",
-        "                conda_packages=['scikit-learn'])"
+        "                entry_script='train.py')"
      ]
    },
    {
@@ -646,18 +674,6 @@
      "language": "python",
      "name": "python36"
    },
-    "language_info": {
-      "codemirror_mode": {
-        "name": "ipython",
-        "version": 3
-      },
-      "file_extension": ".py",
-      "mimetype": "text/x-python",
-      "name": "python",
-      "nbconvert_exporter": "python",
-      "pygments_lexer": "ipython3",
-      "version": "3.6.8"
-    },
    "msauthor": "roastala"
  },
  "nbformat": 4,