Azure · jafreck · Jan 27, 2018 · Dec 22, 2017 · Dec 23, 2017 · Dec 23, 2017
diff --git a/aztk/models.py b/aztk/models.py
@@ -23,6 +23,13 @@ def __init__(self, name: str = None, script: str = None, run_on=None):
         self.run_on = run_on
 
 
+class UserConfiguration:
+    def __init__(self, username: str, ssh_key: str = None, password: str = None):
+        self.username = username
+        self.ssh_key = ssh_key
+        self.password = password
+
+
 class ClusterConfiguration:
     def __init__(
             self,
@@ -33,7 +40,8 @@ def __init__(
             vm_low_pri_count=None,
             vm_size=None,
             subnet_id=None,
-            docker_repo: str=None):
+            docker_repo: str = None,
+            user_configuration: UserConfiguration = None):
 
         self.custom_scripts = custom_scripts
         self.file_shares = file_shares
@@ -43,6 +51,7 @@ def __init__(
         self.vm_low_pri_count = vm_low_pri_count
         self.subnet_id = subnet_id
         self.docker_repo = docker_repo
+        self.user_configuration = user_configuration
 
 
 class RemoteLogin:

diff --git a/aztk/spark/client.py b/aztk/spark/client.py
@@ -10,6 +10,7 @@
 from aztk.spark.helpers import job_submission as job_submit_helper
 from aztk.spark.helpers import get_log as get_log_helper
 from aztk.spark.utils import upload_node_scripts, util
+import yaml
 
 
 class Client(BaseClient):
@@ -21,10 +22,18 @@ def __init__(self, secrets_config):
     '''
     def create_cluster(self, cluster_conf: models.ClusterConfiguration, wait: bool = False):
         try:
+            if cluster_conf.user_configuration:
+                user_conf = yaml.dump({'username': cluster_conf.user_configuration.username,
+                                       'password': cluster_conf.user_configuration.password,
+                                       'ssh-key': cluster_conf.user_configuration.ssh_key,
+                                       'cluster_id': cluster_conf.cluster_id})
+            else:
+                user_conf = None
             zip_resource_files = upload_node_scripts.zip_scripts(self.blob_client,
                                                                  cluster_conf.cluster_id,
                                                                  cluster_conf.custom_scripts,
-                                                                 cluster_conf.spark_configuration)
+                                                                 cluster_conf.spark_configuration,
+                                                                 user_conf)
 
             start_task = create_cluster_helper.generate_cluster_start_task(self,
                                                                            zip_resource_files,
@@ -137,7 +146,7 @@ def get_application_status(self, cluster_id: str, app_name: str):
             return task.state._value_
         except batch_error.BatchErrorException as e:
             raise error.AztkError(helpers.format_batch_exception(e))
-    
+
     '''
         job submission
     '''
@@ -180,7 +189,7 @@ def submit_job(self, job_configuration):
             else:
                 raise error.AztkError("Jobs do not support both dedicated and low priority nodes." \
                                       " JobConfiguration fields max_dedicated_nodes and max_low_pri_nodes are mutually exclusive values.")
-            
+
             job = self.__submit_job(
                 job_configuration=job_configuration,
                 start_task=start_task,

diff --git a/aztk/spark/models.py b/aztk/spark/models.py
@@ -62,6 +62,10 @@ class FileShare(aztk.models.FileShare):
     pass
 
 
+class UserConfiguration(aztk.models.UserConfiguration):
+    pass
+
+
 class ClusterConfiguration(aztk.models.ClusterConfiguration):
     def __init__(
             self,
@@ -72,17 +76,19 @@ def __init__(
             vm_low_pri_count=None,
             vm_size=None,
             subnet_id=None,
-            docker_repo: str=None,
-            spark_configuration: SparkConfiguration = None):
+            docker_repo: str = None,
+            spark_configuration: SparkConfiguration = None,
+            user_configuration: UserConfiguration = None):
         super().__init__(custom_scripts=custom_scripts,
-              cluster_id=cluster_id,
-              vm_count=vm_count,
-              vm_low_pri_count=vm_low_pri_count,
-              vm_size=vm_size,
-              docker_repo=docker_repo,
-              subnet_id=subnet_id,
-              file_shares=file_shares
-        )
+                         cluster_id=cluster_id,
+                         vm_count=vm_count,
+                         vm_low_pri_count=vm_low_pri_count,
+                         vm_size=vm_size,
+                         docker_repo=docker_repo,
+                         subnet_id=subnet_id,
+                         file_shares=file_shares,
+                         user_configuration=user_configuration
+                        )
         self.spark_configuration = spark_configuration
         self.gpu_enabled = helpers.is_gpu_enabled(vm_size)
 

diff --git a/aztk/spark/utils/upload_node_scripts.py b/aztk/spark/utils/upload_node_scripts.py
@@ -101,7 +101,7 @@ def __add_str_to_zip(zipf, payload, zipf_file_path=None):
     zipf.writestr(zipf_file_path, payload)
     return zipf
 
-def zip_scripts(blob_client, container_id, custom_scripts, spark_configuration):
+def zip_scripts(blob_client, container_id, custom_scripts, spark_configuration, user_conf=None):
     zipf = __create_zip()
     if custom_scripts:
         zipf = __add_custom_scripts(zipf, custom_scripts)
@@ -117,8 +117,12 @@ def zip_scripts(blob_client, container_id, custom_scripts, spark_configuration):
             for jar in spark_configuration.jars:
                 zipf = __add_file_to_zip(zipf, jar, 'jars', binary=True)
 
+    if user_conf:
+        zipf = __add_str_to_zip(zipf, user_conf, 'user.yaml')
+
     # add helper file to node_scripts/submit/
     zip_file_to_dir(file=os.path.join(constants.ROOT_PATH, 'aztk', 'utils', 'command_builder.py'), directory='', zipf=zipf, binary=False)
 
     zipf.close()
+
     return __upload(blob_client, container_id)
diff --git a/cli/config.py b/cli/config.py
@@ -224,10 +224,6 @@ def merge(self, uid, username, size, size_low_pri, vm_size, subnet_id, password,
             raise aztk.error.AztkError(
                 "Please supply a value for wait in either the cluster.yaml configuration file or with a parameter (--wait or --no-wait)")
 
-        if self.username is not None and self.wait is False:
-            raise aztk.error.AztkError(
-                "You cannot create a user '{0}' if wait is set to false. By default, we create a user in the cluster.yaml file. Please either the configure your cluster.yaml file or set the parameter (--wait)".format(self.username))
-
 
 class SshConfig:
 

diff --git a/cli/spark/endpoints/cluster/cluster_create.py b/cli/spark/endpoints/cluster/cluster_create.py
@@ -53,13 +53,6 @@ def execute(args: typing.NamedTuple):
         password=args.password,
         docker_repo=args.docker_repo)
 
-    print_cluster_conf(cluster_conf)
-
-    spinner = utils.Spinner()
-
-    log.info("Please wait while your cluster is being provisioned")
-    spinner.start()
-
     if cluster_conf.custom_scripts:
         custom_scripts = []
         for custom_script in cluster_conf.custom_scripts:
@@ -86,6 +79,23 @@ def execute(args: typing.NamedTuple):
     else:
         file_shares = None
 
+    if cluster_conf.username:
+        ssh_key, password = utils.get_ssh_key_or_prompt(spark_client.secrets_config.ssh_pub_key,
+                                                        cluster_conf.username,
+                                                        cluster_conf.password,
+                                                        spark_client.secrets_config)
+        user_conf = aztk.spark.models.UserConfiguration(
+            username=cluster_conf.username,
+            password=password,
+            ssh_key=ssh_key
+        )
+    else:
+        user_conf = None
+
+    print_cluster_conf(cluster_conf)
+    spinner = utils.Spinner()
+    spinner.start()
+
     # create spark cluster
     cluster = spark_client.create_cluster(
         aztk.spark.models.ClusterConfiguration(
@@ -97,24 +107,12 @@ def execute(args: typing.NamedTuple):
             custom_scripts=custom_scripts,
             file_shares=file_shares,
             docker_repo=cluster_conf.docker_repo,
-            spark_configuration=load_aztk_spark_config()
+            spark_configuration=load_aztk_spark_config(),
+            user_configuration=user_conf
         ),
         wait=cluster_conf.wait
     )
 
-    if cluster_conf.username:
-        ssh_key = spark_client.secrets_config.ssh_pub_key
-
-        ssh_key, password = utils.get_ssh_key_or_prompt(
-            ssh_key, cluster_conf.username, cluster_conf.password, spark_client.secrets_config)
-
-        spark_client.create_user(
-            cluster_id=cluster_conf.uid,
-            username=cluster_conf.username,
-            password=password,
-            ssh_key=ssh_key
-        )
-
     spinner.stop()
 
     if cluster_conf.wait:

diff --git a/config/cluster.yaml b/config/cluster.yaml
@@ -24,9 +24,8 @@ docker_repo: aztk/base:spark2.2.0
 #   - script: <./relative/path/to/other/script.sh or ./relative/path/to/other/script/directory/>
 #     runOn: <master/worker/all-nodes>
 
+# To add your cluster to a virtual network provide the full arm resoruce id below
+# subnet_id: /subscriptions/********-****-****-****-************/resourceGroups/********/providers/Microsoft.Network/virtualNetworks/*******/subnets/******
 
 # wait: <true/false>
-wait: true
-
-# To add yout cluster to a virtual network provide the full arm resoruce id below
-# subnet_id:
+wait: false
diff --git a/node_scripts/install/create_user.py b/node_scripts/install/create_user.py
@@ -0,0 +1,33 @@
+import os
+import yaml
+import azure.batch.models as batch_models
+import azure.batch.models.batch_error as batch_error
+from datetime import datetime, timezone, timedelta
+'''
+    Creates a user if the user configuration file at $DOCKER_WORKING_DIR/user.yaml exists
+'''
+
+def create_user(batch_client):
+    path = os.path.join(os.environ['DOCKER_WORKING_DIR'], "user.yaml")
+
+    if not os.path.isfile(path):
+        print("No user to create.")
+        return
+
+    with open(path) as file:
+        user_conf = yaml.load(file.read())
+
+    try:
+        batch_client.compute_node.add_user(
+            pool_id=os.environ['AZ_BATCH_POOL_ID'],
+            node_id=os.environ['AZ_BATCH_NODE_ID'],
+            user=batch_models.ComputeNodeUser(
+                name=user_conf['username'],
+                is_admin=True,
+                password=user_conf['password'],
+                ssh_public_key=str(user_conf['ssh-key']),
+                expiry_time=datetime.now(timezone.utc) + timedelta(days=365)
+            )
+        )
+    except batch_error.BatchErrorException as e:
+        print(e)
diff --git a/node_scripts/install/install.py b/node_scripts/install/install.py
@@ -1,11 +1,13 @@
 import os
 from core import config
-from install import pick_master, spark, scripts
+from install import pick_master, spark, scripts, create_user
 
 
 def setup_node():
     client = config.batch_client
 
+    create_user.create_user(batch_client=client)
+
     spark.setup_conf()
 
     is_master = pick_master.find_master(client)