blob: a4dda9d80286567d5a732aeb1a0e15423a7cbdc3 [file] [log] [blame]
#!/usr/bin/python
# *****************************************************************************
#
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.
#
# ******************************************************************************
import logging
import json
import sys
import os
from Crypto.PublicKey import RSA
import dlab.fab
import dlab.actions_lib
import dlab.meta_lib
import traceback
from fabric.api import *
if __name__ == "__main__":
instance_class = 'notebook'
local_log_filename = "{}_{}_{}.log".format(os.environ['conf_resource'], os.environ['project_name'],
os.environ['request_id'])
local_log_filepath = "/logs/" + os.environ['conf_resource'] + "/" + local_log_filename
logging.basicConfig(format='%(levelname)-8s [%(asctime)s] %(message)s',
level=logging.DEBUG,
filename=local_log_filepath)
# generating variables dictionary
try:
AzureMeta = dlab.meta_lib.AzureMeta()
AzureActions = dlab.actions_lib.AzureActions()
notebook_config = dict()
notebook_config['user_name'] = os.environ['edge_user_name']
notebook_config['project_name'] = os.environ['project_name']
notebook_config['project_tag'] = notebook_config['project_name']
notebook_config['endpoint_name'] = os.environ['endpoint_name']
notebook_config['endpoint_tag'] = notebook_config['endpoint_name']
notebook_config['application'] = os.environ['application'].lower()
print('Generating infrastructure names and tags')
try:
notebook_config['exploratory_name'] = os.environ['exploratory_name']
except:
notebook_config['exploratory_name'] = ''
notebook_config['service_base_name'] = os.environ['conf_service_base_name']
notebook_config['resource_group_name'] = os.environ['azure_resource_group_name']
notebook_config['region'] = os.environ['azure_region']
notebook_config['vpc_name'] = os.environ['azure_vpc_name']
notebook_config['instance_size'] = os.environ['azure_notebook_instance_size']
notebook_config['key_name'] = os.environ['conf_key_name']
notebook_config['instance_name'] = '{}-{}-{}-nb-{}'.format(notebook_config['service_base_name'],
notebook_config['project_name'],
notebook_config['endpoint_name'],
notebook_config['exploratory_name'])
notebook_config['tags'] = {"Name": notebook_config['instance_name'],
"SBN": notebook_config['service_base_name'],
"User": notebook_config['user_name'],
"project_tag": notebook_config['project_tag'],
"endpoint_tag": notebook_config['endpoint_tag'],
"Exploratory": notebook_config['exploratory_name'],
"product": "dlab"}
notebook_config['network_interface_name'] = notebook_config['instance_name'] + "-nif"
notebook_config['security_group_name'] = '{}-{}-{}-nb-sg'.format(notebook_config['service_base_name'],
notebook_config['project_name'],
notebook_config['endpoint_name'])
notebook_config['private_subnet_name'] = '{}-{}-{}-subnet'.format(notebook_config['service_base_name'],
notebook_config['project_name'],
notebook_config['endpoint_name'])
ssh_key_path = '{}{}.pem'.format(os.environ['conf_key_dir'], os.environ['conf_key_name'])
key = RSA.importKey(open(ssh_key_path, 'rb').read())
notebook_config['public_ssh_key'] = key.publickey().exportKey("OpenSSH")
notebook_config['primary_disk_size'] = '32'
notebook_config['instance_storage_account_type'] = (lambda x: 'Standard_LRS' if x in ('deeplearning', 'tensor')
else 'Premium_LRS')(os.environ['application'])
if os.environ['conf_os_family'] == 'debian':
notebook_config['initial_user'] = 'ubuntu'
notebook_config['sudo_group'] = 'sudo'
if os.environ['conf_os_family'] == 'redhat':
notebook_config['initial_user'] = 'ec2-user'
notebook_config['sudo_group'] = 'wheel'
notebook_config['image_type'] = 'default'
notebook_config['shared_image_enabled'] = os.environ['conf_shared_image_enabled']
if notebook_config['shared_image_enabled'] == 'false':
notebook_config['expected_image_name'] = '{0}-{1}-{2}-{3}-notebook-image'.format(
notebook_config['service_base_name'],
notebook_config['project_name'],
notebook_config['endpoint_name'],
notebook_config['application'])
else:
notebook_config['expected_image_name'] = '{0}-{1}-{2}-notebook-image'.format(
notebook_config['service_base_name'],
notebook_config['endpoint_name'],
notebook_config['application'])
notebook_config['notebook_image_name'] = (lambda x: '{0}-{1}-{2}-{3}-{4}'.format(
notebook_config['service_base_name'], notebook_config['project_name'], notebook_config['endpoint_name'],
os.environ['application'], os.environ['notebook_image_name']).replace('_', '-') if (x != 'None' and x != '')
else notebook_config['expected_image_name'])(str(os.environ.get('notebook_image_name')))
print('Searching pre-configured images')
notebook_config['image_name'] = os.environ['azure_{}_image_name'.format(os.environ['conf_os_family'])]
if AzureMeta.get_image(notebook_config['resource_group_name'], notebook_config['notebook_image_name']):
notebook_config['image_name'] = notebook_config['notebook_image_name']
notebook_config['image_type'] = 'pre-configured'
print('Pre-configured image found. Using: {}'.format(notebook_config['notebook_image_name']))
else:
os.environ['notebook_image_name'] = notebook_config['image_name']
print('No pre-configured image found. Using default one: {}'.format(notebook_config['image_name']))
except Exception as err:
print("Failed to generate variables dictionary.")
dlab.fab.append_result("Failed to generate variables dictionary.", str(err))
sys.exit(1)
try:
edge_status = AzureMeta.get_instance_status(notebook_config['resource_group_name'],
'{0}-{1}-{2}-edge'.format(os.environ['conf_service_base_name'],
notebook_config['project_name'],
notebook_config['endpoint_name']))
if edge_status != 'running':
logging.info('ERROR: Edge node is unavailable! Aborting...')
print('ERROR: Edge node is unavailable! Aborting...')
ssn_hostname = AzureMeta.get_private_ip_address(notebook_config['resource_group_name'],
os.environ['conf_service_base_name'] + '-ssn')
dlab.fab.put_resource_status('edge', 'Unavailable', os.environ['ssn_dlab_path'], os.environ['conf_os_user'],
ssn_hostname)
dlab.fab.append_result("Edge node is unavailable")
sys.exit(1)
except Exception as err:
dlab.fab.append_result("Failed to verify edge status.", str(err))
sys.exit(1)
with open('/root/result.json', 'w') as f:
data = {"notebook_name": notebook_config['instance_name'], "error": ""}
json.dump(data, f)
# launching instance for notebook server
try:
logging.info('[CREATE NOTEBOOK INSTANCE]')
print('[CREATE NOTEBOOK INSTANCE]')
params = "--instance_name {} --instance_size {} --region {} --vpc_name {} --network_interface_name {} \
--security_group_name {} --subnet_name {} --service_base_name {} --resource_group_name {} \
--dlab_ssh_user_name {} --public_ip_name {} --public_key '''{}''' --primary_disk_size {} \
--instance_type {} --project_name {} --instance_storage_account_type {} --image_name {} \
--image_type {} --tags '{}'". \
format(notebook_config['instance_name'], notebook_config['instance_size'], notebook_config['region'],
notebook_config['vpc_name'], notebook_config['network_interface_name'],
notebook_config['security_group_name'], notebook_config['private_subnet_name'],
notebook_config['service_base_name'], notebook_config['resource_group_name'],
notebook_config['initial_user'], 'None', notebook_config['public_ssh_key'],
notebook_config['primary_disk_size'], 'notebook', notebook_config['project_name'],
notebook_config['instance_storage_account_type'], notebook_config['image_name'],
notebook_config['image_type'], json.dumps(notebook_config['tags']))
try:
local("~/scripts/{}.py {}".format('common_create_instance', params))
except:
traceback.print_exc()
raise Exception
except Exception as err:
try:
AzureActions.remove_instance(notebook_config['resource_group_name'], notebook_config['instance_name'])
except:
print("The instance hasn't been created.")
dlab.fab.append_result("Failed to create instance.", str(err))
sys.exit(1)