infrastructure-provisioning/src/general/scripts/aws/ssn_prepare.py (329 lines of code) (raw):
#!/usr/bin/python3
# *****************************************************************************
#
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.
#
# ******************************************************************************
import datalab.fab
import datalab.actions_lib
import datalab.meta_lib
from datalab.logger import logging
import json
import os
import sys
import traceback
import subprocess
from fabric import *
def cleanup_aws_resources(tag_name, service_base_name):
try:
params = "--tag_name {} --service_base_name {}".format(tag_name, service_base_name)
subprocess.run("~/scripts/{}.py {}".format('ssn_terminate_aws_resources', params), shell=True, check=True)
except:
traceback.print_exc()
raise Exception
if __name__ == "__main__":
#creating aws config file
try:
logging.info('[CREATE AWS CONFIG FILE]')
if 'aws_access_key' in os.environ and 'aws_secret_access_key' in os.environ:
datalab.actions_lib.create_aws_config_files(generate_full_config=True)
else:
datalab.actions_lib.create_aws_config_files()
except Exception as err:
logging.error('Unable to create configuration')
datalab.fab.append_result("Unable to create configuration", err)
traceback.print_exc()
sys.exit(1)
#deriving variables for ssn node deployment
try:
logging.info('[DERIVING NAMES]')
ssn_conf = dict()
ssn_conf['service_base_name'] = os.environ['conf_service_base_name'] = datalab.fab.replace_multi_symbols(
os.environ['conf_service_base_name'][:20], '-', True)
ssn_conf['role_name'] = '{}-ssn-role'.format(ssn_conf['service_base_name'])
ssn_conf['role_profile_name'] = '{}-ssn-profile'.format(ssn_conf['service_base_name'])
ssn_conf['policy_name'] = '{}-ssn-policy'.format(ssn_conf['service_base_name'])
ssn_conf['tag_name'] = '{}-tag'.format(ssn_conf['service_base_name'])
ssn_conf['tag2_name'] = '{}-secondary-tag'.format(ssn_conf['service_base_name'])
ssn_conf['user_tag'] = "{0}:{0}-ssn-role".format(ssn_conf['service_base_name'])
ssn_conf['instance_name'] = '{}-ssn'.format(ssn_conf['service_base_name'])
ssn_conf['region'] = os.environ['aws_region']
ssn_conf['zone_full'] = os.environ['aws_region'] + os.environ['aws_zone']
ssn_conf['ssn_image_name'] = os.environ['aws_{}_image_name'.format(os.environ['conf_os_family'])]
ssn_conf['ssn_ami_id'] = datalab.meta_lib.get_ami_id(ssn_conf['ssn_image_name'])
ssn_conf['policy_path'] = '/root/files/ssn_policy.json'
ssn_conf['vpc_cidr'] = os.environ['conf_vpc_cidr']
ssn_conf['vpc2_cidr'] = os.environ['conf_vpc2_cidr']
ssn_conf['vpc_name'] = '{}-vpc'.format(ssn_conf['service_base_name'])
ssn_conf['vpc2_name'] = '{}-vpc2'.format(ssn_conf['service_base_name'])
ssn_conf['subnet_name'] = '{}-subnet'.format(ssn_conf['service_base_name'])
ssn_conf['allowed_ip_cidr'] = list()
for cidr in os.environ['conf_allowed_ip_cidr'].split(','):
ssn_conf['allowed_ip_cidr'].append({"CidrIp": cidr.replace(' ','')})
ssn_conf['sg_name'] = '{}-ssn-sg'.format(ssn_conf['service_base_name'])
ssn_conf['network_type'] = os.environ['conf_network_type']
ssn_conf['all_ip_cidr'] = '0.0.0.0/0'
ssn_conf['elastic_ip_name'] = '{0}-ssn-static-ip'.format(ssn_conf['service_base_name'])
ssn_conf['subnet_tag'] = {"Key": ssn_conf['tag_name'], "Value": ssn_conf['subnet_name']}
ssn_conf['allowed_vpc_cidr_ip_ranges'] = list()
except Exception as err:
datalab.fab.append_result("Failed to generate variables dictionary.", str(err))
traceback.print_exc()
sys.exit(1)
#checking sbn for unique value
try:
if datalab.meta_lib.get_instance_by_name(ssn_conf['tag_name'], ssn_conf['instance_name']):
logging.info("Service base name should be unique and less or equal 20 symbols. Please try again.")
sys.exit(1)
except Exception as err:
datalab.fab.append_result("Failed to make predeployment check.", str(err))
logging.error('Error: {0}'.format(err))
traceback.print_exc()
sys.exit(1)
#creating aws vpc
try:
if 'aws_vpc_id' in os.environ and os.environ['aws_vpc_id'] != '':
ssn_conf['aws_vpc_id'] = os.environ['aws_vpc_id']
else:
logging.info('[CREATE VPC AND ROUTE TABLE]')
params = "--vpc {} --region {} --infra_tag_name {} --infra_tag_value {} --vpc_name {}".format(
ssn_conf['vpc_cidr'], ssn_conf['region'], ssn_conf['tag_name'], ssn_conf['service_base_name'],
ssn_conf['vpc_name'])
try:
subprocess.run("~/scripts/{}.py {}".format('ssn_create_vpc', params), shell=True, check=True)
except:
traceback.print_exc()
raise Exception
ssn_conf['aws_vpc_id'] = datalab.meta_lib.get_vpc_by_tag(ssn_conf['tag_name'],
ssn_conf['service_base_name'])
for cidr in datalab.meta_lib.get_vpc_cidr_by_id(ssn_conf['aws_vpc_id']):
ssn_conf['allowed_vpc_cidr_ip_ranges'].append({"CidrIp": cidr})
except Exception as err:
logging.error('Error: {0}'.format(err))
datalab.fab.append_result("Failed to create VPC", str(err))
sys.exit(1)
#creating secondary aws vpc
try:
if os.environ['conf_duo_vpc_enable'] == 'true' and 'aws_vpc2_id' in os.environ \
and os.environ['aws_vpc2_id'] != '':
ssn_conf['aws_vpc2_id'] = os.environ['aws_vpc2_id']
elif os.environ['conf_duo_vpc_enable'] == 'true':
logging.info('[CREATE SECONDARY VPC AND ROUTE TABLE]')
params = "--vpc {} --region {} --infra_tag_name {} --infra_tag_value {} --secondary" \
" --vpc_name {}".format(ssn_conf['vpc2_cidr'], ssn_conf['region'], ssn_conf['tag2_name'],
ssn_conf['service_base_name'], ssn_conf['vpc2_name'])
try:
subprocess.run("~/scripts/{}.py {}".format('ssn_create_vpc', params), shell=True, check=True)
except:
traceback.print_exc()
raise Exception
ssn_conf['aws_vpc2_id'] = datalab.meta_lib.get_vpc_by_tag(ssn_conf['tag2_name'],
ssn_conf['service_base_name'])
except Exception as err:
logging.error('Error: {0}'.format(err))
datalab.fab.append_result("Failed to create secondary VPC", str(err))
cleanup_aws_resources(ssn_conf['tag_name'], ssn_conf['service_base_name'])
sys.exit(1)
#creating subnet
try:
if 'aws_subnet_id' in os.environ and os.environ['aws_subnet_id'] != '':
ssn_conf['aws_subnet_id'] = os.environ['aws_subnet_id']
else:
logging.info('[CREATE SUBNET]')
params = "--vpc_id {0} --username {1} --infra_tag_name {2} --infra_tag_value {3} --prefix {4} " \
"--ssn {5} --zone {6} --subnet_name {7}".format(ssn_conf['aws_vpc_id'], 'ssn',
ssn_conf['tag_name'],
ssn_conf['service_base_name'],
'20', True,
ssn_conf['zone_full'], ssn_conf['subnet_name'])
try:
subprocess.run("~/scripts/{}.py {}".format('common_create_subnet', params), shell=True, check=True)
except:
traceback.print_exc()
raise Exception
ssn_conf['aws_subnet_id'] = datalab.meta_lib.get_subnet_by_tag(ssn_conf['subnet_tag'], True,
ssn_conf['aws_vpc_id'])
datalab.actions_lib.enable_auto_assign_ip(ssn_conf['aws_subnet_id'])
except Exception as err:
logging.error('Error: {0}'.format(err))
datalab.fab.append_result("Failed to create Subnet", str(err))
cleanup_aws_resources(ssn_conf['tag_name'], ssn_conf['service_base_name'])
sys.exit(1)
#creating peering connection
try:
if os.environ['conf_duo_vpc_enable'] == 'true' and ssn_conf['aws_vpc_id'] and ssn_conf['aws_vpc2_id']:
logging.info('[CREATE PEERING CONNECTION]')
ssn_conf['aws_peering_id'] = datalab.actions_lib.create_peering_connection(
ssn_conf['aws_vpc_id'], ssn_conf['aws_vpc2_id'], ssn_conf['service_base_name'])
logging.info('PEERING CONNECTION ID:' + ssn_conf['aws_peering_id'])
datalab.actions_lib.create_route_by_id(ssn_conf['aws_subnet_id'], ssn_conf['aws_vpc_id'],
ssn_conf['aws_peering_id'],
datalab.meta_lib.get_cidr_by_vpc(ssn_conf['aws_vpc2_id']))
except Exception as err:
logging.error('Error: {0}'.format(err))
datalab.fab.append_result("Failed to create peering connection", str(err))
cleanup_aws_resources(ssn_conf['tag_name'], ssn_conf['service_base_name'])
sys.exit(1)
#creating security groups
try:
if 'aws_security_groups_ids' in os.environ and os.environ['aws_security_groups_ids'] != '':
ssn_conf['aws_security_groups_ids'] = os.environ['aws_security_groups_ids']
else:
logging.info('[CREATE SG FOR SSN]')
ssn_conf['ingress_sg_rules_template'] = datalab.meta_lib.format_sg([
{
"PrefixListIds": [],
"FromPort": 80,
"IpRanges": ssn_conf['allowed_ip_cidr'],
"ToPort": 80, "IpProtocol": "tcp", "UserIdGroupPairs": []
},
{
"PrefixListIds": [],
"FromPort": 22,
"IpRanges": ssn_conf['allowed_ip_cidr'],
"ToPort": 22, "IpProtocol": "tcp", "UserIdGroupPairs": []
},
{
"PrefixListIds": [],
"FromPort": 443,
"IpRanges": ssn_conf['allowed_ip_cidr'],
"ToPort": 443, "IpProtocol": "tcp", "UserIdGroupPairs": []
},
{
"PrefixListIds": [],
"FromPort": -1,
"IpRanges": ssn_conf['allowed_ip_cidr'],
"ToPort": -1, "IpProtocol": "icmp", "UserIdGroupPairs": []
},
{
"PrefixListIds": [],
"FromPort": 80,
"IpRanges": ssn_conf['allowed_vpc_cidr_ip_ranges'],
"ToPort": 80, "IpProtocol": "tcp", "UserIdGroupPairs": []
},
{
"PrefixListIds": [],
"FromPort": 443,
"IpRanges": ssn_conf['allowed_vpc_cidr_ip_ranges'],
"ToPort": 443, "IpProtocol": "tcp", "UserIdGroupPairs": []
}
])
egress_sg_rules_template = datalab.meta_lib.format_sg([
{"IpProtocol": "-1", "IpRanges": [{"CidrIp": ssn_conf['all_ip_cidr']}], "UserIdGroupPairs": [],
"PrefixListIds": []}
])
params = "--name {} --vpc_id {} --security_group_rules '{}' --egress '{}' --infra_tag_name {} " \
"--infra_tag_value {} --force {} --ssn {}". \
format(ssn_conf['sg_name'], ssn_conf['aws_vpc_id'],
json.dumps(ssn_conf['ingress_sg_rules_template']), json.dumps(egress_sg_rules_template),
ssn_conf['service_base_name'], ssn_conf['tag_name'], False, True)
try:
subprocess.run("~/scripts/{}.py {}".format('common_create_security_group', params), shell=True, check=True)
except:
traceback.print_exc()
raise Exception
ssn_conf['aws_security_groups_ids'] = datalab.meta_lib.get_security_group_by_name(ssn_conf['sg_name'])
except Exception as err:
logging.error('Error: {0}'.format(err))
datalab.fab.append_result("Failed to create security group for SSN", str(err))
cleanup_aws_resources(ssn_conf['tag_name'], ssn_conf['service_base_name'])
sys.exit(1)
#creating roles
try:
if 'aws_ssn_instance_role' in os.environ and os.environ['aws_ssn_instance_role'] != '':
logging.info('[USING PREDEFINED ROLE]')
ssn_conf['role_name'] = os.environ['aws_ssn_instance_role']
ssn_conf['role_profile_name'] = os.environ['aws_ssn_instance_role']
else:
logging.info('[CREATE ROLES]')
params = "--role_name {} --role_profile_name {} --policy_name {} --policy_file_name {} --region {} " \
"--infra_tag_name {} --infra_tag_value {} --user_tag_value {}". \
format(ssn_conf['role_name'], ssn_conf['role_profile_name'], ssn_conf['policy_name'],
ssn_conf['policy_path'], ssn_conf['region'], ssn_conf['tag_name'],
ssn_conf['service_base_name'], ssn_conf['user_tag'])
if 'aws_permissions_boundary_arn' in os.environ:
params = '{} --permissions_boundary_arn {}'.format(params, os.environ['aws_permissions_boundary_arn'])
try:
subprocess.run("~/scripts/{}.py {}".format('common_create_role_policy', params), shell=True, check=True)
except:
traceback.print_exc()
raise Exception
except Exception as err:
logging.error('Error: {0}'.format(err))
datalab.fab.append_result("Failed to create roles", str(err))
cleanup_aws_resources(ssn_conf['tag_name'], ssn_conf['service_base_name'])
sys.exit(1)
#creating endpoint and rout-table
try:
logging.info('[CREATE ENDPOINT AND ROUTE-TABLE]')
params = "--vpc_id {} --region {} --infra_tag_name {} --infra_tag_value {}".format(
ssn_conf['aws_vpc_id'], ssn_conf['region'], ssn_conf['tag_name'], ssn_conf['service_base_name'])
try:
subprocess.run("~/scripts/{}.py {}".format('ssn_create_endpoint', params), shell=True, check=True)
except:
traceback.print_exc()
raise Exception
except Exception as err:
logging.error('Error: {0}'.format(err))
datalab.fab.append_result("Failed to create endpoint", str(err))
cleanup_aws_resources(ssn_conf['tag_name'], ssn_conf['service_base_name'])
sys.exit(1)
# creating endpoint and rout-table notebook vpc
try:
if os.environ['conf_duo_vpc_enable'] == 'true':
logging.info('[CREATE ENDPOINT AND ROUTE-TABLE FOR NOTEBOOK VPC]')
params = "--vpc_id {} --region {} --infra_tag_name {} --infra_tag_value {}".format(
ssn_conf['aws_vpc2_id'], ssn_conf['aws_region'], ssn_conf['tag2_name'],
ssn_conf['service_base_name'])
try:
subprocess.run("~/scripts/{}.py {}".format('ssn_create_endpoint', params), shell=True, check=True)
except:
traceback.print_exc()
raise Exception
except Exception as err:
logging.error('Error: {0}'.format(err))
datalab.fab.append_result("Failed to create secondary endpoint", str(err))
cleanup_aws_resources(ssn_conf['tag_name'], ssn_conf['service_base_name'])
sys.exit(1)
#creating ssn instance
try:
logging.info('[CREATE SSN INSTANCE]')
params = "--node_name {0} --ami_id {1} --instance_type {2} --key_name {3} --security_group_ids {4} " \
"--subnet_id {5} --iam_profile {6} --infra_tag_name {7} --infra_tag_value {8} --instance_class {9} " \
"--primary_disk_size {10}".\
format(ssn_conf['instance_name'], ssn_conf['ssn_ami_id'], os.environ['aws_ssn_instance_size'],
os.environ['conf_key_name'], ssn_conf['aws_security_groups_ids'], ssn_conf['aws_subnet_id'],
ssn_conf['role_profile_name'], ssn_conf['tag_name'], ssn_conf['instance_name'], 'ssn', '20')
try:
subprocess.run("~/scripts/{}.py {}".format('common_create_instance', params), shell=True, check=True)
except:
traceback.print_exc()
raise Exception
except Exception as err:
logging.error('Error: {0}'.format(err))
datalab.fab.append_result("Failed to create ssn instance", str(err))
cleanup_aws_resources(ssn_conf['tag_name'], ssn_conf['service_base_name'])
sys.exit(1)
#associating elastic ip
try:
if ssn_conf['network_type'] == 'public':
logging.info('[ASSOCIATING ELASTIC IP]')
ssn_conf['ssn_id'] = datalab.meta_lib.get_instance_by_name(ssn_conf['tag_name'], ssn_conf['instance_name'])
try:
ssn_conf['elastic_ip'] = os.environ['ssn_elastic_ip']
except:
ssn_conf['elastic_ip'] = 'None'
params = "--elastic_ip {} --ssn_id {} --infra_tag_name {} --infra_tag_value {}".format(
ssn_conf['elastic_ip'], ssn_conf['ssn_id'], ssn_conf['tag_name'], ssn_conf['elastic_ip_name'])
try:
subprocess.run("~/scripts/{}.py {}".format('ssn_associate_elastic_ip', params), shell=True, check=True)
except:
traceback.print_exc()
raise Exception
except Exception as err:
logging.error('Error: {0}'.format(err))
datalab.fab.append_result("Failed to create elastic ip", str(err))
cleanup_aws_resources(ssn_conf['tag_name'], ssn_conf['service_base_name'])
sys.exit(1)
#creating route53 records
try:
if 'ssn_hosted_zone_id' in os.environ and 'ssn_hosted_zone_name' in os.environ and 'ssn_subdomain' in os.environ:
if ssn_conf['network_type'] == 'private':
ssn_conf['instance_ip'] = datalab.meta_lib.get_instance_ip_address(ssn_conf['tag_name'],
ssn_conf['instance_name']).get('Private')
else:
ssn_conf['instance_ip'] = datalab.meta_lib.get_instance_ip_address(ssn_conf['tag_name'],
ssn_conf['instance_name']).get('Public')
logging.info('[CREATING ROUTE53 RECORD]')
try:
datalab.actions_lib.create_route_53_record(os.environ['ssn_hosted_zone_id'],
os.environ['ssn_hosted_zone_name'],
os.environ['ssn_subdomain'], ssn_conf['instance_ip'])
except:
traceback.print_exc()
raise Exception
except Exception as err:
logging.error('Error: {0}'.format(err))
datalab.fab.append_result("Failed to create route53 record", str(err))
cleanup_aws_resources(ssn_conf['tag_name'], ssn_conf['service_base_name'])
sys.exit(1)