From 07a7be29e3bd898dfdfb8ce39dadf7a663fa2fcf Mon Sep 17 00:00:00 2001 From: lcaggio Date: Thu, 19 Jan 2023 00:33:31 +0100 Subject: [PATCH 1/3] Add shared-vpc support on Data Playgroud blueprint --- .../data-solutions/data-playground/README.md | 17 +++--- .../data-solutions/data-playground/main.tf | 53 +++++++++++++++---- .../data-solutions/data-playground/outputs.tf | 2 +- .../data-playground/variables.tf | 20 +++---- blueprints/data-solutions/main.tf | 10 ++++ modules/project/service-accounts.tf | 1 + .../data_playground/test_plan.py | 2 +- 7 files changed, 77 insertions(+), 28 deletions(-) create mode 100644 blueprints/data-solutions/main.tf diff --git a/blueprints/data-solutions/data-playground/README.md b/blueprints/data-solutions/data-playground/README.md index ecc12973ad..db7d51fce0 100644 --- a/blueprints/data-solutions/data-playground/README.md +++ b/blueprints/data-solutions/data-playground/README.md @@ -12,12 +12,15 @@ This sample creates several distinct groups of resources: - project - networking - - VPC network with a default subnet and CloudNat - - Firewall rules for [SSH access via IAP](https://cloud.google.com/iap/docs/using-tcp-forwarding) and open communication within the VPC - Vertex AI Workbench notebook configured with a private IP and using a dedicated Service Account - One GCS bucket - One BigQuery dataset +## Virtual Private Cloud (VPC) design +As is often the case in real-world configurations, this blueprint accepts as input an existing Shared-VPC via the network_config variable. Make sure that 'container.googleapis.com', 'notebooks.googleapis.com' and 'servicenetworking.googleapis.com' are enabled in the VPC host project. + +If the network_config variable is not provided, one VPC will be created in each project that supports network resources (load, transformation and orchestration). + ## Deploy your enviroment We assume the identiy running the following steps has the following role: @@ -47,12 +50,12 @@ You can now connect to the Vertex AI notbook to perform your data analysy. | name | description | type | required | default | |---|---|:---:|:---:|:---:| -| [prefix](variables.tf#L22) | Prefix used for resource names. | string | ✓ | | -| [project_id](variables.tf#L40) | Project id, references existing project if `project_create` is null. | string | ✓ | | +| [prefix](variables.tf#L32) | Prefix used for resource names. | string | ✓ | | +| [project_id](variables.tf#L50) | Project id, references existing project if `project_create` is null. | string | ✓ | | | [location](variables.tf#L16) | The location where resources will be deployed. | string | | "EU" | -| [project_create](variables.tf#L31) | Provide values if project creation is needed, uses existing project if null. Parent format: folders/folder_id or organizations/org_id. | object({…}) | | null | -| [region](variables.tf#L45) | The region where resources will be deployed. | string | | "europe-west1" | -| [vpc_config](variables.tf#L61) | Parameters to create a VPC. | object({…}) | | {…} | +| [network_config](variables.tf#L22) | Shared VPC network configurations to use. If null networks will be created in projects with preconfigured values. | object({…}) | | null | +| [project_create](variables.tf#L41) | Provide values if project creation is needed, uses existing project if null. Parent format: folders/folder_id or organizations/org_id. | object({…}) | | null | +| [region](variables.tf#L55) | The region where resources will be deployed. | string | | "europe-west1" | ## Outputs diff --git a/blueprints/data-solutions/data-playground/main.tf b/blueprints/data-solutions/data-playground/main.tf index ff079d5ebc..e164fc998c 100644 --- a/blueprints/data-solutions/data-playground/main.tf +++ b/blueprints/data-solutions/data-playground/main.tf @@ -17,6 +17,19 @@ ############################################################################### locals { service_encryption_keys = var.service_encryption_keys + shared_vpc_project = try(var.network_config.host_project, null) + + subnet = ( + local.use_shared_vpc + ? var.network_config.subnet_self_link + : values(module.vpc.0.subnet_self_links)[0] + ) + vpc = ( + local.use_shared_vpc + ? var.network_config.network_self_link + : module.vpc.0.self_link + ) + use_shared_vpc = var.network_config != null } module "project" { @@ -27,6 +40,7 @@ module "project" { project_create = var.project_create != null prefix = var.project_create == null ? null : var.prefix services = [ + "aiplatform.googleapis.com", "bigquery.googleapis.com", "bigquerystorage.googleapis.com", "bigqueryreservation.googleapis.com", @@ -42,17 +56,26 @@ module "project" { "storage.googleapis.com", "storage-component.googleapis.com" ] + + shared_vpc_service_config = local.shared_vpc_project == null ? null : { + attach = true + host_project = local.shared_vpc_project + } + org_policies = { # "constraints/compute.requireOsLogin" = { # enforce = false # } - # Example of applying a project wide policy, mainly useful for Composer + # Example of applying a project wide policy, mainly useful for Composer 1 } service_encryption_key_ids = { compute = [try(local.service_encryption_keys.compute, null)] bq = [try(local.service_encryption_keys.bq, null)] storage = [try(local.service_encryption_keys.storage, null)] } + service_config = { + disable_on_destroy = false, disable_dependent_services = false + } } ############################################################################### @@ -61,11 +84,12 @@ module "project" { module "vpc" { source = "../../../modules/net-vpc" + count = local.use_shared_vpc ? 0 : 1 project_id = module.project.project_id name = "${var.prefix}-vpc" subnets = [ { - ip_cidr_range = var.vpc_config.ip_cidr_range + ip_cidr_range = "10.0.0.0/20" name = "${var.prefix}-subnet" region = var.region } @@ -74,10 +98,11 @@ module "vpc" { module "vpc-firewall" { source = "../../../modules/net-vpc-firewall" + count = local.use_shared_vpc ? 0 : 1 project_id = module.project.project_id - network = module.vpc.name + network = module.vpc.0.name default_rules_config = { - admin_ranges = [var.vpc_config.ip_cidr_range] + admin_ranges = ["10.0.0.0/20"] } ingress_rules = { #TODO Remove and rely on 'ssh' tag once terraform-provider-google/issues/9273 is fixed @@ -92,12 +117,21 @@ module "vpc-firewall" { module "cloudnat" { source = "../../../modules/net-cloudnat" + count = local.use_shared_vpc ? 0 : 1 project_id = module.project.project_id name = "${var.prefix}-default" region = var.region - router_network = module.vpc.name + router_network = module.vpc.0.name } +resource "google_project_iam_member" "shared_vpc" { + count = local.use_shared_vpc ? 1 : 0 + project = var.network_config.host_project + role = "roles/compute.networkUser" + member = "serviceAccount:${module.project.service_accounts.robots.notebooks}" +} + + ############################################################################### # Storage # ############################################################################### @@ -121,8 +155,6 @@ module "dataset" { ############################################################################### # Vertex AI Notebook # ############################################################################### -# TODO: Add encryption_key to Vertex AI notebooks as well -# TODO: Add shared VPC support module "service-account-notebook" { source = "../../../modules/iam-service-account" @@ -160,11 +192,14 @@ resource "google_notebooks_instance" "playground" { no_public_ip = true no_proxy_access = false - network = module.vpc.network.id - subnet = module.vpc.subnets[format("%s/%s", var.region, "${var.prefix}-subnet")].id + network = local.vpc + subnet = local.subnet service_account = module.service-account-notebook.email #TODO Uncomment once terraform-provider-google/issues/9273 is fixed # tags = ["ssh"] + depends_on = [ + google_project_iam_member.shared_vpc, + ] } diff --git a/blueprints/data-solutions/data-playground/outputs.tf b/blueprints/data-solutions/data-playground/outputs.tf index 4b80c311c5..35f2efeb12 100644 --- a/blueprints/data-solutions/data-playground/outputs.tf +++ b/blueprints/data-solutions/data-playground/outputs.tf @@ -37,5 +37,5 @@ output "project" { output "vpc" { description = "VPC Network." - value = module.vpc.name + value = local.vpc } diff --git a/blueprints/data-solutions/data-playground/variables.tf b/blueprints/data-solutions/data-playground/variables.tf index 1735406733..3bd0ca65b1 100644 --- a/blueprints/data-solutions/data-playground/variables.tf +++ b/blueprints/data-solutions/data-playground/variables.tf @@ -19,6 +19,16 @@ variable "location" { default = "EU" } +variable "network_config" { + description = "Shared VPC network configurations to use. If null networks will be created in projects with preconfigured values." + type = object({ + host_project = string + network_self_link = string + subnet_self_link = string + }) + default = null +} + variable "prefix" { description = "Prefix used for resource names." type = string @@ -57,13 +67,3 @@ variable "service_encryption_keys" { # service encription key }) default = null } - -variable "vpc_config" { - description = "Parameters to create a VPC." - type = object({ - ip_cidr_range = string - }) - default = { - ip_cidr_range = "10.0.0.0/20" - } -} diff --git a/blueprints/data-solutions/main.tf b/blueprints/data-solutions/main.tf new file mode 100644 index 0000000000..333b370926 --- /dev/null +++ b/blueprints/data-solutions/main.tf @@ -0,0 +1,10 @@ +module "test" { + source = "./data-playground" + prefix = "plg-202301" + project_id = "cg1-dev-data-cmn-0" + network_config = { + host_project = "cgg-dev-net-spoke-0" + network_self_link = "https://www.googleapis.com/compute/v1/projects/cgg-dev-net-spoke-0/global/networks/dev-spoke-0" + subnet_self_link = "https://www.googleapis.com/compute/v1/projects/cgg-dev-net-spoke-0/regions/europe-west1/subnetworks/dev-dataplatform-ew1" + } +} diff --git a/modules/project/service-accounts.tf b/modules/project/service-accounts.tf index e1f6cb71a5..abf34cae02 100644 --- a/modules/project/service-accounts.tf +++ b/modules/project/service-accounts.tf @@ -45,6 +45,7 @@ locals { # TODO: jit? gke-mcs = "service-%s@gcp-sa-mcsd" monitoring-notifications = "service-%s@gcp-sa-monitoring-notification" + notebooks = "service-%s@gcp-sa-notebooks" pubsub = "service-%s@gcp-sa-pubsub" secretmanager = "service-%s@gcp-sa-secretmanager" sql = "service-%s@gcp-sa-cloud-sql" diff --git a/tests/blueprints/data_solutions/data_playground/test_plan.py b/tests/blueprints/data_solutions/data_playground/test_plan.py index a0c3b5e6fe..daaa57fc96 100644 --- a/tests/blueprints/data_solutions/data_playground/test_plan.py +++ b/tests/blueprints/data_solutions/data_playground/test_plan.py @@ -22,4 +22,4 @@ def test_resources(e2e_plan_runner): "Test that plan works and the numbers of resources is as expected." modules, resources = e2e_plan_runner(FIXTURES_DIR) assert len(modules) == 7 - assert len(resources) == 37 + assert len(resources) == 38 From 6477d0790dcd91bd9473049e7f176444972d300f Mon Sep 17 00:00:00 2001 From: lcaggio Date: Thu, 19 Jan 2023 00:39:55 +0100 Subject: [PATCH 2/3] Remove temp file. --- blueprints/data-solutions/main.tf | 10 ---------- 1 file changed, 10 deletions(-) delete mode 100644 blueprints/data-solutions/main.tf diff --git a/blueprints/data-solutions/main.tf b/blueprints/data-solutions/main.tf deleted file mode 100644 index 333b370926..0000000000 --- a/blueprints/data-solutions/main.tf +++ /dev/null @@ -1,10 +0,0 @@ -module "test" { - source = "./data-playground" - prefix = "plg-202301" - project_id = "cg1-dev-data-cmn-0" - network_config = { - host_project = "cgg-dev-net-spoke-0" - network_self_link = "https://www.googleapis.com/compute/v1/projects/cgg-dev-net-spoke-0/global/networks/dev-spoke-0" - subnet_self_link = "https://www.googleapis.com/compute/v1/projects/cgg-dev-net-spoke-0/regions/europe-west1/subnetworks/dev-dataplatform-ew1" - } -} From 3c88aace1a98b7880e91c61ca6d8904867e49def Mon Sep 17 00:00:00 2001 From: lcaggio Date: Thu, 19 Jan 2023 01:04:11 +0100 Subject: [PATCH 3/3] Fix dataflow shared-vpc support --- .../data-solutions/data-playground/main.tf | 20 +++++++++++++++++++ 1 file changed, 20 insertions(+) diff --git a/blueprints/data-solutions/data-playground/main.tf b/blueprints/data-solutions/data-playground/main.tf index e164fc998c..b87e8e7301 100644 --- a/blueprints/data-solutions/data-playground/main.tf +++ b/blueprints/data-solutions/data-playground/main.tf @@ -30,6 +30,26 @@ locals { : module.vpc.0.self_link ) use_shared_vpc = var.network_config != null + + shared_vpc_bindings = { + "roles/compute.networkUser" = [ + "robot-df", "notebooks" + ] + } + + shared_vpc_role_members = { + robot-df = "serviceAccount:${module.project.service_accounts.robots.dataflow}" + notebooks = "serviceAccount:${module.project.service_accounts.robots.notebooks}" + } + + # reassemble in a format suitable for for_each + shared_vpc_bindings_map = { + for binding in flatten([ + for role, members in local.shared_vpc_bindings : [ + for member in members : { role = role, member = member } + ] + ]) : "${binding.role}-${binding.member}" => binding + } } module "project" {