Skip to content

Commit

Permalink
Adding gke-ml-dev cluster to the dev environment.
Browse files Browse the repository at this point in the history
  • Loading branch information
arueth committed Mar 6, 2024
1 parent 9f9cad4 commit 5db975f
Show file tree
Hide file tree
Showing 6 changed files with 179 additions and 4 deletions.
2 changes: 1 addition & 1 deletion ml-platform/02_gke/backend.tf
Original file line number Diff line number Diff line change
Expand Up @@ -15,6 +15,6 @@
terraform {
backend "gcs" {
prefix = "02_gke"
bucket = "YOUR_STATE_BUCKET"
bucket = "rueth-prod-mlp"
}
}
3 changes: 2 additions & 1 deletion ml-platform/02_gke/main.tf
Original file line number Diff line number Diff line change
Expand Up @@ -61,6 +61,7 @@ module "gke" {
depends_on = [google_gke_hub_feature.configmanagement_acm_feature]
env = each.key
}

module "reservation" {
for_each = local.parsed_project_id
source = "./modules/vm-reservations"
Expand All @@ -69,6 +70,7 @@ module "reservation" {
project_id = each.value
depends_on = [module.gke]
}

module "node_pool-reserved" {
for_each = local.parsed_project_id
source = "./modules/node-pools"
Expand Down Expand Up @@ -101,7 +103,6 @@ module "node_pool-spot" {
region = var.subnet_01_region
taints = var.spot_taints
resource_type = "spot"

}

module "cloud-nat" {
Expand Down
76 changes: 76 additions & 0 deletions ml-platform/02_gke/project.tf
Original file line number Diff line number Diff line change
@@ -0,0 +1,76 @@
# Copyright 2024 Google LLC
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

resource "google_project_service" "anthos_googleapis_com" {
for_each = local.parsed_project_id

disable_dependent_services = true
disable_on_destroy = false
project = each.value
service = "anthos.googleapis.com"
}

resource "google_project_service" "anthosconfigmanagement_googleapis_com" {
for_each = local.parsed_project_id

disable_dependent_services = true
disable_on_destroy = false
project = each.value
service = "anthosconfigmanagement.googleapis.com"
}

resource "google_project_service" "cloudresourcemanager_googleapis_com" {
for_each = local.parsed_project_id

disable_dependent_services = true
disable_on_destroy = false
project = each.valuecd
service = "cloudresourcemanager.googleapis.com"
}

resource "google_project_service" "compute_googleapis_com" {
for_each = local.parsed_project_id

disable_dependent_services = true
disable_on_destroy = false
project = each.value
service = "compute.googleapis.com"
}

resource "google_project_service" "container_googleapis_com" {
for_each = local.parsed_project_id

disable_dependent_services = true
disable_on_destroy = false
project = each.value
service = "container.googleapis.com"
}

resource "google_project_service" "gkehub_googleapis_com" {
for_each = local.parsed_project_id

disable_dependent_services = true
disable_on_destroy = false
project = each.value
service = "gkehub.googleapis.com"
}

resource "google_project_service" "iam_googleapis_com" {
for_each = local.parsed_project_id

disable_dependent_services = true
disable_on_destroy = false
project = each.value
service = "iam.googleapis.com"
}
2 changes: 1 addition & 1 deletion ml-platform/03_configsync/backend.tf
Original file line number Diff line number Diff line change
Expand Up @@ -15,6 +15,6 @@
terraform {
backend "gcs" {
prefix = "03_config_sync_prerequisite"
bucket = "YOUR_STATE_BUCKET"
bucket = "rueth-prod-mlp"
}
}
99 changes: 99 additions & 0 deletions ml-platform/03_configsync/log
Original file line number Diff line number Diff line change
@@ -0,0 +1,99 @@
Download repo is mlp-config-sync-10d10ecf218aeee3c446
ls -lrt before going into download repo is total 52
drwxr-xr-x 3 user user 4096 Mar 6 15:32 templates
-rw-r--r-- 1 user user 1036 Mar 6 15:32 providers.tf
-rwxr-xr-x 1 user user 3150 Mar 6 15:32 create_cluster_yamls.sh
-rw-r--r-- 1 user user 4215 Mar 6 16:45 main.tf
-rw-r--r-- 1 user user 697 Mar 6 16:56 outputs.tf
-rw-r--r-- 1 user user 11518 Mar 6 17:03 README.md
-rw-r--r-- 1 user user 1416 Mar 6 18:19 variables.tf
-rw-r--r-- 1 user user 685 Mar 6 18:40 backend.tf
-rw-r--r-- 1 user user 308 Mar 6 20:46 terraform.tfvars
-rw-r--r-- 1 user user 54 Mar 6 20:46 log
ls -lrt in download repo is total 52
drwxr-xr-x 3 user user 4096 Mar 6 15:32 templates
-rw-r--r-- 1 user user 1036 Mar 6 15:32 providers.tf
-rwxr-xr-x 1 user user 3150 Mar 6 15:32 create_cluster_yamls.sh
-rw-r--r-- 1 user user 4215 Mar 6 16:45 main.tf
-rw-r--r-- 1 user user 697 Mar 6 16:56 outputs.tf
-rw-r--r-- 1 user user 11518 Mar 6 17:03 README.md
-rw-r--r-- 1 user user 1416 Mar 6 18:19 variables.tf
-rw-r--r-- 1 user user 685 Mar 6 18:40 backend.tf
-rw-r--r-- 1 user user 308 Mar 6 20:46 terraform.tfvars
-rw-r--r-- 1 user user 647 Mar 6 20:46 log
not copying files
In directory /home/user/development/ai-on-gke/ml-platform/03_configsync
level0 total 52
drwxr-xr-x 3 user user 4096 Mar 6 15:32 templates
-rw-r--r-- 1 user user 1036 Mar 6 15:32 providers.tf
-rwxr-xr-x 1 user user 3150 Mar 6 15:32 create_cluster_yamls.sh
-rw-r--r-- 1 user user 4215 Mar 6 16:45 main.tf
-rw-r--r-- 1 user user 697 Mar 6 16:56 outputs.tf
-rw-r--r-- 1 user user 11518 Mar 6 17:03 README.md
-rw-r--r-- 1 user user 1416 Mar 6 18:19 variables.tf
-rw-r--r-- 1 user user 685 Mar 6 18:40 backend.tf
-rw-r--r-- 1 user user 308 Mar 6 20:46 terraform.tfvars
-rw-r--r-- 1 user user 1315 Mar 6 20:46 log
level1 total 28
drwxr-xr-x 2 user user 4096 Mar 6 15:32 06_operating_teams
drwxr-xr-x 2 user user 4096 Mar 6 15:32 05_setup_teams
drwxr-xr-x 2 user user 4096 Mar 6 15:32 04_setup_clusters
drwxr-xr-x 3 user user 4096 Mar 6 16:57 01_gcp_project
-rw-r--r-- 1 user user 3888 Mar 6 17:01 README.md
drwxr-xr-x 4 user user 4096 Mar 6 18:07 02_gke
drwxr-xr-x 4 user user 4096 Mar 6 20:46 03_configsync
level2 total 120
-rw-r--r-- 1 user user 2832 Feb 5 16:20 Makefile
-rw-r--r-- 1 user user 11357 Feb 5 16:20 LICENSE
drwxr-xr-x 2 user user 4096 Feb 5 16:20 best-practices
drwxr-xr-x 3 user user 4096 Feb 5 16:20 gke-a100-jax
drwxr-xr-x 4 user user 4096 Feb 5 16:20 dcgm-on-gke
-rw-r--r-- 1 user user 1068 Feb 5 16:20 contributing.md
drwxr-xr-x 2 user user 4096 Feb 5 16:20 gke-dws-examples
drwxr-xr-x 3 user user 4096 Feb 5 16:20 gke-online-serving-single-gpu
drwxr-xr-x 4 user user 4096 Feb 5 16:20 gke-tpu-examples
drwxr-xr-x 3 user user 4096 Feb 5 16:20 jobset
drwxr-xr-x 2 user user 4096 Feb 5 16:20 indexed-job
-rw-r--r-- 1 user user 5838 Feb 5 16:20 tutorial.md
drwxr-xr-x 4 user user 4096 Feb 5 16:20 training-single-gpu
drwxr-xr-x 4 user user 4096 Feb 5 16:20 saxml-on-gke
-rw-r--r-- 1 user user 5505 Feb 21 20:11 README.md
drwxr-xr-x 5 user user 4096 Feb 21 20:11 applications
drwxr-xr-x 9 user user 4096 Feb 21 20:11 gke-batch-refarch
lrwxrwxrwx 1 user user 20 Feb 21 20:11 jupyter-on-gke -> applications/jupyter
lrwxrwxrwx 1 user user 16 Feb 21 20:11 ray-on-gke -> applications/ray
drwxr-xr-x 6 user user 4096 Feb 21 20:11 tutorials
drwxr-xr-x 4 user user 4096 Feb 27 19:13 gke-disk-image-builder
drwxr-xr-x 8 user user 4096 Feb 27 19:13 tpu-provisioner
drwxr-xr-x 6 user user 4096 Mar 6 15:32 benchmarks
-rw-r--r-- 1 user user 6624 Mar 6 15:32 cloudbuild.yaml
drwxr-xr-x 4 user user 4096 Mar 6 15:32 infrastructure
drwxr-xr-x 8 user user 4096 Mar 6 15:32 ml-platform
drwxr-xr-x 15 user user 4096 Mar 6 15:32 modules
level3 total 80
drwxr-xr-x 6 user user 4096 Jun 1 2023 anthos-service-mesh-samples
drwxr-xr-x 4 user user 4096 Jun 1 2023 bank-of-anthos-hybrid
drwxr-xr-x 13 user user 4096 Jun 1 2023 consumer-edge-core
drwxr-xr-x 4 user user 4096 Jun 1 2023 development-workstation
drwxr-xr-x 11 user user 4096 Jun 1 2023 gcp-solutions-content
drwxr-xr-x 3 user user 4096 Jun 13 2023 arueth-platform-patterns
drwxr-xr-x 8 user user 4096 Jun 21 2023 golden-path
drwxr-xr-x 2 user user 4096 Jun 21 2023 scratch
drwxr-xr-x 2 user user 4096 Jul 11 2023 documentation
drwxr-xr-x 10 user user 4096 Jul 11 2023 magic-modules
drwxr-xr-x 3 user user 4096 Jan 12 22:26 tmp
drwxr-xr-x 4 user user 4096 Jan 24 20:52 saxml
drwxr-xr-x 17 user user 4096 Jan 30 17:09 terraform-example-foundation
drwxr-xr-x 3 user user 4096 Feb 5 22:20 gem-saxml
drwxr-xr-x 5 user user 4096 Feb 16 17:27 ai-on-google-cloud
drwxr-xr-x 2 user user 4096 Feb 22 17:52 workspace
drwxr-xr-x 22 user user 4096 Feb 27 20:58 ai-on-gke-fork
drwxr-xr-x 14 user user 4096 Feb 29 22:25 anthos-bare-metal-ref-arch
drwxr-xr-x 12 user user 4096 Mar 6 15:31 bank-of-anthos
drwxr-xr-x 22 user user 4096 Mar 6 15:32 ai-on-gke
level4 total 16
drwxr-xr-x 5 user user 4096 Jul 11 2023 go
drwxr-xr-x 4 user user 4096 Jan 18 19:34 java
drwxr-xr-x 22 user user 4096 Feb 22 17:52 development
drwxr-xr-x 4 user user 4096 Mar 6 19:04 bin
env is dev
1 change: 0 additions & 1 deletion ml-platform/03_configsync/variables.tf
Original file line number Diff line number Diff line change
Expand Up @@ -15,7 +15,6 @@
variable "lookup_state_bucket" {
description = "GCS bucket to look up TF state from previous steps."
type = string
default = "YOUR_STATE_BUCKET"
}

variable "configsync_repo_name" {
Expand Down

0 comments on commit 5db975f

Please sign in to comment.