Merge pull request #60 from repping/master

repping · web-flow · commit d804bdc4a19c · 2022-12-30T13:55:55.000+01:00
updated vault aws_health.sh script
diff --git a/iam.tf b/iam.tf
@@ -254,39 +254,41 @@ resource "aws_iam_role_policy" "lambda" {
   role   = aws_iam_role.lambda[0].id
 }
 
+data "aws_partition" "current" {}
+
+data "aws_caller_identity" "current" {}
+
 data "aws_iam_policy_document" "lambda" {
   count  = var.vault_enable_cloudwatch ? 1 : 0
   statement {
     effect  = "Allow"
     actions = [
-      "logs:CreateLogGroup",
-      "logs:CreateLogStream",
-      "logs:PutLogEvents",
-      "logs:DescribeLogGroups"
+      "cloudwatch:PutMetricData"
     ]
     resources = [
-      # TODO should be --> Resource: !Sub "arn:${AWS::Partition}:logs:${AWS::Region}:${AWS::AccountId}:log-group:*"
-      "*"
+    "*"
     ]
   }
   statement {
     effect  = "Allow"
     actions = [
-      "logs:PutLogEvents"
+      "logs:CreateLogGroup",
+      "logs:CreateLogStream",
+      "logs:PutLogEvents",
+      "logs:DescribeLogGroups"
     ]
     resources = [
-      # TODO should be --> Resource: !Sub "arn:${AWS::Partition}:logs:${AWS::Region}:${AWS::AccountId}:log-group:*:log-stream:*"
-      "*"
+      "arn:${data.aws_partition.current.partition}:logs:${data.aws_region.default.name}:${data.aws_caller_identity.current.id}:log-group:*",
+      "arn:${data.aws_partition.current.partition}:logs:${data.aws_region.default.name}:${data.aws_caller_identity.current.id}:log-group:*:log-stream:*"
     ]
   }
   statement {
     effect  = "Allow"
     actions = [
-      "ec2:DescribeInstances",
-      "ec2:DescribeImages"
+      "logs:PutLogEvents"
     ]
     resources = [
-      "*"
+      "arn:${data.aws_partition.current.partition}:logs:${data.aws_region.default.name}:${data.aws_caller_identity.current.id}:log-group:*:log-stream:*",
     ]
   }
   statement {
@@ -296,7 +298,6 @@ data "aws_iam_policy_document" "lambda" {
       "ec2:DescribeImages"
     ]
     resources = [
-      # TODO should be --> Resource: !Sub "arn:${AWS::Partition}:ec2:${AWS::Region}:${AWS::AccountId}:instance/*"
       "*"
     ]
   }
@@ -308,8 +309,7 @@ data "aws_iam_policy_document" "lambda" {
       "cloudwatch:PutMetricAlarm"
     ]
     resources = [
-      # TODO should be --> Resource:  !Sub "arn:${AWS::Partition}:cloudwatch:${AWS::Region}:${AWS::AccountId}:alarm:AutoAlarm-*"
-      "*"
+      "arn:${data.aws_partition.current.partition}:cloudwatch:${data.aws_region.default.name}:${data.aws_caller_identity.current.id}:alarm:AutoAlarm-*"
     ]
   }
   statement {
@@ -318,7 +318,7 @@ data "aws_iam_policy_document" "lambda" {
       "cloudwatch:DescribeAlarms"
     ]
     resources = [
-      "*"
+    "*"
     ]
   }
   statement {
@@ -327,8 +327,7 @@ data "aws_iam_policy_document" "lambda" {
       "ec2:CreateTags"
     ]
     resources = [
-      # TODO should be --> Resource: !Sub "arn:${AWS::Partition}:ec2:${AWS::Region}:${AWS::AccountId}:instance/*"
-      "*"
+      "arn:${data.aws_partition.current.partition}:ec2:${data.aws_region.default.name}:${data.aws_caller_identity.current.id}:instance/*"
     ]
   }
 }
diff --git a/user_data_vault.sh.tpl b/user_data_vault.sh.tpl
@@ -200,26 +200,24 @@ usermod -G vault ec2-user
 
 # Place an AWS EC2 health check script.
 cat << EOF >> /usr/local/bin/aws_health.sh
-#!/bin/sh
-
-# This script checks that status of Vault and reports that status to the ASG.
-# If Vault fails, the instance is replaced.
-
-# Tell Vault how to connect.
-export VAULT_ADDR=https://$${my_ipaddress}:8200
-export VAULT_CACERT="${vault_data_path}/tls/vault_ca.crt"
-
-# Get the status of Vault and report to AWS ASG.
-# TODO: This check is not sufficient; 0 is returned in many cases.
-if vault status > /dev/null 2>&1 ; then
-  aws --region $${my_region} autoscaling set-instance-health --instance-id $${my_instance_id} --health-status Healthy
-else
-  # Randominze the moment when to set the instance to unhealthy. This helps gradually replacing unhealthy instances.
-  # For example; a cluster that is configured as a replication secondary has all followers set to unhealthy, risking
-  # loosing quorum.
-  sleep $((RANDOM % 60))
-  aws --region $${my_region} autoscaling set-instance-health --instance-id $${my_instance_id} --health-status Unhealthy
-fi
+!/bin/bash
+
+# Set variables
+VAULT_STATUS_URL="https://$${my_ipaddress}:8200/v1/sys/health"
+TIMEOUT=5
+
+# Perform the health check
+response=\$(curl -k -m \$TIMEOUT -s -o /dev/null -w "%%{http_code}" \$VAULT_STATUS_URL)
+
+# Check the response code
+case \$response in
+  200|429|472|473)
+    aws --region $${my_region} autoscaling set-instance-health --instance-id $${my_instance_id} --health-status Healthy
+  ;;
+  *)
+    aws --region $${my_region} autoscaling set-instance-health --instance-id $${my_instance_id} --health-status Unhealthy
+  ;;
+esac
 EOF
 
 # Make the AWS EC2 health check script executable.

Original file line number	Diff line number	Diff line change
`@@ -254,39 +254,41 @@ resource "aws_iam_role_policy" "lambda" {`
`254`	`254`	`role = aws_iam_role.lambda[0].id`
`255`	`255`	`}`
`256`	`256`
	`257`	`+data "aws_partition" "current" {}`
	`258`	`+`
	`259`	`+data "aws_caller_identity" "current" {}`
	`260`	`+`
`257`	`261`	`data "aws_iam_policy_document" "lambda" {`
`258`	`262`	`count = var.vault_enable_cloudwatch ? 1 : 0`
`259`	`263`	`statement {`
`260`	`264`	`effect = "Allow"`
`261`	`265`	`actions = [`
`262`		`- "logs:CreateLogGroup",`
`263`		`- "logs:CreateLogStream",`
`264`		`- "logs:PutLogEvents",`
`265`		`- "logs:DescribeLogGroups"`
	`266`	`+ "cloudwatch:PutMetricData"`
`266`	`267`	`]`
`267`	`268`	`resources = [`
`268`		`- # TODO should be --> Resource: !Sub "arn:${AWS::Partition}:logs:${AWS::Region}:${AWS::AccountId}:log-group:*"`
`269`		`- "*"`
	`269`	`+ "*"`
`270`	`270`	`]`
`271`	`271`	`}`
`272`	`272`	`statement {`
`273`	`273`	`effect = "Allow"`
`274`	`274`	`actions = [`
`275`		`- "logs:PutLogEvents"`
	`275`	`+ "logs:CreateLogGroup",`
	`276`	`+ "logs:CreateLogStream",`
	`277`	`+ "logs:PutLogEvents",`
	`278`	`+ "logs:DescribeLogGroups"`
`276`	`279`	`]`
`277`	`280`	`resources = [`
`278`		`- # TODO should be --> Resource: !Sub "arn:${AWS::Partition}:logs:${AWS::Region}:${AWS::AccountId}:log-group::log-stream:"`
`279`		`- "*"`
	`281`	`+ "arn:${data.aws_partition.current.partition}:logs:${data.aws_region.default.name}:${data.aws_caller_identity.current.id}:log-group:*",`
	`282`	`+ "arn:${data.aws_partition.current.partition}:logs:${data.aws_region.default.name}:${data.aws_caller_identity.current.id}:log-group::log-stream:"`
`280`	`283`	`]`
`281`	`284`	`}`
`282`	`285`	`statement {`
`283`	`286`	`effect = "Allow"`
`284`	`287`	`actions = [`
`285`		`- "ec2:DescribeInstances",`
`286`		`- "ec2:DescribeImages"`
	`288`	`+ "logs:PutLogEvents"`
`287`	`289`	`]`
`288`	`290`	`resources = [`
`289`		`- "*"`
	`291`	`+ "arn:${data.aws_partition.current.partition}:logs:${data.aws_region.default.name}:${data.aws_caller_identity.current.id}:log-group::log-stream:",`
`290`	`292`	`]`
`291`	`293`	`}`
`292`	`294`	`statement {`
`@@ -296,7 +298,6 @@ data "aws_iam_policy_document" "lambda" {`
`296`	`298`	`"ec2:DescribeImages"`
`297`	`299`	`]`
`298`	`300`	`resources = [`
`299`		`- # TODO should be --> Resource: !Sub "arn:${AWS::Partition}:ec2:${AWS::Region}:${AWS::AccountId}:instance/*"`
`300`	`301`	`"*"`
`301`	`302`	`]`
`302`	`303`	`}`
`@@ -308,8 +309,7 @@ data "aws_iam_policy_document" "lambda" {`
`308`	`309`	`"cloudwatch:PutMetricAlarm"`
`309`	`310`	`]`
`310`	`311`	`resources = [`
`311`		`- # TODO should be --> Resource: !Sub "arn:${AWS::Partition}:cloudwatch:${AWS::Region}:${AWS::AccountId}:alarm:AutoAlarm-*"`
`312`		`- "*"`
	`312`	`+ "arn:${data.aws_partition.current.partition}:cloudwatch:${data.aws_region.default.name}:${data.aws_caller_identity.current.id}:alarm:AutoAlarm-*"`
`313`	`313`	`]`
`314`	`314`	`}`
`315`	`315`	`statement {`
`@@ -318,7 +318,7 @@ data "aws_iam_policy_document" "lambda" {`
`318`	`318`	`"cloudwatch:DescribeAlarms"`
`319`	`319`	`]`
`320`	`320`	`resources = [`
`321`		`- "*"`
	`321`	`+ "*"`
`322`	`322`	`]`
`323`	`323`	`}`
`324`	`324`	`statement {`
`@@ -327,8 +327,7 @@ data "aws_iam_policy_document" "lambda" {`
`327`	`327`	`"ec2:CreateTags"`
`328`	`328`	`]`
`329`	`329`	`resources = [`
`330`		`- # TODO should be --> Resource: !Sub "arn:${AWS::Partition}:ec2:${AWS::Region}:${AWS::AccountId}:instance/*"`
`331`		`- "*"`
	`330`	`+ "arn:${data.aws_partition.current.partition}:ec2:${data.aws_region.default.name}:${data.aws_caller_identity.current.id}:instance/*"`
`332`	`331`	`]`
`333`	`332`	`}`
`334`	`333`	`}`