cipulan · February 7, 2025 08:49 · cipulan · Feb 6, 2025
diff --git a/monitor-termination.service b/monitor-termination.service
 [Unit]
 Description=Monitor AWS Spot Termination Event
 After=network.target

 [Service]
 ExecStart=/opt/monitor_termination.sh
 Restart=always
 User=root

 [Install]
 WantedBy=multi-user.target
diff --git a/monitor_termination.sh b/monitor_termination.sh
 #!/bin/bash

 LOG_FILE="/var/log/spot_termination_monitor.log"
 AWS_REGION="ap-southeast-3"

 # Get the instance ID from metadata
 INSTANCE_ID=$(/usr/bin/curl -s http://169.254.169.254/latest/meta-data/instance-id)

 log() {
    echo "$(date '+%Y-%m-%d %H:%M:%S') - $1" | tee -a "$LOG_FILE"
 }

 # Function to check termination event
 check_termination_event() {
    STATUS_CODE=$(/usr/bin/curl -s -o /dev/null -w "%{http_code}" http://169.254.169.254/latest/meta-data/spot/termination-time)
    echo "$STATUS_CODE"
 }

 # Function to set the instance as unhealthy
 set_instance_unhealthy() {
    log "Setting instance $INSTANCE_ID to Unhealthy in region $AWS_REGION..."
    /usr/bin/aws autoscaling set-instance-health --instance-id "$INSTANCE_ID" --health-status Unhealthy --region "$AWS_REGION"
 }

 log "Monitoring for Spot Instance termination events..."

 while true; do
    STATUS_CODE=$(check_termination_event)
    
    if [ "$STATUS_CODE" -eq 200 ]; then
        log "Termination event detected! Marking instance as Unhealthy..."
        set_instance_unhealthy
        exit 0
    else
        log "No termination event detected. Checking again in 30 seconds..."
    fi

    sleep 30
 done
	[Unit]
	Description=Monitor AWS Spot Termination Event
	After=network.target

	[Service]
	ExecStart=/opt/monitor_termination.sh
	Restart=always
	User=root

	[Install]
	WantedBy=multi-user.target
	#!/bin/bash

	LOG_FILE="/var/log/spot_termination_monitor.log"
	AWS_REGION="ap-southeast-3"

	# Get the instance ID from metadata
	INSTANCE_ID=$(/usr/bin/curl -s http://169.254.169.254/latest/meta-data/instance-id)

	log() {
	echo "$(date '+%Y-%m-%d %H:%M:%S') - $1" \| tee -a "$LOG_FILE"
	}

	# Function to check termination event
	check_termination_event() {
	STATUS_CODE=$(/usr/bin/curl -s -o /dev/null -w "%{http_code}" http://169.254.169.254/latest/meta-data/spot/termination-time)
	echo "$STATUS_CODE"
	}

	# Function to set the instance as unhealthy
	set_instance_unhealthy() {
	log "Setting instance $INSTANCE_ID to Unhealthy in region $AWS_REGION..."
	/usr/bin/aws autoscaling set-instance-health --instance-id "$INSTANCE_ID" --health-status Unhealthy --region "$AWS_REGION"
	}

	log "Monitoring for Spot Instance termination events..."

	while true; do
	STATUS_CODE=$(check_termination_event)

	if [ "$STATUS_CODE" -eq 200 ]; then
	log "Termination event detected! Marking instance as Unhealthy..."
	set_instance_unhealthy
	exit 0
	else
	log "No termination event detected. Checking again in 30 seconds..."
	fi

	sleep 30
	done