Skip to content

Commit

Permalink
Improvement] ecs/cluster - ECS Stop Container Timeout, Avoid ECS API …
Browse files Browse the repository at this point in the history
…request limits, ...
  • Loading branch information
andreaswittig authored May 16, 2019
1 parent 0fe0ce0 commit 585f3d3
Showing 1 changed file with 11 additions and 37 deletions.
48 changes: 11 additions & 37 deletions ecs/cluster.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -50,6 +50,7 @@ Metadata:
- MinSize
- DesiredCapacity
- DrainingTimeoutInSeconds
- StopContainerTimeoutInSeconds
- Label:
default: 'Cluster Scaling Parameters'
Parameters:
Expand Down Expand Up @@ -165,6 +166,13 @@ Parameters:
ConstraintDescription: 'Must be in the range [60-86400]'
MinValue: 60
MaxValue: 86400 # 24 hours
StopContainerTimeoutInSeconds:
Description: 'Time in seconds the ECS agent waits before killing a stopped container (see ECS_CONTAINER_STOP_TIMEOUT).'
Type: Number
Default: 30
ConstraintDescription: 'Must be in the range [30-3600]'
MinValue: 30
MaxValue: 3600
ContainerMaxCPU:
Description: 'The maximum number of cpu reservation per container that you plan to run on this cluster. A container instance has 1,024 CPU units for every CPU core.'
Type: Number
Expand Down Expand Up @@ -801,6 +809,7 @@ Resources:
#!/bin/bash -ex
trap '/opt/aws/bin/cfn-signal -e 1 --stack ${AWS::StackName} --resource AutoScalingGroup --region ${AWS::Region}' ERR
echo "ECS_CLUSTER=${Cluster}" >> /etc/ecs/ecs.config
echo "ECS_CONTAINER_STOP_TIMEOUT=${StopContainerTimeoutInSeconds}s" >> /etc/ecs/ecs.config
yum install -y aws-cfn-bootstrap
/opt/aws/bin/cfn-init -v --stack ${AWS::StackName} --resource LaunchConfiguration --region ${AWS::Region}
/opt/aws/bin/cfn-signal -e 0 --stack ${AWS::StackName} --resource AutoScalingGroup --region ${AWS::Region}
Expand Down Expand Up @@ -984,7 +993,8 @@ Resources:
ComparisonOperator: GreaterThanOrEqualToThreshold
Statistic: Maximum # special rule because we scale on reservations and not utilization
Period: 60
EvaluationPeriods: 1
EvaluationPeriods: 15
DatapointsToAlarm: 15
Threshold: !Ref ContainerExcessThreshold
AlarmActions:
- !Ref ScaleDownPolicy
Expand Down Expand Up @@ -1057,35 +1067,6 @@ Resources:
AlarmActions:
- {'Fn::ImportValue': !Sub '${ParentAlertStack}-TopicARN'}
# scaling based on SchedulableContainers is described in detail here: http://garbe.io/blog/2017/04/12/a-better-solution-to-ecs-autoscaling/
SchedulableContainersRule:
Type: 'AWS::Events::Rule'
Properties:
EventPattern:
source:
- 'aws.ecs'
'detail-type':
- 'ECS Container Instance State Change'
State: ENABLED
Targets:
- Arn: !GetAtt 'SchedulableContainersLambdaV2.Arn'
Id: lambda
SchedulableContainersRuleFailedInvocationsTooHighAlarm:
Condition: HasAlertTopic
Type: 'AWS::CloudWatch::Alarm'
Properties:
AlarmDescription: 'Invocations failed permanently'
Namespace: 'AWS/Events'
MetricName: FailedInvocations
Statistic: Sum
Period: 60
EvaluationPeriods: 1
ComparisonOperator: GreaterThanThreshold
Threshold: 0
AlarmActions:
- {'Fn::ImportValue': !Sub '${ParentAlertStack}-TopicARN'}
Dimensions:
- Name: RuleName
Value: !Ref SchedulableContainersRule
SchedulableContainersCron:
Type: 'AWS::Events::Rule'
Properties:
Expand Down Expand Up @@ -1142,13 +1123,6 @@ Resources:
- Effect: Allow
Action: 'cloudwatch:PutMetricData'
Resource: '*'
SchedulableContainersLambdaPermission:
Type: 'AWS::Lambda::Permission'
Properties:
Action: 'lambda:InvokeFunction'
FunctionName: !Ref SchedulableContainersLambdaV2
Principal: 'events.amazonaws.com'
SourceArn: !GetAtt 'SchedulableContainersRule.Arn'
SchedulableContainersLambdaPermission2:
Type: 'AWS::Lambda::Permission'
Properties:
Expand Down

0 comments on commit 585f3d3

Please sign in to comment.