AWS EMR CF模板BOOTSTRAP_FAILURE,消息:在主实例上

时间:2018-11-02 17:25:59

标签: amazon-web-services etl amazon-cloudformation amazon-emr

我正在尝试使用cloudformation模板启动emr集群。

当我创建堆栈时-创建IAM角色,策略,安全组,EC2实例时没有任何错误,但是当模板到达主节点上发生引导过程的时刻,即引导节点失败并终止。

仅供参考-我已经指定了管理员策略来排除权限问题,但是那不起作用,并且由于某些奇怪的原因,未在s3存储桶-s3:// emrfm / logs中生成日志,以查看引导失败的地方。

{
"Description": "CloudFormation template for creating an EMR cluster with Spark and an auto-scaling policy.",
"Outputs": {
    "IPAddress": {
        "Description": "IP address of EMR cluster MasterNode",
        "Value": {
            "Fn::GetAtt": [
                "emrfmlabcluster",
                "MasterPublicDNS"
            ]
        }
    },
    "EmrRoleArn": {
        "Description": "ARN of EMR role",
        "Value": {
            "Fn::GetAtt": [
                "EmrRole",
                "Arn"
            ]
        }
    },
    "EmrEc2RoleArn": {
        "Description": "ARN of EMR EC2 role",
        "Value": {
            "Fn::GetAtt": [
                "EmrEc2Role",
                "Arn"
            ]
        }
    },
    "EmrRoleName": {
        "Description": "Name of EMR role",
        "Value": {
            "Ref": "EmrRole"
        }
    },
    "EmrEc2RoleName": {
        "Description": "Name of EMR EC2 role",
        "Value": {
            "Ref": "EmrEc2Role"
        }
    },
    "EmrEc2ProfileName": {
        "Description": "Name of EMR EC2 instance profile",
        "Value": {
            "Ref": "EmrEc2InstanceProfile"
        }
    },
    "MasterSG": {
        "Description": "ID of master security group for EMR cluster",
        "Value": {
            "Fn::GetAtt": [
                "MasterSecurityGroup",
                "GroupId"
            ]
        }
    }
},
"Parameters": {
    "MaxCapacity": {
        "Default": "4",
        "Description": "Maximum number of core instances",
        "Type": "Number"
    },
    "AllowedCidrIngress": {
        "Default": "0.0.0.0/0",
        "ConstraintDescription": "Must be a valid CIDR range",
        "Type": "String",
        "AllowedPattern": "(\\d{1,3})\\.(\\d{1,3})\\.(\\d{1,3})\\.(\\d{1,3})/(\\d{1,3})"
    },
    "MinCapacity": {
        "Default": "2",
        "Description": "Minimum number of core instances",
        "Type": "Number"
    },
    "CoreInstanceCount": {
        "Default": "2",
        "Description": "Number of core instances",
        "Type": "Number"
    },
    "CoreInstanceType": {
        "Default": "m4.large",
        "Description": "Instance Type of the core node",
        "Type": "String"
    },
    "EMRClusterName": {
        "Default": "emrfmlabcluster",
        "Description": "Cluster name for the EMR",
        "Type": "String"
    },
    "EMRLogDir": {
        "Description": "Log Dir for the EMR cluster",
        "Type": "String"
    },
    "KeyName": {
        "Description": "Name of an existing EC2 KeyPair to enable SSH to the instances",
        "Type": "AWS::EC2::KeyPair::KeyName"
    },
    "ProjectTag": {
        "Default": "emrfmlabcluster",
        "Description": "Tag for cost allocation",
        "Type": "String"
    },
    "MasterInstanceType": {
        "Default": "m4.large",
        "Description": "Instance Type of the master node",
        "Type": "String"
    },
    "Subnet": {
        "Description": "Subnet ID for creating the EMR cluster",
        "Type": "AWS::EC2::Subnet::Id"
    },
    "VPC": {
        "Description": "VPC ID for creating the EMR cluster",
        "Type": "AWS::EC2::VPC::Id"
    },
    "emrReleaseLabel": {
        "Default": "emr-5.18.0",
        "Description": "Release label for the EMR cluster",
        "Type": "String"
    }
},
"Resources": {
    "emrfmlabcluster": {
        "Properties": {
            "Applications": [
                {
                    "Name": "Hadoop"
                },
                {
                    "Name": "Hive"
                },
                {
                    "Name": "Spark"
                }
            ],
            "Instances": {
                "AdditionalMasterSecurityGroups": [
                    {
                        "Fn::GetAtt": [
                            "MasterSecurityGroup",
                            "GroupId"
                        ]
                    }
                ],
                "CoreInstanceGroup": {
                    "EbsConfiguration": {
                        "EbsBlockDeviceConfigs": [
                            {
                                "VolumeSpecification": {
                                    "SizeInGB": "50",
                                    "VolumeType": "gp2"
                                },
                                "VolumesPerInstance": "1"
                            }
                        ],
                        "EbsOptimized": "true"
                    },
                    "InstanceCount": {
                        "Ref": "CoreInstanceCount"
                    },
                    "InstanceType": {
                        "Ref": "CoreInstanceType"
                    },
                    "Market": "ON_DEMAND",
                    "Name": "Core Instance",
                    "AutoScalingPolicy": {
                        "Constraints": {
                            "MinCapacity": {
                                "Ref": "MinCapacity"
                            },
                            "MaxCapacity": {
                                "Ref": "MaxCapacity"
                            }
                        },
                        "Rules": [
                            {
                                "Name": "Scale-out",
                                "Description": "Scale-out policy",
                                "Action": {
                                    "SimpleScalingPolicyConfiguration": {
                                        "AdjustmentType": "CHANGE_IN_CAPACITY",
                                        "ScalingAdjustment": 1,
                                        "CoolDown": 300
                                    }
                                },
                                "Trigger": {
                                    "CloudWatchAlarmDefinition": {
                                        "Dimensions": [
                                            {
                                                "Key": "JobFlowId",
                                                "Value": "${emr:clusterid}"
                                            }
                                        ],
                                        "EvaluationPeriods": 1,
                                        "Namespace": "AWS/ElasticMapReduce",
                                        "Period": 300,
                                        "ComparisonOperator": "LESS_THAN",
                                        "Statistic": "AVERAGE",
                                        "Threshold": 15,
                                        "Unit": "PERCENT",
                                        "MetricName": "YARNMemoryAvailablePercentage"
                                    }
                                }
                            },
                            {
                                "Name": "Scale-in",
                                "Description": "Scale-in policy",
                                "Action": {
                                    "SimpleScalingPolicyConfiguration": {
                                        "AdjustmentType": "CHANGE_IN_CAPACITY",
                                        "ScalingAdjustment": -1,
                                        "CoolDown": 300
                                    }
                                },
                                "Trigger": {
                                    "CloudWatchAlarmDefinition": {
                                        "Dimensions": [
                                            {
                                                "Key": "JobFlowId",
                                                "Value": "${emr:clusterid}"
                                            }
                                        ],
                                        "EvaluationPeriods": 1,
                                        "Namespace": "AWS/ElasticMapReduce",
                                        "Period": 300,
                                        "ComparisonOperator": "GREATER_THAN",
                                        "Statistic": "AVERAGE",
                                        "Threshold": 75,
                                        "Unit": "PERCENT",
                                        "MetricName": "YARNMemoryAvailablePercentage"
                                    }
                                }
                            }
                        ]
                    }
                },
                "Ec2KeyName": {
                    "Ref": "KeyName"
                },
                "Ec2SubnetId": {
                    "Ref": "Subnet"
                },
                "MasterInstanceGroup": {
                    "InstanceCount": "1",
                    "InstanceType": {
                        "Ref": "MasterInstanceType"
                    },
                    "Market": "ON_DEMAND",
                    "Name": "Master Instance"
                },
                "TerminationProtected": "false"
            },
            "JobFlowRole": {
                "Ref": "EmrEc2InstanceProfile"
            },
            "EbsRootVolumeSize": "50",
            "LogUri": {
                "Ref": "EMRLogDir"
            },
            "Name": {
                "Ref": "EMRClusterName"
            },
            "ReleaseLabel": {
                "Ref": "emrReleaseLabel"
            },
            "ServiceRole": {
                "Ref": "EmrRole"
            },
            "AutoScalingRole": {
                "Ref": "AutoScalingRole"
            },
            "Tags": [
                {
                    "Key": "Name",
                    "Value": "emrfmlabcluster"
                },
                {
                    "Key": "Project",
                    "Value": {
                        "Ref": "ProjectTag"
                    }
                }
            ],
            "VisibleToAllUsers": "true"
        },
        "Type": "AWS::EMR::Cluster"
    },
    "MasterSecurityGroup": {
        "Type": "AWS::EC2::SecurityGroup",
        "Properties": {
            "GroupDescription": "Allow full access to EMR master",
            "VpcId": {
                "Ref": "VPC"
            },
            "SecurityGroupIngress": [
                {
                    "IpProtocol": "tcp",
                    "FromPort": "0",
                    "ToPort": "65535",
                    "CidrIp": {
                        "Ref": "AllowedCidrIngress"
                    }
                }
            ]
        }
    },
    "AutoScalingRole": {
        "Type": "AWS::IAM::Role",
        "Properties": {
            "AssumeRolePolicyDocument": {
                "Version": "2012-10-17",
                "Statement": [
                    {
                        "Effect": "Allow",
                        "Principal": {
                            "Service": [
                                "elasticmapreduce.amazonaws.com",
                                "application-autoscaling.amazonaws.com"
                            ]
                        },
                        "Action": [
                            "sts:AssumeRole"
                        ]
                    }
                ]
            },
            "ManagedPolicyArns": [
                "arn:aws:iam::aws:policy/service-role/AmazonElasticMapReduceforAutoScalingRole",
                "arn:aws:iam::aws:policy/AdministratorAccess"
            ],
            "Path": "/"
        }
    },
    "EmrRole": {
        "Type": "AWS::IAM::Role",
        "Properties": {
            "AssumeRolePolicyDocument": {
                "Version": "2012-10-17",
                "Statement": [
                    {
                        "Effect": "Allow",
                        "Principal": {
                            "Service": [
                                "elasticmapreduce.amazonaws.com",
                                "datapipeline.amazonaws.com"
                            ]
                        },
                        "Action": [
                            "sts:AssumeRole"
                        ]
                    }
                ]
            },
            "ManagedPolicyArns": [
                "arn:aws:iam::aws:policy/service-role/AmazonElasticMapReduceRole",
                "arn:aws:iam::aws:policy/AmazonS3FullAccess",
                "arn:aws:iam::aws:policy/AdministratorAccess",
                "arn:aws:iam::aws:policy/service-role/AWSDataPipelineRole"
            ],
            "Path": "/"
        }
    },
    "EmrKmsRolePolicies": {
        "Type": "AWS::IAM::Policy",
        "Properties": {
            "PolicyName": "EMRKmsETL",
            "PolicyDocument": {
                "Version": "2012-10-17",
                "Statement": [
                    {
                        "Effect": "Allow",
                        "Action": "kms:GenerateDataKey",
                        "Resource": "*"
                    },
                    {
                        "Effect": "Allow",
                        "Action": "kms:Decrypt",
                        "Resource": "*"
                    }
                ]
            },
            "Roles": [
                {
                    "Ref": "EmrRole"
                }
            ]
        }
    },
    "EmrEc2Role": {
        "Type": "AWS::IAM::Role",
        "Properties": {
            "AssumeRolePolicyDocument": {
                "Version": "2012-10-17",
                "Statement": [
                    {
                        "Effect": "Allow",
                        "Principal": {
                            "Service": [
                                "ec2.amazonaws.com"
                            ]
                        },
                        "Action": [
                            "sts:AssumeRole"
                        ]
                    }
                ]
            },
            "ManagedPolicyArns": [
                "arn:aws:iam::aws:policy/service-role/AmazonElasticMapReduceforEC2Role",
                "arn:aws:iam::aws:policy/AmazonS3FullAccess",
                "arn:aws:iam::aws:policy/AdministratorAccess",
                "arn:aws:iam::aws:policy/service-role/AmazonEC2RoleforDataPipelineRole"
            ],
            "Path": "/"
        }
    },
    "EmrEc2InstanceProfile": {
        "Type": "AWS::IAM::InstanceProfile",
        "Properties": {
            "Path": "/",
            "Roles": [
                {
                    "Ref": "EmrEc2Role"
                }
            ]
        }
    },
    "EmrEc2KmsRolePolicies": {
        "Type": "AWS::IAM::Policy",
        "Properties": {
            "PolicyName": "EMREc2KmsETL",
            "PolicyDocument": {
                "Version": "2012-10-17",
                "Statement": [
                    {
                        "Effect": "Allow",
                        "Action": "kms:GenerateDataKey",
                        "Resource": "*"
                    },
                    {
                        "Effect": "Allow",
                        "Action": "kms:Decrypt",
                        "Resource": "*"
                    }
                ]
            },
            "Roles": [
                {
                    "Ref": "EmrEc2Role"
                }
            ]
        }
    }
}

}

0 个答案:

没有答案