[{"data":1,"prerenderedAt":52},["ShallowReactive",2],{"workflow-manage-emr-job-cdk":3},{"id":4,"title":5,"cleanup":6,"contributors":10,"deploy":12,"description":15,"diagram":16,"extension":17,"framework":18,"gitHub":19,"introBox":28,"level":32,"meta":33,"resources":34,"s3URL":40,"services":41,"simplicity":43,"stem":44,"testing":45,"type":49,"usecase":50,"videoId":27,"__hash__":51},"workflows\u002Fworkflows\u002Fmanage-emr-job-cdk.json","Manage an Amazon EMR Job",{"headline":7,"text":8},"Cleanup",[9],"1. Delete the stack: \u003Ccode>cdk destroy\u003C\u002Fcode>.",[11],"content\u002Fcontributors\u002Faditi-agarwal.json",{"text":13},[14],"\u003Ccode>cdk deploy\u003C\u002Fcode>","Automate Amazon EMR job using Step Functions. Create cluster, add steps, execute synchronously, and terminate cluster. Minimal code for data processing.","\u002Fassets\u002Fimages\u002Fworkflows\u002Fmanage-emr-job-cdk.png","json","AWS CDK",{"template":20,"payloads":25},{"repoURL":21,"templateDir":22,"templateFile":23,"ASL":24},"https:\u002F\u002Fgithub.com\u002Faws-samples\u002Fstep-functions-workflows-collection\u002Ftree\u002Fmain\u002Fmanage-emr-job-cdk\u002F","manage-emr-job-cdk","manage_emr_job\u002Fmanage_emr_job_stack.py","statemachine\u002Fstatemachine.asl.json",[26],{"headline":27,"payloadURL":27},"",{"headline":29,"text":30},"How it works",[31],"This workflow demonstrates automating an Amazon EMR job using AWS Step Functions. The workflow creates an Amazon EMR cluster, adds multiple steps, runs them, and then terminates the cluster. The Amazon EMR task is executed synchronously, and the state machine waits for its success or failure. After the two steps are completed on the EMR cluster, it is terminated, enabling users to process and analyze data with minimal code. The AWS Cloud Development Kit (CDK) code generates all the necessary resources for running this workflow, including Identity and Access Management (IAM) roles and policies, a Simple Storage Service (S3) bucket for storing EMR logs, and the State Machine for managing the EMR job.","100",{},{"headline":35,"bullets":36},"Additional resources",[37],{"text":38,"link":39},"ETL on Amazon EMR Workshop","https:\u002F\u002Fcatalog.us-east-1.prod.workshops.aws\u002Fworkshops\u002Fc86bd131-f6bf-4e8f-b798-58fd450d3c44\u002Fen-US",null,[42],"sfn","1 - Fundamental","workflows\u002Fmanage-emr-job-cdk",{"headline":46,"text":47},"Testing",[48],"See the GitHub repository for detailed testing instructions.","Standard","Data Processing","rvtPaylKXY4HvrgAvJwiu9CV2xtHOaFFFcKQPj5X8Ck",1778846889243]