set -e
# Identify EMR cluster, set up Livy and configure with cluster ID address

echo ${EMRCluster} > /tmp/emrclusterid
echo ${EMRDNSName} > /tmp/emrmasterdnsname

cat << EOF >> /tmp/krb5.conf
[libdefaults]
    default_realm = EC2.INTERNAL
    dns_lookup_realm = false
    dns_lookup_kdc = false
    rdns = true
    ticket_lifetime = 24h
    forwardable = true
    udp_preference_limit = 1000000
    default_tkt_enctypes = aes256-cts-hmac-sha1-96 aes128-cts-hmac-sha1-96 des3-cbc-sha1
    default_tgs_enctypes = aes256-cts-hmac-sha1-96 aes128-cts-hmac-sha1-96 des3-cbc-sha1
    permitted_enctypes = aes256-cts-hmac-sha1-96 aes128-cts-hmac-sha1-96 des3-cbc-sha1

[realms]

    EC2.INTERNAL = {
        kdc = localhost:88
        admin_server = localhost:749
        default_domain = ec2.internal
    }

[domain_realm]
    .ec2.internal = EC2.INTERNAL
     ec2.internal = EC2.INTERNAL

[logging]
    kdc = FILE:/var/log/kerberos/krb5kdc.log
    admin_server = FILE:/var/log/kerberos/kadmin.log
    default = FILE:/var/log/kerberos/krb5lib.log
EOF

cp /tmp/krb5.conf /etc/krb5.conf

wget -O /home/ec2-user/SageMaker/.sparkmagic/config.json https://raw.githubusercontent.com/jupyter-incubator/sparkmagic/master/sparkmagic/example_config.json 

wget -O /home/ec2-user/SageMaker/Covid19-Pandas-Spark.ipynb https://aws-ml-blog.s3.amazonaws.com/artifacts/Secure-Data-Analytics-with-SageMaker-Notebook-Instance-and-Kerberized-EMR-Cluster/Covid19-Pandas-Spark.ipynb

sed -i -e "s/localhost/${EMRDNSName}/g" /home/ec2-user/SageMaker/.sparkmagic/config.json
sed -i -e 's/None"$/Kerberos"/g' /home/ec2-user/SageMaker/.sparkmagic/config.json
sed -i -e "s/localhost/${EMRDNSName}/g" /etc/krb5.conf
sed -i -e "s/mybucket/${S3Bucket}/g" /home/ec2-user/SageMaker/Covid19-Pandas-Spark.ipynb

