#!/bin/bash # This script is used as internalCustomStartupScript to setup the VM of the Azure Scale Set. # This setup is for Debian 8 VM only, and involves: # - setting up Docker and Docker-Compose # - setting up ProActive Node service with PNP # - starting the ProActive Node service # If you require additional configuration, you can add your own script as userCustomStartupScript # Be sure the two variables below are OK, depending on your context # The URL from where to retrieve the JRE tarball JRE_TARBALL_URL="https://s3.amazonaws.com/ci-materials/Latest_jre/jre-8u382b05-linux-x64.tar.gz" # This repo hosts the required additional jar files for the various script engines ADDITIONAL_JARS_REPO_URL="https://github.com/gheon/proactive-node-additional-jar.git" set -x set -e # Prerequisites: Install Docker and Docker Compose, add 'activeeon' user to docker group # wait for other apt to terminate while ps -aux | grep apt | grep -v grep >/dev/null 2>&1; do sleep 1; done # workaround for ubuntu images with invalid apt key for archive.ubuntu rm -rf /var/lib/apt/lists/* rm -rf /var/cache/apt/archive/partial/* apt-get update apt-get install -y \ apt-transport-https \ ca-certificates \ curl \ gnupg \ software-properties-common curl -fsSL https://download.docker.com/linux/$(. /etc/os-release; echo "$ID")/gpg | apt-key add - add-apt-repository \ "deb [arch=amd64] https://download.docker.com/linux/$(. /etc/os-release; echo "$ID") \ $(lsb_release -cs) \ stable" apt-get update apt-get install -y docker-ce groupadd -f docker usermod -aG docker activeeon curl -L https://github.com/docker/compose/releases/download/1.17.0/docker-compose-`uname -s`-`uname -m` -o /usr/local/bin/docker-compose chmod +x /usr/local/bin/docker-compose ############################### # Downloads and install ProActive Node as a Systemd service ############################### mkdir -p /opt/proactive mkdir -p /tmp/node cd /tmp/node # Install dependencies apt-get update if ! apt-get install -y wget curl jq; then sleep 10 apt-get update if ! apt-get install -y wget curl jq; then >&2 echo "Fatal error: Unable to run apt-get" exit 4 fi fi # Install Java 8 # [MODIFY] modify if needed the URL to get the JRE wget --no-clobber $JRE_TARBALL_URL tar zxf jre-8u382b05-linux-x64.tar.gz ln -s /tmp/node/jre1.8.0_382b05 /tmp/node/java # making Java 8 available system-wide update-alternatives --install /usr/bin/java java /tmp/node/java/bin/java 1 update-alternatives --set java /tmp/node/java/bin/java # Configure Python apt-get install -y python3 python3-pip pip3 install py4j # pip3 install numpy apt-get install -y python3-numpy # Retrieve NS config from CustomData if [ -f /var/lib/waagent/CustomData ]; then JSONCONFIG=$(base64 -d /var/lib/waagent/CustomData) elif [ -f /var/lib/cloud/instance/user-data.txt ]; then JSONCONFIG=$(cat /var/lib/cloud/instance/user-data.txt) elif [ -f /var/lib/waagent/ovf-env.xml ]; then JSONCONFIG=$(grep -oP '\K.*?(?=)' /var/lib/waagent/ovf-env.xml | base64 -d) else JSONCONFIG="" echo "Custom data not found in the system, aborting" exit 1 fi echo $JSONCONFIG export RMURL=`echo $JSONCONFIG | jq '.rmurl' -r` export CREDVALUE=`echo $JSONCONFIG | jq '.credentials' -r` export NODESOURCENAME=`echo $JSONCONFIG | jq '.nodesourcename' -r` export STORAGEACCOUNT=`echo $JSONCONFIG | jq '.storageaccount' -r` export SASKEY=`echo $JSONCONFIG | jq '.saskey' -r` export USERCUSTOMSCRIPTURL=`echo $JSONCONFIG | jq '.usercustomscripturl' -r` export EXTERNALSTORAGEACCOUNT=`echo $JSONCONFIG | jq '.externalstorageaccount' -r` export JVMPARAMETERS=`echo $JSONCONFIG | jq '.jvmparameters' -r` export NODEPRECOMMAND=`echo $JSONCONFIG | jq '.nodeprecommand' -r | sed -e 's/\\\\n/\n/g'` ############################### # Bash function used by the VM to send debug messages to the dedicated Azure Queue ############################### function debug { DEBUGCONTENT=`echo $1 | base64 -w 0` DEBUGMESSAGE="$DEBUGCONTENT" curl -X POST -d "$DEBUGMESSAGE" "https://$STORAGEACCOUNT.queue.core.windows.net/debug/messages?$SASKEY" } # debug debug "$HOSTNAME INFO: CustomData read properly (as I can write this message)" # Override custom script if specified if [ ! -z "$USERCUSTOMSCRIPTURL" ]; then curl -X GET "$USERCUSTOMSCRIPTURL" > user_custom_script.sh chmod +x user_custom_script.sh ./user_custom_script.sh >> user_script_stdout 2>>user_script_stderr if [ $? -ne 0 ]; then debug "$HOSTNAME FATAL: User custom script exited with error: $?" fi fi # Getting node.jar curl -X GET "https://$STORAGEACCOUNT.blob.core.windows.net/nodefiles/node.jar?$SASKEY" > node.jar # Change ownership to /tmp/node chown -R activeeon:activeeon /tmp/node # debug NOW=`date` debug "$HOSTNAME INFO: Start filling the Table on $NOW" start_time=$(date +%s) # Max time to try de delete msg from queue timeout_minutes=30 isValidMessage="false" while [[ "$isValidMessage" == "false" ]]; do # Read Azure Queue to get node name Deletion is performed on NS Side when nodes are properly registered msg=$(curl "https://$STORAGEACCOUNT.queue.core.windows.net/nodeconfig/messages?visibilitytimeout=300&$SASKEY") JSONMSG=`echo $msg | grep -oP '\K[^<]+' | base64 -d` msgId=`echo $msg | grep -oP '\K[^<]+'` popReceipt=`echo $msg | grep -oP '\K[^<]+'` # Encode popReceipt query param popReceipt=$(echo $popReceipt | jq -R -r @uri) dequeueCount=`echo $msg | grep -oP '\K[^<]+'` NODEBASENAME=`echo $JSONMSG | jq '.nodebasename' -r` NODEINSTANCES=`echo $JSONMSG | jq '.nodeinstances' -r` if [ -z "$NODEBASENAME" ]; then echo "$HOSTNAME ERROR: Unable to retrieve node configuration from 'nodeconfig' queue message $msg" # Check if 30 minutes have passed current_time=$(date +%s) elapsed_time=$((current_time - start_time)) if [ "$elapsed_time" -ge $((timeout_minutes * 60)) ]; then echo "Timeout of $timeout_minutes minutes reached for azure queue deletion." exit 5 fi echo "Retrying..." sleep 10 continue #halt #sleep 9999 #exit -1 fi # Try to delete message from queue URL="https://${STORAGEACCOUNT}.queue.core.windows.net/nodeconfig/messages/${msgId}?popreceipt=${popReceipt}&${SASKEY}" delete_response=$(curl -w "%{http_code}" -X DELETE $URL) echo "$delete_response" http_code=$(tail -n1 <<< "$delete_response") if [[ $http_code -ne 204 ]]; then echo "$HOSTNAME WARN: Could not delete Azure message from queue" fi if [[ "$dequeueCount" == "1" ]]; then isValidMessage="true" fi done # Retrieve instance metadata INSTANCE_NAME=$(curl -H Metadata:true "http://169.254.169.254/metadata/instance/compute?api-version=2017-12-01" | jq .name | sed 's/"//g') INSTANCE_ID=$(echo -n "$INSTANCE_NAME" | rev | cut -d'_' -f1 | rev) # Update Azure Table ENTITY="{'PartitionKey':'$HOSTNAME','RowKey':'$NODEBASENAME', 'NodesCount':'$NODEINSTANCES', 'InstanceId': '$INSTANCE_ID'}" curl -H "Content-Type: application/json" -d "$ENTITY" -X POST "https://$STORAGEACCOUNT.table.core.windows.net/nodesperhost?$SASKEY" if [ $? -ne 0 ]; then debug "$HOSTNAME FATAL: Unable to register the host into 'nodesperhost' table" exit 3 fi NOW=`date` debug "$HOSTNAME INFO: Terminated to fill the Table on $NOW" # Generate the ExecStartPre commands if they were provided by the user EXECSTARTPRE='' if [ ! -z "$NODEPRECOMMAND" ]; then while read -r line; do EXECSTARTPRE=$EXECSTARTPRE`echo "ExecStartPre=$line"`$'\n' done <<< "$NODEPRECOMMAND" fi ############################### # Generate proactive-node systemd service unit file ############################### cat > /etc/systemd/system/proactive-node.service <