Builder job for deploying Openstack for testing
[releng/builder.git] / jjb / integration / include-raw-integration-start-cluster-run-test.sh
index 19054f13334b4345a32190145bc092c23fcff22a..4bc956436ad5a7e2efd0ccb2377039901f989366 100644 (file)
@@ -1,65 +1,36 @@
-echo "#########################################################"
-echo "##  include-raw-integration-start-cluster-run-test.sh  ##"
-echo "#########################################################"
-# Expects $BUNDLEFOLDER to be set earlier in Jenkins job.
-set -x
-
-  if [ -z ${BUNDLEFOLDER} ] || [ -f ${BUNDLEFOLDER} ]; then
-    echo "Location of ODL BUNDLEFOLDER:$BUNDLEFOLDER is not defined"
-    exit 1
-  fi
-
-# populate $(CONTROLLERIPS)
-
-  declare CONTROLLERIPS=($(cat slave_addresses.txt | grep CONTROLLER | awk -F = '{print $2}'))
-  declare -p CONTROLLERIPS
-
-# Creates a script to run controller inside a dynamic jenkins slave
-
-cat > ${WORKSPACE}/run-startandtest-controller-script.sh <<EOF
-set -x
-cd /tmp
-cd ${BUNDLEFOLDER}
-echo "BUNDLE: $BUNDLEFOLDER"
-echo "Checking status of controller..."
-    bash bin/status
-    bash bin/start &
-set +x
-EOF
-
+#@IgnoreInspection BashAddShebang
+# Activate robotframework virtualenv
+# ${ROBOT_VENV} comes from the include-raw-integration-install-robotframework.sh
+# script.
+source ${ROBOT_VENV}/bin/activate
 
+echo "#################################################"
+echo "##         Verify Cluster is UP                ##"
+echo "#################################################"
 
-cat > ${WORKSPACE}/run-verify-controller-isup-script.sh <<EOF
-set -x
-cd /tmp
-cd ${BUNDLEFOLDER}
-echo "BUNDLE: $BUNDLEFOLDER"
-echo "Checking status of controller..."
- bash bin/status
- echo "Waiting for controller to come up..."
- COUNT="0"
+cat > ${WORKSPACE}/verify-cluster-is-up.sh <<EOF
 
+CONTROLLERID="member-\$1"
+ODL_SYSTEM_IP_PATH=\$2
 
+echo "Waiting for controller to come up..."
+COUNT="0"
 while true; do
     RESP="\$( curl --user admin:admin -sL -w "%{http_code} %{url_effective}\\n" http://localhost:8181/restconf/modules -o /dev/null )"
     echo \$RESP
-    if [[ \$RESP == *"200"* ]]; then
+    SHARD="\$( curl --user admin:admin -sL -w "%{http_code} %{url_effective}\\n" http://localhost:8181/jolokia/read/org.opendaylight.controller:Category=Shards,name=\$CONTROLLERID-shard-inventory-config,type=DistributedConfigDatastore)"
+    echo \$SHARD
+    if ([[ \$RESP == *"200"* ]] && [[ \$SHARD  == *'"status":200'* ]]); then
         echo Controller is UP
-    SHARD="\$( curl --user admin:admin -sL -w "%{http_code} %{url_effective}\\n" http://localhost:8181/jolokia/read/org.opendaylight.controller:Category=Shards,name=member-0-shard-inventory-config,type=DistributedConfigDatastore)"
-      echo \$SHARD
-      if [[ \$SHARD  == *'"status":200'* ]]
-       then
         break
-      fi
-      break
-
     elif (( "\$COUNT" > "600" )); then
         echo Timeout Controller DOWN
-        echo "Dumping Karaf log..."
-        ls
-        pwd
-        cd data/log
-        cat karaf.log
+        echo "Dumping first 500K bytes of karaf log..."
+        head --bytes=500K "/tmp/${BUNDLEFOLDER}/data/log/karaf.log"
+        echo "Dumping last 500K bytes of karaf log..."
+        tail --bytes=500K "/tmp/${BUNDLEFOLDER}/data/log/karaf.log"
+        echo "Listing all open ports on controller system"
+        netstat -natu
         exit 1
     else
         COUNT=\$(( \${COUNT} + 5 ))
@@ -68,71 +39,103 @@ while true; do
     fi
 done
 
-cd /tmp/${BUNDLEFOLDER}/bin/
+echo "Listing all open ports on controller system.."
+netstat -natu
+
+function exit_on_log_file_message {
+    echo "looking for \"\$1\" in log file"
+    if grep --quiet "\$1" "/tmp/${BUNDLEFOLDER}/data/log/karaf.log"; then
+        echo ABORTING: found "\$1"
+        echo "Dumping first 500K bytes of karaf log..."
+        head --bytes=500K "/tmp/${BUNDLEFOLDER}/data/log/karaf.log"
+        echo "Dumping last 500K bytes of karaf log..."
+        tail --bytes=500K "/tmp/${BUNDLEFOLDER}/data/log/karaf.log"
+        exit 1
+    fi
+}
 
-echo "Checking OSGi bundles..."
-sshpass -p karaf ./client -u karaf 'bundle:list'
+exit_on_log_file_message 'BindException: Address already in use'
+exit_on_log_file_message 'server is unhealthy'
 
 EOF
 
-
-for  i in "${!CONTROLLERIPS[@]}"
+for i in `seq 1 ${NUM_ODL_SYSTEM}`
 do
- echo "Copying HERE docs to ${CONTROLLERIPS[$i]} which is node $i "
- scp ${WORKSPACE}/run-startandtest-controller-script.sh \
-${CONTROLLERIPS[$i]}:/tmp
-
- scp ${WORKSPACE}/run-verify-controller-isup-script.sh \
-${CONTROLLERIPS[$i]}:/tmp
+    CONTROLLERIP=ODL_SYSTEM_${i}_IP
+    echo "Verifying member-${i} with IP address ${!CONTROLLERIP} is UP"
+    scp ${WORKSPACE}/verify-cluster-is-up.sh ${!CONTROLLERIP}:/tmp
+    ssh ${!CONTROLLERIP} "bash /tmp/verify-cluster-is-up.sh ${i} ${!CONTROLLERIP}"
 done
 
-for  i in "${!CONTROLLERIPS[@]}"
+if [ ${NUM_OPENSTACK_SYSTEM} -gt 0 ]; then
+   echo "Exiting without running tests to deploy openstack for testing"
+   exit
+fi
+
+if [ ${CONTROLLERSCOPE} == 'all' ]; then
+    COOLDOWN_PERIOD="180"
+else
+    COOLDOWN_PERIOD="60"
+fi
+echo "Cool down for ${COOLDOWN_PERIOD} seconds :)..."
+sleep ${COOLDOWN_PERIOD}
+
+echo "Generating controller variables..."
+for i in `seq 1 ${NUM_ODL_SYSTEM}`
 do
- echo "Starting ${CONTROLLERIPS[$i]} on node $i "
- ssh ${CONTROLLERIPS[$i]} "bash /tmp/run-startandtest-controller-script.sh $i"&
+    CONTROLLERIP=ODL_SYSTEM_${i}_IP
+    odl_variables=${odl_variables}" -v ${CONTROLLERIP}:${!CONTROLLERIP}"
 done
 
-for  i in "${!CONTROLLERIPS[@]}"
+echo "Generating mininet variables..."
+for i in `seq 1 ${NUM_TOOLS_SYSTEM}`
 do
- echo "Running sanity tests on ${CONTROLLERIPS[$i]} on node $i "
ssh ${CONTROLLERIPS[$i]} "bash /tmp/run-verify-controller-isup-script.sh $i"
+    MININETIP=TOOLS_SYSTEM_${i}_IP
   tools_variables=${tools_variables}" -v ${MININETIP}:${!MININETIP}"
 done
 
-echo "Cool down for 1 min :)..."
-sleep 60
+echo "Locating test plan to use..."
+testplan_filepath="${WORKSPACE}/test/csit/testplans/${STREAMTESTPLAN}"
+if [ ! -f "${testplan_filepath}" ]; then
+    testplan_filepath="${WORKSPACE}/test/csit/testplans/${TESTPLAN}"
+fi
 
 echo "Changing the testplan path..."
-cat ${WORKSPACE}/test/csit/testplans/${TESTPLAN} | sed "s:integration:${WORKSPACE}:" > testplan.txt
+cat "${testplan_filepath}" | sed "s:integration:${WORKSPACE}:" > testplan.txt
 cat testplan.txt
 
-SUITES=$( egrep -v '(^[[:space:]]*#|^[[:space:]]*$)' testplan.txt | tr '\012' ' ' )
+SUITES=`egrep -v '(^[[:space:]]*#|^[[:space:]]*$)' testplan.txt | tr '\012' ' '`
 
 echo "Starting Robot test suites ${SUITES} ..."
+pybot -N ${TESTPLAN} -c critical -e exclude -v BUNDLEFOLDER:${BUNDLEFOLDER} \
+-v WORKSPACE:/tmp -v BUNDLE_URL:${ACTUALBUNDLEURL} -v JAVA_HOME:${JAVA_HOME} \
+-v NEXUSURL_PREFIX:${NEXUSURL_PREFIX} -v JDKVERSION:${JDKVERSION} -v ODL_STREAM:${DISTROSTREAM} \
+-v CONTROLLER:${ODL_SYSTEM_IP} -v CONTROLLER1:${ODL_SYSTEM_2_IP} -v CONTROLLER2:${ODL_SYSTEM_3_IP} -v ODL_SYSTEM_IP:${ODL_SYSTEM_IP} \
+${odl_variables} -v NUM_ODL_SYSTEM:${NUM_ODL_SYSTEM} -v CONTROLLER_USER:${USER} -v ODL_SYSTEM_USER:${USER} -v \
+TOOLS_SYSTEM_IP:${TOOLS_SYSTEM_IP} ${tools_variables} -v NUM_TOOLS_SYSTEM:${NUM_TOOLS_SYSTEM} -v TOOLS_SYSTEM_USER:${USER} \
+-v MININET:${TOOLS_SYSTEM_IP} -v MININET1:${TOOLS_SYSTEM_2_IP} -v MININET2:${TOOLS_SYSTEM_3_IP} -v MININET_USER:${USER} \
+-v USER_HOME:${HOME} ${TESTOPTIONS} ${SUITES} || true
+# FIXME: Sort (at least -v) options alphabetically.
+
+set +e  # We do not want to create red dot just because something went wrong while fetching logs.
+for i in `seq 1 ${NUM_ODL_SYSTEM}`
+do
+    CONTROLLERIP=ODL_SYSTEM_${i}_IP
+    echo "dumping first 500K bytes of karaf log..." > "odl${i}_karaf.log"
+    ssh "${!CONTROLLERIP}" head --bytes=500K "/tmp/${BUNDLEFOLDER}/data/log/karaf.log" >> "odl${i}_karaf.log"
+    echo "dumping last 500K bytes of karaf log..." >> "odl${i}_karaf.log"
+    ssh "${!CONTROLLERIP}" tail --bytes=500K "/tmp/${BUNDLEFOLDER}/data/log/karaf.log" >> "odl${i}_karaf.log"
+    echo "killing karaf process..."
+    ssh "${!CONTROLLERIP}" bash -c 'ps axf | grep karaf | grep -v grep | awk '"'"'{print "kill -9 " $1}'"'"' | sh'
+done
+sleep 5
+for i in `seq 1 ${NUM_ODL_SYSTEM}`
+do
+    CONTROLLERIP=ODL_SYSTEM_${i}_IP
+    ssh "${!CONTROLLERIP}" xz -9ekvv "/tmp/${BUNDLEFOLDER}/data/log/karaf.log"
+    scp "${!CONTROLLERIP}:/tmp/${BUNDLEFOLDER}/data/log/karaf.log.xz" "odl${i}_karaf.log.xz"
+done
+true  # perhaps Jenkins is testing last exit code
 
+# vim: ts=4 sw=4 sts=4 et ft=sh :
 
-pybot -N ${TESTPLAN} -c critical -e exclude -v BUNDLEFOLDER:${BUNDLEFOLDER} -v WORKSPACE:/tmp \
--v NEXUSURL_PREFIX:${NEXUSURL_PREFIX} -v CONTROLLER:${CONTROLLER0} -v CONTROLLER1:${CONTROLLER1} -v CONTROLLER2:${CONTROLLER2} \
--v MININET:${MININET0} -v MININET_USER:${USER} -v USER_HOME:${HOME} ${TESTOPTIONS} ${SUITES} || true
-# the "|| true" is there to swallow a non-zero error code, as we do not want a failed critical test case to stop this script (run with -xe by Jenkins) from gathering karaf.log
-
-
-#
-echo "######  Fetching controller0-karaf.log ############"
-scp $CONTROLLER0:/tmp/$BUNDLEFOLDER/data/log/karaf.log \
-controller0-karaf.log
-# cat karaf.log
-#
-echo "######  Fetching controller1-karaf.log ############"
-scp $CONTROLLER1:/tmp/$BUNDLEFOLDER/data/log/karaf.log \
-controller1-karaf.log
-# cat controller1-karaf.log
-
-echo "######  Fetching controller2-karaf.log ############"
-scp $CONTROLLER2:/tmp/$BUNDLEFOLDER/data/log/karaf.log \
-controller2-karaf.log
-# cat controller2-karaf.log
-
-## vim: ts=4 sw=4 sts=4 et ft=sh :
-echo "############################################################"
-echo "## END include-raw-integration-start-cluster-run-test.sh  ##"
-echo "############################################################"