adding more sleep time for -all- jobs
[releng/builder.git] / jjb / integration / include-raw-integration-start-cluster-run-test.sh
1 #@IgnoreInspection BashAddShebang
2 # Activate robotframework virtualenv
3 # ${ROBOT_VENV} comes from the include-raw-integration-install-robotframework.sh
4 # script.
5 source ${ROBOT_VENV}/bin/activate
6
7 echo "#################################################"
8 echo "##         Verify Cluster is UP                ##"
9 echo "#################################################"
10
11 cat > ${WORKSPACE}/verify-cluster-is-up.sh <<EOF
12
13 CONTROLLERID="member-\$1"
14 ODL_SYSTEM_IP_PATH=\$2
15
16 echo "Waiting for controller to come up..."
17 COUNT="0"
18 while true; do
19     RESP="\$( curl --user admin:admin -sL -w "%{http_code} %{url_effective}\\n" http://localhost:8181/restconf/modules -o /dev/null )"
20     echo \$RESP
21     SHARD="\$( curl --user admin:admin -sL -w "%{http_code} %{url_effective}\\n" http://localhost:8181/jolokia/read/org.opendaylight.controller:Category=Shards,name=\$CONTROLLERID-shard-inventory-config,type=DistributedConfigDatastore)"
22     echo \$SHARD
23     if ([[ \$RESP == *"200"* ]] && [[ \$SHARD  == *'"status":200'* ]]); then
24         echo Controller is UP
25         break
26     elif (( "\$COUNT" > "600" )); then
27         echo Timeout Controller DOWN
28         echo "Dumping first 500K bytes of karaf log..."
29         head --bytes=500K "/tmp/${BUNDLEFOLDER}/data/log/karaf.log"
30         echo "Dumping last 500K bytes of karaf log..."
31         tail --bytes=500K "/tmp/${BUNDLEFOLDER}/data/log/karaf.log"
32         echo "Listing all open ports on controller system"
33         netstat -natu
34         exit 1
35     else
36         COUNT=\$(( \${COUNT} + 5 ))
37         sleep 5
38         echo waiting \$COUNT secs...
39     fi
40 done
41
42 echo "Listing all open ports on controller system.."
43 netstat -natu
44
45 function exit_on_log_file_message {
46     echo "looking for \"\$1\" in log file"
47     if grep --quiet "\$1" "/tmp/${BUNDLEFOLDER}/data/log/karaf.log"; then
48         echo ABORTING: found "\$1"
49         echo "Dumping first 500K bytes of karaf log..."
50         head --bytes=500K "/tmp/${BUNDLEFOLDER}/data/log/karaf.log"
51         echo "Dumping last 500K bytes of karaf log..."
52         tail --bytes=500K "/tmp/${BUNDLEFOLDER}/data/log/karaf.log"
53         exit 1
54     fi
55 }
56
57 exit_on_log_file_message 'BindException: Address already in use'
58 exit_on_log_file_message 'server is unhealthy'
59
60 EOF
61
62 for i in `seq 1 ${NUM_ODL_SYSTEM}`
63 do
64     CONTROLLERIP=ODL_SYSTEM_${i}_IP
65     echo "Verifying member-${i} with IP address ${!CONTROLLERIP} is UP"
66     scp ${WORKSPACE}/verify-cluster-is-up.sh ${!CONTROLLERIP}:/tmp
67     ssh ${!CONTROLLERIP} "bash /tmp/verify-cluster-is-up.sh ${i} ${!CONTROLLERIP}"
68 done
69
70 if [ ${CONTROLLERSCOPE} == 'all' ]; then
71     COOLDOWN_PERIOD="180"
72 else
73     COOLDOWN_PERIOD="60"
74 fi
75 echo "Cool down for ${COOLDOWN_PERIOD} seconds :)..."
76 sleep ${COOLDOWN_PERIOD}
77
78 echo "Changing the testplan path..."
79 cat ${WORKSPACE}/test/csit/testplans/${TESTPLAN} | sed "s:integration:${WORKSPACE}:" > testplan.txt
80 cat testplan.txt
81
82 SUITES=`egrep -v '(^[[:space:]]*#|^[[:space:]]*$)' testplan.txt | tr '\012' ' '`
83
84 echo "Generating controller variables..."
85 for i in `seq 1 ${NUM_ODL_SYSTEM}`
86 do
87     CONTROLLERIP=ODL_SYSTEM_${i}_IP
88     odl_variables=${odl_variables}" -v ${CONTROLLERIP}:${!CONTROLLERIP}"
89 done
90
91 echo "Generating mininet variables..."
92 for i in `seq 1 ${NUM_TOOLS_SYSTEM}`
93 do
94     MININETIP=TOOLS_SYSTEM_${i}_IP
95     tools_variables=${tools_variables}" -v ${MININETIP}:${!MININETIP}"
96 done
97
98 echo "Starting Robot test suites ${SUITES} ..."
99 pybot -N ${TESTPLAN} -c critical -e exclude -v BUNDLEFOLDER:${BUNDLEFOLDER} -v WORKSPACE:/tmp -v BUNDLE_URL:${ACTUALBUNDLEURL} \
100 -v NEXUSURL_PREFIX:${NEXUSURL_PREFIX} \
101 -v CONTROLLER:${ODL_SYSTEM_IP} -v CONTROLLER1:${ODL_SYSTEM_2_IP} -v CONTROLLER2:${ODL_SYSTEM_3_IP} -v ODL_SYSTEM_IP:${ODL_SYSTEM_IP} \
102 ${odl_variables} -v NUM_ODL_SYSTEM:${NUM_ODL_SYSTEM} -v CONTROLLER_USER:${USER} -v ODL_SYSTEM_USER:${USER} -v \
103 TOOLS_SYSTEM_IP:${TOOLS_SYSTEM_IP} ${tools_variables} -v NUM_TOOLS_SYSTEM:${NUM_TOOLS_SYSTEM} -v TOOLS_SYSTEM_USER:${USER} \
104 -v MININET:${TOOLS_SYSTEM_IP} -v MININET1:${TOOLS_SYSTEM_2_IP} -v MININET2:${TOOLS_SYSTEM_3_IP} -v MININET_USER:${USER} \
105 -v USER_HOME:${HOME} ${TESTOPTIONS} ${SUITES} || true
106
107 set +e  # We do not want to create red dot just because something went wrong while fetching logs.
108 for i in `seq 1 ${NUM_ODL_SYSTEM}`
109 do
110     CONTROLLERIP=ODL_SYSTEM_${i}_IP
111     echo "dumping first 500K bytes of karaf log..." > "odl${i}_karaf.log"
112     ssh "${!CONTROLLERIP}" head --bytes=500K "/tmp/${BUNDLEFOLDER}/data/log/karaf.log" >> "odl${i}_karaf.log"
113     echo "dumping last 500K bytes of karaf log..." >> "odl${i}_karaf.log"
114     ssh "${!CONTROLLERIP}" tail --bytes=500K "/tmp/${BUNDLEFOLDER}/data/log/karaf.log" >> "odl${i}_karaf.log"
115     echo "killing karaf process..."
116     ssh "${!CONTROLLERIP}" bash -c 'ps axf | grep karaf | grep -v grep | awk '"'"'{print "kill -9 " $1}'"'"' | sh'
117 done
118 sleep 5
119 for i in `seq 1 ${NUM_ODL_SYSTEM}`
120 do
121     CONTROLLERIP=ODL_SYSTEM_${i}_IP
122     ssh "${!CONTROLLERIP}" xz -9ekvv "/tmp/${BUNDLEFOLDER}/data/log/karaf.log"
123     scp "${!CONTROLLERIP}:/tmp/${BUNDLEFOLDER}/data/log/karaf.log.xz" "odl${i}_karaf.log.xz"
124 done
125 true  # perhaps Jenkins is testing last exit code
126
127 # vim: ts=4 sw=4 sts=4 et ft=sh :
128