Enable java thread dumps for netvirt csit
[releng/builder.git] / jjb / integration / include-raw-integration-deploy-controller-run-test.sh
1 #@IgnoreInspection BashAddShebang
2 # Activate robotframework virtualenv
3 # ${ROBOT_VENV} comes from the include-raw-integration-install-robotframework.sh
4 # script.
5 source ${ROBOT_VENV}/bin/activate
6
7 CONTROLLERMEM="2048m"
8
9 if [ "${ENABLE_HAPROXY_FOR_NEUTRON}" == "yes" ]; then
10     echo "Configure cluster"
11     AKKACONF=/tmp/${BUNDLEFOLDER}/configuration/initial/akka.conf
12     MODULESCONF=/tmp/${BUNDLEFOLDER}/configuration/initial/modules.conf
13     MODULESHARDSCONF=/tmp/${BUNDLEFOLDER}/configuration/initial/module-shards.conf
14 fi
15
16 if [ ${CONTROLLERSCOPE} == 'all' ]; then
17     ACTUALFEATURES="odl-integration-compatible-with-all,${CONTROLLERFEATURES}"
18     CONTROLLERMEM="3072m"
19     COOLDOWN_PERIOD="180"
20 else
21     ACTUALFEATURES="${CONTROLLERFEATURES}"
22     COOLDOWN_PERIOD="60"
23 fi
24
25 # Some versions of jenkins job builder result in feature list containing spaces
26 # and ending in newline. Remove all that.
27 ACTUALFEATURES=`echo "${ACTUALFEATURES}" | tr -d '\n \r'`
28
29 if [ -f "${WORKSPACE}/test/csit/scriptplans/${TESTPLAN}" ]; then
30     echo "scriptplan exists!!!"
31     echo "Changing the scriptplan path..."
32     cat ${WORKSPACE}/test/csit/scriptplans/${TESTPLAN} | sed "s:integration:${WORKSPACE}:" > scriptplan.txt
33     cat scriptplan.txt
34     for line in $( egrep -v '(^[[:space:]]*#|^[[:space:]]*$)' scriptplan.txt ); do
35         echo "Executing ${line}..."
36         source ${line}
37     done
38 fi
39
40 cat > ${WORKSPACE}/configuration-script.sh <<EOF
41
42 echo "Changing to /tmp"
43 cd /tmp
44
45 echo "Downloading the distribution..."
46 wget --progress=dot:mega '${ACTUAL_BUNDLE_URL}'
47
48 echo "Extracting the new controller..."
49 unzip -q ${BUNDLE}
50
51 echo "Configuring the startup features..."
52 FEATURESCONF=/tmp/${BUNDLEFOLDER}/etc/org.apache.karaf.features.cfg
53 CUSTOMPROP=/tmp/${BUNDLEFOLDER}/etc/custom.properties
54 sed -ie "s/\(featuresBoot=\|featuresBoot =\)/featuresBoot = ${ACTUALFEATURES},/g" \${FEATURESCONF}
55 sed -ie "s%mvn:org.opendaylight.integration/features-integration-index/${BUNDLEVERSION}/xml/features%mvn:org.opendaylight.integration/features-integration-index/${BUNDLEVERSION}/xml/features,mvn:org.opendaylight.integration/features-integration-test/${BUNDLEVERSION}/xml/features,mvn:org.apache.karaf.decanter/apache-karaf-decanter/1.0.0/xml/features%g" \${FEATURESCONF}
56 cat \${FEATURESCONF}
57
58 if [ "${ODL_ENABLE_L3_FWD}" == "yes" ]; then
59     echo "Enable the l3.fwd in custom.properties..."
60     echo "ovsdb.l3.fwd.enabled=yes" >> \${CUSTOMPROP}
61 fi
62 cat \${CUSTOMPROP}
63
64 echo "Configuring the log..."
65 LOGCONF=/tmp/${BUNDLEFOLDER}/etc/org.ops4j.pax.logging.cfg
66 sed -ie 's/log4j.appender.out.maxBackupIndex=10/log4j.appender.out.maxBackupIndex=1/g' \${LOGCONF}
67 # FIXME: Make log size limit configurable from build parameter.
68 sed -ie 's/log4j.appender.out.maxFileSize=1MB/log4j.appender.out.maxFileSize=30GB/g' \${LOGCONF}
69 echo "log4j.logger.org.opendaylight.yangtools.yang.parser.repo.YangTextSchemaContextResolver = WARN" >> \${LOGCONF}
70 cat \${LOGCONF}
71
72 echo "Configure java home and max memory..."
73 MEMCONF=/tmp/${BUNDLEFOLDER}/bin/setenv
74 sed -ie 's%^# export JAVA_HOME%export JAVA_HOME="\${JAVA_HOME:-${JAVA_HOME}}"%g' \${MEMCONF}
75 sed -ie 's/JAVA_MAX_MEM="2048m"/JAVA_MAX_MEM="${CONTROLLERMEM}"/g' \${MEMCONF}
76 cat \${MEMCONF}
77
78 echo "Listing all open ports on controller system..."
79 netstat -pnatu
80
81 echo "Set Java version"
82 sudo /usr/sbin/alternatives --install /usr/bin/java java ${JAVA_HOME}/bin/java 1
83 sudo /usr/sbin/alternatives --set java ${JAVA_HOME}/bin/java
84 echo "JDK default version..."
85 java -version
86
87 echo "Set JAVA_HOME"
88 export JAVA_HOME="${JAVA_HOME}"
89 # Did you know that in HERE documents, single quote is an ordinary character, but backticks are still executing?
90 JAVA_RESOLVED=\`readlink -e "\${JAVA_HOME}/bin/java"\`
91 echo "Java binary pointed at by JAVA_HOME: \${JAVA_RESOLVED}"
92
93 if [ "${ENABLE_HAPROXY_FOR_NEUTRON}" == "yes" ]; then
94
95     # Copy shard file if exists
96     if [ -f /tmp/custom_shard_config.txt ]; then
97         echo "Custom shard config exists!!!"
98         echo "Copying the shard config..."
99         cp /tmp/custom_shard_config.txt /tmp/${BUNDLEFOLDER}/bin/
100     fi
101
102     echo "Configuring cluster"
103     /tmp/${BUNDLEFOLDER}/bin/configure_cluster.sh \$1 \$2
104
105     echo "Dump akka.conf"
106     cat ${AKKACONF}
107
108     echo "Dump modules.conf"
109     cat ${MODULESCONF}
110
111      echo "Dump module-shards.conf"
112      cat ${MODULESHARDSCONF}
113 fi
114
115 EOF
116
117 # Create the startup script to be run on controller.
118 cat > ${WORKSPACE}/startup-script.sh <<EOF
119
120 echo "Redirecting karaf console output to karaf_console.log"
121 export KARAF_REDIRECT="/tmp/${BUNDLEFOLDER}/data/log/karaf_console.log"
122
123 echo "Starting controller..."
124 /tmp/${BUNDLEFOLDER}/bin/start
125
126 EOF
127
128 cat > ${WORKSPACE}/post-startup-script.sh <<EOF
129
130 echo "Waiting for controller to come up..."
131 COUNT="0"
132 while true; do
133     RESP="\$( curl --user admin:admin -sL -w "%{http_code} %{url_effective}\\n" http://localhost:8181/restconf/modules -o /dev/null )"
134     echo \$RESP
135     if [ "${ENABLE_HAPROXY_FOR_NEUTRON}" == "yes" ]; then
136         SHARD="\$( curl --user admin:admin -sL -w "%{http_code} %{url_effective}\\n" http://localhost:8181/jolokia/read/org.opendaylight.controller:Category=Shards,name=\member-\$1-shard-inventory-config,type=DistributedConfigDatastore)"
137         echo \$SHARD
138     fi
139     if ([[ \$RESP == *"200"* ]] && ([[ "${ENABLE_HAPROXY_FOR_NEUTRON}" != "yes" ]] || [[ \$SHARD  == *'"status":200'* ]])); then
140         echo Controller is UP
141         break
142     elif (( "\$COUNT" > "600" )); then
143         echo Timeout Controller DOWN
144         echo "Dumping first 500K bytes of karaf log..."
145         head --bytes=500K "/tmp/${BUNDLEFOLDER}/data/log/karaf.log"
146         echo "Dumping last 500K bytes of karaf log..."
147         tail --bytes=500K "/tmp/${BUNDLEFOLDER}/data/log/karaf.log"
148         echo "Listing all open ports on controller system"
149         netstat -pnatu
150         exit 1
151     else
152         COUNT=\$(( \${COUNT} + 5 ))
153         sleep 5
154         echo waiting \$COUNT secs...
155     fi
156 done
157
158 echo "Listing all open ports on controller system..."
159 netstat -pnatu
160
161 function exit_on_log_file_message {
162     echo "looking for \"\$1\" in log file"
163     if grep --quiet "\$1" "/tmp/${BUNDLEFOLDER}/data/log/karaf.log"; then
164         echo ABORTING: found "\$1"
165         echo "Dumping first 500K bytes of karaf log..."
166         head --bytes=500K "/tmp/${BUNDLEFOLDER}/data/log/karaf.log"
167         echo "Dumping last 500K bytes of karaf log..."
168         tail --bytes=500K "/tmp/${BUNDLEFOLDER}/data/log/karaf.log"
169         exit 1
170     fi
171 }
172
173 exit_on_log_file_message 'BindException: Address already in use'
174 exit_on_log_file_message 'server is unhealthy'
175
176 EOF
177
178 [ "$NUM_OPENSTACK_SITES" ] || NUM_OPENSTACK_SITES=1
179 NUM_ODLS_PER_SITE=$((NUM_ODL_SYSTEM / NUM_OPENSTACK_SITES))
180 for i in `seq 1 ${NUM_OPENSTACK_SITES}`
181 do
182     # Get full list of ODL nodes for this site
183     odl_node_list=
184     for j in `seq 1 ${NUM_ODLS_PER_SITE}`
185     do
186         odl_ip=ODL_SYSTEM_$(((i - 1) * NUM_ODLS_PER_SITE + j))_IP
187         odl_node_list="${odl_node_list} ${!odl_ip}"
188     done
189
190     for j in `seq 1 ${NUM_ODLS_PER_SITE}`
191     do
192         odl_ip=ODL_SYSTEM_$(((i - 1) * NUM_ODLS_PER_SITE + j))_IP
193         # Copy over the config script to controller and execute it (parameters are used only for cluster)
194         echo "Execute the configuration script on controller ${!odl_ip} for index $j with node list ${odl_node_list}"
195         scp ${WORKSPACE}/configuration-script.sh ${!odl_ip}:/tmp
196         ssh ${!odl_ip} "bash /tmp/configuration-script.sh ${j} '${odl_node_list}'"
197     done
198 done
199
200 echo "Locating config plan to use..."
201 configplan_filepath="${WORKSPACE}/test/csit/configplans/${STREAMTESTPLAN}"
202 if [ ! -f "${configplan_filepath}" ]; then
203     configplan_filepath="${WORKSPACE}/test/csit/configplans/${TESTPLAN}"
204 fi
205
206 if [ -f "${configplan_filepath}" ]; then
207     echo "configplan exists!!!"
208     echo "Changing the configplan path..."
209     cat ${configplan_filepath} | sed "s:integration:${WORKSPACE}:" > configplan.txt
210     cat configplan.txt
211     for line in $( egrep -v '(^[[:space:]]*#|^[[:space:]]*$)' configplan.txt ); do
212         echo "Executing ${line}..."
213         source ${line}
214     done
215 fi
216
217 # Copy over the startup script to controller and execute it.
218 for i in `seq 1 ${NUM_ODL_SYSTEM}`
219 do
220     CONTROLLERIP=ODL_SYSTEM_${i}_IP
221     echo "Execute the startup script on controller ${!CONTROLLERIP}"
222     scp ${WORKSPACE}/startup-script.sh ${!CONTROLLERIP}:/tmp
223     ssh ${!CONTROLLERIP} "bash /tmp/startup-script.sh"
224 done
225
226 seed_index=1
227 for i in `seq 1 ${NUM_ODL_SYSTEM}`
228 do
229     CONTROLLERIP=ODL_SYSTEM_${i}_IP
230     echo "Execute the post startup script on controller ${!CONTROLLERIP}"
231     scp ${WORKSPACE}/post-startup-script.sh ${!CONTROLLERIP}:/tmp
232     ssh ${!CONTROLLERIP} "bash /tmp/post-startup-script.sh $(( seed_index++ ))"
233     if [ $(( $i % (${NUM_ODL_SYSTEM} / ${NUM_OPENSTACK_SITES}) )) == 0 ]; then
234         seed_index=1
235     fi
236 done
237
238 echo "Cool down for ${COOLDOWN_PERIOD} seconds :)..."
239 sleep ${COOLDOWN_PERIOD}
240
241 echo "Generating controller variables..."
242 for i in `seq 1 ${NUM_ODL_SYSTEM}`
243 do
244     CONTROLLERIP=ODL_SYSTEM_${i}_IP
245     odl_variables=${odl_variables}" -v ${CONTROLLERIP}:${!CONTROLLERIP}"
246     echo "Lets's take the karaf thread dump"
247     KARAF_PID=$(ssh ${!CONTROLLERIP} "ps aux | grep ${KARAF_ARTIFACT} | grep -v grep | tr -s ' ' | cut -f2 -d' '")
248     ssh ${!CONTROLLERIP} "jstack $KARAF_PID"> ${WORKSPACE}/karaf_${i}_threads_before.log || true
249 done
250
251 if [ ${NUM_OPENSTACK_SYSTEM} -gt 0 ]; then
252    echo "Exiting without running tests to deploy openstack for testing"
253    exit
254 fi
255
256 echo "Generating mininet variables..."
257 for i in `seq 1 ${NUM_TOOLS_SYSTEM}`
258 do
259     MININETIP=TOOLS_SYSTEM_${i}_IP
260     tools_variables=${tools_variables}" -v ${MININETIP}:${!MININETIP}"
261 done
262
263 echo "Locating test plan to use..."
264 testplan_filepath="${WORKSPACE}/test/csit/testplans/${STREAMTESTPLAN}"
265 if [ ! -f "${testplan_filepath}" ]; then
266     testplan_filepath="${WORKSPACE}/test/csit/testplans/${TESTPLAN}"
267 fi
268
269 echo "Changing the testplan path..."
270 cat "${testplan_filepath}" | sed "s:integration:${WORKSPACE}:" > testplan.txt
271 cat testplan.txt
272 SUITES=$( egrep -v '(^[[:space:]]*#|^[[:space:]]*$)' testplan.txt | tr '\012' ' ' )
273
274 echo "Starting Robot test suites ${SUITES} ..."
275 pybot -N ${TESTPLAN} --removekeywords wuks -c critical -e exclude -v BUNDLEFOLDER:${BUNDLEFOLDER} -v WORKSPACE:/tmp \
276 -v JAVA_HOME:${JAVA_HOME} -v BUNDLE_URL:${ACTUAL_BUNDLE_URL} -v NEXUSURL_PREFIX:${NEXUSURL_PREFIX} \
277 -v CONTROLLER:${ODL_SYSTEM_IP} -v ODL_SYSTEM_IP:${ODL_SYSTEM_IP} -v ODL_SYSTEM_1_IP:${ODL_SYSTEM_IP} \
278 -v CONTROLLER_USER:${USER} -v ODL_SYSTEM_USER:${USER} \
279 -v TOOLS_SYSTEM_IP:${TOOLS_SYSTEM_IP} -v TOOLS_SYSTEM_2_IP:${TOOLS_SYSTEM_2_IP} -v TOOLS_SYSTEM_3_IP:${TOOLS_SYSTEM_3_IP} \
280 -v TOOLS_SYSTEM_4_IP:${TOOLS_SYSTEM_4_IP} -v TOOLS_SYSTEM_5_IP:${TOOLS_SYSTEM_5_IP} -v TOOLS_SYSTEM_6_IP:${TOOLS_SYSTEM_6_IP} \
281 -v TOOLS_SYSTEM_USER:${USER} -v JDKVERSION:${JDKVERSION} -v ODL_STREAM:${DISTROSTREAM} -v NUM_ODL_SYSTEM:${NUM_ODL_SYSTEM} \
282 -v MININET:${TOOLS_SYSTEM_IP} -v MININET1:${TOOLS_SYSTEM_2_IP} -v MININET2:${TOOLS_SYSTEM_3_IP} \
283 -v MININET3:${TOOLS_SYSTEM_4_IP} -v MININET4:${TOOLS_SYSTEM_5_IP} -v MININET5:${TOOLS_SYSTEM_6_IP} \
284 -v MININET_USER:${USER} -v USER_HOME:${HOME} ${TESTOPTIONS} ${SUITES} || true
285 # FIXME: Sort (at least -v) options alphabetically.
286
287 echo "Examining the files in data/log and checking filesize"
288 ssh ${ODL_SYSTEM_IP} "ls -altr /tmp/${BUNDLEFOLDER}/data/log/"
289 ssh ${ODL_SYSTEM_IP} "du -hs /tmp/${BUNDLEFOLDER}/data/log/*"
290
291 for i in `seq 1 ${NUM_ODL_SYSTEM}`
292 do
293     CONTROLLERIP=ODL_SYSTEM_${i}_IP
294     echo "Lets's take the karaf thread dump again..."
295     KARAF_PID=$(ssh ${!CONTROLLERIP} "ps aux | grep ${KARAF_ARTIFACT} | grep -v grep | tr -s ' ' | cut -f2 -d' '")
296     ssh ${!CONTROLLERIP} "jstack $KARAF_PID"> ${WORKSPACE}/karaf_${i}_threads_after.log || true
297     echo "Killing ODL"
298     set +e  # We do not want to create red dot just because something went wrong while fetching logs.
299     ssh "${!CONTROLLERIP}" bash -c 'ps axf | grep karaf | grep -v grep | awk '"'"'{print "kill -9 " $1}'"'"' | sh'
300 done
301
302 sleep 5
303 for i in `seq 1 ${NUM_ODL_SYSTEM}`
304 do
305     CONTROLLERIP=ODL_SYSTEM_${i}_IP
306     echo "Compressing karaf.log ${i}"
307     ssh ${!CONTROLLERIP} gzip --best /tmp/${BUNDLEFOLDER}/data/log/karaf.log
308     echo "Fetching compressed karaf.log ${i}"
309     scp "${!CONTROLLERIP}:/tmp/${BUNDLEFOLDER}/data/log/karaf.log.gz" "odl${i}_karaf.log.gz"
310     # TODO: Should we compress the output log file as well?
311     scp "${!CONTROLLERIP}:/tmp/${BUNDLEFOLDER}/data/log/karaf_console.log" "odl${i}_karaf_console.log"
312 done
313
314 true  # perhaps Jenkins is testing last exit code
315
316 # vim: ts=4 sw=4 sts=4 et ft=sh :