#!/bin/bash
#set -x # uncomment for bash script debugging
### ============================================================================
### Licensed under the Apache License, Version 2.0 (the "License");
### you may not use this file except in compliance with the License.
### You may obtain a copy of the License at
###
### http://www.apache.org/licenses/LICENSE-2.0
###
### Unless required by applicable law or agreed to in writing, software
### distributed under the License is distributed on an "AS IS" BASIS,
### WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
### See the License for the specific language governing permissions and
### limitations under the License.
### ============LICENSE_END=====================================================
###
### checkdocs.sh
###
### AUTHOR(S):
### Thomas Kulik, Deutsche Telekom AG, 2020 - 2021
###
### DESCRIPTION:
### Retrieves a full list of ONAP repos from gerrit inluding their state.
### Clones all active repos of the ONAP master branch plus other requested ONAP
### branches. Then the script does some docs related analyses depending on the
### clone results. It creates logfiles containing filtered results. In addition
### a table.csv is created which can be used to import it in a spreadsheed.
### Also a zip-file is created which contains all the results.
###
### IMPORTANT:
### - in the output, repo names are shown in square brackets for readability
### e.g [aai/aai-common]/docs/release-notes.rst
### - in the table.csv file you see data for the requested branch if available.
### if not available, data is retrieved from the master branch. it will be
### denoted in round brackets, e.g. (3) (tox.ini)
###
### REQUIREMENTS:
### curl
### jq
###
###
### SOME HELPING COMMANDS TO PROCESS LOG FILES:
### create repo list
### curl -s https://git.onap.org/ | grep "^
1)print}' | jq -c '.[] | {id, state}' | sed -r 's:%2F:/:g' | sed -r 's:["{}]::g' | sed -r 's:id\:::' | sed -r 's:,state\::|:' | sed '/All-Projects/d' | sed '/All-Users/d'
### SHORT: curl -s 'https://gerrit.onap.org/r/projects/?d' | awk '{if(NR>1)print}' | jq -c '.[] | {id, state}' | sed -r 's:%2F:/:g; s:["{}]::g; s:id\:::; s:,state\::|:; /All-Projects/d; /All-Users/d'
###
script_version="1.10 (2021-06-10)"
# save command for the restart with logging enabled
command=$0
arguments=$@
fullcommand="${command} ${arguments}"
###
### functions
###
# print usage
function usage() {
echo " "
echo " checkdocs.sh Version ${script_version}"
echo " "
echo " USAGE: "
echo " ./checkdocs.sh "
echo " "
echo " ARGUMENTS: "
echo " -u|--user username "
echo " linux foundation username used to clone ONAP repositories"
echo " "
echo " -b|--branches branch1,branch2,branch3 "
echo " list of branches to be cloned. master is automatically "
echo " added to the list. do not add manually! "
echo " "
echo " -d|--dev "
echo " development-mode - limits number of repos to be cloned "
echo " "
}
# draw a simple line
function drawline {
echo "*******************************************************************************"
}
# remove lockfile in case script is interrupted
trap InterruptedScript SIGINT SIGTERM SIGHUP SIGKILL SIGSTOP
function InterruptedScript {
echo " "
echo "Script was interrupted."
if [ -f $lockfile ] ; then
rm $lockfile
fi
exit 0
}
# function to parse wiki (project) lifecycle state information
# call: getwikilifecyclestate "projectname"
# result: $return_from_getwikilifecyclestate
# because bash supports only returning numeric values a variable $return_from_getwikilifecyclestate is used
function getwikilifecyclestate {
local requested=$1
local wikiline=""
local wikirepo=""
local wikistate=""
return_from_getwikilifecyclestate=""
for wikiline in "${wikiplsarray[@]}"
do
wikirepo=$(echo $wikiline | awk -F ";" '{print $1}');
wikistate=$(echo $wikiline | awk -F ";" '{print $2}');
#echo "DBUG: getwikilifecyclestate wikiline = \"${wikiline}\"";
#echo "DBUG: getwikilifecyclestate wikirepo = \"${wikirepo}\""
#echo "DBUG: getwikilifecyclestate wikistate = \"${wikistate}\""
if [[ ${wikirepo} == ${requested} ]]; then
return_from_getwikilifecyclestate=${wikistate}
#echo "DBUG: getwikilifecyclestate wikirepo = \"${wikirepo}\""
#echo "DBUG: getwikilifecyclestate requested = \"${requested}\""
#echo "DBUG: return_from_getwikilifecyclestate = \"${return_from_getwikilifecyclestate}\"";
return 0;
fi
done
#echo "DBUG: getwikilifecyclestate requested \"${requested}\" NOT FOUND in list"
return_from_getwikilifecyclestate=""
}
# function to parse release partizipation information
# call: getrpinfo "projectname"
# result: $return_from_getrpinfo
# because bash supports only returning numeric values a variable $return_from_getrpinfo is used
function getrpinfo {
local requested=$1
# clean up first
local rpdetails=""
local rpline=""
local rprepo=""
local rpproject=""
local current_branch_starting_letter=""
return_from_getrpinfo=""
# finds first matching line in the array using grep (currently every line shows the same partizipation for the project (NOT repository!) )
# this is much faster then looping line by line
rpline=$(IFS=$'\n'; echo "${rparray[*]}" | grep -m 1 ";${requested};");
rpline=$(echo ${rpline} | tr -d '^M')
rprepo=$(echo ${rpline} | awk -F ";" '{print $1}');
rpproject=$(echo ${rpline} | awk -F ";" '{print $2}');
# concatenate details to do an easy grep later on to find out if or if not the project/repo has partizipated to a release
rpdetails=$(echo ${rpline} | awk -F ";" '{print "-" $3 "-" $4 "-" $5 "-" $6 "-" $7 "-" $8 "-" $9 "-" $10 "-" $11 "-" $12 "-"}');
# result will be e.g. "-g" and this avoids false positives with the "m" release
# (because "m" is also used to indicate the maintenance release, e.g. "gm")
current_branch_starting_letter="-${branch:0:1}"
#echo "DBUG: getrpinfo ****************************";
#echo "DBUG: getrpinfo requested = \"${requested}\"";
#echo "DBUG: getrpinfo rpproject = \"${rpproject}\"";
#echo "DBUG: getrpinfo rpdetails = \"${rpdetails}\"";
#echo "DBUG: current branch = \"${branch}\"";
#echo "DBUG: starting_letter = \"${current_branch_starting_letter}\"";
# check
if [[ ${rpproject} = ${requested} ]] && [[ "${rpdetails}" == *"${current_branch_starting_letter}"* ]]; then
return_from_getrpinfo="project partizipated"
#echo "DBUG: getrpinfo return = \"${return_from_getrpinfo}\"";
return 0;
fi
#echo "DBUG: getrpinfo requested \"${requested}\" NOT FOUND in list"
return_from_getrpinfo=""
}
###
### arguments handling
###
PARAMS=""
while (( "$#" )); do
case "$1" in
-d|--dev)
devmode="TRUE"
shift
;;
-b|--branches)
if [ -n "$2" ] && [ ${2:0:1} != "-" ]; then
branches_csv=$2
shift 2
else
echo "Error: Argument for $1 is missing" >&2
usage
exit 1
fi
;;
-u|--user)
if [ -n "$2" ] && [ ${2:0:1} != "-" ]; then
lfusername=$2
shift 2
else
echo "Error: Argument for $1 is missing" >&2
usage
exit 1
fi
;;
-*|--*=) # unsupported flags
echo "Error: Unsupported argument $1" >&2
usage
exit 1
;;
*) # preserve positional arguments
PARAMS="$PARAMS $1"
shift
;;
esac
done
# set positional arguments in their proper place
eval set -- "$PARAMS"
# old: declare -a branches=("master" "frankfurt" "guilin")
if [[ $branches_csv == "" || $lfusername == "" ]]; then
usage
exit -1
fi
# master branch is automatically added and must not part of the user arguments
if [[ $branches_csv == *"master"* ]]; then
usage
exit -1
fi
# clone master first, then the other branches
branches_csv="master,${branches_csv}"
# create the branches array by readinging in the values from the variable
IFS=',' read -r -a branches <<< "${branches_csv}"
#echo "DBUG: devmode = \"${devmode}\""
#echo "DBUG: branches_csv = \"${branches_csv}\""
#echo "DBUG: lfusername = \"${lfusername}\""
#echo "DBUG: branches = \"${branches[@]}\""
# restart script with logging enabled
lockfile="checkdocs-runtime-lockfile"
if [ ! -f $lockfile ] ; then
touch $lockfile
echo "Restarting script with logging enabled."
${fullcommand} 2>&1 | tee checkdocs.log
rm $lockfile
exit
fi
echo " "
echo "checkdocs.sh Version ${script_version}"
echo " "
#
# read in wiki (project) lifecycle state
# always use the lastest available file (derived from date in filename e.g. wiki_lifecycle_state_210409.txt)
# format is ;;
#
wikiplsfile=$(ls | sed -nr '/wiki_lifecycle_state_[0-9]{6}.txt/Ip' | tail -1);
if [[ $wikiplsfile == "" ]]; then
echo "ERROR: wiki_lifecycle_state_yymmdd.txt missing"
exit -1
fi
echo "Using \"${wikiplsfile}\" as the source for wiki (project) lifecycle state information."
readarray -t wikiplsarray < ./${wikiplsfile};
#
# read in release_partizipation_YYMMDD.csv file
# always use the latest available file (derived from date in filename e.g. release_partizipation_210409.csv)
# format is: $1=repository;$2=project;$3=g;$4=gm;$5=h;$6=hm;$7=i;$8=im;$9=j;$10=jm;$11=k;$12=km;;;;
# example: "g" = project partizipated to the (g)uilin release
# "gm" = project partizipated to the (g)uilin (m)aintenance release
# file may contain windows control charaters at end of line (^M)
#
rpfile=$(ls | sed -nr '/release_partizipation_[0-9]{6}.csv/Ip' | tail -1);
if [[ $rpfile == "" ]]; then
echo "ERROR: release_partizipation_yymmdd.csv missing"
exit -1
fi
echo "Using \"${rpfile}\" as the source for release partizipation information."
readarray -t rparray < ./${rpfile};
# remove first line
rparray=("${rparray[@]:1}")
# printf '%s\n' "${rparray[@]}"
#
# curl must be installed
#
if ! command -v curl &> /dev/null
then
echo "ERROR: curl command could not be found"
exit -1
fi
today=$(date '+%Y-%m-%d');
repolist="gerrit-repos-master-"$today".txt";
unique=$(date +%s)
echo "Retrieving a full list of ONAP repositories (master) from gerrit.onap.org."
#
# retrieve the full repolist from gerrit
# workaround because of the (wrong?) response of gerrit.onap.org which makes jq command fail
# "| awk '{if(NR>1)print}'" filters the first line of the response so that jq will work again (thx marek)
#
curl -s 'https://gerrit.onap.org/r/projects/?d' | awk '{if(NR>1)print}' | jq -c '.[] | {id, state}' | sed -r 's:%2F:/:g; s:["{}]::g; s:id\:::; s:,state\::|:; /All-Projects/d; /All-Users/d' >./$repolist
# process the created repolist and try to clone the projects from the mirror
source="git://cloud.onap.org/mirror"
echo "Using \"${source}\" as the source and username \"${lfusername}\" for cloning the repositories."
echo "Start cloning of repositories ..."
for branch in "${branches[@]}"
do
echo " "
echo "###"
echo "### ${branch}"
echo "###"
echo " "
branch_upper=$(echo "${branch}" | tr '[:lower:]' '[:upper:]')
mkdir $branch
cp $repolist $branch
cd $branch
devcounter=0
# process repolist
while read line
do
if [[ $devmode == "TRUE" ]]; then
devcounter=$((devcounter+1))
fi
if [[ $devcounter -lt "50" ]]; then
if [[ $devmode == "TRUE" ]]; then
echo "INFO: devmode! counter=${devcounter}"
fi
drawline
reponame=$(echo $line | awk -F "|" '{print $1}');
repostate=$(echo $line | awk -F "|" '{print $2}');
echo $reponame
echo $repostate
if [[ $repostate == "ACTIVE" ]] || [[ $repostate == "READ_ONLY" ]]; then
echo "Cloning \"${branch}\" branch of \"${repostate}\" project ${reponame}..."
# previously used: git clone --branch ${branch} --recurse-submodules ssh://${lfusername}@gerrit.onap.org:29418/$reponame ./$reponame
# clone script Jess: git clone "git://cloud.onap.org/mirror/${i}" "${LOCALNAME}"
git clone --branch ${branch} --recurse-submodules ${source}/${reponame} ./${reponame}
gitexitcode=$?
if [[ ! ${gitexitcode} == "0" ]]; then
errormsg=$(tail -1 ../checkdocs.log)
else
errormsg="cloned"
fi
# repoclone.log format: $1=gitexitcode|$2=reponame|$3=repostate|$4=errormsg
echo "${gitexitcode}|${reponame}|${repostate}|${errormsg}" | tee -a ${branch}_repoclone.log
#elif [[ $repostate == "READ_ONLY" ]]; then
#echo "-|${reponame}|${repostate}|ignored" | tee -a ${branch}_repoclone.log
else
echo "-|${reponame}|unknown repo state \"${repostate}\"|-" | tee -a ${branch}_repoclone.log
fi
# examine repo
if [[ ${gitexitcode} == "0" ]]; then
printf "\ndocs directories:\n"
find ./$reponame -type d -name docs | sed -r 's:./::' | sed -r s:${reponame}:[${reponame}]: | tee -a ${branch}_docs.log
printf "\nrst files:\n"
find ./$reponame -type f -name *.rst | sed -r 's:./::' | sed -r s:${reponame}:[${reponame}]: | tee -a ${branch}_rstfiles.log
printf "\nrelease notes rst:\n"
find ./$reponame -type f | grep '.*release.*note.*.rst' | sed -r 's:./::' | sed -r s:${reponame}:[${reponame}]: | tee -a ${branch}_releasenotes.log
printf "\ntox.ini files:\n"
find ./$reponame -type f -name tox.ini | sed -r 's:./::' | sed -r s:${reponame}:[${reponame}]: | tee -a ${branch}_toxini.log
printf "\nconf.py files:\n"
find ./$reponame -type f -name conf.py | sed -r 's:./::' | sed -r s:${reponame}:[${reponame}]: | tee -a ${branch}_confpy.log
printf "\nindex.rst files (all):\n"
find ./$reponame -type f -name index.rst | sed -r 's:./::' | sed -r s:${reponame}:[${reponame}]: | tee -a ${branch}_indexrst_all.log
printf "\nindex.rst files (docs root directory):\n"
find ./$reponame -type f -name index.rst | sed -r 's:./::' | sed -r s:${reponame}:[${reponame}]: | grep ']/docs/index.rst' | tee -a ${branch}_indexrst_docs_root.log
printf "\nINFO.yaml files:\n"
find ./$reponame -type f -name INFO.yaml | sed -r 's:./::' | sed -r s:${reponame}:[${reponame}]: | tee -a ${branch}_infoyaml.log
fi
# end defcounter loop
fi
gitexitcode=""
done <${repolist}
# get (first) title for a rst file
drawline
python3 ../getrsttitle.py ${branch}_rstfiles.log | tee ${branch}_rstfiles_titles.log
drawline
python3 ../getrsttitle.py ${branch}_indexrst_docs_root.log | tee ${branch}_indexrst_docs_root_titles.log
# examine repos
drawline
find . -type f -name values.yaml -print -exec grep "image:" {} \; | sed -r 's:^ +::' | tee ${branch}_dockerimagesfull.log
drawline
ls --format single-column -d */ | sed 's:/$::' | tee ${branch}_directories.log
drawline
cat ${branch}_dockerimagesfull.log | grep image | sed -r 's:image\:::' | sed -r 's:^ +::' | sed '/^[[:space:]]*$/d' >${branch}_dockerimages.log
drawline
ls --format single-column -d oom/kubernetes/*/ | tee ${branch}_oomkubernetes.log
drawline
# examine docs
readarray -t docs_array < ./${branch}_docs.log;
for line in "${docs_array[@]}"
do
echo $line | tee -a ${branch}_docsconfig.log
# remove [ and ] which are distinguish the project name in the output
line=$(echo $line | sed -r 's:\[:: ; s:\]::')
if [ -f ./${line}/conf.py ] ; then
echo " conf.py ..... found" | tee -a ${branch}_docsconfig.log
else
echo " conf.py ..... NOT FOUND" | tee -a ${branch}_docsconfig.log
fi
if [ -f ./${line}/index.rst ] ; then
echo " index.rst ... found" | tee -a ${branch}_docsconfig.log
else
echo " index.rst ... NOT FOUND" | tee -a ${branch}_docsconfig.log
fi
if [ -f ./${line}/tox.ini ] ; then
echo " tox.ini ..... found" | tee -a ${branch}_docsconfig.log
else
echo " tox.ini ..... NOT FOUND" | tee -a ${branch}_docsconfig.log
fi
echo " " | tee -a ${branch}_docsconfig.log
done
unset docs_array
drawline
###
### build a csv table that combines results
###
#
# csv column #1: project name
#
readarray -t array < ./${repolist};
i=0
csv[i]="project"
((i++))
for line in "${array[@]}"
do
reponame=$(echo $line | awk -F "|" '{print $1}');
project=$(echo $reponame | sed 's:/.*$::')
#echo "DBUG: reponame=${reponame}"
#echo "DBUG: project=${project}"
#echo "DBUG: i=${i}"
csv[i]=${project}
((i++))
done
unset array
unset i
unset reponame
unset project
#
# csv column #2: repo name
#
readarray -t array < ./${repolist};
i=0
csv[i]="${csv[i]},MASTER repo name"
((i++))
for line in "${array[@]}"
do
reponame=$(echo $line | awk -F "|" '{print $1}');
csv[i]="${csv[i]},${reponame}"
((i++))
done
unset array
unset i
unset reponame
#
# csv column #3: repo state
#
readarray -t array < ./${repolist};
i=0
csv[i]="${csv[i]},MASTER repo state"
((i++))
for line in "${array[@]}"
do
repostate=$(echo $line | awk -F "|" '{print $2}');
csv[i]="${csv[i]},${repostate}"
((i++))
done
unset array
unset i
unset repostate
#
# csv column #4: clone message
#
readarray -t array < ./${branch}_repoclone.log;
i=0
csv[i]="${csv[i]},${branch_upper} clone message"
((i++))
for line in "${array[@]}"
do
# repoclone.log format: $1=gitexitcode|$2=reponame|$3=repostate|$4=errormsg
errormsg=$(echo $line | awk -F "|" '{print $4}');
csv[i]="${csv[i]},${errormsg}"
((i++))
done
unset array
unset i
unset errormsg
#
# csv column #5: latest branch
#
readarray -t array < ./${repolist};
i=0
csv[i]="${csv[i]},latest branch"
((i++))
for line in "${array[@]}"
do
reponame=$(echo $line | awk -F "|" '{print $1}');
latestbranch=$(git ls-remote -q --heads "${source}/${reponame}" | sed 's/^.*heads\///' | sed -nr '/^master$|^amsterdam$|^beijing$|^casablanca$|^dublin$|^elalto$|^frankfurt$|^guilin$|^honolulu$|^istanbul$/Ip' | tail -2 | head -1);
#echo "DBUG: reponame=${reponame}"
#echo "DBUG: latestbranch=${latestbranch}"
echo "latest available branch for repo \"${reponame}\" is \"${latestbranch}\""
csv[i]="${csv[i]},${latestbranch}"
((i++))
done
unset array
unset i
unset reponame
unset latestbranch
#
# csv column #6: INFO.yaml LC state (project lifecycle state based on INFO.yaml / per repo)
# csv column #7: WIKI LC state (project lifecycle state based on ONAP Dev Wiki / per project)
# csv column #8: LC state match shows a "match" if both LC states match
#
readarray -t array < ./${repolist};
i=0
csv[i]="${csv[i]},INFO.yaml LC state,WIKI LC state,LC state match"
((i++))
for line in "${array[@]}"
do
reponame=$(echo $line | awk -F "|" '{print $1}');
project=$(echo $reponame | sed 's:/.*$::')
if [ -f ./${reponame}/INFO.yaml ] ; then
# check if repo/branch has a INFO.yaml
lifecycleproject=$(grep '^project: ' ./${reponame}/INFO.yaml | awk -F ":" '{print $2}' | sed 's:^ ::' | sed "s:'::g" | tr '[:upper:]' '[:lower:]' | sed 's/\r$//')
lifecyclestate=$(grep '^lifecycle_state: ' ./${reponame}/INFO.yaml | awk -F ":" '{print $2}' | sed 's:^ ::' | sed "s:'::g" | tr '[:upper:]' '[:lower:]' | sed 's/\r$//')
elif [ ${branch} != "master" ] && [ -f ../master/${reponame}/INFO.yaml ] ; then
# IF current branch is not master AND if info.yaml not found in the current repo/branch THAN use INFO.yaml of repo/master if available
#echo "DBUG: branch=${branch} - checking master for INFO.yaml"
lifecycleproject=$(grep '^project: ' ../master/${reponame}/INFO.yaml | awk -F ":" '{print $2}' | sed 's:^ ::' | sed "s:'::g" | tr '[:upper:]' '[:lower:]' | sed 's/\r$//')
lifecyclestate=$(grep '^lifecycle_state: ' ../master/${reponame}/INFO.yaml | awk -F ":" '{print $2}' | sed 's:^ ::' | sed "s:'::g" | tr '[:upper:]' '[:lower:]' | sed 's/\r$//')
lifecyclestate="(${lifecyclestate})"
else
lifecyclestate="INFO.yaml not found"
fi
getwikilifecyclestate ${project}
# returns value in ${return_from_getwikilifecyclestate}
#echo "DBUG: working dir is ...";pwd
#echo "DBUG: lifecycleproject=${lifecycleproject}"
#echo "DBUG: lifecyclestate=${lifecyclestate}"
#echo "DBUG: wikilifecyclestate=${return_from_getwikilifecyclestate}"
#check if YAML.info LC state is not empty _AND_ if WIKI LC state is not empty _AND_ if YAML.info LC state contains WIKI LC state
if [[ ${lifecyclestate} != "" ]] && [[ ${return_from_getwikilifecyclestate} != "" ]] && [[ ${lifecyclestate} == *"${return_from_getwikilifecyclestate}"* ]]; then
lcstatesmatch="match"
else
lcstatesmatch=""
fi
csv[i]="${csv[i]},${lifecyclestate},${return_from_getwikilifecyclestate},${lcstatesmatch}"
((i++))
done
unset array
unset i
unset reponame
unset project
unset lifecycleproject
unset lifecyclestate
unset lcstatesmatch
#
# csv column #9: RELEASE component (yes|maybe|unknown)
# to be filled with values of the planned release config file maintained by
# the onap release manager
# NOR FUNCTIONAL YET
# repoclone.log format: $1=gitexitcode|$2=reponame|$3=repostate|$4=errormsg
readarray -t array < ./${branch}_repoclone.log;
i=0
csv[i]="${csv[i]},${branch_upper} component"
((i++))
for line in "${array[@]}"
do
# repoclone.log format: $1=gitexitcode|$2=reponame|$3=repostate|$4=errormsg
gitexitcode=$(echo $line | awk -F "|" '{print $1}');
reponame=$(echo $line | awk -F "|" '{print $2}');
repostate=$(echo $line | awk -F "|" '{print $3}');
errormsg=$(echo $line | awk -F "|" '{print $4}');
#if [[ ${repostate} == "ACTIVE" && ${gitexitcode} == "0" ]]; then
# releasecomponent="yes"
#elif [ ${repostate} == "ACTIVE" ]; then
##elif [[ ${repostate} == "ACTIVE" && ${gitexitcode} == "128" ]]; then
# releasecomponent="maybe"
#elif [[ ${repostate} == "READ_ONLY" && ${gitexitcode} == "0" ]]; then
# releasecomponent="yes"
#elif [ ${repostate} == "READ_ONLY" ]; then
# releasecomponent="maybe"
#else
# releasecomponent="unknown"
#fi
# not functional yet!
releasecomponent=""
csv[i]="${csv[i]},${releasecomponent}"
((i++))
done
unset array
unset i
unset gitexitcode
unset reponame
unset repostate
unset errormsg
unset releasecomponent
#
# csv column #10: RELEASE partizipation
#
# repoclone.log format: $1=gitexitcode|$2=reponame|$3=repostate|$4=errormsg
readarray -t array < ./${branch}_repoclone.log;
i=0
csv[i]="${csv[i]},${branch_upper} partizipation"
((i++))
echo "INFO: determine release partizipation for project ..."
for line in "${array[@]}"
do
# repoclone.log format: $1=gitexitcode|$2=reponame|$3=repostate|$4=errormsg
gitexitcode=$(echo $line | awk -F "|" '{print $1}');
reponame=$(echo $line | awk -F "|" '{print $2}');
repostate=$(echo $line | awk -F "|" '{print $3}');
errormsg=$(echo $line | awk -F "|" '{print $4}');
projectname=$(echo $reponame | sed 's:/.*$::')
if [[ $branch == "master" ]]; then
return_from_getrpinfo="";
else
#echo "DBUG: calling getrpinfo for projectname ${projectname}"
getrpinfo ${projectname}
fi
csv[i]="${csv[i]},${return_from_getrpinfo}"
((i++))
done
unset array
unset i
unset gitexitcode
unset reponame
unset repostate
unset errormsg
unset projectname
unset return_from_getrpinfo
#
# csv column #11: docs (at repo root directory only; no recursive search!)
# csv column #12: conf.py
# csv column #13: tox.ini
# csv column #14: index.rst
# csv column #15: first title in index.rst
#
# columns are filled with values from requested branch.
# if data is not available values from master branch are used.
# to identify master branch values, data is put into round brackets "(...)"
#
readarray -t array < ./${repolist};
i=0
csv[$i]="${csv[i]},docs,conf.py,tox.ini,index.rst,first title in index.rst"
((i++))
for line in "${array[@]}"
do
line=$(echo $line | sed 's:|.*$::')
#echo "DBUG: line=${line}"
#echo "DBUG: i=${i}"
# docs
if [ -d ./${line}/docs ] ; then
docs="docs"
elif [ -d ../master/${line}/docs ] ; then
docs="(docs)"
else
docs="-"
fi
# conf.py
if [ -f ./${line}/docs/conf.py ] ; then
docs="${docs},conf.py"
elif [ -f ../master/${line}/docs/conf.py ] ; then
docs="${docs},(conf.py)"
else
docs="${docs},-"
fi
# tox.ini (check docs dir and also check project root dir)
if [ -f ./${line}/docs/tox.ini ] || [ -f ./${line}/tox.ini ]; then
docs="${docs},tox.ini"
# tox.ini @ branch/docs dir
if [ -f ./${line}/docs/tox.ini ] ; then
docs="${docs} @docs"
fi
# tox.ini @ branch/project root dir
if [ -f ./${line}/tox.ini ] ; then
docs="${docs} @root"
fi
elif [ -f ../master/${line}/docs/tox.ini ] || [ -f ../master/${line}/tox.ini ]; then
docs="${docs},(tox.ini"
# tox.ini @ master/docs dir
if [ -f ../master/${line}/docs/tox.ini ] ; then
docs="${docs} @docs"
fi
# tox.ini @ master/project root dir
if [ -f ../master/${line}/tox.ini ] ; then
docs="${docs} @root"
fi
# just add a round bracket at the end of the value
docs="${docs})"
else
# no tox.ini found in docs or root dir
docs="${docs},-"
fi
# index.rst, first title in index.rst
indexrsttitle=""
if [ -f ./${line}/docs/index.rst ] ; then
indexrsttitle=$(cat ${branch}_indexrst_docs_root_titles.log | grep -F '['${line}']/docs/index.rst,' | awk -F "," '{print $4}');
docs="${docs},index.rst,${indexrsttitle}"
elif [ -f ../master/${line}/docs/index.rst ] ; then
indexrsttitle=$(cat ../master/master_indexrst_docs_root_titles.log | grep -F '['${line}']/docs/index.rst,' | awk -F "," '{print $4}');
docs="${docs},(index.rst),(${indexrsttitle})"
else
docs="${docs},-,-"
fi
#echo "DBUG: docs=${docs}"
line="${csv[i]},${docs}"
csv[$i]=${line}
((i++))
done
unset array
unset i
unset docs
#
# csv column #16: index.html@RTD accessibility check
# csv column #17: index.html url
#
readarray -t array < ./${branch}_repoclone.log;
i=0
csv[i]="${csv[i]},index.html@RTD,index.html url"
((i++))
for line in "${array[@]}"
do
# repoclone.log format: $1=gitexitcode|$2=reponame|$3=repostate|$4=errormsg
gitexitcode=$(echo $line | awk -F "|" '{print $1}');
reponame=$(echo $line | awk -F "|" '{print $2}');
repostate=$(echo $line | awk -F "|" '{print $3}');
errormsg=$(echo $line | awk -F "|" '{print $4}');
url=""
curl_result=""
# this script works only with release "frankfurt" and later because
# earlier releases are using submodule structure for documentation files
if echo "$branch" | grep -q '^[abcde]'; then
curl_result="unsupported release"
url="-"
else
# we are working on "frankfurt" branch or later ...
if [[ ${repostate} == "ACTIVE" ]] || [[ ${repostate} == "READ_ONLY" ]]; then
# OPTIONAL: USE ALSO GITEXITCODE AS A FILTER CRITERIA ???
# url base
# important! only doc project needs a different url base
if [[ ${reponame} == "doc" ]]; then
url_start="https://docs.onap.org"
else
url_start="https://docs.onap.org/projects/onap"
fi
url_lang="en"
url_branch=${branch}
# "master" branch documentation is available as "latest" in RTD
if [[ ${url_branch} == "master" ]]; then
url_branch="latest"
fi
# replace all / characters in repo name with - charachter
url_repo=$(echo ${reponame} | sed -r 's/\//-/g')
url_file="index.html"
# build the full url
if [[ ${reponame} == "doc" ]]; then
# build the full url for the doc project
url="${url_start}/${url_lang}/${url_branch}/${url_file}"
else
# build the full url for the other projects
url="${url_start}-${url_repo}/${url_lang}/${url_branch}/${url_file}"
fi
#echo "DBUG: url=$url"
# test accessibility of url
curl --head --silent --fail "${url}?${unique}" >/dev/null
curl_result=$?
# convert numeric results to text
if [ "${curl_result}" = "0" ]; then
curl_result="accessible"
elif [ "${curl_result}" = "22" ]; then
curl_result="does not exist"
else
curl_result="ERROR:${curl_result}"
fi
# url does not exist for this branch.
# in case the requested url is not already for "master" branch,
# we try to access the url of the master branch and denote the
# result by using round brackets (result)
if [[ ${curl_result} == "does not exist" && ! $branch == "master" ]]; then
# build the full (master/latest) url
url="${url_start}-${url_repo}/${url_lang}/latest/${url_file}"
#echo "DBUG: url=$url"
# test accessibility of url in "master branch" (latest)
curl --head --silent --fail "${url}?${unique}" >/dev/null
curl_result=$?
# denote result as a value from "master" branch (latest)
url="(${url})"
# convert numeric results to text
if [ "${curl_result}" = "0" ]; then
curl_result="(accessible)"
elif [ "${curl_result}" = "22" ]; then
curl_result="(does not exist)"
else
curl_result="(ERROR:${curl_result})"
fi
fi
else
# repostate IS NOT ACTIVE OR READ_ONLY - no curl test required
curl_result="-"
url="-"
fi
fi
echo "$url ... $curl_result"
csv[i]="${csv[i]},${curl_result},${url}"
#echo "DBUG: csv line=${csv[i]}"
((i++))
done
#
# csv column #18: release notes
#
readarray -t array < ../${repolist};
i=0
csv[i]="${csv[i]},release notes"
((i++))
for line in "${array[@]}"
do
line=$(echo $line | sed 's:|.*$::')
#echo "DBUG: line=\"${line}\""
#echo "DBUG: i=${i}"
relnote=""
# put repo name in square brackets for increased grep hit rate
# escape minus and bracket characters to avoid problems with the grep command
#repo_grepable=$(echo ${line} | sed -r s:${line}:[${line}]: | sed -r 's/-/\\-/g' | sed -r 's/\[/\\[/g' | sed -r 's/\]/\\]/g')
#echo "DBUG: repo_grepable=\"${repo_grepable}\""
# check if repo dir exists in this branch
if [ -d ./${line} ] ; then
# if yes, check if repo name appears in the branch releasenotes.log
relnote=$(find "./${line}" -type f | grep '.*release.*note.*.rst' | wc -l);
#echo "DBUG: relnote=${relnote}"
# repo dir DOES NOT exist in this branch - so check if repo dir exists in MASTER branch
elif [ -d ../master/${line} ] ; then
# if yes, check if repo name appears in the MASTER releasenotes.log
# count release notes files in MASTER branch (in repo root and its subdirectories)
relnote=$(find "../master/${line}" -type f | grep 'release.*note.*.rst' | wc -l);
#echo "DBUG: relnote=${relnote}"
# put results in round brackets to show that this is MASTER data
relnote=$(echo ${relnote} | sed -r s:${relnote}:\(${relnote}\):)
else
relnote="-"
fi
#echo "DBUG: relnote=${relnote}"
line="${csv[i]},${relnote}"
csv[i]=${line}
((i++))
done
unset array
unset i
unset relnote
unset repo_grepable
#
# build the table.csv file
#
for i in "${csv[@]}"
do
echo "$i" | tee -a ./${branch}_table.csv
done
#
# create data package for this branch and zip it
#
datadir=${branch}_data
mkdir $datadir
cp $repolist $datadir
cp ../$wikiplsfile $datadir
cp ../$rpfile $datadir
cp ${branch}_table.csv $datadir
cp ${branch}_*.log $datadir
zip -r ${datadir}.zip $datadir
# return from the branch directory
cd ..
# return and work on the next requested branch ... or exit
done
|