#!/bin/bash # # File: check-index-errors # Version: 0.95b # # Check whether the index.html file in a volume has some common errors # (c) 2020-2025 by Manfred Jeusfeld. This script is made available under the # Creative Commons Attribution-ShareAlike CC-BY-SA 4.0 license. # # The BASH script is part of the scripts used for CEUR-WS.org. No warrantee whatsoever. No support. # # Note that this script is updated on a regular basis, in particular to cover changes with # the layout for index files ceur-ws.org/Vol-XXX/index.html. # # Call this script in the directory that contains the index.html file that you want to check. # # Manfred 2020-03-20 (2026-03-15) # if [ ! -f index.html ]; then echo "No file index.html in this directory. Call this script in the directory that contains your submissions files." exit 1 fi if [[ -f index.html.orig && "$1" != "pre" ]]; then echo "Using check-index-errors-after for rules holding for edited index.html files ... " check-index-errors-after "$@" exit 0 fi echo "check-index-errors V0.95b (2026-05-05) CC-BY-SA 4.0" echo "" # to distinguish regular index files for "semantified" index files indexformat=regular if grep -q "foaf:" index.html; then indexformat=semantic fi if grep -q "Workshop on Publishing Papers" index.html; then echo " "; echo " ==========> ERROR (A1) in index.html!!!!"; echo "String 'Workshop on Publishing Papers' found in index.html"; fi if grep -q "OPub" index.html; then echo " "; echo " ==========> ERROR (A2) in index.html!!!!"; echo "String 'OPub' found in index.html"; fi if grep -q -E "Coeditor|Carlos Nombre|Anne Foé" index.html; then echo " "; echo " ==========> ERROR (A3) in index.html!!!!"; echo "String 'Coeditor' or 'Carlos Nombre' or 'Anne Foé' left over from template Vol-XXX found in index.html"; fi if grep -q "

" index.html; then echo " "; echo " ==========> ERROR (A4) in index.html!!!!"; echo "

/,/<\/li>/!p' index.html | grep 'class="CEURAUTHOR"' | sed -e 's/.*class="CEURAUTHOR">//' -e 's/<\/span>.*//' | sed 's/^[ \t]*//;s/[ \t]*$//') EDITOR_OVERLAP_ERROR="no" if [ -n "$EDITORS" ]; then while IFS= read -r editor; do if [ -n "$editor" ]; then # Count occurrences of the editor name in the research paper author list COUNT=$(echo "$AUTHORS" | grep -Fxc "$editor") if [ "$COUNT" -gt 1 ]; then EDITOR_OVERLAP_ERROR="yes" echo " Editor '$editor' is an author of $COUNT research papers." fi fi done <<< "$EDITORS" fi if [[ "$EDITOR_OVERLAP_ERROR" == "no" ]]; then echo "ok" else echo " ==========> ERROR (A41) in index.html!!!!" fi echo " " echo "(*) Checking minimum number of papers ..." NRWORDS=`grep -wc CEURTITLE index.html` if [[ "$NRWORDS" -ge "6" ]]; then echo "ok" else # echo " ==========> ERROR (A42) in index.html!!!!"; echo "The index.html file lists $NRWORDS papers with a CEURTITLE. Minimum is 6." fi echo " " # 2026-05-05: Check for balance between Editor and Author ORCIDs (A43) echo "(*) Checking ORCID coverage balance ..." EDITOR_ORCIDS=$(grep "CEURVOLEDITOR" index.html | grep -c "itemid") AUTHOR_ORCIDS=$(grep "CEURAUTHOR" index.html | grep -c "itemid") if [ "$EDITOR_ORCIDS" -gt "$AUTHOR_ORCIDS" ]; then echo " " echo " ==========> ERROR (A43) in index.html!!!!" echo " There are more ORCIDs for editors ($EDITOR_ORCIDS) than for authors ($AUTHOR_ORCIDS)." echo " We suggest that at least as many authors are semantified as editors." echo " Most paper PDFs have ORCIDs for authors. So pick the date from there!" echo " " else echo "ok" fi echo " "