#!/bin/sh
-# Copyright 2023 Paul Hänsch
+# Copyright 2023, 2024 Paul Hänsch
#
# Permission to use, copy, modify, and/or distribute this software for any
# purpose with or without fee is hereby granted, provided that the above
[ "${PATH_INFO%\[search\]}" = "$PATH_INFO" ] && return 1
. "$_EXEC/cgilite/storage.sh"
+. "$_EXEC/cgilite/db23.sh"
I="$_DATA/index"
+tags="$( GET q | awk '
+ BEGIN { # Field separator FS should include punctuation, including Unicode Block U+2000 - U+206F
+ if ( length("¡") == 1 ) # Utf-8 aware AWK
+ FS = "([] \\t\\n\\r!\"'\''()*+,./:;<=>?\\\\^_`{|}~[-]|%[0-9A-Fa-f]{2}|'"$(printf '[\342\200\200-\342\201\257]')"')+";
+ else # UTF-8 Hack
+ FS = "([] \\t\\n\\r!\"'\''()*+,./:;<=>?\\\\^_`{|}~[-]|%[0-9A-Fa-f]{2}|'"$(printf '\342\200[\200-\277]|\342\201[\201-\257]')"')+";
+ fi
+ }
+ { for (n = 1; n <= NF; n++) if ($n ~ /#[[:alnum:]_]+/) {
+ sub(/^#/,"",$n)
+ printf "%s ", toupper($n);
+ }
+ }
+')"
+
+ntags="$( GET q | awk '
+ BEGIN { # Field separator FS should include punctuation, including Unicode Block U+2000 - U+206F
+ if ( length("¡") == 1 ) # Utf-8 aware AWK
+ FS = "([] \\t\\n\\r\"#'\''()*+,./:;<=>?\\\\^_`{|}~[-]|%[0-9A-Fa-f]{2}|'"$(printf '[\342\200\200-\342\201\257]')"')+";
+ else # UTF-8 Hack
+ FS = "([] \\t\\n\\r\"#'\''()*+,./:;<=>?\\\\^_`{|}~[-]|%[0-9A-Fa-f]{2}|'"$(printf '\342\200[\200-\277]|\342\201[\201-\257]')"')+";
+ fi
+ }
+ { for (n = 1; n <= NF; n++) if ($n ~ /![[:alnum:]_]+/) {
+ sub(/^!/,"",$n)
+ printf "%s ", toupper($n);
+ }
+ }
+')"
+
words="$( GET q | awk '
BEGIN { # Field separator FS should include punctuation, including Unicode Block U+2000 - U+206F
if ( length("¡") == 1 ) # Utf-8 aware AWK
- FS = "([] \\t\\n\\r!\"#'\''()*+,./:;<=>?\\\\^_`{|}~[-]|%[0-9A-Fa-f]{2}|'"$(printf '[\342\200\200-\342\201\257]')"')+";
+ FS = "([] \\t\\n\\r\"#'\''()*+,./:;<=>?\\\\^_`{|}~[-]|%[0-9A-Fa-f]{2}|'"$(printf '[\342\200\200-\342\201\257]')"')+";
else # UTF-8 Hack
- FS = "([] \\t\\n\\r!\"#'\''()*+,./:;<=>?\\\\^_`{|}~[-]|%[0-9A-Fa-f]{2}|'"$(printf '\342\200[\200-\277]|\342\201[\201-\257]')"')+";
+ FS = "([] \\t\\n\\r\"#'\''()*+,./:;<=>?\\\\^_`{|}~[-]|%[0-9A-Fa-f]{2}|'"$(printf '\342\200[\200-\277]|\342\201[\201-\257]')"')+";
fi
}
- { for (n = 1; n <= NF; n++) printf "%s ", tolower($n); }
+ { for (n = 1; n <= NF; n++) if ($n !~ /![[:alnum:]_]+/) {
+ sub(/!/," ",$n)
+ printf "%s ", tolower($n);
+ }
+ }
')"
+searchteaser() {
+ local file="$1" words db3_data
+ local w l nc nl hits mhits cont mcont
+ shift 1; words="$*"
+
+ for w in ${words}; do
+ grep -hiwnF "$w" "$file"
+ done \
+ | sort -t: -k1 -n \
+ | { nc=-1 hits=0 mhits=0
+ while read -r l; do
+ nl="$nc" nc="${l%%:*}"
+ if [ $nc -eq $nl ]; then
+ hits=$((hits + 1))
+ elif [ $nc -eq $((nl + 1 )) ]; then
+ hits=$((hits + 1))
+ cont="${cont}${BR}${l#*:}"
+ elif [ $hits -gt $mhits ]; then
+ mhits="$hits" mcont="$cont"
+ hits=1 cont="${l#*:}"
+ else
+ hits=1 cont="${l#*:}"
+ fi
+ done
+
+ [ $hits -gt $mhits ] \
+ && STRING "$cont" \
+ || STRING "$mcont"
+ }
+}
+
for w in ${words}; do
[ ! -f "$I/$w" ] && continue
while read date doc freq num total; do
P="$_DATA/pages$(UNSTRING "$doc")"
d="$(stat -c %Y -- "$P/#index.flag" 2>&-)"
- [ "$d" -le "$date" ] 2>&- || continue
+ [ "$d" -le "$date" -a -f "$P/#page.md" ] 2>&- || continue
printf '%s %f\n' "$doc" "$freq"
done <"$I/$w"
[ "${page%/:*/}" = "${page%/:${LANGUAGE}/}" ] || continue
fi
acl_read "$page" || continue
- printf '%s\n' "$page"
+ has_tags "$page" $tags || continue
+ has_tag "$page" $ntags && continue
+ printf '%s %s\n' "$doc" "$(searchteaser "$(mdfile "$page")" $words)"
done \
| theme_search "${words% }"