diff options
author | Louie S <louie@example.com> | 2024-01-16 09:31:12 -0500 |
---|---|---|
committer | Louie S <louie@example.com> | 2024-01-16 09:31:12 -0500 |
commit | 2d1e8a273dc45fc10f4d5628e406ab970b720381 (patch) | |
tree | 82ed5d081bf690a16b69e4382695392ab351ba32 /src/index-terms.sh | |
parent | 10a6815096b5101618d22c518dcc72331831d231 (diff) |
Diffstat (limited to 'src/index-terms.sh')
-rwxr-xr-x | src/index-terms.sh | 37 |
1 files changed, 37 insertions, 0 deletions
diff --git a/src/index-terms.sh b/src/index-terms.sh new file mode 100755 index 0000000..a7cd014 --- /dev/null +++ b/src/index-terms.sh @@ -0,0 +1,37 @@ +#!/usr/bin/env sh + +# shellcheck source=./lib/create_table +. "$(dirname "$0")"/lib/create_table +# shellcheck source=./lib/insert +. "$(dirname "$0")"/lib/insert + +TYPE="$1" +shift +CATEGORY="$1" # should refer to how the href is "Reference-manual_$CATEGORY" +shift +DB_PATH="$1" +shift + +insert_index_terms() { + # Get each term from an index page and insert + while [ -n "$1" ]; do + while read -r line; do + if echo "$line" | pup -p 'a' | grep -Eoq "Reference-manual_$CATEGORY"; then + insert_term "$line" + fi + done < "$1" + + shift + done +} + +insert_term() { + LINK="$1" + NAME="$(echo "$LINK" | pup -p 'a text{}' | sed 's/\"\"//g' | tr -d \\n)" + PAGE_PATH="$(echo "$LINK" | pup -p 'a attr{href}')" + + insert "$DB_PATH" "$NAME" "$TYPE" "$PAGE_PATH" +} + +create_table "$DB_PATH" +insert_index_terms "$@" |