summaryrefslogtreecommitdiff
path: root/src/index-terms.sh
diff options
context:
space:
mode:
authorLouie Shprung <lshprung@scu.edu>2023-06-09 11:26:54 -0700
committerLouie Shprung <lshprung@scu.edu>2023-06-09 11:26:54 -0700
commita4784bbacc356d381ff833e1c181b75c30f776c6 (patch)
tree431af41591d4407546548f2f01c76b0bc5af5bd7 /src/index-terms.sh
parente397123c70d2ad564753f8aad1e1ac82276234f0 (diff)
Clean up, base more on dash-docset-template, dumb down entry types for name-index (consider all of these directives)
Diffstat (limited to 'src/index-terms.sh')
-rwxr-xr-xsrc/index-terms.sh33
1 files changed, 33 insertions, 0 deletions
diff --git a/src/index-terms.sh b/src/index-terms.sh
new file mode 100755
index 0000000..f74af03
--- /dev/null
+++ b/src/index-terms.sh
@@ -0,0 +1,33 @@
+#!/usr/bin/env sh
+
+# shellcheck source=./lib/create_table
+. "$(dirname "$0")"/lib/create_table
+# shellcheck source=./lib/insert
+. "$(dirname "$0")"/lib/insert
+
+TYPE="$1"
+shift
+DB_PATH="$1"
+shift
+
+insert_index_terms() {
+ # Get each term from an index page and insert
+ while [ -n "$1" ]; do
+ grep -Eo "<a href.*</a>:" "$1" | while read -r line; do
+ insert_term "$line"
+ done
+
+ shift
+ done
+}
+
+insert_term() {
+ LINK="$1"
+ NAME="$(echo "$LINK" | pup -p 'a text{}' | sed 's/\"\"//g' | tr -d \\n)"
+ PAGE_PATH="$(echo "$LINK" | pup -p 'a attr{href}')"
+
+ insert "$DB_PATH" "$NAME" "$TYPE" "$PAGE_PATH"
+}
+
+create_table "$DB_PATH"
+insert_index_terms "$@"