From 3c530aafe415db3515465e8b0662373065afd925 Mon Sep 17 00:00:00 2001 From: Louie Shprung Date: Sun, 26 Mar 2023 13:58:50 -0700 Subject: Index terms --- src/index-page.sh | 61 +++++++++++++++++++++++++++++++++++++++++++++ src/index-terms.sh | 38 ++++++++++++++++++++++++++++ src/index.sh | 70 ---------------------------------------------------- src/lib/create_table | 6 +++++ src/lib/insert | 9 +++++++ 5 files changed, 114 insertions(+), 70 deletions(-) create mode 100755 src/index-page.sh create mode 100755 src/index-terms.sh delete mode 100755 src/index.sh create mode 100644 src/lib/create_table create mode 100644 src/lib/insert (limited to 'src') diff --git a/src/index-page.sh b/src/index-page.sh new file mode 100755 index 0000000..e26cdf8 --- /dev/null +++ b/src/index-page.sh @@ -0,0 +1,61 @@ +#!/usr/bin/env sh + +# shellcheck source=./lib/create_table +. "$(dirname "$0")"/lib/create_table +# shellcheck source=./lib/insert +. "$(dirname "$0")"/lib/insert + +DB_PATH="$1" +shift + +get_title() { + FILE="$1" + + pup -p -f "$FILE" 'title text{}' | \ + sed 's/(Lexical Analysis With Flex.*)//' | \ + tr -d \\n | \ + sed 's/\"/\"\"/g' +} + +get_type() { + PAGE_NAME="$1" + + case "$PAGE_NAME" in + option-*) + echo "Option" + ;; + *) + echo "Guide" + esac +} + +insert_pages() { + # Get title and insert into table for each html file + while [ -n "$1" ]; do + unset PAGE_NAME + unset PAGE_TYPE + PAGE_NAME="$(get_title "$1")" + + # determine type + case "$PAGE_NAME" in + option-*) + PAGE_TYPE="Option" + PAGE_NAME="$(echo "$PAGE_NAME" | sed 's/^option-//')" + ;; + unnamed-* | deleteme* | ERASEME*) + shift + continue + ;; + *) + PAGE_TYPE="Guide" + esac + + if [ -n "$PAGE_NAME" ]; then + insert "$DB_PATH" "$PAGE_NAME" "$PAGE_TYPE" "$(basename "$1")" + fi + shift + done +} + +create_table "$DB_PATH" +insert_pages "$@" diff --git a/src/index-terms.sh b/src/index-terms.sh new file mode 100755 index 0000000..8ac3163 --- /dev/null +++ b/src/index-terms.sh @@ -0,0 +1,38 @@ +#!/usr/bin/env sh + +# shellcheck source=./lib/create_table +. "$(dirname "$0")"/lib/create_table +# shellcheck source=./lib/insert +. "$(dirname "$0")"/lib/insert + +TYPE="$1" +shift +DB_PATH="$1" +shift + +insert_index_terms() { + # Get each term from an index page and insert + while [ -n "$1" ]; do + grep -Eo ":" "$1" | while read -r line; do + insert_term "$line" + done + + shift + done +} + +insert_term() { + LINK="$1" + NAME="$(echo "$LINK" | pup -p 'a text{}' | sed 's/\"\"//g' | tr -d \\n)" + PAGE_PATH="$(echo "$LINK" | pup -p 'a attr{href}')" + + # DEBUG + #echo "$NAME" + #echo "$PAGE_PATH" + #echo + + insert "$DB_PATH" "$NAME" "$TYPE" "$PAGE_PATH" +} + +create_table "$DB_PATH" +insert_index_terms "$@" diff --git a/src/index.sh b/src/index.sh deleted file mode 100755 index 5aca876..0000000 --- a/src/index.sh +++ /dev/null @@ -1,70 +0,0 @@ -#!/usr/bin/env sh - -DB_PATH="$1" -shift - -create_table() { - sqlite3 "$DB_PATH" "CREATE TABLE IF NOT EXISTS searchIndex(id INTEGER PRIMARY KEY, name TEXT, type TEXT, path TEXT);" - sqlite3 "$DB_PATH" "CREATE UNIQUE INDEX IF NOT EXISTS anchor ON searchIndex (name, type, path);" -} - - -get_title() { - FILE="$1" - - pup -p -f "$FILE" 'title text{}' | \ - sed 's/(Lexical Analysis With Flex.*)//' | \ - tr -d \\n | \ - sed 's/\"/\"\"/g' -} - -get_type() { - PAGE_NAME="$1" - - case "$PAGE_NAME" in - option-*) - echo "Option" - ;; - *) - echo "Guide" - esac -} - -insert() { - NAME="$1" - TYPE="$2" - PAGE_PATH="$3" - - sqlite3 "$DB_PATH" "INSERT INTO searchIndex(name, type, path) VALUES (\"$NAME\",\"$TYPE\",\"$PAGE_PATH\");" -} - -insert_pages() { - # Get title and insert into table for each html file - while [ -n "$1" ]; do - unset PAGE_NAME - unset PAGE_TYPE - PAGE_NAME="$(get_title "$1")" - - # determine type - case "$PAGE_NAME" in - option-*) - PAGE_TYPE="Option" - PAGE_NAME="$(echo "$PAGE_NAME" | sed 's/^option-//')" - ;; - unnamed-* | deleteme* | ERASEME*) - shift - continue - ;; - *) - PAGE_TYPE="Guide" - esac - - if [ -n "$PAGE_NAME" ]; then - insert "$PAGE_NAME" "$PAGE_TYPE" "$(basename "$1")" - fi - shift - done -} - -create_table -insert_pages "$@" diff --git a/src/lib/create_table b/src/lib/create_table new file mode 100644 index 0000000..cdeb477 --- /dev/null +++ b/src/lib/create_table @@ -0,0 +1,6 @@ +create_table() { + DB_PATH="$1" + + sqlite3 "$DB_PATH" "CREATE TABLE IF NOT EXISTS searchIndex(id INTEGER PRIMARY KEY, name TEXT, type TEXT, path TEXT);" + sqlite3 "$DB_PATH" "CREATE UNIQUE INDEX IF NOT EXISTS anchor ON searchIndex (name, type, path);" +} diff --git a/src/lib/insert b/src/lib/insert new file mode 100644 index 0000000..2e4dd8c --- /dev/null +++ b/src/lib/insert @@ -0,0 +1,9 @@ +insert() { + DB_PATH="$1" + NAME="$2" + TYPE="$3" + PAGE_PATH="$4" + + sqlite3 "$DB_PATH" "INSERT INTO searchIndex(name, type, path) VALUES (\"$NAME\",\"$TYPE\",\"$PAGE_PATH\");" +} + -- cgit