blob: dc14178760d6a35c9e3d72a606917cefac2f057d (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
|
#!/usr/bin/env sh
# shellcheck source=../create_table.sh
. "$(dirname "$0")"/../create_table.sh
# shellcheck source=../insert.sh
. "$(dirname "$0")"/../insert.sh
TYPE="$1"
shift
INDEX_ENTRY_CLASS="$1"
shift
DB_PATH="$1"
shift
insert_index_terms() {
# Get each term from an index page and insert
while [ -n "$1" ]; do
grep -Eo "class=${INDEX_ENTRY_CLASS}.*<a href.*</a>" "$1" | while read -r line; do
insert_term "$line"
done
shift
done
}
insert_term() {
LINK="$1"
NAME="$(echo "$LINK" | pup -p 'a text{}' | sed 's/"/\"\"/g' | tr -d \\n)"
PAGE_PATH="$(echo "$LINK" | pup -p 'a attr{href}')"
insert "$DB_PATH" "$NAME" "$TYPE" "$PAGE_PATH"
}
create_table "$DB_PATH"
insert_index_terms "$@"
|