summaryrefslogtreecommitdiff
path: root/src/index_terms.sh
blob: a2b39fb44317da027db9325ee997fb63f9503ba3 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
#!/usr/bin/env sh

# shellcheck source=./lib/create_table
. "$(dirname "$0")"/lib/create_table
# shellcheck source=./lib/insert
. "$(dirname "$0")"/lib/insert
# shellcheck source=./lib/get_type
. "$(dirname "$0")"/lib/get_type

DB_PATH="$1"
shift

insert_index_terms() {
	# Get each term from an index page and insert
	while [ -n "$1" ]; do
		grep -Eoi "^[a-zA-Z_ ]{45}<STRONG><A HREF=\"[^\"]*\">[^<]*</A></STRONG>" "$1" | while read -r line; do
			insert_term "$line"
		done

		shift
	done
}

insert_term() {
	LINK="$1"
	#NAME="$(echo "$LINK" | pup -p 'a text{}' | sed 's/\"\"//g' | tr -d \\n)"
	NAME="$(echo "$LINK" | cut -d ' ' -f 1)"
	PAGE_PATH="$(echo "$LINK" | pup -p 'a attr{href}')"

	TYPE=$(get_type "$PAGE_PATH")
	if [ -z "$TYPE" ]; then
		TYPE="Guide"
	fi

	insert "$DB_PATH" "$NAME" "$TYPE" "man/$PAGE_PATH"
}

create_table "$DB_PATH"
insert_index_terms "$@"