From 20aa42ad2c7740d64247e900e02638317b650209 Mon Sep 17 00:00:00 2001 From: Louie Shprung Date: Tue, 22 Nov 2022 21:45:29 -0800 Subject: Rewrite in POSIX shell --- src/index.rb | 40 ------------------------------------ src/index.sh | 66 ++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ 2 files changed, 66 insertions(+), 40 deletions(-) delete mode 100755 src/index.rb create mode 100755 src/index.sh (limited to 'src') diff --git a/src/index.rb b/src/index.rb deleted file mode 100755 index 81b042a..0000000 --- a/src/index.rb +++ /dev/null @@ -1,40 +0,0 @@ -require 'pathname' - -puts %Q[ - CREATE TABLE searchIndex(id INTEGER PRIMARY KEY, name TEXT, type TEXT, path TEXT); - CREATE UNIQUE INDEX anchor ON searchIndex (name, type, path); -] - -INSERT_SQL = %Q[ - INSERT INTO searchIndex(name, type, path) VALUES ('%s','%s','%s'); -] - -PATTERN = %r[(.*)\(Autoconf\)(.*)] - -BUILTIN_PATTERN = /The node you are looking for is at.*Limitations-of-.*\.html/ -MACRO_PATTERN = /The node you are looking for is at/ - -def quote(s) - s.gsub(/&/, '&').gsub(/'/, "\\'").gsub(/</, '<') -end - -ARGV.each do |arg| - Pathname.glob(arg) do |path| - macro_match = path.each_line.lazy.map { |line| MACRO_PATTERN.match(line) }.find { |m| m } - builtin_match = path.each_line.lazy.map { |line| BUILTIN_PATTERN.match(line) }.find { |m| m } - if builtin_match - type = "Builtin" - elsif macro_match - type = "Macro" - else - type = "Guide" - end - - match = path.each_line.lazy.map { |line| PATTERN.match(line) }.find { |m| m } - if match - printf INSERT_SQL, quote(match[1]), type, path.basename - else - $stderr.puts "%{path.basename}: no title found" - end - end -end diff --git a/src/index.sh b/src/index.sh new file mode 100755 index 0000000..e81a0f7 --- /dev/null +++ b/src/index.sh @@ -0,0 +1,66 @@ +#!/usr/bin/env sh + +DB_PATH="$1" +shift + +get_title() { + FILE="$1" + + PATTERN=".*\(Autoconf\).*" + + #Find pattern in file + grep -Eo "$PATTERN" "$FILE" | + #Remove tag + sed 's/<[^>]*>//g' | \ + #Remove '(automake)' + sed 's/(Autoconf)//g' | \ + #Remove trailing space + sed 's/[ ]*$//g' | \ + #Replace '&' with '&' + sed 's/&/&/g' | \ + #Replace '<' with '<' + sed 's/</