From 0972186c855b59bfed9d7a676bf98d24740d4950 Mon Sep 17 00:00:00 2001 From: nate smith Date: Fri, 2 Feb 2024 12:12:03 -0800 Subject: [PATCH] script for title extraction --- ingest.sh | 8 ++++++++ 1 file changed, 8 insertions(+) create mode 100755 ingest.sh diff --git a/ingest.sh b/ingest.sh new file mode 100755 index 0000000..e1dceba --- /dev/null +++ b/ingest.sh @@ -0,0 +1,8 @@ +#!/bin/bash + +p="/home/vilmibm/pg_plaintext/files/" + +while read book; do + title=`grep "*** START OF THE PROJECT GUTENBERG" $p$book | sed 's/^\*\*\* START OF THE PROJECT GUTENBERG EBOOK //' | sed 's/\*\*\*//'` + echo $book,$title +done