sbrl/plaintext-convert.sh

## plaintext-convert.sh
#!/bin/bash
set -o errexit
set -o nounset
##############

# This program converts a plain-text list of urls to the
# bookmark-archiver HTML format.
#
# Requirements: curl, xidel
# Usage:
#     ./plaintext-convert.sh [{filename}]
#
# The filename is optional. If specified, the specified file will be
# read. If not, then stdin will be used instead.
#
# Examples:
#     ./plaintext-convert.sh <path/to/file >list.html
#     ./plaintext-convert.sh urls.txt >urls.html
#

##############

date=$(date +%s)

egrep --only-matching 'http(s)?\://[^ "\*\*"]*' <"${1:-/dev/stdin}" | while read pageurl; do
    date=$(( $date + 1 ))
    # Extract webpage title
    pagetitle=$(curl "${pageurl}" -Ss | xidel --data - --css "title" --quiet)
    if [ "$pagetitle" = "" ]; then pagetitle="$pageurl"; fi
    echo "<dt><a href=\"$pageurl\" add_date=\"$date\">$pagetitle</a></dt>";
    echo "[info] Processing $pageurl" >&2;
done;
echo "[info] Completed" >&2;
	#!/bin/bash
	set -o errexit
	set -o nounset
	##############

	# This program converts a plain-text list of urls to the
	# bookmark-archiver HTML format.
	#
	# Requirements: curl, xidel
	# Usage:
	# ./plaintext-convert.sh [{filename}]
	#
	# The filename is optional. If specified, the specified file will be
	# read. If not, then stdin will be used instead.
	#
	# Examples:
	# ./plaintext-convert.sh <path/to/file >list.html
	# ./plaintext-convert.sh urls.txt >urls.html
	#

	##############

	date=$(date +%s)

	egrep --only-matching 'http(s)?\://[^ "\\"]*' <"${1:-/dev/stdin}" \| while read pageurl; do
	date=$(( $date + 1 ))
	# Extract webpage title
	pagetitle=$(curl "${pageurl}" -Ss \| xidel --data - --css "title" --quiet)
	if [ "$pagetitle" = "" ]; then pagetitle="$pageurl"; fi
	echo "<dt><a href=\"$pageurl\" add_date=\"$date\">$pagetitle</a></dt>";
	echo "[info] Processing $pageurl" >&2;
	done;
	echo "[info] Completed" >&2;