citadel

My dotfiles, scripts and nix configs
git clone git://jb55.com/citadel
Log | Files | Refs | README | LICENSE

commit a55d489ed6174270e95fb7fc5818f0c928057667
parent 2eddfc5d2548487b45c590e4654a3aa19f82db1c
Author: William Casarin <jb55@jb55.com>
Date:   Sat,  6 Feb 2021 10:12:49 -0800

plainweb: pretend to be chrome

Some websites don't like curl

Signed-off-by: William Casarin <jb55@jb55.com>

Diffstat:
Mbin/plainweb | 4+++-
1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/bin/plainweb b/bin/plainweb @@ -1,5 +1,7 @@ #!/usr/bin/env bash +USER_AGENT="User-Agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10_3) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/44.0.2403.89 Safari/537.36" + if [ -z "$1" ]; then printf "usage: plainweb <url>\n" exit 1 @@ -9,7 +11,7 @@ HURL="/tmp/$(sha256sum <<<"$1" | awk '{print $1}').txt" OUT=${2:-$HURL} if [ ! -f "$HURL" ]; then - curl -sL "$1" | pandoc -f html -t plain - -o "$HURL" + curl -H "$USER_AGENT" -sL "$1" | sed 's,googletagmanager.com,google.com,g' | pandoc -f html -t plain - -o "$HURL" fi exec lessr "$HURL"