From daa1a95792692ed70701f9a7c7233e22fa694719 Mon Sep 17 00:00:00 2001 From: JustAnotherArchivist Date: Tue, 18 Feb 2020 16:53:41 +0000 Subject: [PATCH] Proper URL decoding --- social-media-extract-profile-link | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/social-media-extract-profile-link b/social-media-extract-profile-link index 0896f44..f8b14b7 100755 --- a/social-media-extract-profile-link +++ b/social-media-extract-profile-link @@ -25,7 +25,7 @@ function fetch_n_extract { elif grep -qF 'id="pagelet_loggedout_sign_up"' <<< "${page}" then # Profile overview only - grep -Po ']*\s)?id\s*=\s*"header-links".*?' | grep -Po 'href="/redirect\?([^"]*&(amp;)?)?q=\K[^&"]+' | sed 's,%3A,:,g; s,%2F,/,g; s,%25,%,g' + fetch "${u}" | tr -d '\n' | grep -Po ']*\s)?id\s*=\s*"header-links".*?' | grep -Po 'href="/redirect\?([^"]*&(amp;)?)?q=\K[^&"]+' | python3 -c 'import sys, urllib.parse; sys.stdout.write(urllib.parse.unquote(sys.stdin.read()))' fi }