Browse Source

Automatically fix capitalisation of Facebook and Twitter usernames

master
JustAnotherArchivist 5 years ago
parent
commit
0168d50f62
3 changed files with 23 additions and 4 deletions
  1. +0
    -2
      facebook-user-capitalisation
  2. +13
    -1
      snscrape-facebook-user
  3. +10
    -1
      snscrape-twitter-user

+ 0
- 2
facebook-user-capitalisation View File

@@ -1,2 +0,0 @@
#!/bin/bash
curl -s "https://www.facebook.com/${1}/" | grep -Po '<meta property="og:url" content="https://www\.facebook\.com/\K[^"/]+'

+ 13
- 1
snscrape-facebook-user View File

@@ -1,2 +1,14 @@
#!/bin/bash
user="$1"; { echo "https://www.facebook.com/${user}/"; snscrape -v facebook-user "${user}" | perl -pe 's,[?&]\K__xts__%5B0%5D=[^&]+?(&|$),,; s,[?&]\K__tn__=[^&]+?(&|$),,; s,[?&]\Keid=[^&]+?(&|$),,; s,[?&]$,,;' | awk '{print} /\?type=/ {print substr($0, 1, index($0, "?type=") - 1)}' | awk '!seen[$0]++'; } > "facebook-@${user}"
origUser="$1";
user="$(snscrape --max-results 1 facebook-user "${origUser}" | grep -Po '^https?://www\.facebook\.com/\K[^/]+')"
if [[ "${user}" ]]
then
if [[ "${user}" != "${origUser}" ]]; then echo "Username fix: ${origUser} -> ${user}" >&2; fi
{
echo "https://www.facebook.com/${user}/"
snscrape -v facebook-user "${user}" | \
perl -pe 's,[?&]\K__xts__%5B0%5D=[^&]+?(&|$),,; s,[?&]\K__tn__=[^&]+?(&|$),,; s,[?&]\Keid=[^&]+?(&|$),,; s,[?&]$,,;' | \
awk '{print} /\?type=/ {print substr($0, 1, index($0, "?type=") - 1)}' | \
awk '!seen[$0]++'
} > "facebook-@${user}"
fi

+ 10
- 1
snscrape-twitter-user View File

@@ -1,2 +1,11 @@
#!/bin/bash
user="$1"; { echo "https://twitter.com/${user}"; snscrape -v twitter-user "${user}"; } > "twitter-@${user}"
origUser="$1"
user="$(snscrape --max-results 1 twitter-user "${origUser}" | grep -Po '^https?://twitter\.com/\K[^/]+')"
if [[ "${user}" ]]
then
if [[ "${user}" != "${origUser}" ]]; then echo "Username fix: ${origUser} -> ${user}" >&2; fi
{
echo "https://twitter.com/${user}"
snscrape -v twitter-user "${user}"
} > "twitter-@${user}"
fi

Loading…
Cancel
Save