Browse Source

Add support for facebook.com/pg/something

master
JustAnotherArchivist 4 years ago
parent
commit
c3b0e5543e
2 changed files with 2 additions and 2 deletions
  1. +1
    -1
      social-media-normalise
  2. +1
    -1
      website-extract-social-media

+ 1
- 1
social-media-normalise View File

@@ -11,7 +11,7 @@ do
prefix=""
fi

if [[ "${url}" =~ ^https?://((www|m|[a-z][a-z]-[a-z][a-z]).)?facebook.com/([^/]+/?(\?|$)|pages/[^/]+/[0-9]+/?(\?|$)|profile\.php\?id=[0-9]+(&|$)) ]]
if [[ "${url}" =~ ^https?://((www|m|[a-z][a-z]-[a-z][a-z]).)?facebook.com/([^/]+/?(\?|$)|pages/[^/]+/[0-9]+/?(\?|$)|pg/[^/]+([/?]|$)|profile\.php\?id=[0-9]+(&|$)) ]]
then
if [[ "${url}" == *profile.php* ]]
then


+ 1
- 1
website-extract-social-media View File

@@ -7,7 +7,7 @@ function fetch_n_extract {
tee \
>(
# Facebook
grep -Poi 'facebook\.com/(pages/[^/ <"'"'"']+/|groups/)?[^/ <"'"'"']+' | \
grep -Poi 'facebook\.com/(pages/[^/ <"'"'"']+/|groups/|pg/)?[^/ <"'"'"']+' | \
sed 's,^,https://www.,' | \
grep -vi -e '^https://www\.facebook\.com/2008$' -e '^https://www\.facebook\.com/tr\?' -e '^https://www\.facebook\.com/plugins$' | \
grep -Pvi '^https://www\.facebook\.com/sharer(\.php\?|\?|$)'


Loading…
Cancel
Save