Browse Source

Ignore /intent on Twitter

master
JustAnotherArchivist 4 years ago
parent
commit
c56736bc4a
1 changed files with 1 additions and 1 deletions
  1. +1
    -1
      website-extract-social-media

+ 1
- 1
website-extract-social-media View File

@@ -32,7 +32,7 @@ function fetch_n_extract {
# Twitter
grep -Poi 'twitter\.com/(hashtag/)?[^/ <"'"'"']+' | \
sed 's,^,https://,' | \
grep -vi -e '^https://twitter\.com/home\?' -e '^https://twitter\.com/widgets\.js$' -e '^https://twitter\.com/share\?' | \
grep -vi -e '^https://twitter\.com/home\?' -e '^https://twitter\.com/widgets\.js$' -e '^https://twitter\.com/share\?' -e '^https://twitter\.com/intent$' | \
sed 's,\([?&]\)ref_src=[^&]\+&\?,\1,; s,?$,,'
) \
>(


Loading…
Cancel
Save