You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
docker run --rm -it -v ${TWITTER_DATA}/data:/opt/local -v `pwd`:/opt/bin node node /opt/bin/likes_extract.js | jq '.[].fullText' >full_text.txt
docker run --rm -it -v `pwd`:/opt/local python bash
pip install urlextract
cd /opt/local
cat full_text.txt | ./url_extract.py | more
url_extract.py
#!/usr/local/bin/python
from urlextract import URLExtract
import fileinput
extractor = URLExtract()
for line in fileinput.input():
urls = extractor.find_urls(line)
print(line, urls)