Browse Source

update scrape script to accpect args

fix-broken-scrape
Jørgen Lien Sellæg 6 years ago
parent
commit
ef763d6768
  1. 61
      scrape.sh

61
scrape.sh

@ -1,7 +1,5 @@
#!/bin/bash #!/bin/bash
readonly ARGS="$@"
function usage { function usage {
cat <<- EOF cat <<- EOF
./scrape.sh [options] ./scrape.sh [options]
@ -13,24 +11,42 @@ function usage {
OPTIONS: OPTIONS:
-e --event Facebook event id. Scrape a single Facebook -e --event Facebook event id. Scrape a single Facebook
event. event.
-h --help -? print usage
--events List of Facebook event ids. See examples for
format.
-p --page Facebook page id. Scrape all events of a -p --page Facebook page id. Scrape all events of a
specific facebook page. specific facebook page.
-a --pages Array of Facebook page ids. This is a space --pages List of Facebook page ids. See examples for
seperated list of page ids. format.
-h --help -? print usage NOTE:
Events and pages needs to be public. Private events or pages are not yet
supported.
EXAMPLES: EXAMPLES:
Scrape events of a facebook page with id 133713371337 EOF
./scrape.sh --page 133713371337 }
./scrape.sh -p 133713371337
Scrape a facebook event with id 420420420420 event_ids="";
./scrape.sh --event 420420420420 pages_ids="";
./scrape.sh -e 420420420420
Scrape a facebook event with id 123 and all events from page 1323 function scrape_event {
./scrape.sh --event 123 --page 1323 local event_id;
EOF event_id="$1"
if [ "" == "${event_ids}" ]; then
event_ids="${event_id}"
else
event_ids="${event_ids},${event_id}"
fi
}
function scrape_page {
local page_id;
page_id="$1"
if [ "" == "${pages_ids}" ]; then
pages_ids="${page_id}"
else
pages_ids="${pages_ids},${page_id}"
fi
} }
function parse_args { function parse_args {
@ -41,14 +57,13 @@ function parse_args {
while [[ $# -gt 0 ]]; do while [[ $# -gt 0 ]]; do
key="$1" key="$1"
case $key in case $key in
-e|--event) -e|--event|--events)
shift shift
local event_id; scrape_event "$1"
event_id=$1
;; ;;
-p|--page) -p|--page|--pages)
;; shift
-a|--pages) scrape_page "$1"
;; ;;
*) *)
usage usage
@ -88,6 +103,10 @@ function check_dependencies {
return 0; return 0;
} }
function scrape {
exec node scrape.js --event_ids="${event_ids}" --page_ids="${page_ids}"
}
check_dependencies \ check_dependencies \
&& parse_args "${ARGS}" \ && parse_args "$@" \
&& scrape && scrape

Loading…
Cancel
Save