-
Notifications
You must be signed in to change notification settings - Fork 21
/
Copy pathget_posts.py
35 lines (24 loc) · 1.24 KB
/
get_posts.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
from fb_scrapper import scrape_groups_pages
# To use our application you can use scrape_groups_pages or use one of our predefined functions
# Declare your group or page id here
#group_id = "canoeandkayak"
# Choose which scraping function you want to call
# This function is currently not properly working and will scrape all comments
def scrape_posts_last_es(group_id):
scrape_groups_pages(group_id, 0, False, True)
#def scrape_comments_from_last_scrape(group_id):
#scrape_groups_pages(group_id, 1, True, False)
# Scrape since the last time stamp for the id in the shelve file
def scrape_posts_from_last_scrape(group_id):
scrape_groups_pages(group_id, 1, False, False)
# You must have Kafka running on localhost:9092 or change the port in fb_posts_realtime.py
# Also be advised this may be buggy (we are still in the process of writing tests for it).
def scrape_posts_from_last_scrape_kafka(group_id):
scrape_groups_pages(group_id, 1, True, False)
def scrape_all_posts(group_id):
scrape_groups_pages(group_id, 0, False, False)
#def scrape_all_comments(group_id):
#scrape_groups_pages(group_id, 0, True, False)
#scrape_all_posts("paddlesoft")
#scrape_all_comments("paddlesoft")
#scrape_comments_from_last_scrape("176485839144245")