MCPcopy Index your code
hub / github.com/geekcomputers/Python / tweeter_scrapper

Function tweeter_scrapper

twitter_post_scraper.py:9–35  ·  view source on GitHub ↗
()

Source from the content-addressed store, hash-verified

7
8
9def tweeter_scrapper():
10 list_of_dirty_tweets = []
11 clear_list_of_tweets = []
12 base_tweeter_url = "https://twitter.com/{}"
13
14 tweeter_id = input()
15
16 response = requests.get(base_tweeter_url.format(tweeter_id))
17 soup = BeautifulSoup(response.content, "lxml")
18 all_tweets = soup.find_all("div", {"class": "tweet"})
19
20 for tweet in all_tweets:
21 content = tweet.find("div", {"class": "content"})
22 message = (
23 content.find("div", {"class": "js-tweet-text-container"})
24 .text.replace("\n", " ")
25 .strip()
26 )
27 list_of_dirty_tweets.append(message)
28 for dirty_tweet in list_of_dirty_tweets:
29 dirty_tweet = re.sub(re_text, "", dirty_tweet, flags=re.MULTILINE)
30 dirty_tweet = re.sub(re_text_1, "", dirty_tweet, flags=re.MULTILINE)
31 dirty_tweet = dirty_tweet.replace("\xa0…", "")
32 dirty_tweet = dirty_tweet.replace("\xa0", "")
33 dirty_tweet = dirty_tweet.replace("\u200c", "")
34 clear_list_of_tweets.append(dirty_tweet)
35 print(clear_list_of_tweets)
36
37
38if __name__ == "__main__":

Callers 1

Calls 3

subMethod · 0.80
getMethod · 0.45
appendMethod · 0.45

Tested by

no test coverage detected