Spaces:

ravi6389
/

twitter_sentiment

Build error

twitter_sentiment / twitter_crawl.py

Upload folder using huggingface_hub

ebc8f37 verified about 1 year ago

1.45 kB

	import scrapy

	class TwitterSpider(scrapy.Spider):
	name = "twitter_spider"
	start_urls = [
	"https://twitter.com/search?q=Scrapy"
	]

	def start_requests(self):
	for url in self.start_urls:
	yield scrapy.Request(url, callback=self.parse)

	def parse(self, response):
	# Extract the tweets from the page
	tweets = response.css('.tweet-text::text').getall()

	# Print the tweets
	for tweet in tweets:
	print(tweet)

	# Find the URL of the next page of search results
	next_page = response.css('.next-page::attr(href)').get()

	# Check if there is a next page
	if next_page:
	# Send a request to the next page
	yield scrapy.Request(response.urljoin(next_page), callback=self.parse_page)

	def parse_page(self, response):
	# Extract the tweets from the page
	tweets = response.css('.tweet-text::text').getall()

	# Print the tweets
	for tweet in tweets:
	print(tweet)

	# Find the URL of the next page of search results
	next_page = response.css('.next-page::attr(href)').get()

	# Check if there is a next page
	if next_page:
	# Send a request to the next page
	yield scrapy.Request(response.urljoin(next_page), callback=self.parse_page)