Skip to content

Commit

Permalink
integrate with scrapy-redis havanagrawal#2
Browse files Browse the repository at this point in the history
  • Loading branch information
paulbroek committed Jan 5, 2023
1 parent 8d4028a commit e9243cc
Showing 1 changed file with 4 additions and 3 deletions.
7 changes: 4 additions & 3 deletions GoodreadsScraper/settings.py
Original file line number Diff line number Diff line change
Expand Up @@ -23,11 +23,8 @@
# Obey robots.txt rules
ROBOTSTXT_OBEY = True

# POSTGRES_HOST = "77.249.149.174"
# POSTGRES_HOST = "postgres-goodreads-master"
POSTGRES_HOST = "127.0.0.1"
# POSTGRES_PORT = 5432
# POSTGRES_PORT = 5439

# scrapy-redis settings
USER_AGENT = 'scrapy-redis (+https://github.com/rolando/scrapy-redis)'
Expand All @@ -38,6 +35,10 @@
# SCHEDULER_QUEUE_CLASS = "scrapy_redis.queue.SpiderPriorityQueue"
# SCHEDULER_QUEUE_CLASS = "scrapy_redis.queue.SpiderQueue"
# SCHEDULER_QUEUE_CLASS = "scrapy_redis.queue.SpiderStack"
REDIS_PARAMS = {
"REDIS_HOST": "81.169.252.73",
"REDIS_PORT" : 6382
}

# update postgres when author item is scraped. Caution: very slow if query is
# not optimized
Expand Down

0 comments on commit e9243cc

Please sign in to comment.