Skip to content

Commit

Permalink
Temporarily enabled crawling all 6 pages from soaring.de to capture a…
Browse files Browse the repository at this point in the history
…s many ads as possible before they are gone
  • Loading branch information
lwitkowski committed Jul 30, 2024
1 parent e231645 commit e2f7c1c
Showing 1 changed file with 9 additions and 1 deletion.
10 changes: 9 additions & 1 deletion backend/spiders/SoaringDeSpider.py
Original file line number Diff line number Diff line change
Expand Up @@ -14,7 +14,15 @@ class SoaringDeSpider(scrapy.Spider):
name = "segelflug_de_kleinanzeigen" # fixme, possibly needs db rows update
logger = logging.getLogger(name)

start_urls = [GLIDER_OFFERS_URL, ENGINE_OFFERS_URL]
start_urls = [
GLIDER_OFFERS_URL,
GLIDER_OFFERS_URL + "&iPage=2",
GLIDER_OFFERS_URL + "&iPage=3",
GLIDER_OFFERS_URL + "&iPage=4",
GLIDER_OFFERS_URL + "&iPage=5",
GLIDER_OFFERS_URL + "&iPage=6",
ENGINE_OFFERS_URL
]

AD_SELECTOR = ".listing-thumb"

Expand Down

0 comments on commit e2f7c1c

Please sign in to comment.