From d1e98fac1768dfa638e1f5bac4806a622944deb4 Mon Sep 17 00:00:00 2001 From: prahul11 Date: Mon, 9 Oct 2023 14:35:09 +0530 Subject: [PATCH] print command removed --- .../naukri_gulf_search/spiders/naukri_gulf_search_spider.py | 3 ++- .../naukri_india_search/spiders/naukri_india_search_spider.py | 2 +- 2 files changed, 3 insertions(+), 2 deletions(-) diff --git a/server scraper/naukri_gulf_search/naukri_gulf_search/spiders/naukri_gulf_search_spider.py b/server scraper/naukri_gulf_search/naukri_gulf_search/spiders/naukri_gulf_search_spider.py index f3b9404..8e45045 100644 --- a/server scraper/naukri_gulf_search/naukri_gulf_search/spiders/naukri_gulf_search_spider.py +++ b/server scraper/naukri_gulf_search/naukri_gulf_search/spiders/naukri_gulf_search_spider.py @@ -69,6 +69,7 @@ class NaukriGulfSearchSpiderSpider(scrapy.Spider): def parse(self, response): # status_code = response.status + print(self.crawler.stats.inc_value('urls_crawled')) total_pages = response.meta.get('total_pages') start_page = response.meta.get('start_page') base_url = response.meta.get('base_url') @@ -96,7 +97,7 @@ class NaukriGulfSearchSpiderSpider(scrapy.Spider): except: pass yield parsed_item - print(f"Processed{url} : {start_page}/{total_page_num}/{total_pages}") + # print(f"Processed {url} : {start_page}/{total_page_num}/{total_pages}") total_pages = total_pages-1 start_page = start_page+1 else: diff --git a/server scraper/naukri_india_search/naukri_india_search/spiders/naukri_india_search_spider.py b/server scraper/naukri_india_search/naukri_india_search/spiders/naukri_india_search_spider.py index 5ea3557..8fa6da9 100644 --- a/server scraper/naukri_india_search/naukri_india_search/spiders/naukri_india_search_spider.py +++ b/server scraper/naukri_india_search/naukri_india_search/spiders/naukri_india_search_spider.py @@ -4,7 +4,7 @@ import logging import json import math -input_file_path = "static_data/_industry_urls.csv" +input_file_path = "_industry_urls.csv" headers = { "authority": "www.naukri.com", "accept": "application/json",