diff --git a/naukri/jobdata_india.py b/naukri/jobdata_india.py index 8d24ea2..cba60e0 100644 --- a/naukri/jobdata_india.py +++ b/naukri/jobdata_india.py @@ -16,7 +16,7 @@ error_file = "data_naukri/jobdata_error_india.csv" stats_file = "data_naukri/stats.txt" skip=0 class NaukriJobDetailScraper: - + base_url = "https://www.naukri.com/jobapi/v4/job/{}" headers = { 'authority': 'www.naukri.com', @@ -124,6 +124,8 @@ class NaukriJobDetailScraper: time.sleep(0.5) try: response = requests.get(url, headers=self.headers, timeout=self.timeout, proxies=self.proxies) + if response.status_code == 403: + requests.get(url, headers=self.headers, timeout=self.timeout) print(f"{response.status_code} for {url}") @@ -172,7 +174,7 @@ def main(): duration_hours = (end_time - start_time) / 3600 print(f"Jobdata program took {duration_hours:.2f} hours to run.") with open(stats_file, "a") as stat: - stat.write(f"Jobdata program took {duration_hours:.2f} hours to run.\n") + stat.write(f"Jobdata program took {duration_hours:.2f} hours to run.\n") if __name__ == "__main__":