Spaces:

Yassmen
/

Job.web.scrapping

Sleeping

Yassmen commited on 22 days ago

Commit

0aab451

•

1 Parent(s): be022a1

Update wuzzuf_scraper.py

Files changed (1) hide show

wuzzuf_scraper.py CHANGED Viewed

@@ -29,9 +29,23 @@ def Wuzzuf_scrapping(job_type , job_num):
     for i in range(int(pages_num) ):
       link_new = link1 +'&start='+str(i)
-      data  = requests.get(link_new)
-      soup  = BeautifulSoup(data.content)
-      Title = soup.find_all('h2' , {'class': 'css-m604qf'})
   # to get the info about jobs

     for i in range(int(pages_num) ):
       link_new = link1 +'&start='+str(i)
+      try:
+            data = requests.get(link_new)
+            data.raise_for_status()  # Check for HTTP errors
+            soup = BeautifulSoup(data.content, 'html.parser')
+            Title = soup.find_all('h2', {'class': 'css-m604qf'})
+            for x in range(len(Title)):
+                title.append(Title[x].find('a').text.strip())
+                loc = soup.find_all('span', {'class': 'css-5wys0k'})[x].text.split(',')
+                location.append(loc[0].strip())
+                country.append(loc[-1].strip())
+                links.append('https://wuzzuf.net' + Title[x].find('a').attrs['href'])
+        except requests.exceptions.RequestException as e:
+           # print(f"Request failed: {e}")
+            continue  # Skip to the next page if there's an error
   # to get the info about jobs