Spaces:

Kyo-Kai
/

Fsg-Pp

Sleeping

File size: 5,500 Bytes

f4d52c1

import time
import urllib.request
import os
from random import randint
from selenium.webdriver.common.by import By
from selenium.webdriver.common.keys import Keys
from selenium.webdriver.support.ui import WebDriverWait
from selenium.webdriver.support import expected_conditions as EC
from selenium.common.exceptions import TimeoutException
from commands.driver_instance import create_url_headers, tab_handler
from commands.exec_path import imgList
from commands.universal import contains_works, save_Search, continue_Search
from ai.classifying_ai import img_classifier

def getOrderedZerochanImages(driver, exec_path, user_search, num_pics, num_pages, n_likes, filters, imageControl):
    global image_locations, image_names, ultimatium, ai_mode
    image_names = imgList(mode=1)
    image_locations = []

    ai_mode = 1 
    filters={'likes': 0 if not n_likes else n_likes}
    searchLimit={'pagecount': num_pages,'imagecount':num_pics}
    user_search = user_search.replace(" ","+").capitalize()
    link = "https://www.zerochan.net/" + user_search

    if not imageControl:
        driver.get(link)
    if imageControl:
        continue_Search(driver, link, mode=2)

    if driver.current_url == "https://www.zerochan.net/":
        print("You continued for the first time, but there was no previous search to continue from!")
        driver.get(driver.current_url + 'angry')

    
    is_valid_search(driver)
    if not contains_works(driver, '//*[@id="thumbs2"]'):
        print("No works found...")
        return []

    curr_page = driver.current_url
    while len(image_locations) < num_pics*num_pages:
        search_image(driver,exec_path,filters,searchLimit=searchLimit)
        if curr_page == driver.current_url and len(image_locations) < num_pics*num_pages or image_locations[-1]==-1:
            image_locations.pop()
            print("Reached end of search results")
            break
        curr_page = driver.current_url
    driver.quit()

    return image_locations

def search_image(driver, exec_path, filters, searchLimit):
    filter_link = "https://www.zerochan.net/register"

    # The main image searcher
    for page in range(searchLimit["pagecount"]):
        temp_img_len = len(image_locations)
        save_Search(driver=driver, mode=2)
        WebDriverWait(driver, timeout=11).until(EC.presence_of_element_located((By.XPATH, "//*[@id='thumbs2']")))
        images = driver.find_elements(By.XPATH, "//*[@id='thumbs2']//li")
        if image_locations and image_locations[-1] == -1:
            break

        for curr_iter,image in enumerate(images):
            tempImg = image.find_element(By.XPATH,".//a").get_attribute("href")
            if len(image_locations) >= searchLimit['imagecount']*searchLimit['pagecount'] or len(image_locations) - temp_img_len >= searchLimit['imagecount']:
                break
            try:
                tempDLLink = image.find_elements(By.XPATH, ".//p//a")[0].get_attribute("href")
                if tempDLLink.split(".")[-1] not in ["jpg","png","jpeg"]:
                    tempDLLink = image.find_elements(By.XPATH, ".//p//a")[1].get_attribute("href")
                tempDLAttr = tempDLLink.split("/")[-1]
                counts = tempDLAttr.count(".")-1
                tempDLAttr = tempDLAttr.replace(".", " ", counts).encode("ascii", "ignore").decode("ascii")

                if tempImg == filter_link or tempDLAttr in image_names:
                    print("\nImage already exists, moving to another image...")
                    continue

                rand_time = randint(0,1) + randint(0,9)/10
                time.sleep(rand_time)     
                if int(image.find_element(By.XPATH, './/*[@class="fav"]').get_property("text"))>filters["likes"]:
                    urllib.request.install_opener(create_url_headers(tempImg=tempImg))
                    urllib.request.urlretrieve(
                        tempDLLink, f"./{exec_path.folder_path}/{tempDLAttr}"
                    )
                    image_locations.append(f"./{exec_path.folder_path}/{tempDLAttr}")
                    image_names.append(f"{tempDLAttr}")
                    print(f"\n{tempDLLink}")
                    if ai_mode:
                        if img_classifier(image_locations[-1]):
                            print("AI Mode: I approve this image")
                        else:
                            os.remove(image_locations[-1])
                            image_locations.pop()
                            image_names.pop()
                            print("AI Mode: Skipping this image")

                else:
                    image_locations.append(-1)

            # In case of stale element or any other errors
            except:
                if driver.window_handles[-1] != driver.window_handles[0]:
                    print("I ran into an error, closing the tab and moving on...")
                    driver = tab_handler(driver=driver)
                time.sleep(randint(1,3) + randint(0,9)/10)
                continue

            
        if not valid_page(driver):
             break

def valid_page(driver):
    try:
        driver.get(driver.find_elements(By.XPATH, "//*[@class='pagination']//a")[-1].get_attribute("href"))
        return True
    except:
        return False
    
def is_valid_search(driver):
    try:
        titles = driver.find_element(By.XPATH, "//*[@id='children']//a").get_attribute("href")
        if titles:
            driver.get(titles)
    except:
        pass