WatsonTang98
/

baseline_null

Model card Files Files and versions Community

baseline_null / script.py

WatsonTang98

Upload script.py

f4f33f0 verified 8 months ago

raw

history blame

13.1 kB

	### This is example of the script that will be run in the test environment.
	### Some parts of the code are compulsory and you should NOT CHANGE THEM.
	### They are between '''---compulsory---''' comments.
	### You can change the rest of the code to define and test your solution.
	### However, you should not change the signature of the provided function.
	### The script would save "submission.parquet" file in the current directory.
	### The actual logic of the solution is implemented in the `handcrafted_solution.py` file.
	### The `handcrafted_solution.py` file is a placeholder for your solution.
	### You should implement the logic of your solution in that file.
	### You can use any additional files and subdirectories to organize your code.

	'''---compulsory---'''
	# import subprocess
	# from pathlib import Path
	# def install_package_from_local_file(package_name, folder='packages'):
	# """
	# Installs a package from a local .whl file or a directory containing .whl files using pip.

	# Parameters:
	# path_to_file_or_directory (str): The path to the .whl file or the directory containing .whl files.
	# """
	# try:
	# pth = str(Path(folder) / package_name)
	# subprocess.check_call([subprocess.sys.executable, "-m", "pip", "install",
	# "--no-index", # Do not use package index
	# "--find-links", pth, # Look for packages in the specified directory or at the file
	# package_name]) # Specify the package to install
	# print(f"Package installed successfully from {pth}")
	# except subprocess.CalledProcessError as e:
	# print(f"Failed to install package from {pth}. Error: {e}")

	# install_package_from_local_file('hoho')

	import hoho; hoho.setup() # YOU MUST CALL hoho.setup() BEFORE ANYTHING ELSE
	# import subprocess
	# import importlib
	# from pathlib import Path
	# import subprocess


	# ### The function below is useful for installing additional python wheels.
	# def install_package_from_local_file(package_name, folder='packages'):
	# """
	# Installs a package from a local .whl file or a directory containing .whl files using pip.

	# Parameters:
	# path_to_file_or_directory (str): The path to the .whl file or the directory containing .whl files.
	# """
	# try:
	# pth = str(Path(folder) / package_name)
	# subprocess.check_call([subprocess.sys.executable, "-m", "pip", "install",
	# "--no-index", # Do not use package index
	# "--find-links", pth, # Look for packages in the specified directory or at the file
	# package_name]) # Specify the package to install
	# print(f"Package installed successfully from {pth}")
	# except subprocess.CalledProcessError as e:
	# print(f"Failed to install package from {pth}. Error: {e}")


	# pip download webdataset -d packages/webdataset --platform manylinux1_x86_64 --python-version 38 --only-binary=:all:
	# install_package_from_local_file('webdataset')
	# install_package_from_local_file('tqdm')

	### Here you can import any library or module you want.
	### The code below is used to read and parse the input dataset.
	### Please, do not modify it.

	import webdataset as wds
	from tqdm import tqdm
	from typing import Dict
	import pandas as pd
	from transformers import AutoTokenizer
	import os
	import time
	import io
	from PIL import Image as PImage
	import numpy as np

	from hoho.read_write_colmap import read_cameras_binary, read_images_binary, read_points3D_binary
	from hoho import proc, Sample

	def convert_entry_to_human_readable(entry):
	out = {}
	already_good = ['__key__', 'wf_vertices', 'wf_edges', 'edge_semantics', 'mesh_vertices', 'mesh_faces', 'face_semantics', 'K', 'R', 't']
	for k, v in entry.items():
	if k in already_good:
	out[k] = v
	continue
	if k == 'points3d':
	out[k] = read_points3D_binary(fid=io.BytesIO(v))
	if k == 'cameras':
	out[k] = read_cameras_binary(fid=io.BytesIO(v))
	if k == 'images':
	out[k] = read_images_binary(fid=io.BytesIO(v))
	if k in ['ade20k', 'gestalt']:
	out[k] = [PImage.open(io.BytesIO(x)).convert('RGB') for x in v]
	if k == 'depthcm':
	out[k] = [PImage.open(io.BytesIO(x)) for x in entry['depthcm']]
	return out

	'''---end of compulsory---'''

	### The part below is used to define and test your solution.
	import subprocess
	import sys
	import os

	import numpy as np
	os.environ['MKL_THREADING_LAYER'] = 'GNU'
	os.environ['MKL_SERVICE_FORCE_INTEL'] = '1'

	def uninstall_package(package_name):
	"""
	Uninstalls a package using pip.

	Parameters:
	package_name (str): The name of the package to uninstall.
	"""
	try:
	subprocess.check_call([sys.executable, "-m", "pip", "uninstall", "-y", package_name])
	print(f"Package {package_name} uninstalled successfully")
	except subprocess.CalledProcessError as e:
	print(f"Failed to uninstall package {package_name}. Error: {e}")

	# def download_packages(packages, folder='packages/torch'):
	# """
	# Downloads packages as .whl files into the specified folder using pip.

	# Parameters:
	# packages (list): List of packages to download with versions.
	# folder (str): The folder where the .whl files will be saved.
	# """
	# Path(folder).mkdir(parents=True, exist_ok=True)
	# try:
	# subprocess.check_call([sys.executable, "-m", "pip", "download",
	# "--platform", "manylinux1_x86_64",
	# "--python-version", "38",
	# "--only-binary=:all:",
	# "-d", folder] + packages)
	# print(f"Packages downloaded successfully into {folder}")
	# except subprocess.CalledProcessError as e:
	# print(f"Failed to download packages. Error: {e}")

	def download_packages(packages, folder):
	# Create the directory if it doesn't exist
	if not os.path.exists(folder):
	os.makedirs(folder)

	try:
	subprocess.check_call([
	'pip', 'download',
	'--dest', folder,
	'-f', 'https://download.pytorch.org/whl/cu121'
	] + packages)
	print(f"Packages downloaded successfully to {folder}")
	except subprocess.CalledProcessError as e:
	print(f"Failed to download packages. Error: {e}")

	# Set CUDA environment variables
	os.environ['CUDA_HOME'] = '/usr/local/cuda-12.1'
	os.environ['PATH'] = os.environ['CUDA_HOME'] + '/bin:' + os.environ['PATH']
	os.environ['LD_LIBRARY_PATH'] = os.environ['CUDA_HOME'] + '/lib64:' + os.environ.get('LD_LIBRARY_PATH', '')

	def install_package_from_local_file(package_name, folder='packages'):
	"""
	Installs a package from a local .whl file or a directory containing .whl files using pip.

	Parameters:
	package_name (str): The name of the package to install.
	folder (str): The folder where the .whl files are located.
	"""
	try:
	pth = str(Path(folder) / package_name)
	subprocess.check_call([sys.executable, "-m", "pip", "install",
	"--no-index", # Do not use package index
	"--find-links", pth, # Look for packages in the specified directory or at the file
	package_name]) # Specify the package to install
	print(f"Package installed successfully from {pth}")
	except subprocess.CalledProcessError as e:
	print(f"Failed to install package from {pth}. Error: {e}")

	def install_which():
	try:
	# Attempt to install which if it's not available
	subprocess.check_call(['sudo', 'apt-get', 'install', '-y', 'which'])
	print("Which installed successfully.")
	except subprocess.CalledProcessError as e:
	print(f"An error occurred while installing which: {e}")
	sys.exit(1)

	def setup_environment():
	# Uninstall torch if it is already installed
	# packages_to_uninstall = ['torch', 'torchvision', 'torchaudio']
	# for package in packages_to_uninstall:
	# uninstall_package(package)
	# Download required packages
	# pip install torch==1.13.1+cu116 torchvision==0.14.1+cu116 torchaudio==0.13.1 --extra-index-url https://download.pytorch.org/whl/cu116
	# pip install torch==2.3.0 torchvision==0.18.0 torchaudio==2.3.0 --index-url https://download.pytorch.org/whl/cu121
	# pip install torch==2.1.0 torchvision==0.16.0 torchaudio==2.1.0 --index-url https://download.pytorch.org/whl/cu121
	# packages_to_download = ['torch==1.13.1', 'torchvision==0.14.1', 'torchaudio==0.13.1']
	# packages_to_download = ['torch==2.1.0', 'torchvision==0.16.0', 'torchaudio==2.1.0']
	# download_packages(packages_to_download, folder='packages/torch')

	# Install ninja
	# install_package_from_local_file('ninja', folder='packages')

	# packages_to_download = ['torch==2.1.0', 'torchvision==0.16.0', 'torchaudio==2.1.0']
	# download_folder = 'packages/torch'

	# Download the packages
	# download_packages(packages_to_download, download_folder)

	# Install packages from local files
	# install_package_from_local_file('torch', folder='packages')
	# install_package_from_local_file('packages/torch/torchvision-0.16.0-cp38-cp38-manylinux1_x86_64.whl', folder='packages/torch')
	# install_package_from_local_file('packages/torch/torchaudio-2.1.0-cp38-cp38-manylinux1_x86_64.whl', folder='packages/torch')
	# install_package_from_local_file('scikit-learn', folder='packages')
	# install_package_from_local_file('open3d', folder='packages')
	# install_package_from_local_file('easydict', folder='packages')
	# install_package_from_local_file('setuptools', folder='packages')
	# install_package_from_local_file('ninja', folder='packages')
	# download_packages(['scikit-learn'], folder='packages/scikit-learn')
	# download_packages(['open3d'], folder='packages/open3d')
	# download_packages(['easydict'], folder='packages/easydict')

	# try:
	# subprocess.check_call(['which', 'which'])
	# except subprocess.CalledProcessError:
	# install_which()

	# Set environment variables for CUDA
	os.environ['CUDA_HOME'] = '/usr/local/cuda'
	os.environ['PATH'] = os.environ['CUDA_HOME'] + '/bin:' + os.environ['PATH']
	os.environ['LD_LIBRARY_PATH'] = os.environ['CUDA_HOME'] + '/lib64:' + os.environ.get('LD_LIBRARY_PATH', '')
	os.environ['LIBRARY_PATH'] = os.environ['CUDA_HOME'] + '/lib64'

	# Print CUDA environment variables to verify
	# print("CUDA_HOME:", os.environ['CUDA_HOME'])
	# print("PATH:", os.environ['PATH'])
	# print("LD_LIBRARY_PATH:", os.environ['LD_LIBRARY_PATH'])
	# print("LIBRARY_PATH:", os.environ['LIBRARY_PATH'])

	# Verify CUDA headers are accessible
	cuda_include_path = os.path.join(os.environ['CUDA_HOME'], 'include')
	if not os.path.exists(os.path.join(cuda_include_path, 'cuda.h')):
	raise EnvironmentError(f"CUDA headers not found in {cuda_include_path}. Please check your CUDA installation.")

	pc_util_path = os.path.join(os.getcwd(), 'pc_util')
	if os.path.isdir(pc_util_path):
	os.chdir(pc_util_path)
	subprocess.check_call([sys.executable, "setup.py", "install"], cwd=pc_util_path)
	os.chdir("..")

	def setup_cuda_environment():
	# cuda_home = '/usr/local/cuda'
	# if not os.path.exists(cuda_home):
	# raise EnvironmentError(f"CUDA_HOME directory {cuda_home} does not exist. Please install CUDA and set CUDA_HOME environment variable.")
	# os.environ['CUDA_HOME'] = cuda_home
	# os.environ['PATH'] = f"{cuda_home}/bin:{os.environ['PATH']}"
	# os.environ['LD_LIBRARY_PATH'] = f"{cuda_home}/lib64:{os.environ.get('LD_LIBRARY_PATH', '')}"

	os.environ['PATH'] = '/usr/local/cuda/bin'
	os.environ['LD_LIBRARY_PATH'] = '/usr/local/cuda/lib64'
	os.environ['LIBRARY_PATH'] = '/usr/local/cuda/lib64'

	# usr_local_contents = os.listdir('/usr/local')
	# # print("Items under /usr/local:")
	# for item in usr_local_contents:
	# print(item)

	from pathlib import Path
	def save_submission(submission, path):
	"""
	Saves the submission to a specified path.

	Parameters:
	submission (List[Dict[]]): The submission to save.
	path (str): The path to save the submission to.
	"""
	sub = pd.DataFrame(submission, columns=["__key__", "wf_vertices", "wf_edges"])
	sub.to_parquet(path)
	print(f"Submission saved to {path}")

	if __name__ == "__main__":
	# setup_cuda_environment()
	setup_environment()

	from handcrafted_solution import predict
	print ("------------ Loading dataset------------ ")
	params = hoho.get_params()
	dataset = hoho.get_dataset(decode=None, split='all', dataset_type='webdataset')

	print('------------ Now you can do your solution ---------------')
	solution = []
	from concurrent.futures import ProcessPoolExecutor
	with ProcessPoolExecutor(max_workers=1) as pool:
	results = []
	for i, sample in enumerate(tqdm(dataset)):
	results.append(pool.submit(predict, sample, visualize=False))

	for i, result in enumerate(tqdm(results)):
	key, pred_vertices, pred_edges = result.result()
	solution.append({
	'__key__': key,
	'wf_vertices': pred_vertices.tolist(),
	'wf_edges': pred_edges
	})
	if i % 100 == 0:
	# incrementally save the results in case we run out of time
	print(f"Processed {i} samples")
	# save_submission(solution, Path(params['output_path']) / "submission.parquet")
	print('------------ Saving results ---------------')
	save_submission(solution, Path(params['output_path']) / "submission.parquet")
	print("------------ Done ------------ ")