Spaces:

wlyu
/

FaceLift

Running on Zero

App Files Files Community

FaceLift / configs /gslrm.yaml

wlyu-adobe

Initial commit

bd9eb72 about 2 months ago

raw

history blame contribute delete

3.85 kB

	# =============================================================================
	# General Configuration
	# =============================================================================
	profile: false
	debug: false

	# =============================================================================
	# Model Configuration
	# =============================================================================
	model:
	class_name: gslrm.model.gslrm.GSLRM

	# Image processing settings
	image_tokenizer:
	image_size: 512
	patch_size: 8
	in_channels: 9 # 3 RGB + 3 direction + 3 Reference

	# Transformer architecture
	transformer:
	d: 1024
	d_head: 64
	n_layer: 24

	# Gaussian splatting configuration
	gaussians:
	n_gaussians: 2 # 12288
	sh_degree: 0

	upsampler:
	upsample_factor: 1

	# Model behavior flags
	add_refsrc_marker: false
	hard_pixelalign: true
	use_custom_plucker: true
	clip_xyz: true

	# =============================================================================
	# Training Configuration
	# =============================================================================
	training:
	# Training runtime settings
	runtime:
	use_tf32: true
	use_amp: true
	amp_dtype: "bf16"
	torch_compile: false
	grad_accum_steps: 1
	grad_clip_norm: 1.0
	grad_checkpoint_every: 1

	# Dataset configuration
	dataset:
	dataset_path: "data_sample/gslrm/data_gslrm_train.txt"

	# View configuration
	maximize_view_overlap: true
	num_views: 8
	num_input_views: 6 # In training, we set it as 4. In inference, we set it as 6.
	target_has_input: true

	# Data preprocessing
	normalize_distance_to: 0.0
	remove_alpha: false
	background_color: "white"

	# Data loader settings
	dataloader:
	batch_size_per_gpu: 2
	num_workers: 4
	num_threads: 32
	prefetch_factor: 32

	# Loss function weights
	losses:
	l2_loss_weight: 1.0
	lpips_loss_weight: 0.0
	perceptual_loss_weight: 0.5
	ssim_loss_weight: 0.0
	pixelalign_loss_weight: 0.0
	masked_pixelalign_loss: true
	pointsdist_loss_weight: 0.0
	warmup_pointsdist: false
	distill_loss_weight: 0.0

	# Optimizer configuration (AdamW)
	optimizer:
	lr: 0.0001
	beta1: 0.9
	beta2: 0.95
	weight_decay: 0.05
	reset_lr: false
	reset_weight_decay: false
	reset_training_state: true

	# Training schedule
	schedule:
	num_epochs: 100000 # dataset epochs
	early_stop_after_epochs: 100000 # 40
	max_fwdbwd_passes: 20000 # forward/backward pass steps
	warmup: 500 # parameter update steps
	l2_warmup_steps: 500

	# Checkpointing
	checkpointing:
	resume_ckpt: "checkpoints/gslrm/stage_2"
	checkpoint_every: 5000 # forward/backward pass steps
	checkpoint_dir: "checkpoints/gslrm/stage_3"

	# Logging and monitoring
	logging:
	print_every: 20 # forward/backward pass steps
	vis_every: 250 # forward/backward pass steps

	# Weights & Biases configuration
	wandb:
	project: "facelift_gslrm"
	exp_name: "stage_3"
	group: "facelift"
	job_type: "train"
	log_every: 50 # forward/backward pass steps
	offline: false


	# =============================================================================
	# Inference Configuration
	# =============================================================================
	inference:
	enabled: false
	output_dir: "outputs/inference/gslrm/stage_3"

	# =============================================================================
	# Validation Configuration
	# =============================================================================
	validation:
	enabled: true
	val_every: 5000
	output_dir: "outputs/validation/gslrm/stage_3"
	dataset_path: "data_sample/gslrm/data_gslrm_val.txt"