Spaces:

yslan
/

worldmem

Running on Zero

worldmem / configurations /huggingface.yaml

xizaoqu

update

0cb2a53 26 days ago

1.46 kB

	n_tokens: 3
	pose_cond_dim: 5
	use_plucker: true
	focal_length: 0.35
	customized_validation: true
	condition_similar_length: 8
	log_video: true
	relative_embedding: true
	cond_only_on_qk: true
	add_pose_embed: false
	use_domain_adapter: false
	use_reference_attention: true
	add_frame_timestep_embedder: true
	is_interactive: true
	diffusion:
	sampling_timesteps: 20
	beta_schedule: sigmoid
	objective: pred_v
	use_fused_snr: True
	cum_snr_decay: 0.96
	clip_noise: 20.
	ddim_sampling_eta: 0.0
	stabilization_level: 15
	schedule_fn_kwargs: {}
	use_snr: False
	use_cum_snr: False
	snr_clip: 5.0
	timesteps: 1000
	# architecture
	architecture:
	network_size: 64
	attn_heads: 4
	attn_dim_head: 64
	dim_mults: [1, 2, 4, 8]
	resolution: ${dataset.resolution}
	attn_resolutions: [16, 32, 64, 128]
	use_init_temporal_attn: True
	use_linear_attn: True
	time_emb_type: rotary

	weight_decay: 2e-3
	warmup_steps: 10000
	optimizer_beta: [0.9, 0.99]
	action_cond_dim: 25
	n_frames: 8
	frame_skip: 1
	frame_stack: 1
	uncertainty_scale: 1
	guidance_scale: 0.0
	chunk_size: 1 # -1 for full trajectory diffusion, number to specify diffusion chunk size
	scheduling_matrix: autoregressive
	noise_level: random_all
	causal: True
	x_shape: [3, 360, 640]
	context_frames: 1
	diffusion_path: yslan/worldmem_checkpoints/diffusion_only.ckpt
	vae_path: yslan/worldmem_checkpoints/vae_only.ckpt
	pose_predictor_path: yslan/worldmem_checkpoints/pose_prediction_model_only.ckpt