Spaces:

radames
/

Text2Human-API

Runtime error

App Files Files Community

Text2Human-API / Text2Human /configs /sample_from_pose.yml

radames

missing

ca3f1b4 over 3 years ago

raw

history blame

2.47 kB

	name: sample_from_pose
	use_tb_logger: true
	set_CUDA_VISIBLE_DEVICES: ~
	gpu_ids: [3]

	# dataset configs
	batch_size: 4
	num_workers: 4
	pose_dir: ./datasets/densepose
	texture_ann_file: ./datasets/texture_ann/test
	shape_ann_path: ./datasets/shape_ann/test_ann_file.txt
	downsample_factor: 2

	model_type: SampleFromPoseModel
	# network configs
	embed_dim: 256
	n_embed: 1024
	codebook_spatial_size: 2

	# bottom level vqgan
	bot_n_embed: 512
	bot_codebook_spatial_size: 2
	bot_double_z: false
	bot_z_channels: 256
	bot_resolution: 512
	bot_in_channels: 3
	bot_out_ch: 3
	bot_ch: 128
	bot_ch_mult: [1, 1, 2, 4]
	bot_num_res_blocks: 2
	bot_attn_resolutions: [64]
	bot_dropout: 0.0
	bot_vae_path: ./pretrained_models/vqvae_bottom.pth

	# top level vqgan
	top_double_z: false
	top_z_channels: 256
	top_resolution: 512
	top_in_channels: 3
	top_out_ch: 3
	top_ch: 128
	top_ch_mult: [1, 1, 2, 2, 4]
	top_num_res_blocks: 2
	top_attn_resolutions: [32]
	top_dropout: 0.0
	top_vae_path: ./pretrained_models/vqvae_top.pth

	# unet configs
	index_pred_encoder_in_channels: 256
	index_pred_fc_in_channels: 64
	index_pred_fc_in_index: 4
	index_pred_fc_channels: 64
	index_pred_fc_num_convs: 1
	index_pred_fc_concat_input: False
	index_pred_fc_dropout_ratio: 0.1
	index_pred_fc_num_classes: 512
	index_pred_fc_align_corners: False
	pretrained_index_network: ./pretrained_models/index_pred_net.pth

	# segmentation tokenization
	segm_double_z: false
	segm_z_channels: 32
	segm_resolution: 512
	segm_in_channels: 24
	segm_out_ch: 24
	segm_ch: 64
	segm_ch_mult: [1, 1, 2, 2, 4]
	segm_num_res_blocks: 1
	segm_attn_resolutions: [16]
	segm_dropout: 0.0
	segm_num_segm_classes: 24
	segm_n_embed: 1024
	segm_embed_dim: 32
	segm_token_path: ./pretrained_models/parsing_token.pth

	# sampler configs
	codebook_size: 18432
	segm_codebook_size: 1024
	texture_codebook_size: 18
	bert_n_emb: 512
	bert_n_layers: 24
	bert_n_head: 8
	block_size: 512 # 32 x 16
	latent_shape: [32, 16]
	embd_pdrop: 0.0
	resid_pdrop: 0.0
	attn_pdrop: 0.0
	num_head: 18
	pretrained_sampler: ./pretrained_models/sampler.pth

	# shape network configs
	shape_embedder_dim: 8
	shape_embedder_out_dim: 128
	shape_attr_class_num: [2, 4, 6, 5, 4, 3, 5, 5, 3, 2, 2, 2, 2, 2, 2]
	shape_encoder_in_channels: 1
	shape_fc_in_channels: 64
	shape_fc_in_index: 4
	shape_fc_channels: 64
	shape_fc_num_convs: 1
	shape_fc_concat_input: False
	shape_fc_dropout_ratio: 0.1
	shape_fc_num_classes: 24
	shape_fc_align_corners: False
	pretrained_parsing_gen: ./pretrained_models/parsing_gen.pth

	manual_seed: 2021
	sample_steps: 256