Spaces:

wsntxxn
/

MM-StoryAgent

Running on L4

MM-StoryAgent / configs /mm_story_agent.yaml

Xu Xuenan

Initial commit

a121edc 7 months ago

1.69 kB

	story_dir: generated_stories/20240808_1130
	audio_sample_rate: &audio_sample_rate 16000
	audio_codec: mp3 # [mp3, aac, ...]


	story_setting:
	story_topic: "Time Management: A child learning how to manage their time effectively."
	main_role: "(no main role specified)"
	scene: "(no scene specified)"

	story_gen_config:
	max_conv_turns: 3
	num_outline: 4
	temperature: 0.5

	caption_config:
	font: resources/font/msyh.ttf
	# bg_color: LightGrey
	fontsize: 32
	color: white
	# stroke_color: white
	# stroke_width: 0.5
	max_single_caption_length: 50

	sound_generation:
	call_cfg:
	guidance_scale: 3.5
	seed: 0
	ddim_steps: 200
	n_candidate_per_text: 3
	revise_cfg:
	num_turns: 3
	sample_rate: *audio_sample_rate


	speech_generation:
	call_cfg:
	voice: longyuan
	sample_rate: *audio_sample_rate


	image_generation:
	revise_cfg:
	num_turns: 3
	obj_cfg:
	model_name: stabilityai/stable-diffusion-xl-base-1.0
	id_length: 2
	height: 512
	width: 1024
	call_cfg:
	seed: 112536
	guidance_scale: 10.0
	style_name: "Storybook" # ['(No style)', 'Japanese Anime', 'Digital/Oil Painting', 'Pixar/Disney Character',
	# 'Photographic', 'Comic book', 'Line art', 'Black and White Film Noir', 'Isometric Rooms']

	music_generation:
	revise_cfg:
	num_turns: 3
	call_cfg:
	duration: 60.0

	slideshow_effect:
	fade_duration: 0.8
	slide_duration: 0.4
	zoom_speed: 0.5
	move_ratio: 0.9

	sound_volume: 0.6
	music_volume: 0.5
	bg_speech_ratio: 0.6

	fps: 8