From 76ab53f521133f81329db5f6835e642a93962176 Mon Sep 17 00:00:00 2001 From: Chris Kennedy Date: Sat, 7 Dec 2024 05:13:25 -0800 Subject: [PATCH] adjust defaults --- scripts/broadcast_personality.sh | 8 ++++---- src/args.rs | 23 +++++++---------------- 2 files changed, 11 insertions(+), 20 deletions(-) diff --git a/scripts/broadcast_personality.sh b/scripts/broadcast_personality.sh index cc878b2..df713cf 100755 --- a/scripts/broadcast_personality.sh +++ b/scripts/broadcast_personality.sh @@ -34,8 +34,8 @@ USE_API=1 CHAT_FORMAT=chatml #CHAT_FORMAT=llama2 #CHAT_FORMAT=vicuna -MAX_TOKENS=16000 -TEMPERATURE=0.8 +MAX_TOKENS=8000 +TEMPERATURE=1.0 CONTEXT_SIZE=32000 QUANTIZED=0 KEEP_HISTORY=1 @@ -54,7 +54,7 @@ TWITCH_CHAT_HISTORY=32 TWITCH_MAX_TOKENS_CHAT=500 TWITCH_MAX_TOKENS_LLM=$MAX_TOKENS ## Stable Diffusion Settings -SD_TEXT_MIN=300 +SD_TEXT_MIN=500 #SD_WIDTH=512 SD_WIDTH=768 #SD_WIDTH=860 @@ -66,7 +66,7 @@ SD_API=1 SD_MODEL=turbo SD_CUSTOM_MODEL="sd_xl_turbo_1.0_fp16.safetensors" SD_INTERMEDIARY_IMAGES=0 -SD_N_STEPS=14 +SD_N_STEPS=20 ALIGNMENT=center SUBTITLES=0 # === END OF CONFIGURATION === diff --git a/src/args.rs b/src/args.rs index 7c02695..0c04322 100644 --- a/src/args.rs +++ b/src/args.rs @@ -201,7 +201,7 @@ pub struct Args { #[clap( long, env = "MIMIC3_VOICE", - default_value = "en_US/vctk_low#p303", + default_value = "en_US/ljspeech_low", help = "MIMIC3_VOICE voice model via text string to use for mimic3 tts. Use en_US/vctk_low#p326 for a male voice, default is female." )] pub mimic3_voice: String, @@ -457,7 +457,7 @@ pub struct Args { #[clap( long, env = "POLL_INTERVAL", - default_value_t = 60_000, + default_value_t = 1_000, help = "POLL Interval in ms." )] pub poll_interval: u64, @@ -480,15 +480,6 @@ pub struct Args { )] pub loglevel: String, - /// Break Line Length - line length for breaking lines from LLM messages - #[clap( - long, - env = "BREAK_LINE_LENGTH", - default_value_t = 300, - help = "Break Line Length - line length for breaking lines from LLM messages." - )] - pub break_line_length: usize, - /// SD Image - create an SD image from the LLM messages #[clap( long, @@ -511,7 +502,7 @@ pub struct Args { #[clap( long, env = "SD_MAX_LENGTH", - default_value_t = 200, + default_value_t = 300, help = "SD Max Length in tokens for SD Image hardsub text segments. example: 77 tokens is avg 77 * 4 == 308 chars." )] pub sd_max_length: usize, @@ -520,7 +511,7 @@ pub struct Args { #[clap( long, env = "SD_PARAGRAPH_MIN", - default_value_t = 60, + default_value_t = 300, help = "SD Min Length for text segments generating Images. Will force past this value before segmenting text." )] pub sd_text_min: usize, @@ -584,7 +575,7 @@ pub struct Args { pub sd_height: usize, /// sd width - #[clap(long, env = "SD_WIDTH", default_value_t = 512, help = "SD Width.")] + #[clap(long, env = "SD_WIDTH", default_value_t = 768, help = "SD Width.")] pub sd_width: usize, /// sd scaled height @@ -618,7 +609,7 @@ pub struct Args { #[clap( long, env = "SD_CUSTOM_MODEL", - default_value = "sd_xl_turbo_1.0.safetensors", + default_value = "sd_xl_turbo_1.0_fp.safetensors", help = "Custom Stable Diffusion Model. for automatic 111111 API usage, the name must exist as a model locally or remotely." )] pub sd_custom_model: String, @@ -685,7 +676,7 @@ pub struct Args { #[clap( long, env = "SUBTITLE_POSITION", - default_value = "center", + default_value = "top", help = "Subtitle position." )] pub subtitle_position: String,