From b36202f3fb7399881760b0355a269ead4599e79c Mon Sep 17 00:00:00 2001 From: Allan <53341442+Guohanzhong@users.noreply.github.com> Date: Fri, 9 Aug 2024 13:35:34 +0800 Subject: [PATCH 1/2] Update inference_v2.yaml Fix the bug in Moore codebase (in training, moore codebase use the scaled linear as schedule) --- configs/inference/inference_v2.yaml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/configs/inference/inference_v2.yaml b/configs/inference/inference_v2.yaml index a501c42..34c0b4f 100644 --- a/configs/inference/inference_v2.yaml +++ b/configs/inference/inference_v2.yaml @@ -25,7 +25,7 @@ unet_additional_kwargs: noise_scheduler_kwargs: beta_start: 0.00085 beta_end: 0.012 - beta_schedule: "linear" + beta_schedule: "scaled_linear" clip_sample: false steps_offset: 1 ### Zero-SNR params @@ -33,4 +33,4 @@ noise_scheduler_kwargs: rescale_betas_zero_snr: True timestep_spacing: "trailing" -sampler: DDIM \ No newline at end of file +sampler: DDIM From 24720d437e0177922ae193754fcde2c90e1e6d82 Mon Sep 17 00:00:00 2001 From: Allan <53341442+Guohanzhong@users.noreply.github.com> Date: Fri, 9 Aug 2024 13:39:23 +0800 Subject: [PATCH 2/2] Update README.md updates results after fixing the bug --- README.md | 22 ++++++++++++++++++++++ 1 file changed, 22 insertions(+) diff --git a/README.md b/README.md index 9d37317..50b41c7 100644 --- a/README.md +++ b/README.md @@ -129,6 +129,28 @@ Terminal Technology Department, Alipay, Ant Group. +### Audio Driven after fix the bug in schedule of inference + +Left: After fixing the bug; Right: Before fixing the bug; +Fix the bug will remove the noise of background. + +
| + + | ++ + | +