add example

This commit is contained in:
xinshengwang
2025-10-28 03:13:09 +08:00
parent f650704efc
commit ae27aa6583
9 changed files with 109 additions and 0 deletions

1
.gitignore vendored
View File

@@ -3,6 +3,7 @@ __pycache__/
*.py[codz]
*$py.class
pretrained_models/
outputs/
# C extensions
*.so

Binary file not shown.

Binary file not shown.

11
example/infer_dialogue.sh Normal file
View File

@@ -0,0 +1,11 @@
export PYTHONPATH="$(cd "$(dirname "${BASH_SOURCE[0]}")"/.. && pwd)"
echo "PYTHONPATH set to: $PYTHONPATH"
# Note: To infer Chinese dialects, set model_dir to "pretrained_models/SoulX-Podcast-1.7B-dialect
model_dir=pretrained_models/SoulX-Podcast-1.7B
input_file=example/podcast_script/script_mandarin.json
python cli/podcast.py \
--json_path ${input_file} \
--model_path ${model_dir} \
--output_path outputs/mandarin.wav

View File

@@ -0,0 +1,18 @@
{
"speakers": {
"S1": {
"prompt_audio": "example/audios/female_mandarin.wav",
"prompt_text": "喜欢攀岩、徒步、滑雪的语言爱好者,以及过两天要带着全部家当去景德镇做陶瓷的白日梦想家。"
},
"S2": {
"prompt_audio": "example/audios/male_mandarin.wav",
"prompt_text": "呃,还有一个就是要跟大家纠正一点,就是我们在看电影的时候,尤其是游戏玩家,看电影的时候,在看到那个到西北那边的这个陕北民谣,嗯,这个可能在想,哎,是不是他是受到了黑神话的启发?"
}
},
"text": [
["S1", "Hey, sorry for snapping earlier. That was totally unprofessional of me. Lets get back to recapping the match."],
["S2", "Yeah, no worries. Honestly, that was such an awesome match. Youve gotta admit, Ali, even though your substitute didnt win, it was almost legendary."],
["S1", "Totally, one for the record books. Sam and Max were only supposed to have four bouts, but things got a little messy right from the start."],
["S2", "Oh yeah, someone ran onto the field shouting something—I couldnt hear a word. Honestly, I was just glad when the guards finally dragged them out. I just wanted to get back to the joust, but it really threw everything off, and it even got the crowd all hyped up, which was kinda surprising."]
]
}

View File

@@ -0,0 +1,21 @@
{
"speakers": {
"S1": {
"prompt_audio": "example/audios/female_mandarin.wav",
"prompt_text": "喜欢攀岩、徒步、滑雪的语言爱好者,以及过两天要带着全部家当去景德镇做陶瓷的白日梦想家。",
"dialect_prompt": "<|Henan|>哎哟俺哩个乖乖!叻老师这生活咋恁得劲咧!又是攀岩又是烧瓷,赶明儿怕不是要踩着雪板往窑洞里钻?"
},
"S2": {
"prompt_audio": "example/audios/male_mandarin.wav",
"prompt_text": "听到叻四老师关于自己身份的介绍,大家其实可以想象一下 叻四老师的生活有如此的丰富的状态。",
"dialect_prompt": "<|Henan|>哎哟俺哩个乖乖!叻老师这生活咋恁得劲咧!又是攀岩又是烧瓷,赶明儿怕不是要踩着雪板往窑洞里钻?"
}
},
"text": [
["S1", "<|Henan|>哎,大家好啊,欢迎收听咱这一期嘞《瞎聊呗,就这么说》,我是恁嘞老朋友,燕子。"],
["S2", "<|Henan|>大家好,我是老张。燕子啊,今儿瞅瞅你这个劲儿,咋着,是有啥可得劲嘞事儿想跟咱唠唠?"],
["S1", "<|Henan|>哎哟,老张,你咋恁懂我嘞!我跟你说啊,最近我刷手机,老是刷住些可逗嘞方言视频,特别是咱河南话,咦~我哩个乖乖,一听我都憋不住笑,咋说嘞,得劲儿哩很,跟回到家一样。"],
["S2", "<|Henan|>你这回可算说到根儿上了!河南话,咱往大处说说,中原官话,它真嘞是有一股劲儿搁里头。它可不光是说话,它脊梁骨后头藏嘞,是咱一整套、鲜鲜活活嘞过法儿,一种活人嘞道理。"],
["S1", "<|Henan|>活人嘞道理?哎,这你这一说,我嘞兴致“腾”一下就上来啦!觉住咱这嗑儿,一下儿从搞笑视频蹿到文化顶上了。那你赶紧给我白话白话,这里头到底有啥道道儿?我特别想知道——为啥一提起咱河南人,好些人脑子里“蹦”出来嘞头一个词儿,就是实在?这个实在,骨子里到底是啥嘞? "]
]
}

View File

@@ -0,0 +1,18 @@
{
"speakers": {
"S1": {
"prompt_audio": "example/audios/female_mandarin.wav",
"prompt_text": "喜欢攀岩、徒步、滑雪的语言爱好者,以及过两天要带着全部家当去景德镇做陶瓷的白日梦想家。"
},
"S2": {
"prompt_audio": "example/audios/male_mandarin.wav",
"prompt_text": "呃,还有一个就是要跟大家纠正一点,就是我们在看电影的时候,尤其是游戏玩家,看电影的时候,在看到那个到西北那边的这个陕北民谣,嗯,这个可能在想,哎,是不是他是受到了黑神话的启发?"
}
},
"text": [
["S1", "哈喽AI时代的冲浪先锋们欢迎收听《AI生活进行时》。啊一个充满了未来感然后还有一点点<|laughter|>神经质的播客节目,我是主持人小希。"],
["S2", "哎,大家好呀!我是能唠,爱唠,天天都想唠的唠嗑!"],
["S1", "最近活得特别赛博朋克哈以前老是觉得AI是科幻片儿里的<|sigh|> 现在现在连我妈都用AI写广场舞文案了。"],
["S2", "这个例子很生动啊。是的特别是生成式AI哈感觉都要炸了那我们今天就聊聊AI是怎么走进我们的生活的哈"]
]
}

View File

@@ -0,0 +1,20 @@
{
"speakers": {
"S1": {
"prompt_audio": "example/audios/female_mandarin.wav",
"prompt_text": "喜欢攀岩、徒步、滑雪的语言爱好者,以及过两天要带着全部家当去景德镇做陶瓷的白日梦想家。",
"dialect_prompt": "<|Sichuan|>哪个晓得耍耍哒哒的,倒把生科院的门门儿敲开啰!现在天天泡实验室,跟那些瓶瓶罐罐打交道,硬是闻到福尔马林的味道都比屋头泡菜坛子亲切喽!"
},
"S2": {
"prompt_audio": "example/audios/male_mandarin.wav",
"prompt_text": "呃,还有一个就是要跟大家纠正一点,就是我们在看电影的时候,尤其是游戏玩家,看电影的时候,在看到那个到西北那边的这个陕北民谣,嗯,这个可能在想,哎,是不是他是受到了黑神话的启发?",
"dialect_prompt": "<|Sichuan|>哎哟喂,这个搞反了噻!黑神话里头唱曲子的王二浪早八百年就在黄土高坡吼秦腔喽,游戏组专门跑切录的原汤原水,听得人汗毛儿都立起来!"
}
},
"text": [
["S1", "<|Sichuan|>各位《巴适得板》的听众些,大家好噻!我是你们主持人晶晶。今儿天气硬是巴适,不晓得大家是在赶路嘛,还是茶都泡起咯,准备跟我们好生摆一哈龙门阵喃?"],
["S2", "<|Sichuan|>晶晶好哦,大家安逸噻!我是李老倌。你刚开口就川味十足,摆龙门阵几个字一甩出来,我鼻子头都闻到茶香跟火锅香咯!"],
["S1", "<|Sichuan|>就是得嘛!李老倌,我前些天带个外地朋友切人民公园鹤鸣茶社坐了一哈。他硬是搞不醒豁,为啥子我们一堆人围到杯茶就可以吹一下午壳子,从隔壁子王嬢嬢娃儿耍朋友,扯到美国大选,中间还掺几盘斗地主。他说我们四川人简直是把摸鱼刻进骨子里头咯!"],
["S2", "<|Sichuan|>你那个朋友说得倒是有点儿趣,但他莫看到精髓噻。摆龙门阵哪是摸鱼嘛,这是我们川渝人特有的交际方式,更是一种活法。外省人天天说的松弛感,根根儿就在这龙门阵里头。今天我们就要好生摆一哈,为啥子四川人活得这么舒坦。就先从茶馆这个老窝子说起,看它咋个成了我们四川人的魂儿!"]
]
}

View File

@@ -0,0 +1,20 @@
{
"speakers": {
"S1": {
"prompt_audio": "example/audios/female_mandarin.wav",
"prompt_text": "喜欢攀岩、徒步、滑雪的语言爱好者,以及过两天要带着全部家当去景德镇做陶瓷的白日梦想家。",
"dialect_prompt": "<|Yue|>真係冇讲错啊!佢哋制作认真到连背景音乐嘅呼吸声都执到最啱拍子,出亲街访仲要自带三个后备电池,呢种专业精神边度搵啊?我哋成日话学嘢就要学佢哋咁龟毛先得嘛!"
},
"S2": {
"prompt_audio": "example/audios/male_mandarin.wav",
"prompt_text": "呃,还有一个就是要跟大家纠正一点,就是我们在看电影的时候,尤其是游戏玩家,看电影的时候,在看到那个到西北那边的这个陕北民谣,嗯,这个可能在想,哎,是不是他是受到了黑神话的启发?",
"dialect_prompt": "<|Yue|>真係唔话得!徐生连标点符号都要拗到最啱先收货,成组人晚晚通顶改稿改到天光,呢种摞命搏嘅精神先至係最难得嘎!"
}
},
"text": [
["S1", "<|Yue|>哈囉大家好啊,歡迎收聽我哋嘅節目。喂,我今日想問你樣嘢啊,你覺唔覺得,嗯,而家揸電動車,最煩,最煩嘅一樣嘢係咩啊?"],
["S2", "<|Yue|>梗係充電啦。大佬啊,搵個位都已經好煩,搵到個位仲要喺度等,你話快極都要半個鐘一個鐘,真係,有時諗起都覺得好冇癮。"],
["S1", "<|Yue|>係咪先。如果我而家同你講,充電可以快到同入油差唔多時間,你信唔信先?喂你平時喺油站入滿一缸油,要幾耐啊?五六分鐘?"],
["S2", "<|Yue|>差唔多啦,七八分鐘,點都走得啦。電車喎,可以做到咁快?你咪玩啦。"]
]
}