mirror of
https://github.com/Soul-AILab/SoulX-Podcast.git
synced 2026-05-06 21:51:04 +08:00
add example
This commit is contained in:
1
.gitignore
vendored
1
.gitignore
vendored
@@ -3,6 +3,7 @@ __pycache__/
|
||||
*.py[codz]
|
||||
*$py.class
|
||||
pretrained_models/
|
||||
outputs/
|
||||
# C extensions
|
||||
*.so
|
||||
|
||||
|
||||
BIN
example/audios/female_mandarin.wav
Normal file
BIN
example/audios/female_mandarin.wav
Normal file
Binary file not shown.
BIN
example/audios/male_mandarin.wav
Normal file
BIN
example/audios/male_mandarin.wav
Normal file
Binary file not shown.
11
example/infer_dialogue.sh
Normal file
11
example/infer_dialogue.sh
Normal file
@@ -0,0 +1,11 @@
|
||||
export PYTHONPATH="$(cd "$(dirname "${BASH_SOURCE[0]}")"/.. && pwd)"
|
||||
echo "PYTHONPATH set to: $PYTHONPATH"
|
||||
|
||||
# Note: To infer Chinese dialects, set model_dir to "pretrained_models/SoulX-Podcast-1.7B-dialect
|
||||
model_dir=pretrained_models/SoulX-Podcast-1.7B
|
||||
input_file=example/podcast_script/script_mandarin.json
|
||||
|
||||
python cli/podcast.py \
|
||||
--json_path ${input_file} \
|
||||
--model_path ${model_dir} \
|
||||
--output_path outputs/mandarin.wav
|
||||
18
example/podcast_script/script_english.json
Normal file
18
example/podcast_script/script_english.json
Normal file
@@ -0,0 +1,18 @@
|
||||
{
|
||||
"speakers": {
|
||||
"S1": {
|
||||
"prompt_audio": "example/audios/female_mandarin.wav",
|
||||
"prompt_text": "喜欢攀岩、徒步、滑雪的语言爱好者,以及过两天要带着全部家当去景德镇做陶瓷的白日梦想家。"
|
||||
},
|
||||
"S2": {
|
||||
"prompt_audio": "example/audios/male_mandarin.wav",
|
||||
"prompt_text": "呃,还有一个就是要跟大家纠正一点,就是我们在看电影的时候,尤其是游戏玩家,看电影的时候,在看到那个到西北那边的这个陕北民谣,嗯,这个可能在想,哎,是不是他是受到了黑神话的启发?"
|
||||
}
|
||||
},
|
||||
"text": [
|
||||
["S1", "Hey, sorry for snapping earlier. That was totally unprofessional of me. Let’s get back to recapping the match."],
|
||||
["S2", "Yeah, no worries. Honestly, that was such an awesome match. You’ve gotta admit, Ali, even though your substitute didn’t win, it was almost legendary."],
|
||||
["S1", "Totally, one for the record books. Sam and Max were only supposed to have four bouts, but things got a little messy right from the start."],
|
||||
["S2", "Oh yeah, someone ran onto the field shouting something—I couldn’t hear a word. Honestly, I was just glad when the guards finally dragged them out. I just wanted to get back to the joust, but it really threw everything off, and it even got the crowd all hyped up, which was kinda surprising."]
|
||||
]
|
||||
}
|
||||
21
example/podcast_script/script_henan.json
Normal file
21
example/podcast_script/script_henan.json
Normal file
@@ -0,0 +1,21 @@
|
||||
{
|
||||
"speakers": {
|
||||
"S1": {
|
||||
"prompt_audio": "example/audios/female_mandarin.wav",
|
||||
"prompt_text": "喜欢攀岩、徒步、滑雪的语言爱好者,以及过两天要带着全部家当去景德镇做陶瓷的白日梦想家。",
|
||||
"dialect_prompt": "<|Henan|>哎哟俺哩个乖乖!叻老师这生活咋恁得劲咧!又是攀岩又是烧瓷,赶明儿怕不是要踩着雪板往窑洞里钻?"
|
||||
},
|
||||
"S2": {
|
||||
"prompt_audio": "example/audios/male_mandarin.wav",
|
||||
"prompt_text": "听到叻四老师关于自己身份的介绍,大家其实可以想象一下 叻四老师的生活有如此的丰富的状态。",
|
||||
"dialect_prompt": "<|Henan|>哎哟俺哩个乖乖!叻老师这生活咋恁得劲咧!又是攀岩又是烧瓷,赶明儿怕不是要踩着雪板往窑洞里钻?"
|
||||
}
|
||||
},
|
||||
"text": [
|
||||
["S1", "<|Henan|>哎,大家好啊,欢迎收听咱这一期嘞《瞎聊呗,就这么说》,我是恁嘞老朋友,燕子。"],
|
||||
["S2", "<|Henan|>大家好,我是老张。燕子啊,今儿瞅瞅你这个劲儿,咋着,是有啥可得劲嘞事儿想跟咱唠唠?"],
|
||||
["S1", "<|Henan|>哎哟,老张,你咋恁懂我嘞!我跟你说啊,最近我刷手机,老是刷住些可逗嘞方言视频,特别是咱河南话,咦~我哩个乖乖,一听我都憋不住笑,咋说嘞,得劲儿哩很,跟回到家一样。"],
|
||||
["S2", "<|Henan|>你这回可算说到根儿上了!河南话,咱往大处说说,中原官话,它真嘞是有一股劲儿搁里头。它可不光是说话,它脊梁骨后头藏嘞,是咱一整套、鲜鲜活活嘞过法儿,一种活人嘞道理。"],
|
||||
["S1", "<|Henan|>活人嘞道理?哎,这你这一说,我嘞兴致“腾”一下就上来啦!觉住咱这嗑儿,一下儿从搞笑视频蹿到文化顶上了。那你赶紧给我白话白话,这里头到底有啥道道儿?我特别想知道——为啥一提起咱河南人,好些人脑子里“蹦”出来嘞头一个词儿,就是实在?这个实在,骨子里到底是啥嘞? "]
|
||||
]
|
||||
}
|
||||
18
example/podcast_script/script_mandarin.json
Normal file
18
example/podcast_script/script_mandarin.json
Normal file
@@ -0,0 +1,18 @@
|
||||
{
|
||||
"speakers": {
|
||||
"S1": {
|
||||
"prompt_audio": "example/audios/female_mandarin.wav",
|
||||
"prompt_text": "喜欢攀岩、徒步、滑雪的语言爱好者,以及过两天要带着全部家当去景德镇做陶瓷的白日梦想家。"
|
||||
},
|
||||
"S2": {
|
||||
"prompt_audio": "example/audios/male_mandarin.wav",
|
||||
"prompt_text": "呃,还有一个就是要跟大家纠正一点,就是我们在看电影的时候,尤其是游戏玩家,看电影的时候,在看到那个到西北那边的这个陕北民谣,嗯,这个可能在想,哎,是不是他是受到了黑神话的启发?"
|
||||
}
|
||||
},
|
||||
"text": [
|
||||
["S1", "哈喽,AI时代的冲浪先锋们!欢迎收听《AI生活进行时》。啊,一个充满了未来感,然后,还有一点点,<|laughter|>神经质的播客节目,我是主持人小希。"],
|
||||
["S2", "哎,大家好呀!我是能唠,爱唠,天天都想唠的唠嗑!"],
|
||||
["S1", "最近活得特别赛博朋克哈!以前老是觉得AI是科幻片儿里的,<|sigh|> 现在,现在连我妈都用AI写广场舞文案了。"],
|
||||
["S2", "这个例子很生动啊。是的,特别是生成式AI哈,感觉都要炸了! 诶,那我们今天就聊聊AI是怎么走进我们的生活的哈!"]
|
||||
]
|
||||
}
|
||||
20
example/podcast_script/script_sichuan.json
Normal file
20
example/podcast_script/script_sichuan.json
Normal file
@@ -0,0 +1,20 @@
|
||||
{
|
||||
"speakers": {
|
||||
"S1": {
|
||||
"prompt_audio": "example/audios/female_mandarin.wav",
|
||||
"prompt_text": "喜欢攀岩、徒步、滑雪的语言爱好者,以及过两天要带着全部家当去景德镇做陶瓷的白日梦想家。",
|
||||
"dialect_prompt": "<|Sichuan|>哪个晓得耍耍哒哒的,倒把生科院的门门儿敲开啰!现在天天泡实验室,跟那些瓶瓶罐罐打交道,硬是闻到福尔马林的味道都比屋头泡菜坛子亲切喽!"
|
||||
},
|
||||
"S2": {
|
||||
"prompt_audio": "example/audios/male_mandarin.wav",
|
||||
"prompt_text": "呃,还有一个就是要跟大家纠正一点,就是我们在看电影的时候,尤其是游戏玩家,看电影的时候,在看到那个到西北那边的这个陕北民谣,嗯,这个可能在想,哎,是不是他是受到了黑神话的启发?",
|
||||
"dialect_prompt": "<|Sichuan|>哎哟喂,这个搞反了噻!黑神话里头唱曲子的王二浪早八百年就在黄土高坡吼秦腔喽,游戏组专门跑切录的原汤原水,听得人汗毛儿都立起来!"
|
||||
}
|
||||
},
|
||||
"text": [
|
||||
["S1", "<|Sichuan|>各位《巴适得板》的听众些,大家好噻!我是你们主持人晶晶。今儿天气硬是巴适,不晓得大家是在赶路嘛,还是茶都泡起咯,准备跟我们好生摆一哈龙门阵喃?"],
|
||||
["S2", "<|Sichuan|>晶晶好哦,大家安逸噻!我是李老倌。你刚开口就川味十足,摆龙门阵几个字一甩出来,我鼻子头都闻到茶香跟火锅香咯!"],
|
||||
["S1", "<|Sichuan|>就是得嘛!李老倌,我前些天带个外地朋友切人民公园鹤鸣茶社坐了一哈。他硬是搞不醒豁,为啥子我们一堆人围到杯茶就可以吹一下午壳子,从隔壁子王嬢嬢娃儿耍朋友,扯到美国大选,中间还掺几盘斗地主。他说我们四川人简直是把摸鱼刻进骨子里头咯!"],
|
||||
["S2", "<|Sichuan|>你那个朋友说得倒是有点儿趣,但他莫看到精髓噻。摆龙门阵哪是摸鱼嘛,这是我们川渝人特有的交际方式,更是一种活法。外省人天天说的松弛感,根根儿就在这龙门阵里头。今天我们就要好生摆一哈,为啥子四川人活得这么舒坦。就先从茶馆这个老窝子说起,看它咋个成了我们四川人的魂儿!"]
|
||||
]
|
||||
}
|
||||
20
example/podcast_script/script_yue.json
Normal file
20
example/podcast_script/script_yue.json
Normal file
@@ -0,0 +1,20 @@
|
||||
{
|
||||
"speakers": {
|
||||
"S1": {
|
||||
"prompt_audio": "example/audios/female_mandarin.wav",
|
||||
"prompt_text": "喜欢攀岩、徒步、滑雪的语言爱好者,以及过两天要带着全部家当去景德镇做陶瓷的白日梦想家。",
|
||||
"dialect_prompt": "<|Yue|>真係冇讲错啊!佢哋制作认真到连背景音乐嘅呼吸声都执到最啱拍子,出亲街访仲要自带三个后备电池,呢种专业精神边度搵啊?我哋成日话学嘢就要学佢哋咁龟毛先得嘛!"
|
||||
},
|
||||
"S2": {
|
||||
"prompt_audio": "example/audios/male_mandarin.wav",
|
||||
"prompt_text": "呃,还有一个就是要跟大家纠正一点,就是我们在看电影的时候,尤其是游戏玩家,看电影的时候,在看到那个到西北那边的这个陕北民谣,嗯,这个可能在想,哎,是不是他是受到了黑神话的启发?",
|
||||
"dialect_prompt": "<|Yue|>真係唔话得!徐生连标点符号都要拗到最啱先收货,成组人晚晚通顶改稿改到天光,呢种摞命搏嘅精神先至係最难得嘎!"
|
||||
}
|
||||
},
|
||||
"text": [
|
||||
["S1", "<|Yue|>哈囉大家好啊,歡迎收聽我哋嘅節目。喂,我今日想問你樣嘢啊,你覺唔覺得,嗯,而家揸電動車,最煩,最煩嘅一樣嘢係咩啊?"],
|
||||
["S2", "<|Yue|>梗係充電啦。大佬啊,搵個位都已經好煩,搵到個位仲要喺度等,你話快極都要半個鐘一個鐘,真係,有時諗起都覺得好冇癮。"],
|
||||
["S1", "<|Yue|>係咪先。如果我而家同你講,充電可以快到同入油差唔多時間,你信唔信先?喂你平時喺油站入滿一缸油,要幾耐啊?五六分鐘?"],
|
||||
["S2", "<|Yue|>差唔多啦,七八分鐘,點都走得啦。電車喎,可以做到咁快?你咪玩啦。"]
|
||||
]
|
||||
}
|
||||
Reference in New Issue
Block a user