diff --git a/.gitattributes b/.gitattributes index 4af4d66f886e69d1f36632fba64a469b1ae5e709..a6344aac8c09253b3b630fb776ae94478aa0275b 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,94 +33,3 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text -MiniMax_Speech.pdf filter=lfs diff=lfs merge=lfs -text -assets/audios/回忆男中年.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/美妆女博主.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/深度访谈男中年.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/体育解说男青年.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/游戏主播女青年.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/直播带货女青年.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/Breaking[[:space:]]Down[[:space:]]Mandarin_OneShot.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/Breaking[[:space:]]Down[[:space:]]Mandarin_Prompt.WAV filter=lfs diff=lfs merge=lfs -text -assets/audios/Breaking[[:space:]]Down[[:space:]]Mandarin_Source.WAV filter=lfs diff=lfs merge=lfs -text -assets/audios/Breaking[[:space:]]Down[[:space:]]Mandarin_ZeroShot.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/Breathy[[:space:]]ASMR_Sourse.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/Breathy[[:space:]]ASMR.MP3 filter=lfs diff=lfs merge=lfs -text -assets/audios/CoCo_Sourse.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/Compelling[[:space:]]and[[:space:]]Persuasive.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/Condition1.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/Condition2.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/Conditon3.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/Czech_Female_Sourse.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/Czech.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/ElevenLabs_Breaking[[:space:]]Down[[:space:]]Mandarin.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/ElevenLabs_English-Mandarin.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/ElevenLabs_Japanese_Dominant_Man.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/ElevenLabs_Japanese-Korean.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/ElevenLabs_Mandarin-English.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/ElevenLabs_Neurotic[[:space:]]Teenage[[:space:]]English.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/Emma_1.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/Emma_2.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/English_Radiant_Girl_Sourse.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/English-Mandarin.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/English-Spanish.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/Explanatory[[:space:]]Broad[[:space:]]Emotional.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/Explanatory[[:space:]]Supernatural[[:space:]]Prosody.MP3 filter=lfs diff=lfs merge=lfs -text -assets/audios/FlowVAE1.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/FlowVAE2.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/FlowVAE3.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/Japanese_DominantMan_Sourse.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/Japanese-Korean.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/Japanese.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/JosephBrodsky_Fast.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/JosephBrodsky_PVC.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/JosephBrodsky_Source.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/Lucky[[:space:]]Robot_Sourse.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/Lucky[[:space:]]Robot.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/Lyrical[[:space:]]Cantonese_Oneshot.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/Lyrical[[:space:]]Cantonese_Prompt.WAV filter=lfs diff=lfs merge=lfs -text -assets/audios/Lyrical[[:space:]]Cantonese_Source.WAV filter=lfs diff=lfs merge=lfs -text -assets/audios/Lyrical[[:space:]]Cantonese_ZeroShot.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/Mandarin_Refreshing_Young_Man_Sourse.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/Mandarin-Cantonese.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/Mandarin-English.WAV filter=lfs diff=lfs merge=lfs -text -assets/audios/Marketing_Voice_Sourse.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/Murmur-Excitement-Anger-[[:space:]]Whispers.MP3 filter=lfs diff=lfs merge=lfs -text -assets/audios/Nancy_1.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/Nancy_2.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/Neurotic[[:space:]]Teenage[[:space:]]English_OneShot.MP3 filter=lfs diff=lfs merge=lfs -text -assets/audios/Neurotic[[:space:]]Teenage[[:space:]]English_ZeroShot.MP3 filter=lfs diff=lfs merge=lfs -text -assets/audios/Neurotic[[:space:]]Teenage[[:space:]]English.MP3 filter=lfs diff=lfs merge=lfs -text -assets/audios/Neutral-Rage-Reminiscence-Weeping.MP3 filter=lfs diff=lfs merge=lfs -text -assets/audios/Onee-san_Sourse.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/Onee-san.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/OpenAI_Breaking[[:space:]]Down[[:space:]]Mandarin.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/OpenAI_English-Mandarin.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/OpenAI_Japanese-Korean.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/OpenAI_Japanese.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/OpenAI_Neurotic[[:space:]]Teenage[[:space:]]English.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/Polish_Male_Sourse.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/Powerful_Girl_Sourse.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/Quirky[[:space:]]Female[[:space:]]English.MP3 filter=lfs diff=lfs merge=lfs -text -assets/audios/Radiant_Girl_1.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/Science_Voice_Sourse.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/ShiBanYu_Sourse.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/ShuanQ_Sourse.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/Sociology_Sourse.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/Spanish-English.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/Thai_Male_Sourse.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/TianJin_PVC.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/TianJin_Source.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/VAE1.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/VAE2.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/VAE3.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/Vietnamese_Female_Sourse.wav filter=lfs diff=lfs merge=lfs -text -assets/audios/Warm[[:space:]]and[[:space:]]Magnetic_Sourse.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/Warm[[:space:]]and[[:space:]]Magnetic.mp3 filter=lfs diff=lfs merge=lfs -text -assets/audios/Wong_Sourse.mp3 filter=lfs diff=lfs merge=lfs -text -assets/images/header-bg.jpeg filter=lfs diff=lfs merge=lfs -text -assets/images/system-overview.jpg filter=lfs diff=lfs merge=lfs -text -*.wav filter=lfs diff=lfs merge=lfs -text -*.mp3 filter=lfs diff=lfs merge=lfs -text -*.WAV filter=lfs diff=lfs merge=lfs -text -*.MP3 filter=lfs diff=lfs merge=lfs -text diff --git a/Mandarin-Cantonese.wav b/Mandarin-Cantonese.wav deleted file mode 100644 index 31906154322eaab4eedf27b98d980f29e99d0775..0000000000000000000000000000000000000000 --- a/Mandarin-Cantonese.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:58e92479f1bdcfe373512963369ce3656ea6526adb2e647e9a0165434d43b5f3 -size 12680134 diff --git a/MiniMax_Speech.pdf b/MiniMax_Speech.pdf deleted file mode 100644 index 723c027ae81ed29ded368d7022a4f1cffa9095a7..0000000000000000000000000000000000000000 --- a/MiniMax_Speech.pdf +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2d9498aa5fb7f8ca0382b1ddc28b3c57270198efa54e76e5cea0028c103df72b -size 1828673 diff --git a/Onee-san_Sourse.wav b/Onee-san_Sourse.wav deleted file mode 100644 index 8f45a99fe64a5031c866d83eade99fb5ecbb7ab2..0000000000000000000000000000000000000000 --- a/Onee-san_Sourse.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7b46285788ca5ff9bae286396f9a2aeeb6d3c1259b4e8c9e46caccf4b9dcd9e6 -size 13137536 diff --git a/README.md b/README.md index b35ac744d014c30f115ec28b8e1695c0a706b4a7..6ab188518e3bee2f8457c40ddeb38d796837ff6f 100644 --- a/README.md +++ b/README.md @@ -1,26 +1,10 @@ --- -title: MiniMax Speech Tech Report -emoji: 🎙️ +title: MiniMax Speech 02 +emoji: 📊 colorFrom: indigo colorTo: green sdk: static pinned: false --- -Here are our latest tech reports: - -- [MiniMax Speech Tech Report](https://minimax-ai.github.io/tts_tech_report/) - -Citation - -``` -@misc{minimax2025minimaxspeechintrinsiczeroshottexttospeech, - title={MiniMax-Speech: Intrinsic Zero-Shot Text-to-Speech with a Learnable Speaker Encoder}, - author={Bowen Zhang, Congchao Guo, Geng Yang, Hang Yu, Haozhe Zhang, Heidi Lei, Jialong Mai, Junjie Yan, Kaiyue Yang, Mingqi Yang, Peikai Huang, Ruiyang Jin, Sitan Jiang, Weihua Cheng, Yawei Li, Yichen Xiao, Yiying Zhou, Yongmao Zhang, Yuan Lu, Yucen He}, - year={2025}, - eprint={2505.07916}, - archivePrefix={arXiv}, - primaryClass={eess.AS}, - url={https://arxiv.org/abs/2505.07916}, -} -``` \ No newline at end of file +Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference diff --git a/assets/audios/Angry.mp3 b/assets/audios/Angry.mp3 deleted file mode 100644 index 9300322d72edc7f6bbdbeed866db54ce62eec223..0000000000000000000000000000000000000000 --- a/assets/audios/Angry.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:cb31b4518cccc69715e4eb05dafdcf8367c2d4bebefd2dc06b47e88540f077d5 -size 44972 diff --git a/assets/audios/Breaking Down Mandarin_OneShot.mp3 b/assets/audios/Breaking Down Mandarin_OneShot.mp3 deleted file mode 100644 index 8cb0b2bb18747b94d9d80478c00e3f24db6360cb..0000000000000000000000000000000000000000 --- a/assets/audios/Breaking Down Mandarin_OneShot.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d4f1094d3626532f61b59199c5cfa3a99b297006fc6624fa961858c427ca7b1b -size 178412 diff --git a/assets/audios/Breaking Down Mandarin_Prompt.WAV b/assets/audios/Breaking Down Mandarin_Prompt.WAV deleted file mode 100644 index 7e18e472743960f9ab49b829bb51556ae4aaa604..0000000000000000000000000000000000000000 --- a/assets/audios/Breaking Down Mandarin_Prompt.WAV +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a2fdd1847813b850456b048197f6f7d4137eccb5f400b0784d924f5c903c9bcd -size 7525598 diff --git a/assets/audios/Breaking Down Mandarin_Source.WAV b/assets/audios/Breaking Down Mandarin_Source.WAV deleted file mode 100644 index eb74bf1cfc8373067c14cfd81b83a08cc28a5bb1..0000000000000000000000000000000000000000 --- a/assets/audios/Breaking Down Mandarin_Source.WAV +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:58c3cb652de3e0ff25cdff880dbf8679b9254c2985f5b803b3abbb47df749a9e -size 24609542 diff --git a/assets/audios/Breaking Down Mandarin_ZeroShot.mp3 b/assets/audios/Breaking Down Mandarin_ZeroShot.mp3 deleted file mode 100644 index fee0b8a45e32502736d487cd9074645ca842e46c..0000000000000000000000000000000000000000 --- a/assets/audios/Breaking Down Mandarin_ZeroShot.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8f05dabe3e4d954cd51d7ceff25a924d649c841b269b94463b04c7cc3b46ad43 -size 171692 diff --git a/assets/audios/Breathy ASMR.MP3 b/assets/audios/Breathy ASMR.MP3 deleted file mode 100644 index 7bb7d5fd60708e595e0b2438a297e5a0db335ca2..0000000000000000000000000000000000000000 --- a/assets/audios/Breathy ASMR.MP3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:722f596eb6c2b7a1b75442c35db631ded6e52db48b9b2cc94e7dd52745a21bdc -size 501183 diff --git a/assets/audios/Breathy ASMR_Sourse.wav b/assets/audios/Breathy ASMR_Sourse.wav deleted file mode 100644 index 11fbe3f4418a757d2b369b3451ab3fdd8397df40..0000000000000000000000000000000000000000 --- a/assets/audios/Breathy ASMR_Sourse.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:961d88c6873af93776bb565086a8ce56c551f9ea5b57687ce214c0bda08f1102 -size 48650554 diff --git a/assets/audios/CoCo_Sourse.mp3 b/assets/audios/CoCo_Sourse.mp3 deleted file mode 100644 index e20d44a8210a98f0cdd917767b11d7ac7ba71b2f..0000000000000000000000000000000000000000 --- a/assets/audios/CoCo_Sourse.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0880beb0ede519e88d7d250d8621490de0fea087636e8dd38c4adc715d4b1493 -size 469484 diff --git a/assets/audios/Compelling and Persuasive.wav b/assets/audios/Compelling and Persuasive.wav deleted file mode 100644 index bff0f110745f1cb1f8058f941c04a850d6ff75e8..0000000000000000000000000000000000000000 --- a/assets/audios/Compelling and Persuasive.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:1b2dfcda010a1a5c9cfd347819e5e93f0f7798edefdc00247688a1e0cd3f5e88 -size 86784102 diff --git a/assets/audios/Condition1.wav b/assets/audios/Condition1.wav deleted file mode 100644 index b159ab70c4e152edcbfc7e2ccbe5922e49da002f..0000000000000000000000000000000000000000 --- a/assets/audios/Condition1.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5c8e467fd8fad0532bd1f07d18d9bf66ab49e9e41d5abd76ed7e7a732c48bae1 -size 1190502 diff --git a/assets/audios/Condition2.wav b/assets/audios/Condition2.wav deleted file mode 100644 index dd85cc6658c3310b3c59f542b1ce6be63604a90a..0000000000000000000000000000000000000000 --- a/assets/audios/Condition2.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3423e027486d816a7cc42e00e4348d709fe1c5b2c2a204b7c9235fefd5fad3d2 -size 2402418 diff --git a/assets/audios/Conditon3.wav b/assets/audios/Conditon3.wav deleted file mode 100644 index 0820bace8be3b15bf81d1b88c53cefdcd9991800..0000000000000000000000000000000000000000 --- a/assets/audios/Conditon3.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e2e0a030ac2458d3bfced27c02d41ae74bd9487892c5a196d194f21a65ba43ce -size 2525298 diff --git a/assets/audios/Czech.mp3 b/assets/audios/Czech.mp3 deleted file mode 100644 index 393100a4a62e50731569fa5e0fd9115e82019b04..0000000000000000000000000000000000000000 --- a/assets/audios/Czech.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6861406b335a4c4f6834276b4ee692cef7954ee36dacc1deeed248501130be3d -size 258048 diff --git a/assets/audios/Czech_Female_Sourse.wav b/assets/audios/Czech_Female_Sourse.wav deleted file mode 100644 index 2a011d3bf545150689dd86464384d3969204b524..0000000000000000000000000000000000000000 --- a/assets/audios/Czech_Female_Sourse.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ce4148eddb7bb435ce47e7ec7a58ad3d0a49a927311b48470ae1ebae4911ecb3 -size 19901650 diff --git a/assets/audios/Disgusted.mp3 b/assets/audios/Disgusted.mp3 deleted file mode 100644 index ef3bf8bbe8df07b1d300753411549ea11ecf2267..0000000000000000000000000000000000000000 --- a/assets/audios/Disgusted.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:bf5021f78be6a17303092791b63043f5415dc5a85c88aec30f88bdc722144afa -size 49580 diff --git a/assets/audios/ElevenLabs_Breaking Down Mandarin.mp3 b/assets/audios/ElevenLabs_Breaking Down Mandarin.mp3 deleted file mode 100644 index a22a89048215b37aeaf17b8dfb31ec1f0dbb8dc8..0000000000000000000000000000000000000000 --- a/assets/audios/ElevenLabs_Breaking Down Mandarin.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a2ecb8ae7c390bfef06a520857ce3686f0ed93d378120e5483720916eb317d83 -size 159212 diff --git a/assets/audios/ElevenLabs_Czech.mp3 b/assets/audios/ElevenLabs_Czech.mp3 deleted file mode 100644 index cdd98922ceaa71f0b99876fda78be47e1925cac3..0000000000000000000000000000000000000000 --- a/assets/audios/ElevenLabs_Czech.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ad5799f0fa3b0eb76d7eca47b1fd9becbf04d6157d8e776c21ac338f13e3987c -size 66092 diff --git a/assets/audios/ElevenLabs_English-Mandarin.mp3 b/assets/audios/ElevenLabs_English-Mandarin.mp3 deleted file mode 100644 index 0acb55dbb0b81cce61fdf15500364505e79f76e3..0000000000000000000000000000000000000000 --- a/assets/audios/ElevenLabs_English-Mandarin.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:773a84baa079b800972b9d660473f1076c57d78906a6393aa58d7d7885e6e2fe -size 144236 diff --git a/assets/audios/ElevenLabs_English-Spanish.mp3 b/assets/audios/ElevenLabs_English-Spanish.mp3 deleted file mode 100644 index cafaccab99268348a0bbc6370f3fffb32bd3eced..0000000000000000000000000000000000000000 --- a/assets/audios/ElevenLabs_English-Spanish.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4312e7436fb7f6c3eeea4ccb690e9c611e609d8f2b058f4dab7fdccb8ccc5ff3 -size 84716 diff --git a/assets/audios/ElevenLabs_Japanese-Korean.mp3 b/assets/audios/ElevenLabs_Japanese-Korean.mp3 deleted file mode 100644 index 6316cd1e4d0f1a025f6db10bf0bcb0fbdd1b9cbd..0000000000000000000000000000000000000000 --- a/assets/audios/ElevenLabs_Japanese-Korean.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9b63a6e7e9a5f92cb6515dd076b6b2e9b85bc6d97328381c0828cb54819ce3f8 -size 181292 diff --git a/assets/audios/ElevenLabs_Japanese_Dominant_Man.mp3 b/assets/audios/ElevenLabs_Japanese_Dominant_Man.mp3 deleted file mode 100644 index 220ac7956a5063c0fcf4ee672aa0ffa1b5c6a06f..0000000000000000000000000000000000000000 --- a/assets/audios/ElevenLabs_Japanese_Dominant_Man.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:efc0f1aecf60ddeef39f80e9dbcbc23495aec893284212fe3ef56e8ede136e36 -size 106604 diff --git a/assets/audios/ElevenLabs_Mandarin-English.mp3 b/assets/audios/ElevenLabs_Mandarin-English.mp3 deleted file mode 100644 index 251443fdc2ae3992a54eecf3c62464f23e47c312..0000000000000000000000000000000000000000 --- a/assets/audios/ElevenLabs_Mandarin-English.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c3ea274ace47a8b5e4d6c5d96296012abf8d9e1b2c7a610f8acca3ad927fe5c2 -size 221804 diff --git a/assets/audios/ElevenLabs_Neurotic Teenage English.mp3 b/assets/audios/ElevenLabs_Neurotic Teenage English.mp3 deleted file mode 100644 index c3f056650b332d74adf924b1dad974704d58c543..0000000000000000000000000000000000000000 --- a/assets/audios/ElevenLabs_Neurotic Teenage English.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:1d6f8d74ebe04c46b23f6546d2d7f52b697b0f37dbadaf05615508ea390adf46 -size 120428 diff --git a/assets/audios/ElevenLabs_Polish.mp3 b/assets/audios/ElevenLabs_Polish.mp3 deleted file mode 100644 index 14f0785a98f46462ccecc6f9054c63275cae6e43..0000000000000000000000000000000000000000 --- a/assets/audios/ElevenLabs_Polish.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3ab31b881427dd7cd65603b62ed059035b8f817c930af4c12e478b437f84dd62 -size 59948 diff --git a/assets/audios/ElevenLabs_Polishmale.mp3 b/assets/audios/ElevenLabs_Polishmale.mp3 deleted file mode 100644 index 14f0785a98f46462ccecc6f9054c63275cae6e43..0000000000000000000000000000000000000000 --- a/assets/audios/ElevenLabs_Polishmale.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3ab31b881427dd7cd65603b62ed059035b8f817c930af4c12e478b437f84dd62 -size 59948 diff --git a/assets/audios/ElevenLabs_Quirky Female English.mp3 b/assets/audios/ElevenLabs_Quirky Female English.mp3 deleted file mode 100644 index b950ae63b160d634bb127e0341f794e803d8679e..0000000000000000000000000000000000000000 --- a/assets/audios/ElevenLabs_Quirky Female English.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:def7580f004debe027500fd484d44551194db9c6de2bbe1db6002f14b5e88dd8 -size 72236 diff --git a/assets/audios/ElevenLabs_Thai.mp3 b/assets/audios/ElevenLabs_Thai.mp3 deleted file mode 100644 index 27dddff66c01c208e53e122dfb03856ff3862306..0000000000000000000000000000000000000000 --- a/assets/audios/ElevenLabs_Thai.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:209adbe0288e52cb78a0767e684e056bafcb6c492c6c1410832563b6aa06801e -size 59180 diff --git a/assets/audios/ElevenLabs_Vietnamese.mp3 b/assets/audios/ElevenLabs_Vietnamese.mp3 deleted file mode 100644 index 7df52c5eb1d2ad5451144f8edf002a699c40a016..0000000000000000000000000000000000000000 --- a/assets/audios/ElevenLabs_Vietnamese.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c36c8ab12fdb4cddd6d7ea6da3ef66d3fb55d32922eb406172b429dc98172cbb -size 52652 diff --git a/assets/audios/Emma_1.mp3 b/assets/audios/Emma_1.mp3 deleted file mode 100644 index 9d0a4b95dfc69930e4f5ae54143e25cadd845857..0000000000000000000000000000000000000000 --- a/assets/audios/Emma_1.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d6a7ae38ab8d1c9dd3fa0d302be6f326fdf65b117fec8130841e3e2c554945cc -size 173420 diff --git a/assets/audios/Emma_2.mp3 b/assets/audios/Emma_2.mp3 deleted file mode 100644 index 020fb4e65b38641be8c7d4d223c1cecf48820240..0000000000000000000000000000000000000000 --- a/assets/audios/Emma_2.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e00591194b8e369d213ed962cb6d55ed4aad2452769dc34f30239f555491fb7a -size 207212 diff --git a/assets/audios/English-Mandarin.wav b/assets/audios/English-Mandarin.wav deleted file mode 100644 index 587558f6d91eb9ddf078004acdb2db98033e16a1..0000000000000000000000000000000000000000 --- a/assets/audios/English-Mandarin.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:710e10dc1da70e2ad8a5018e3d7dffd6af95f15f8353df56aa92c8d4c58f0200 -size 13362242 diff --git a/assets/audios/English-Spanish.wav b/assets/audios/English-Spanish.wav deleted file mode 100644 index f9fcf3c92920b85fe14a07dcb74a6f6f205db80b..0000000000000000000000000000000000000000 --- a/assets/audios/English-Spanish.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9025271f908910cf7bc7d7bb23418af4ad7faefb472928bf67066731bc529def -size 4471252 diff --git a/assets/audios/English_Radiant_Girl_Sourse.wav b/assets/audios/English_Radiant_Girl_Sourse.wav deleted file mode 100644 index 28b50aa44f411db85abf3bd57486ac370837d83a..0000000000000000000000000000000000000000 --- a/assets/audios/English_Radiant_Girl_Sourse.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:fcf70df56aeb03ee242a98d17563fde7695ccf068c89f20bebc6294bc3517bad -size 17280102 diff --git a/assets/audios/Explanatory Broad Emotional.wav b/assets/audios/Explanatory Broad Emotional.wav deleted file mode 100644 index 8754674bf5c1f8e1f2a673290e133f4134a8e0dc..0000000000000000000000000000000000000000 --- a/assets/audios/Explanatory Broad Emotional.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:77db883f13fb78866e095ff1b36b2fe6506fada6e84fd95b438048300eea403a -size 52224102 diff --git a/assets/audios/Explanatory Supernatural Prosody.MP3 b/assets/audios/Explanatory Supernatural Prosody.MP3 deleted file mode 100644 index b57ffe5bd9f91d483e6ccfd0d13551d8db52e7bf..0000000000000000000000000000000000000000 --- a/assets/audios/Explanatory Supernatural Prosody.MP3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4a9993a82a9d0519a695caf0091be9bbc2c623031b670151fabb85815f6f1852 -size 729068 diff --git a/assets/audios/Fearful.mp3 b/assets/audios/Fearful.mp3 deleted file mode 100644 index 7315f25b46edd524403b9d4d2e5ba5bc43976ac8..0000000000000000000000000000000000000000 --- a/assets/audios/Fearful.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5fe3b587489c66d1a74ca52b6fae8ef87beda36389841c60a37f4264999e2082 -size 67244 diff --git a/assets/audios/FlowVAE1.wav b/assets/audios/FlowVAE1.wav deleted file mode 100644 index c1b68db4f3a3e666877863884325312b8c56626e..0000000000000000000000000000000000000000 --- a/assets/audios/FlowVAE1.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:aad56ad937dc46634605218683693d66058839ae4d2d501e8562e29588db3a5c -size 1772754 diff --git a/assets/audios/FlowVAE2.wav b/assets/audios/FlowVAE2.wav deleted file mode 100644 index 2061e075b42fcba538307fc66efa6190e90f6e08..0000000000000000000000000000000000000000 --- a/assets/audios/FlowVAE2.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0a93bd69061671e7565c6015c317c2d3fcf757c969643b54dc370d693e365170 -size 1545390 diff --git a/assets/audios/FlowVAE3.wav b/assets/audios/FlowVAE3.wav deleted file mode 100644 index f6cecd0641e34a8e57f8a55b665691a808ee19ea..0000000000000000000000000000000000000000 --- a/assets/audios/FlowVAE3.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f1deee73f88606cfd5e8a8f520fdbd3cd9d075c607d9a93167a64995580e02f2 -size 2004582 diff --git a/assets/audios/Happy.mp3 b/assets/audios/Happy.mp3 deleted file mode 100644 index 7f1339ed1134f6a9b51e98fc8746f2de63af2566..0000000000000000000000000000000000000000 --- a/assets/audios/Happy.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:93bb9837b0989d5baa1063dc8e2d81561694f0852739518c044cb2b1c9a2341a -size 51884 diff --git a/assets/audios/Japanese-Korean.mp3 b/assets/audios/Japanese-Korean.mp3 deleted file mode 100644 index 7927355f177d4eccfcf33a192cc38f2ae96d6830..0000000000000000000000000000000000000000 --- a/assets/audios/Japanese-Korean.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7c041606f741082540f2f732a55a9964b242b14957f01955f2a1acb879d238c0 -size 356588 diff --git a/assets/audios/Japanese.mp3 b/assets/audios/Japanese.mp3 deleted file mode 100644 index 2e9303f8cc291563291eabdd66ce629ab6bd10b5..0000000000000000000000000000000000000000 --- a/assets/audios/Japanese.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:56dff2d3624bad3195f5d4753c75c7ded64885fcb6362f985be4f240c8128036 -size 102572 diff --git a/assets/audios/Japanese_DominantMan_Sourse.mp3 b/assets/audios/Japanese_DominantMan_Sourse.mp3 deleted file mode 100644 index 4a393cda2e4c3ed829e8aa97e2d6edc2a0464236..0000000000000000000000000000000000000000 --- a/assets/audios/Japanese_DominantMan_Sourse.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:392b29ba63cf4cb42239104433515d389988e939a02f873b71b5270b0266a6c7 -size 477164 diff --git a/assets/audios/Joanna_1.mp3 b/assets/audios/Joanna_1.mp3 deleted file mode 100644 index c4eea8f50787935404ada5df7630f79a35cf8d0e..0000000000000000000000000000000000000000 --- a/assets/audios/Joanna_1.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d567615c7e52659de134b1842d8f8fcd05e8ab0c110831e0d2d0512806040548 -size 73196 diff --git a/assets/audios/Joanna_2.mp3 b/assets/audios/Joanna_2.mp3 deleted file mode 100644 index 0ce38327ea6c0ba22f8f6e8d9adff917eaad1857..0000000000000000000000000000000000000000 --- a/assets/audios/Joanna_2.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5acf931d0c797e1d76a3cdd494d487da4eb07fac41937003eaba995f7cc7f4b5 -size 87596 diff --git a/assets/audios/JosephBrodsky_Fast.mp3 b/assets/audios/JosephBrodsky_Fast.mp3 deleted file mode 100644 index d370e561b78d7084434f1c0dddab95d3a9006793..0000000000000000000000000000000000000000 --- a/assets/audios/JosephBrodsky_Fast.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c0ae4a684a675b8d031703c250fd2e93e485d64e933b9922319d2e5026f078ee -size 196076 diff --git a/assets/audios/JosephBrodsky_PVC.mp3 b/assets/audios/JosephBrodsky_PVC.mp3 deleted file mode 100644 index e53837d5299fe5d4b851b92e3d678bf84a87a867..0000000000000000000000000000000000000000 --- a/assets/audios/JosephBrodsky_PVC.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:fd799ec35ab00adff5874297cca0b22c528da17459544f64220ebd9601f6b251 -size 211820 diff --git a/assets/audios/JosephBrodsky_Source.wav b/assets/audios/JosephBrodsky_Source.wav deleted file mode 100644 index de336eb497d499cb04c0bab4d613e288f4bd7977..0000000000000000000000000000000000000000 --- a/assets/audios/JosephBrodsky_Source.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4c63dcdcb0418dca9a7460d50234472fd318e006927a024c034524c8c7a91091 -size 5376102 diff --git a/assets/audios/Korean.mp3 b/assets/audios/Korean.mp3 deleted file mode 100644 index ace82096b814c52c835afb4b35d6c6873a7a47d0..0000000000000000000000000000000000000000 --- a/assets/audios/Korean.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:16e281b47cc0208447ee106a7a5addaa4f31e95e852ee770d756e7fec2198611 -size 93164 diff --git a/assets/audios/Lucky Robot.mp3 b/assets/audios/Lucky Robot.mp3 deleted file mode 100644 index e412257e810e78b9154ac186d1dd86acc94e7515..0000000000000000000000000000000000000000 --- a/assets/audios/Lucky Robot.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6e1dbc1756bcf6506ff6215df65b00bb2ad99cdd411e30452499d90d2b59544c -size 155948 diff --git a/assets/audios/Lucky Robot_Sourse.wav b/assets/audios/Lucky Robot_Sourse.wav deleted file mode 100644 index fd96160779e8ff3e1800a0387e040d570ea3e4a5..0000000000000000000000000000000000000000 --- a/assets/audios/Lucky Robot_Sourse.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ffd296e5170e7c35e7ac10d31624d37efbf97a5a0447fe7bc903d6cbf8606944 -size 6755334 diff --git a/assets/audios/Lyrical Cantonese_Oneshot.mp3 b/assets/audios/Lyrical Cantonese_Oneshot.mp3 deleted file mode 100644 index 31cb32e60ce28680ecc35603bc76d7cd1f4ae2d2..0000000000000000000000000000000000000000 --- a/assets/audios/Lyrical Cantonese_Oneshot.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:71ccfe7b699c56612403fb3c9b2fe1e3783f37b8c6ece6b5ee4a2939d1db1e30 -size 355628 diff --git a/assets/audios/Lyrical Cantonese_Prompt.WAV b/assets/audios/Lyrical Cantonese_Prompt.WAV deleted file mode 100644 index a304a03aa78ff402b81d8eaa8b5f12327daa7812..0000000000000000000000000000000000000000 --- a/assets/audios/Lyrical Cantonese_Prompt.WAV +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:892403bae0a7014ff19b6d774a9bc98a2f946312df2389071a9f1a5e5cae68f4 -size 7703926 diff --git a/assets/audios/Lyrical Cantonese_Source.WAV b/assets/audios/Lyrical Cantonese_Source.WAV deleted file mode 100644 index f7ede83c24bbf10b462ccbf40c74590515948f32..0000000000000000000000000000000000000000 --- a/assets/audios/Lyrical Cantonese_Source.WAV +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:dc1efa7f412ea28a22276167db006775e77a1026e50dfd9f4dcd4be0b4c39508 -size 31653546 diff --git a/assets/audios/Lyrical Cantonese_ZeroShot.mp3 b/assets/audios/Lyrical Cantonese_ZeroShot.mp3 deleted file mode 100644 index 629f36e6f38504f0dc9e160879d14120fab21b4a..0000000000000000000000000000000000000000 --- a/assets/audios/Lyrical Cantonese_ZeroShot.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9e4730cc68baabb905c68bf9a2a9657ea451626221bc95fb2188b2cf977e4472 -size 249644 diff --git a/assets/audios/Mandarin-Cantonese.MP3 b/assets/audios/Mandarin-Cantonese.MP3 deleted file mode 100644 index d7350653288d36c3b15f4611f3aecee054dc2539..0000000000000000000000000000000000000000 --- a/assets/audios/Mandarin-Cantonese.MP3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:80d84db1fd98b97a2c0e99a99ce0bb42e1b189dae47859348f6f08a9931b8952 -size 265036 diff --git a/assets/audios/Mandarin-Cantonese.wav b/assets/audios/Mandarin-Cantonese.wav deleted file mode 100644 index 31906154322eaab4eedf27b98d980f29e99d0775..0000000000000000000000000000000000000000 --- a/assets/audios/Mandarin-Cantonese.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:58e92479f1bdcfe373512963369ce3656ea6526adb2e647e9a0165434d43b5f3 -size 12680134 diff --git a/assets/audios/Mandarin-English.WAV b/assets/audios/Mandarin-English.WAV deleted file mode 100644 index 831fdacc589e629cfdfca03abc36dbc3f3ff3078..0000000000000000000000000000000000000000 --- a/assets/audios/Mandarin-English.WAV +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:58e92479f1bdcfe373512963369ce3656ea6526adb2e647e9a0165434d43b5f3 -size 11145682 diff --git a/assets/audios/Mandarin_Refreshing_Young_Man_Sourse.mp3 b/assets/audios/Mandarin_Refreshing_Young_Man_Sourse.mp3 deleted file mode 100644 index 8c0829dc3a1cb9bc82e8cc96215aa69c3d8def80..0000000000000000000000000000000000000000 --- a/assets/audios/Mandarin_Refreshing_Young_Man_Sourse.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:46965e3f90f9b6a6271898645dfe44bb2964b9e623ad74775fc33bcff26e277c -size 514028 diff --git a/assets/audios/Marketing_Voice_Sourse.wav b/assets/audios/Marketing_Voice_Sourse.wav deleted file mode 100644 index 826f56c2566b3fa58c9ade964be605b4c91a49f0..0000000000000000000000000000000000000000 --- a/assets/audios/Marketing_Voice_Sourse.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5c258ea4ea588fd9ec228f49650bc97828151539c6d70e8f4f0a726505990430 -size 3951054 diff --git a/assets/audios/Murmur-Excitement-Anger- Whispers.MP3 b/assets/audios/Murmur-Excitement-Anger- Whispers.MP3 deleted file mode 100644 index 98de9d20adb21ed42c1a9a3f26552b3475bbe198..0000000000000000000000000000000000000000 --- a/assets/audios/Murmur-Excitement-Anger- Whispers.MP3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ede011827c1e33855114063d7b4ddf59ce054011b2a81db8eaf1092b5f3d4e91 -size 689900 diff --git a/assets/audios/Nancy_1.mp3 b/assets/audios/Nancy_1.mp3 deleted file mode 100644 index 0bc9224822770ca82fa098278ce96e044e855011..0000000000000000000000000000000000000000 --- a/assets/audios/Nancy_1.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9900e2e204c5bc0fa0ca7a1972facc30f0dc0222229ef6b66f37f4a14677e540 -size 172268 diff --git a/assets/audios/Nancy_2.mp3 b/assets/audios/Nancy_2.mp3 deleted file mode 100644 index 7cd5db6d7674e7b35fbe3fc1d19f83af1f291352..0000000000000000000000000000000000000000 --- a/assets/audios/Nancy_2.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:139a3236fec43393689ad11a2f1d55b868849dc5e820a9c17b462062098b452c -size 196844 diff --git a/assets/audios/Neurotic Teenage English.MP3 b/assets/audios/Neurotic Teenage English.MP3 deleted file mode 100644 index cc8421be0520293d4b1dc771b10f30a12320da41..0000000000000000000000000000000000000000 --- a/assets/audios/Neurotic Teenage English.MP3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e3e349a108a792e1a96fca6c0ab88e183712c0b0b5c3aa675cc6509f02242624 -size 360812 diff --git a/assets/audios/Neurotic Teenage English_OneShot.MP3 b/assets/audios/Neurotic Teenage English_OneShot.MP3 deleted file mode 100644 index 0921868a616aa29a54657ef2f425c548af20ab3c..0000000000000000000000000000000000000000 --- a/assets/audios/Neurotic Teenage English_OneShot.MP3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:69769c49b3d1ae0e834cbafc2e4badce3dd993fba41eddbad3e3991d8d141e78 -size 156908 diff --git a/assets/audios/Neurotic Teenage English_Prompt.MP3 b/assets/audios/Neurotic Teenage English_Prompt.MP3 deleted file mode 100644 index 2b3c7ad630099d23a434bb59dd12542d96b673cc..0000000000000000000000000000000000000000 --- a/assets/audios/Neurotic Teenage English_Prompt.MP3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:33774ed6215a44a8666eeec8287af06db36ff02b60ae890a2edb93cd22092a17 -size 91244 diff --git a/assets/audios/Neurotic Teenage English_ZeroShot.MP3 b/assets/audios/Neurotic Teenage English_ZeroShot.MP3 deleted file mode 100644 index 8ba6d5c38c0e3181ab07da2ac0bc8cf694610efd..0000000000000000000000000000000000000000 --- a/assets/audios/Neurotic Teenage English_ZeroShot.MP3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:afaeaedf6cda34ea2798ccbab5bd7743d9773708b2e707d1cc3e9841bf0b48f2 -size 275067 diff --git a/assets/audios/Neutral-Rage-Reminiscence-Weeping.MP3 b/assets/audios/Neutral-Rage-Reminiscence-Weeping.MP3 deleted file mode 100644 index d9b1aca9570d941f848db7537fe0d938f04f9487..0000000000000000000000000000000000000000 --- a/assets/audios/Neutral-Rage-Reminiscence-Weeping.MP3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:328892635a32b295d714b012f63696984b234d035a25dac8b7257df410cde2b5 -size 583148 diff --git a/assets/audios/Neutral1.mp3 b/assets/audios/Neutral1.mp3 deleted file mode 100644 index 24c669ed7752bac52b2bd54edafd110d780abc2b..0000000000000000000000000000000000000000 --- a/assets/audios/Neutral1.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:89cbaf00a66239d2b051ad41971a179315415873750e94aeb5d87d3cab0a9c5b -size 54764 diff --git a/assets/audios/Neutral2.mp3 b/assets/audios/Neutral2.mp3 deleted file mode 100644 index 74a91f73fddf4dc1973c3fc057dc871ec4475e4e..0000000000000000000000000000000000000000 --- a/assets/audios/Neutral2.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:eef5a109b7410875953975d99a2291cfee58dd8d5182ec78ac12cf2cad952e92 -size 49580 diff --git a/assets/audios/Neutral3.mp3 b/assets/audios/Neutral3.mp3 deleted file mode 100644 index 72cde73a0b1be9ea14c3ad502527d845c672dc5c..0000000000000000000000000000000000000000 --- a/assets/audios/Neutral3.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:aad98b334aa8b226a5ba31689e627c01bcc971e77c235b134a846c447e01fc9d -size 52844 diff --git a/assets/audios/Neutral4.mp3 b/assets/audios/Neutral4.mp3 deleted file mode 100644 index 7523d0f3c06660bfaaf3d625e3bc4fa1bcdbb24b..0000000000000000000000000000000000000000 --- a/assets/audios/Neutral4.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7e1200fc067de254dcb2fd839867f453b43136a35047ee870750fec3de88af38 -size 48428 diff --git a/assets/audios/Neutral5.mp3 b/assets/audios/Neutral5.mp3 deleted file mode 100644 index 3b6d1df980f46dc9cf735b3d3d2f59680da213d1..0000000000000000000000000000000000000000 --- a/assets/audios/Neutral5.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:cf4dade1010e6981c7c81076a8dbcf5630a05235c78ecd9b0b57b45eb8bf31ba -size 49388 diff --git a/assets/audios/Neutral6.mp3 b/assets/audios/Neutral6.mp3 deleted file mode 100644 index dfe9ba8c066393bb52b864920e291a5a65cce3a9..0000000000000000000000000000000000000000 --- a/assets/audios/Neutral6.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d1647071eab3a1a45918d99eb68e4bbc9229dadd1fcddbc253c3687f66f2a526 -size 51116 diff --git a/assets/audios/Onee-san.wav b/assets/audios/Onee-san.wav deleted file mode 100644 index 9180faf93069302a8d57aa6e7cb366038e6c411f..0000000000000000000000000000000000000000 --- a/assets/audios/Onee-san.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a11dfcafd395d37d2b8109d61bfdb699eeeccc2ce42e3e4cc5e3e95acaf9a8f1 -size 13071638 diff --git a/assets/audios/Onee-san_Sourse.MP3 b/assets/audios/Onee-san_Sourse.MP3 deleted file mode 100644 index 4074090c4498fb86d379ab05e481ccbc419fc2ad..0000000000000000000000000000000000000000 --- a/assets/audios/Onee-san_Sourse.MP3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d1832d908a6cf4a2cfd58f6253b6191f3fa128d0f386778677360a181ae87ecc -size 548412 diff --git a/assets/audios/Onee-san_Sourse.wav b/assets/audios/Onee-san_Sourse.wav deleted file mode 100644 index 8f45a99fe64a5031c866d83eade99fb5ecbb7ab2..0000000000000000000000000000000000000000 --- a/assets/audios/Onee-san_Sourse.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7b46285788ca5ff9bae286396f9a2aeeb6d3c1259b4e8c9e46caccf4b9dcd9e6 -size 13137536 diff --git a/assets/audios/OpenAI_Breaking Down Mandarin.mp3 b/assets/audios/OpenAI_Breaking Down Mandarin.mp3 deleted file mode 100644 index 25902884d129faf51f17bb64a474bfcb2b5393d2..0000000000000000000000000000000000000000 --- a/assets/audios/OpenAI_Breaking Down Mandarin.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d54a12566ade2b019755eb020f1dd2030cb18744a5ddb4cb4c2888589ac3b018 -size 188012 diff --git a/assets/audios/OpenAI_Czech.mp3 b/assets/audios/OpenAI_Czech.mp3 deleted file mode 100644 index fa783b85b3955778d1772813a595a897cbe3fe74..0000000000000000000000000000000000000000 --- a/assets/audios/OpenAI_Czech.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:97cd63e2404914ead4aedf42385ebcca1fa3fe93e03fb4a21cc1701632bf4dbf -size 67628 diff --git a/assets/audios/OpenAI_English-Mandarin.mp3 b/assets/audios/OpenAI_English-Mandarin.mp3 deleted file mode 100644 index 8fd30cde75d2275b166d8c658d896ce8068ec5c3..0000000000000000000000000000000000000000 --- a/assets/audios/OpenAI_English-Mandarin.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:bb9578930207d8d452b8f6c75c212c8630a5cc035b312ba1454a490ff9ea9108 -size 114284 diff --git a/assets/audios/OpenAI_English-Spanish.mp3 b/assets/audios/OpenAI_English-Spanish.mp3 deleted file mode 100644 index e4f02d1dd91a3e2f984d1482a8bc9be445277f26..0000000000000000000000000000000000000000 --- a/assets/audios/OpenAI_English-Spanish.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d7b29ef11732d2b7f659d719be14fa8426fbdd7dced16dc123d4b8c8834c6a99 -size 81644 diff --git a/assets/audios/OpenAI_Japanese-Korean.mp3 b/assets/audios/OpenAI_Japanese-Korean.mp3 deleted file mode 100644 index 4e9338983322c9ebba44ca7d0112c3428a339316..0000000000000000000000000000000000000000 --- a/assets/audios/OpenAI_Japanese-Korean.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a06a7e38f98936b20487901c30ac3eddc1794e9623be21c9c4ebdf9d3fb7a57b -size 183596 diff --git a/assets/audios/OpenAI_Japanese.mp3 b/assets/audios/OpenAI_Japanese.mp3 deleted file mode 100644 index 3a763c202302787e60e6f7199e12a737988f22f0..0000000000000000000000000000000000000000 --- a/assets/audios/OpenAI_Japanese.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e308471decd55206332a8b0de6de28b32d51250c9a0b9b7acb406ec460e165ff -size 106412 diff --git a/assets/audios/OpenAI_Mandarin-English.mp3 b/assets/audios/OpenAI_Mandarin-English.mp3 deleted file mode 100644 index 73e305871053f5a18dab5ce30e5aeb3f7f99dc96..0000000000000000000000000000000000000000 --- a/assets/audios/OpenAI_Mandarin-English.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:353b140d040b5592a24b13f3047c7ec96391d10a8f6ccb868610fc8a1b7586a3 -size 86828 diff --git a/assets/audios/OpenAI_Mandarine-English.mp3 b/assets/audios/OpenAI_Mandarine-English.mp3 deleted file mode 100644 index b862f1cce0256e87dc78f27ad62d0c11485df1ec..0000000000000000000000000000000000000000 --- a/assets/audios/OpenAI_Mandarine-English.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:00b4f1e7efa77233bbf76bb7c65e5052f53afbde140b8b04f2c55ecd5c49fb76 -size 86252 diff --git a/assets/audios/OpenAI_Neurotic Teenage English.mp3 b/assets/audios/OpenAI_Neurotic Teenage English.mp3 deleted file mode 100644 index 768452f7fde7bec9d761deb074e8852efac9cfab..0000000000000000000000000000000000000000 --- a/assets/audios/OpenAI_Neurotic Teenage English.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2014bc438916965f449881f2dd0895dc2970431689ab0b9b4a9262076787015d -size 126572 diff --git a/assets/audios/OpenAI_Polish.mp3 b/assets/audios/OpenAI_Polish.mp3 deleted file mode 100644 index 0ac18906c5c251d2b08a343f4aed07ef20fa977f..0000000000000000000000000000000000000000 --- a/assets/audios/OpenAI_Polish.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:bb3810b88541848a4b341acad3b4be61ff59eaaa2fcf13cade10fd8ec45ceb40 -size 70508 diff --git a/assets/audios/OpenAI_Quirky Female English.mp3 b/assets/audios/OpenAI_Quirky Female English.mp3 deleted file mode 100644 index af492e43bcda8d2296b84e1d6b4a3547da74e77c..0000000000000000000000000000000000000000 --- a/assets/audios/OpenAI_Quirky Female English.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ac7264a517bc0843af80624f3ddc7a6a33dc364f5ae5454a6aa61bbc61dc09fa -size 71660 diff --git a/assets/audios/OpenAI_Thai.mp3 b/assets/audios/OpenAI_Thai.mp3 deleted file mode 100644 index eae2349ecbbd162117b9d6decca4df2050c0746e..0000000000000000000000000000000000000000 --- a/assets/audios/OpenAI_Thai.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2be05801106cd9a352ec9e25e555883f204cba9141a1fcd3fc83924a8176c384 -size 69164 diff --git a/assets/audios/OpenAI_Vietnamese.mp3 b/assets/audios/OpenAI_Vietnamese.mp3 deleted file mode 100644 index 789c0a0eca0981f0b52e28606c1ee195fc7e0ad8..0000000000000000000000000000000000000000 --- a/assets/audios/OpenAI_Vietnamese.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:1ae7ac7888e37c4a952aa4f10d4c8aee9026919dac078cf6e571ec8c934d38e3 -size 59948 diff --git a/assets/audios/Polish.mp3 b/assets/audios/Polish.mp3 deleted file mode 100644 index 44b203dc50f3690a99c38aa537b065a6ac6356db..0000000000000000000000000000000000000000 --- a/assets/audios/Polish.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:bf38f2b8fc3abb8e9929be81939cbb94c397cc4ead7de2fff46115f6d5963481 -size 66092 diff --git a/assets/audios/Polish_Male_Sourse.wav b/assets/audios/Polish_Male_Sourse.wav deleted file mode 100644 index 17a650db3bc3ae7452afb9e00e49d0091e64a204..0000000000000000000000000000000000000000 --- a/assets/audios/Polish_Male_Sourse.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7b46285788ca5ff9bae286396f9a2aeeb6d3c1259b4e8c9e46caccf4b9dcd9e6 -size 48291666 diff --git a/assets/audios/Powerful_Girl_Sourse.mp3 b/assets/audios/Powerful_Girl_Sourse.mp3 deleted file mode 100644 index 8d0788ccfa61617c42915e1e4deb23a30286aa1c..0000000000000000000000000000000000000000 --- a/assets/audios/Powerful_Girl_Sourse.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:25db4fa4c7f4c50fc3f7e2c731880f7b9f160f9416bd2767ef7b01cf30cba060 -size 454892 diff --git a/assets/audios/Quirky Female English.MP3 b/assets/audios/Quirky Female English.MP3 deleted file mode 100644 index 9d87ad666740de4f00d70c7320e5bae1afbecd73..0000000000000000000000000000000000000000 --- a/assets/audios/Quirky Female English.MP3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ae17c5fa4a781ee1299ade2d2717686a1ae1fe6d1eb6dc79534df3fb160e4030 -size 490604 diff --git a/assets/audios/Quirky Female English_OneShot.MP3 b/assets/audios/Quirky Female English_OneShot.MP3 deleted file mode 100644 index f608c9754770a2dddcf0a054a5c9e56caeb3b1e7..0000000000000000000000000000000000000000 --- a/assets/audios/Quirky Female English_OneShot.MP3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:62d65e9bc39b4f898c2a4a9e5e088233015c67e39c1099730ca0e481a337338d -size 78317 diff --git a/assets/audios/Quirky Female English_Prompt.MP3 b/assets/audios/Quirky Female English_Prompt.MP3 deleted file mode 100644 index d29f315edca50b4d8463220a38ed5fcc972cb041..0000000000000000000000000000000000000000 --- a/assets/audios/Quirky Female English_Prompt.MP3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:66524a476efc04f9c3fbb6fcf9f49418c9b435b150b0ed88d8a704ec87b2f6c2 -size 74864 diff --git a/assets/audios/Quirky Female English_ZeroShot.MP3 b/assets/audios/Quirky Female English_ZeroShot.MP3 deleted file mode 100644 index 82d92c1e8db1e0d23233773161906a192aeed313..0000000000000000000000000000000000000000 --- a/assets/audios/Quirky Female English_ZeroShot.MP3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d8637e2e6898c10214576bb53f06f8cdbd46569c0b8ff31370b9d9c702876513 -size 75884 diff --git a/assets/audios/Radiant_Girl_1.mp3 b/assets/audios/Radiant_Girl_1.mp3 deleted file mode 100644 index 406e2b1e0fd000e7ddcab52c41a3de13cd5ea08b..0000000000000000000000000000000000000000 --- a/assets/audios/Radiant_Girl_1.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f3fbc2cdb0ec704bfc7fcec64b3baf2ce725bcd29c5f7b3589677c935939b680 -size 106604 diff --git a/assets/audios/Radiant_Girl_2.mp3 b/assets/audios/Radiant_Girl_2.mp3 deleted file mode 100644 index cce21f6c644508f064f49a65170665ab39743af5..0000000000000000000000000000000000000000 --- a/assets/audios/Radiant_Girl_2.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c565c87db9f581d94f5c51122a67e8120e27f5eb359b4aa54763421d76635215 -size 98540 diff --git a/assets/audios/Ruth_1.mp3 b/assets/audios/Ruth_1.mp3 deleted file mode 100644 index b221b51603f90c0792d8089a6348320127f95742..0000000000000000000000000000000000000000 --- a/assets/audios/Ruth_1.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0c90c219330024ebd82db7624fcbf11c9ad7d2d3d5b812de080b5173144be013 -size 75308 diff --git a/assets/audios/Ruth_2.mp3 b/assets/audios/Ruth_2.mp3 deleted file mode 100644 index 1a679af767559ca04190ba4ceff269575c2da888..0000000000000000000000000000000000000000 --- a/assets/audios/Ruth_2.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0d0065238c7f4c4a7acca63aef2fb3ae6fc53f819448b85750a525f8545629e4 -size 94700 diff --git a/assets/audios/Sad.mp3 b/assets/audios/Sad.mp3 deleted file mode 100644 index 36ecaeff5646da298b604572031350c9444ab208..0000000000000000000000000000000000000000 --- a/assets/audios/Sad.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:fce94c8fbe84446aba1d4082f7bf35f1415e86ca4aaa719bae0bc96e69477a25 -size 60332 diff --git a/assets/audios/Science_Voice_Sourse.wav b/assets/audios/Science_Voice_Sourse.wav deleted file mode 100644 index c4663b0b3583f655e0a1584adc59832573d5969d..0000000000000000000000000000000000000000 --- a/assets/audios/Science_Voice_Sourse.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e42476b02d2176bc2d4b475d08e6d0c8713a3ce1acf981a65d3f20f738712685 -size 3871032 diff --git a/assets/audios/ShiBanYu_Sourse.mp3 b/assets/audios/ShiBanYu_Sourse.mp3 deleted file mode 100644 index 7bfad95f5c88c9577e8cc08ed36dfcb9d4615470..0000000000000000000000000000000000000000 --- a/assets/audios/ShiBanYu_Sourse.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7aec0d2c2e83fbf2569e48500b9c0f2b1e66a071d35a7d08e047ba973e5e977a -size 1391468 diff --git a/assets/audios/ShuanQ_Sourse.mp3 b/assets/audios/ShuanQ_Sourse.mp3 deleted file mode 100644 index 26c71eea220ce56be7620b4b26b77d809892c927..0000000000000000000000000000000000000000 --- a/assets/audios/ShuanQ_Sourse.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:daaf4bbbc9aeaee5d801e80bcc5b081054b78839b25e974aa6643a3027cba415 -size 482304 diff --git a/assets/audios/Sociology_Sourse.mp3 b/assets/audios/Sociology_Sourse.mp3 deleted file mode 100644 index b05566b5cafd9b5c1d2b1f8135fc9dd19a4268df..0000000000000000000000000000000000000000 --- a/assets/audios/Sociology_Sourse.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b32b7921a59e87541a88d0f83e50bfbea2886cd55f4ba8cf5f11862e6f608c98 -size 1390700 diff --git a/assets/audios/Spanish-English.wav b/assets/audios/Spanish-English.wav deleted file mode 100644 index 5ce724ce2101785c747c82bcde1885ef2123cb73..0000000000000000000000000000000000000000 --- a/assets/audios/Spanish-English.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:61fc6458581e0156292f69253e72d11b76d48fd3447e7c118f27ac30a0941111 -size 9731014 diff --git a/assets/audios/Surprised.mp3 b/assets/audios/Surprised.mp3 deleted file mode 100644 index b8cae771d56da321e9a6639735dadb29944460bf..0000000000000000000000000000000000000000 --- a/assets/audios/Surprised.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:382669e20f8556fc1e3baad28069fec33d1c8c3bb2bbea232b87415a938fb642 -size 48812 diff --git a/assets/audios/Thai.mp3 b/assets/audios/Thai.mp3 deleted file mode 100644 index bd9b20770d39b61202b6cfd30203502a37305437..0000000000000000000000000000000000000000 --- a/assets/audios/Thai.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0b125f1a649eaab3995f8b0d732e0f7cf299f13f91cc450b34b629fc2a9e5fb8 -size 56300 diff --git a/assets/audios/Thai_Male_Sourse.wav b/assets/audios/Thai_Male_Sourse.wav deleted file mode 100644 index 145f779eebfa1cd16f0ce0f250107b0aed89dbba..0000000000000000000000000000000000000000 --- a/assets/audios/Thai_Male_Sourse.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:99a90ee75e66ce8037d32ca8bd02efbf3ceb65bc8fd5d8227c3d807b621d1a7d -size 54158698 diff --git a/assets/audios/TianJin_Fast.mp3 b/assets/audios/TianJin_Fast.mp3 deleted file mode 100644 index 5ff719005d73156a0a7038260d0082a858040850..0000000000000000000000000000000000000000 --- a/assets/audios/TianJin_Fast.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9d000fb45879701cd022bfc3d8d798e07480e37eda87a304ba34270ea704e2f8 -size 88364 diff --git a/assets/audios/TianJin_PVC.mp3 b/assets/audios/TianJin_PVC.mp3 deleted file mode 100644 index 1b191328fc03b8fcfb72295cde62b1726979b4e2..0000000000000000000000000000000000000000 --- a/assets/audios/TianJin_PVC.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b5958a4426ca15648d32acbd0523eb1001576ea598f22387ec9f5e05b8c0734e -size 103340 diff --git a/assets/audios/TianJin_Source.wav b/assets/audios/TianJin_Source.wav deleted file mode 100644 index 733c0d844fa1d1286def4e1dd821b0b6ffb47165..0000000000000000000000000000000000000000 --- a/assets/audios/TianJin_Source.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b9b928ca7516794261fb3e9c33e5c4d033d3df89308941e1c6010fbe40948f57 -size 5683302 diff --git a/assets/audios/VAE1.wav b/assets/audios/VAE1.wav deleted file mode 100644 index 51d5c2fd09eeba5f2dd4f032f97ccb1cfa1a9430..0000000000000000000000000000000000000000 --- a/assets/audios/VAE1.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c3688a8d6e6c1928a119edaf8c047dcb119a36ad5080434b2f95d580846534c8 -size 1772754 diff --git a/assets/audios/VAE2.wav b/assets/audios/VAE2.wav deleted file mode 100644 index e1205d6a1d4cc8b2f1f2e0c3730fd37307187900..0000000000000000000000000000000000000000 --- a/assets/audios/VAE2.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:685a8003e0ce6ddfca126480aaabe1ed788f8d7107b63fd16ba0b48a4f44822b -size 1545390 diff --git a/assets/audios/VAE3.wav b/assets/audios/VAE3.wav deleted file mode 100644 index 339a14d60d3cee6fef6f384e520e10faa467a16c..0000000000000000000000000000000000000000 --- a/assets/audios/VAE3.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:11f27142e2b5ed1429474d558c2691ad0dd9504fff0dd56e7bccc887d26821f8 -size 2004582 diff --git a/assets/audios/Vietnamese.mp3 b/assets/audios/Vietnamese.mp3 deleted file mode 100644 index 6065bdfd040990229ee67f84c452bbf76609b679..0000000000000000000000000000000000000000 --- a/assets/audios/Vietnamese.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c2a4a323f3469efeb40952c7cba38b79a443223785eca152099d9ead3901eb5c -size 43052 diff --git a/assets/audios/Vietnamese_Female_Sourse.wav b/assets/audios/Vietnamese_Female_Sourse.wav deleted file mode 100644 index 29848c7da99ce40f000e0b80a440b6e386fb9c6c..0000000000000000000000000000000000000000 --- a/assets/audios/Vietnamese_Female_Sourse.wav +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d6e56209d5307da27769fc366177b68efe2823043dbf806e8fcf2460dfb68a4b -size 30102082 diff --git a/assets/audios/Warm and Magnetic.mp3 b/assets/audios/Warm and Magnetic.mp3 deleted file mode 100644 index 09b206960c6b0b54bc9df5861364c7a3f2211722..0000000000000000000000000000000000000000 --- a/assets/audios/Warm and Magnetic.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ecef1157b2f24175e96029ec81b0a2d15106ede51ebd51dd9f530751c22ccbde -size 249260 diff --git a/assets/audios/Warm and Magnetic_Sourse.mp3 b/assets/audios/Warm and Magnetic_Sourse.mp3 deleted file mode 100644 index 9c2a910cd1d311cc34c6c537ee1445f774748e30..0000000000000000000000000000000000000000 --- a/assets/audios/Warm and Magnetic_Sourse.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e32ca8567897e81347c59548795c3f1da7b5e5ddbc35342de957dfc261457dc5 -size 719852 diff --git a/assets/audios/Wong_Sourse.mp3 b/assets/audios/Wong_Sourse.mp3 deleted file mode 100644 index f62409cfcd4d252bf582397ab60d01167136591d..0000000000000000000000000000000000000000 --- a/assets/audios/Wong_Sourse.mp3 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:06081146374d6b4a41a2bc12285c8e384b403197087213aeab1fab0b9f28e9f8 -size 178796 diff --git "a/assets/audios/\344\275\223\350\202\262\350\247\243\350\257\264\347\224\267\351\235\222\345\271\264.wav" "b/assets/audios/\344\275\223\350\202\262\350\247\243\350\257\264\347\224\267\351\235\222\345\271\264.wav" deleted file mode 100644 index e98429d6190cdf6b9da20d874aea5438db7f0b42..0000000000000000000000000000000000000000 --- "a/assets/audios/\344\275\223\350\202\262\350\247\243\350\257\264\347\224\267\351\235\222\345\271\264.wav" +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:606ad746e2c471a1182b19f7fdf7e6556e0e2fd0e7c2962b7a823571b7765b08 -size 5606838 diff --git "a/assets/audios/\345\233\236\345\277\206\347\224\267\344\270\255\345\271\264.wav" "b/assets/audios/\345\233\236\345\277\206\347\224\267\344\270\255\345\271\264.wav" deleted file mode 100644 index f7ee8379b36943e31ab5883d715361c171b46c06..0000000000000000000000000000000000000000 --- "a/assets/audios/\345\233\236\345\277\206\347\224\267\344\270\255\345\271\264.wav" +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e917abfe6bae2c3021dc593f457c2622b7e159d95880fc41ae010e9f1347eef8 -size 7162758 diff --git "a/assets/audios/\346\267\261\345\272\246\350\256\277\350\260\210\347\224\267\344\270\255\345\271\264.wav" "b/assets/audios/\346\267\261\345\272\246\350\256\277\350\260\210\347\224\267\344\270\255\345\271\264.wav" deleted file mode 100644 index 8aa714c49f797dadeb720502a12f8be52d4aedc8..0000000000000000000000000000000000000000 --- "a/assets/audios/\346\267\261\345\272\246\350\256\277\350\260\210\347\224\267\344\270\255\345\271\264.wav" +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:acc56f0c43fae339823f9131f54f66f9ca127459a9d2f2179839cb9295912eb6 -size 6770438 diff --git "a/assets/audios/\346\270\270\346\210\217\344\270\273\346\222\255\345\245\263\351\235\222\345\271\264.wav" "b/assets/audios/\346\270\270\346\210\217\344\270\273\346\222\255\345\245\263\351\235\222\345\271\264.wav" deleted file mode 100644 index 08cea2e5d76ef29efdef11da388fa76581a9afb0..0000000000000000000000000000000000000000 --- "a/assets/audios/\346\270\270\346\210\217\344\270\273\346\222\255\345\245\263\351\235\222\345\271\264.wav" +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:88f7f5e965c1bfd86c4ca2c50bce067c9e0dccb6a583dd89427233b071486ee6 -size 4345158 diff --git "a/assets/audios/\347\233\264\346\222\255\345\270\246\350\264\247\345\245\263\351\235\222\345\271\264.wav" "b/assets/audios/\347\233\264\346\222\255\345\270\246\350\264\247\345\245\263\351\235\222\345\271\264.wav" deleted file mode 100644 index a13238779c4287bc652c7773760818b424ad45f6..0000000000000000000000000000000000000000 --- "a/assets/audios/\347\233\264\346\222\255\345\270\246\350\264\247\345\245\263\351\235\222\345\271\264.wav" +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2976ba7f37bf9a19892041f36b36ca82d6731a807313427495be96eabb141ac4 -size 5722758 diff --git "a/assets/audios/\347\276\216\345\246\206\345\245\263\345\215\232\344\270\273.wav" "b/assets/audios/\347\276\216\345\246\206\345\245\263\345\215\232\344\270\273.wav" deleted file mode 100644 index fac62fc49379cdab79b5c3e77d75ae716a180ec6..0000000000000000000000000000000000000000 --- "a/assets/audios/\347\276\216\345\246\206\345\245\263\345\215\232\344\270\273.wav" +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:dce4e52442b09c6e1b23e4edb5a094e92535335d5c7e65e3a3d75053fcc9d5e5 -size 5361638 diff --git a/assets/images/header-bg.jpeg b/assets/images/header-bg.jpeg deleted file mode 100644 index d05ef88541b5082629aa0fb890e69da8a6ff505b..0000000000000000000000000000000000000000 --- a/assets/images/header-bg.jpeg +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:fbff99d252d597cd09f47c2d1ad49cfbd81f26303a1773a9491d45e138f882c4 -size 135383 diff --git a/assets/images/system-overview.jpg b/assets/images/system-overview.jpg deleted file mode 100644 index 618d33051df32b4ad98d6cdc58f56f25345aa4c8..0000000000000000000000000000000000000000 --- a/assets/images/system-overview.jpg +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e478da546bf88d449ac9ca0c04db10ad810b3757f9041213b0dcdfc06a7711f2 -size 379909 diff --git a/index.html b/index.html index a53780f4c3a3446439ee1a91027a8e97a50de825..b0c4b3666032a737f3903db53e6a8a9272483e28 100644 --- a/index.html +++ b/index.html @@ -1,1070 +1,19 @@ - - - - - - - MiniMax-Speech Tech Report | Intrinsic Zero-Shot Text-to-Speech with a Learnable Speaker Encoder - - - - - - - - - - - -
-

MiniMax-Speech

-

Intrinsic Zero-Shot Text-to-Speech - with a - Learnable Speaker - Encoder

-

- MiniMax Team May 2025
- [Tech - Report] - [Multilingual Test Set] - [GitHub] -

-
- -
-

Abstract

-

- We introduce MiniMax-Speech, an autoregressive Transformer-based Text-to-Speech (TTS) model that generates - high-quality - speech. A key innovation is our learnable speaker encoder, which extracts timbre features from a reference audio - without - requiring its transcription. This enables MiniMax-Speech to produce highly expressive speech with timbre - consistent with - the reference in a zero-shot manner, while also supporting one-shot voice cloning with exceptionally high - similarity to - the reference voice. In addition, the overall quality of the synthesized audio is enhanced through the proposed - Flow-VAE. Our model supports 32 languages and demonstrates excellent performance across multiple objective and - subjective evaluations metrics. Notably, it achieves state-of-the-art (SOTA) results on objective voice cloning - metrics - (Word Error Rate and Speaker Similarity) and has secured the top position on the public TTS Arena leaderboard. - Another - key strength of MiniMax-Speech, granted by the robust and disentangled representations from the speaker encoder, - is its - extensibility without modifying the base model, enabling various applications such as: arbitrary voice emotion - control - via LoRA; text to voice (T2V) by synthesizing timbre features directly from text description; and professional - voice - cloning (PVC) by fine-tuning timbre features with additional data. -

-
- - - -
-
-
-

Architecture Overview

-
- System Architecture -
- An overview of the architecture of MiniMax-Speech. -
-
-
- -
-

Expressiveness Demonstrations

-

Showcase with High Versatility

-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
DescriptionSource AudioGenerated Audio
- A Compelling and Persuasive Speaker Voice - - - - -
- A Clear and Explanatory Voice with Broad Emotional Dynamics Across Different Texts - - - - -
- Another Explanatory Voice with Supernatural Prosody,
- Featuring Distinct Ethnic and Age Characteristics -
- - - -
- A Warm and Magnetic Voice that Brings Comfort - - - - -
- An ASMR Whispering Voice with Generated Breathing and Sound Effects - - - - -
- A Robotic Voice with Rich Bass Resonance and Spatial Presence - - - - -
- A Sardonic Mature Female Voice - - - - -
-
- -

Showcase with Multiple Generation Attempts, Post-Processing - Audio Effects and Added Sound Effects

-
- - - - - - - - - - - - - - - -
DescriptionGenerated Audio
- A Husky Male Voice: From Soft Murmur to Excitement to Anger, then to Whispers - - -
- An Angry Female Voice: From Soft Murmur to Rage to Reminiscence, then to Weeping - - -
-
-
- -
-

Zero-Shot vs. One-Shot Demonstrations

-

- ZeroShot maintains speaker identity while generating more natural emotions, pauses, and other expressive - features based - on the text content, whereas OneShot adheres more strictly to the speaker characteristics (prosody, speech - rate, - emotions, etc.). For details of Zero-Shot and One-Shot, refer to the technical report. -

-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
Source AudioTextZero-Shot VersionOne-Shot VersionElevenlabs Multilingual_v2
- - - 命运就算颠沛流离,
- 命运就算曲折离奇,
- 命运就算恐吓着你,
- 做人没趣味。
- 别流泪,心酸,更不应舍弃。
- 我愿能,一生永远陪伴你。 -
- - Preserving Distinctive Voice
- Timbre and Expressive
- Prosody with Regularized
- Pausing and Speech Rate -
- - Better Reproduction of
- Prompt's Exaggerated Speech
- Rate and Characteristic
- Phrase-Initial Pauses -
- Cantonese not supported -
- - - 你们这些躲在道德高地的懦夫,
- 敢承认自己对本我的恐惧吗?
- 回答我!嗯?你回答我!
- Look in my eyes!
- 老子写梦的解析时
- 你们还在玩泥巴,
- 我精神分析引论每个字母都能
- 刺穿文明社会的虚伪面具,
- 我解剖潜意识就像
- 外科医生划开皮肤。
- 是不是啊?说话! -
- - Capable of Generating
- Relatively Calmer Emotions
- while Preserving Voice
- Identity -
- - Consistently Reproducing the
- Angry Emotion from Prompt
- in Every Utterance -
- -
- - - Would you believe what happened at the
- grocery store today? My goodness! The
- avocados were on sale - half price! Half
- price! I bought twenty of them! -
- - Effectively follows textual cues
- for both longer and shorter
- inter-sentence pauses -
- - Better reproduces the
- exaggerated high pitch
- characteristic of anime voices
-
- -
- - - Oh my gosh, like, I literally can't believe
- what just happened! Um, so basically, I was,
- you know, just sitting there in class,
- right? And then, ugh, this totally weird
- thing happened - like, seriously weird! Wait,
- wait... Should I even be talking about this?
- Ugh, whatever. -
- - Effectively follows textual cues
- for both longer and shorter
- inter-sentence pauses -
- - Better reproduces the
- exaggerated high pitch
- characteristic of anime voices
-
- -
-
-
- -
-

Multilingual and Cross-Lingual Capabilities - Demonstrations

-

Speech-02-HD maintains high naturalness in less common languages while demonstrating significant advantages - in - Standard - Chinese pronunciation accuracy.

-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
LanguagesSource AudioTextMiniMax
Speech_02_HD
ElevenLabs
Multilingual_v2
OpenAI
TTS_1_HD
(*not cloned voice)
Thai - - - สวัสดีค่ะ วันนี้อากาศดีมากเลย
- คุณจะไปทานอาหารกลางวันที่ไหนคะ
- ฉันกำลังคิดว่าจะไปร้านอาหารไทยแถวนี้
-
- - - Thai not perfectly supported - - - -
Vietnamese - - - Tôi đang đọc một cuốn sách rất hay về lịch sử Việt Nam.
- Những câu chuyện về văn hóa truyền
- thống thật sự rất thú vị.
-
- - - Vietnamese not perfectly supported - - - -
Czech - - - Ranní mlha se pomalu zvedá nad řekou,
- zatímco první paprsky slunce prosvítají mezi stromy.
- Ptáci začínají svůj ranní koncert.
-
- - - - - -
Polish - 、 - - Młoda sowa siedzi cicho na gałęzi sosny,
- obserwując leśną polanę w świetle księżyca.
- Wiatr delikatnie porusza liśćmi drzew.
-
- - - - - -
Japanese - - - 電車が遅延している影響で、渋谷駅がとても混雑
- しています。次の山手線は約10分後に到着
- 予定です。お急ぎのお客様は、他の路線も
- ご利用ください。 -
- - - - - -
-
-

Speech-02-HD has superior performance in zero-shot cross-lingual scenarios.

-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
Original LanguageSource AudioMixed LanguageTextMiniMax
Speech_02_HD
ElevenLabs
Multilingual_v2
OpenAI
TTS_1_HD
(*not cloned voice)
English - - English + Mandarin - Kiddo! Come come come, 学如逆水行舟,不进则退。
- I see you're using AI tools already - so smart!
- But eh, cannot just rely on tools only lah!
- The future belongs to those who can work alongside AI,
- not those scared of it. -
- - - - - -
Mandarin - - Mandarin + Cantonese - 老铁啊,多谢晒你送我呢本,广州话正音字典,咁好嘢喎!
- 我呢个大老爷们儿学广州话真系好难㗎!成日都分唔清声调啊。
- 嗱,而家有咗呢本书,什么都好啦。 -
- - - Cantonese not supported - - Cantonese not supported -
Mandarin - - Mandarin + English - The people said, 桂林's scenery is the first under heaven.
- Yet in my opinion, 阳朔 scenery is better than 桂林。
- 群峰倒影山浮水,无水无山不入神。 -
- - - - - -
English - - English + Spanish - Mi abuelita always told me "el que persevera, alcanza".
- If you persevere, you'll achieve your dreams!
- Guess what! They choose me to play the lead role in our BIG show! -
- - - - - -
Japanese - - Japanese + Korean - 最近の天気予報によりますと、今週末は桜の開花に最適
- な気温になる予定です。
- 東京都内の各公園では花見客で賑わうことが予想されますが、
- 서울에서도 벚꽃이 피기 시작했다고 하네요.
- 이번 주말에는 여의도 공원에서 벚꽃 축제가 열린다고 하니
- 많은 분들이 찾아오실 것 같습니다. -
- - - - - -
-
-

*Although OpenAI currently does not support voice cloning functionality, we still wish to conduct comparative - listening - tests with its excellent naturalness as a reference.

-
- -
-

Flow-VAE vs. VAE Comparison

-

Flow-VAE is less likely to produce the following instabilities.

-
- - - - - - - - - - - - - - - - - - - - - - - - - - - -
Source AudioFlow-VAEVAEDifferences
- - - - - - - Flow-VAE reproduces more continuous
- and natural reverberation -
- - - - - - - VAE introduces unwanted
- high-frequency components -
- - - - - - - VAE produces electronic-sounding
- artifacts at the beginning -
-
-
- -
-

Professional Voice Clone (PVC) Demonstrations

-

For more complex dialectal accents and tonal characteristics, PVC can reproduce these features while - maintaining high - naturalness based on the text content.

-
- - - - - - - - - - - - - - - - - - - - - -
Source AudioZero-ShotPVCDifferences
- - - - - - - Like the ZeroShot version, the PVC
- version has rising sentence-final intonation,
- but distinctively sustains this
- elevated pitch instead of the typical
- pitch declination found in common
- declarative sentences -
- - - - - - - With more materials, the model not only
- reproduces the speaker's voice characteristics
- but also accurately captures more
- dialectal features -
-
-
- -
-

Emotion Control Demonstrations

-

Source Audio for Refreshing Young Man

- -

DEMO

-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
NeutralEmotionTextEmotion Control Audio
- - - Surprised - - 天哪!我完全没想到会在这里遇见你,
- 都过去这么多年了,你一点都没变! -
- -
- - - Disgusted - - 这个地方实在太脏乱了,到处都是垃圾和难闻的气味儿,
- 我一秒钟都不想多待。 -
- -
- - - Fearful - - 深夜回家的路上,我清楚地听见身后有脚步声在跟着我,
- 可是回头却什么都看不见。 -
- -
- - - Angry - - 我付出了这么多,换来的却是这样的背叛!
- 你怎么可以这样对待我的信任! -
- -
- - - Sad - - 躺在床上翻来覆去,心里压着说不出的难过和沮丧,
- 昨天晚上又失眠了。 -
- -
- - - Happy - - 和好朋友一起在院子里烧烤,聊着有趣的故事,
- 享受着美食和欢乐的时光。 -
- -
-
-
- -
-

Text-Prompted Voice Generation Demonstrations

-
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
PromptTextAudio
- 男性中年声音,说中文,音色浑厚醇厚,带有自然的磁性,
- 语速偏慢,音量适中,音调偏低沉。声音整体给人沉稳可靠的感觉,
- 在深度访谈场景中表现出专业性和亲和力,音质清晰,吐字规整有力。 -
- 在这个安静的夜晚,让我们一起走进《人生笔记》这本书。
- 作者用平实的文字记录下生活中的点点滴滴,
- 让我们看到平凡中的真善美。
- 今天,我们先来读第一章:'生活的痕迹'...... -
- -
- 说中文的女青年,音色偏甜美,语速比较快,
- 说话时带着一种轻快的感觉,整体音调较高,像是在直播带货,
- 整体氛围比较活跃,声音清晰,听起来很有亲和力。 -
- 亲爱的宝宝们,等了好久的神仙面霜终于到货啦!
- 你们看这个包装是不是超级精致?
- 我自己已经用了一个月了,效果真的绝绝子!
- 而且这次活动价真的太划算了,错过真的会后悔的哦~ -
- -
- 中国男性声音,听着像是青年,音色清亮,语速比较快,
- 说话很有激情,像是在解说比赛,声音中带着紧张和兴奋的感觉。 -
- 漂亮!这个进攻太精彩了!张伟突破防线,
- 一个漂亮的转身,球传到禁区,王超跟上,射门!
- 球进了!难以置信的精彩配合,现场观众都沸腾了! -
- -
- 中国女青年的声音,音色清脆,说话速度偏快,语调活泼,
- 像是在做游戏直播,声音中带着愉快的感觉,整体音调较高,
- 整体氛围比较轻松。 -
- 啊!这里有个宝箱!让我们看看里面是什么~
- 哇!是传说中的紫色装备!运气也太好了吧!
- 谢谢小伙伴们的打赏,我们继续往前探索...... -
- -
- English-speaking female voice, sounding relatively young,
- with a sweet and pleasant tone. Speaking at a moderate pace
- with a touch of energy, similar to someone narrating a
- beauty/makeup tutorial video. The overall atmosphere is
- relaxed and cheerful. -
- Hi everyone! Today I'll be sharing a soft, romantic
- makeup look that's perfect for dates. Many of you have
- been asking how to apply this eyeshadow naturally - the
- key is using gentle techniques. Let's go through the
- steps together... -
- -
- English-speaking middle-aged male voice, slightly husky,
- speaking at a moderate-to-slow pace with a deep tone. Like
- someone telling an old story, conveying a nostalgic feeling,
- with a relaxed and composed manner of speaking. -
- That was back in the late 1970s. I remember when our
- village first got electricity - everyone was so excited.
- In theevenings, people would bring their stools and
- gather under the big banyan tree by the village committee
- office to watch movies projected on the wall. Even now,
- thinking back to those moments still fills me with warmth. -
- -
-
-
- -
-

Comparison of voice naturalness - with the previous generation products

-

The new model demonstrates significant advantages in naturalness compared to the previous version.

-

Source Audio for Radiant_Girl

- -

DEMO

-
- - - - - - - - - - - - - - - - - - - - - -
TextMiniMax
Speech_02_HD
Microsoft
Azure TTS
AWS
Polly
- I sat alone in the empty room, staring at the old photographs,
- wondering how everything could change so quickly,
- how a lifetime of memories could fade away just like that. -
- - - - - -
- The moment I held my acceptance letter, my heart burst with joy -
- all those sleepless nights finally paid off, and I couldn't stop
- dancing around the room, calling everyone I knew to share this amazing news! -
- - - - - -
-
-
- -
-

Citation

-
-
-						
-@misc{minimax2025minimaxspeechintrinsiczeroshottexttospeech,
-	title={MiniMax-Speech: Intrinsic Zero-Shot Text-to-Speech with a Learnable Speaker Encoder},
-	author={Bowen Zhang, Congchao Guo, Geng Yang, Hang Yu, Haozhe Zhang, Heidi Lei, Jialong Mai, Junjie Yan, Kaiyue Yang,
-	Mingqi Yang, Peikai Huang, Ruiyang Jin, Sitan Jiang, Weihua Cheng, Yawei Li, Yichen Xiao, Yiying Zhou, Yongmao Zhang,
-	Yuan Lu, Yucen He},
-	year={2025},
-	eprint={2505.07916},
-	archivePrefix={arXiv},
-	primaryClass={eess.AS},
-	url={https://arxiv.org/abs/2505.07916},
-}
-					
-
-
-
-
- - - - - - \ No newline at end of file + + + + + + My static Space + + + +
+

Welcome to your static Space!

+

You can modify this app directly by editing index.html in the Files and versions tab.

+

+ Also don't forget to check the + Spaces documentation. +

+
+ + diff --git a/style.css b/style.css index 45425b088cc7911762573fa578d5010cc9b1bc92..114adf441e9032febb46bc056b2a8bb651075f0d 100644 --- a/style.css +++ b/style.css @@ -1,843 +1,28 @@ -/*! - * LaTeX.css (https://latex.vercel.app/) - * - * Source: https://github.com/vincentdoerig/latex-css - * Licensed under MIT (https://github.com/vincentdoerig/latex-css/blob/master/LICENSE) -*/ - -@font-face { - font-family: 'Latin Modern'; - font-style: normal; - font-weight: normal; - font-display: swap; - src: url('./fonts/LM-regular.woff2') format('woff2'), - url('./fonts/LM-regular.woff') format('woff'), - url('./fonts/LM-regular.ttf') format('truetype'); -} - -@font-face { - font-family: 'Latin Modern'; - font-style: italic; - font-weight: normal; - font-display: swap; - src: url('./fonts/LM-italic.woff2') format('woff2'), - url('./fonts/LM-italic.woff') format('woff'), - url('./fonts/LM-italic.ttf') format('truetype'); -} - -@font-face { - font-family: 'Latin Modern'; - font-style: normal; - font-weight: bold; - font-display: swap; - src: url('./fonts/LM-bold.woff2') format('woff2'), - url('./fonts/LM-bold.woff') format('woff'), - url('./fonts/LM-bold.ttf') format('truetype'); -} - -@font-face { - font-family: 'Latin Modern'; - font-style: italic; - font-weight: bold; - font-display: swap; - src: url('./fonts/LM-bold-italic.woff2') format('woff2'), - url('./fonts/LM-bold-italic.woff') format('woff'), - url('./fonts/LM-bold-italic.ttf') format('truetype'); -} - -@font-face { - font-family: 'Libertinus'; - font-style: normal; - font-weight: normal; - font-display: swap; - src: url('./fonts/Libertinus-regular.woff2') format('woff2'); -} - -@font-face { - font-family: 'Libertinus'; - font-style: italic; - font-weight: normal; - font-display: swap; - src: url('./fonts/Libertinus-italic.woff2') format('woff2'); -} - -@font-face { - font-family: 'Libertinus'; - font-style: normal; - font-weight: bold; - font-display: swap; - src: url('./fonts/Libertinus-bold.woff2') format('woff2'); -} - -@font-face { - font-family: 'Libertinus'; - font-style: italic; - font-weight: bold; - font-display: swap; - src: url('./fonts/Libertinus-bold-italic.woff2') format('woff2'); -} - -@font-face { - font-family: 'Libertinus'; - font-style: normal; - font-weight: 600; - font-display: swap; - src: url('./fonts/Libertinus-semibold.woff2') format('woff2'); -} - -@font-face { - font-family: 'Libertinus'; - font-style: italic; - font-weight: 600; - font-display: swap; - src: url('./fonts/Libertinus-semibold-italic.woff2') format('woff2'); -} - -/* Box sizing rules */ -*, -*::before, -*::after { - box-sizing: border-box; -} - -:root { - --body-color: hsl(0, 5%, 10%); - --body-bg-color: hsl(210, 20%, 98%); - --link-visited: hsl(0, 100%, 33%); - --link-focus-outline: hsl(220, 90%, 52%); - --pre-bg-color: hsl(210, 28%, 93%); - --kbd-bg-color: hsl(210, 5%, 100%); - --kbd-border-color: hsl(210, 5%, 70%); - --table-border-color: black; - --border-width-thin: 1.36px; - --border-color-thin: rgba(0, 0, 0, 0.1); - --border-width-thick: 2.27px; - --sidenote-target-border-color: hsl(55, 55%, 70%); - --footnotes-border-color: hsl(0, 0%, 39%); - --text-indent-size: 1.463rem; /* In 12pt [Latin Modern font] LaTeX article - \parindent =~ 17.625pt; taking also into account the ratio - 1pt[LaTeX] = (72 / 72.27) * 1pt[HTML], with default 12pt/1rem LaTeX.css font - size, the identation value in rem CSS units is: - \parindent =~ 17.625 * (72 / 72.27) / 12 = 1.463rem. */ -} - -.latex-dark { - --body-color: hsl(0, 0%, 86%); - --body-bg-color: hsl(0, 0%, 16%); - --link-visited: hsl(196 80% 77%); - --link-focus-outline: hsl(215, 63%, 73%); - --pre-bg-color: hsl(0, 1%, 25%); - --kbd-bg-color: hsl(0, 0%, 16%); - --kbd-border-color: hsl(210, 5%, 70%); - --table-border-color: white; - --sidenote-target-border-color: hsl(0, 0%, 59%); - --footnotes-border-color: hsl(0, 0%, 59%); - --proof-symbol-filter: invert(80%); -} - -@media (prefers-color-scheme: dark) { - .latex-dark-auto { - --body-color: hsl(0, 0%, 86%); - --body-bg-color: hsl(0, 0%, 16%); - --link-visited: hsl(196 80% 77%); - --link-focus-outline: hsl(215, 63%, 73%); - --pre-bg-color: hsl(0, 1%, 25%); - --kbd-bg-color: hsl(0, 0%, 16%); - --kbd-border-color: hsl(210, 5%, 70%); - --table-border-color: white; - --sidenote-target-border-color: hsl(0, 0%, 59%); - --footnotes-border-color: hsl(0, 0%, 59%); - --proof-symbol-filter: invert(80%); - } -} - -/* Remove default margin */ -body, -h1, -h2, -h3, -h4, -p, -ul[class], -ol[class], -li, -figure, -figcaption, -dl, -dd { - margin: 0; -} - -/* Make default font-size 1rem and add smooth scrolling to anchors */ -html { - font-size: 1rem; -} -@media (prefers-reduced-motion: no-preference) { - html { - scroll-behavior: smooth; - } -} - -body.libertinus { - font-family: 'Libertinus', Georgia, Cambria, 'Times New Roman', Times, serif; -} - -.text-justify { - text-align: justify; -} - body { - font-family: 'Latin Modern', Georgia, Cambria, 'Times New Roman', Times, serif; - line-height: 1.8; - - max-width: 60vw; - min-height: 100vh; - overflow-x: hidden; - margin: 0 auto; - padding: 2rem 1.25rem; - - counter-reset: theorem definition sidenote-counter; - - color: var(--body-color); - background-color: var(--body-bg-color); - - text-rendering: optimizeLegibility; - - /* Allow automatic hyphenation for all text in the document */ - hyphens: auto; - -webkit-hyphens: auto; - -moz-hyphens: auto; -} - -@media (min-width: 1050px) { - body { - max-width: 80vw; - } -} - -@media (max-width: 768px) { - body { - max-width: 90vw; - } -} - -p { - margin-top: 1rem; -} - -/* Indents paragraphs like in LaTeX documents*/ -.indent-pars p { - text-indent: var(--text-indent-size); -} - -.indent-pars p.no-indent, -p.no-indent { - text-indent: 0; -} - -.indent-pars ol p, -.indent-pars ul p { - text-indent: 0; -} - -.indent-pars h2 + p, -.indent-pars h3 + p, -.indent-pars h4 + p { - text-indent: 0; -} - -/* A elements that don't have a class get default styles */ -a:not([class]) { - text-decoration-skip-ink: auto; -} - -/* Make links red */ -a, -a:visited { - color: var(--link-visited); -} - -a:focus { - outline-offset: 2px; - outline: 2px solid var(--link-focus-outline); -} - -/* Allow line breaks between any two characters */ -.break-all { - /* - NOTE: Whith `break-all` value no hyphens are shown, even if the word breaks - at a hyphenation point - */ - word-break: break-all; -} - -/* Make images easier to work with */ -img { - max-width: 100%; - height: auto; - display: block; -} - -audio { - display: block; - width: 100%; - margin: 0.7rem auto; -} - -.audio-sm { - min-width: 190px; -} - -.audio-md { - min-width: 220px; -} - -.audio-lg { - min-width: 300px; -} - - - -/* Inherit fonts for inputs and buttons */ -input, -button, -textarea, -select { - font: inherit; -} - -/* Prevent textarea from overflowing */ -textarea { - width: 100%; -} - -/* Natural flow and rhythm in articles by default */ -article > * + * { - margin-top: 1em; -} - -.article-block { - border-radius: 8px; - box-shadow: 0 10px 30px rgba(0, 0, 0, 0.1); - padding: 2rem; - margin: 3rem 0; - box-sizing: border-box; - -} - -.article-block h2 { - margin-top: 0 !important; -} - -.article-block p { - font-size: 1.1rem; - line-height: 1.6; -} - -/* Styles for inline code or code snippets */ -code, -pre, -kbd { - font-family: Menlo, Monaco, Consolas, 'Liberation Mono', 'Courier New', - monospace; - font-size: 85%; - hyphens: none; - text-align: left; -} -pre { - padding: 1rem 1.4rem; - max-width: 100%; - overflow: auto; - border-radius: 4px; - background: var(--pre-bg-color); -} -pre code { - font-size: 95%; - position: relative; -} -kbd { - background: var(--kbd-bg-color); - border: 1px solid var(--kbd-border-color); - border-radius: 2px; - padding: 2px 4px; - font-size: 75%; -} - -/* Better tables */ -table:not(.borders-custom) { - border-collapse: collapse; - border-spacing: 0; - width: auto; - max-width: 100%; - border-top: var(--border-width-thick) solid var(--table-border-color); - border-bottom: var(--border-width-thick) solid var(--table-border-color); - /* display: block; */ - overflow-x: auto; /* does not work because element is not block */ - /* white-space: nowrap; */ - counter-increment: caption; -} -/* add bottom border on column table headings */ -table:not(.borders-custom) tr > th[scope='col'] { - border-bottom: var(--border-width-thin) solid var(--table-border-color); -} -/* add right border on row table headings */ -table:not(.borders-custom) tr > th[scope='row'] { - border-right: var(--border-width-thin) solid var(--table-border-color); -} -table:not(.borders-custom) > tbody > tr:first-child > td, -table:not(.borders-custom) > tbody > tr:first-child > th { - border-top: var(--border-width-thin) solid var(--table-border-color); -} -table:not(.borders-custom) > tbody > tr:last-child > td, -table:not(.borders-custom) > tbody > tr:last-child > th { - border-bottom: var(--border-width-thin) solid var(--table-border-color); -} - -th, -td { - text-align: left; - padding: 0.5rem; - line-height: 1.1; -} - -/* Table caption */ -caption { - text-align: left; - font-size: 0.923em; - /* border-bottom: 2pt solid #000; */ - padding: 0 0.25em 0.25em; - width: 100%; - margin-left: 0; -} - -caption::before { - content: 'Table ' counter(caption) '. '; - font-weight: bold; -}abstract - -/* allow scroll on the x-axis */ -.scroll-wrapper, .article-block .scroll-wrapper { - overflow-x: auto; - width: 100%; -} - -/* if a table is wrapped in a scroll wrapper, - the table cells shouldn't wrap */ -.scroll-wrapper > table td, .article-block .scroll-wrapper > table td { - white-space: nowrap; -} - -/* Table custom borders */ -table.borders-custom { - border-collapse: collapse; - border-spacing: 0; - width: auto; - max-width: 100%; - overflow-x: auto; - counter-increment: caption; -} - -.border-top-thick { - border-top: var(--border-width-thick) solid var(--table-border-color); -} -.border-right-thick { - border-right: var(--border-width-thick) solid var(--table-border-color); -} -.border-bottom-thick { - border-bottom: var(--border-width-thick) solid var(--table-border-color); -} -.border-left-thick { - border-left: var(--border-width-thick) solid var(--table-border-color); -} - -.border-top-thin { - border-top: var(--border-width-thin) solid var(--table-border-color); -} -.border-right-thin { - border-right: var(--border-width-thin) solid var(--table-border-color); -} -.border-bottom-thin { - border-bottom: var(--border-width-thin) solid var(--border-color-thin); -} -.border-left-thin { - border-left: var(--border-width-thin) solid var(--table-border-color); -} - -/* Table column alignment */ -.col-1-l tr > :nth-child(1), -.col-2-l tr > :nth-child(2), -.col-3-l tr > :nth-child(3), -.col-4-l tr > :nth-child(4), -.col-5-l tr > :nth-child(5), -.col-6-l tr > :nth-child(6), -.col-7-l tr > :nth-child(7), -.col-8-l tr > :nth-child(8), -.col-9-l tr > :nth-child(9), -.col-10-l tr > :nth-child(10), -.col-11-l tr > :nth-child(11), -.col-12-l tr > :nth-child(12) { - text-align: left; -} -.col-1-c tr > :nth-child(1), -.col-2-c tr > :nth-child(2), -.col-3-c tr > :nth-child(3), -.col-4-c tr > :nth-child(4), -.col-5-c tr > :nth-child(5), -.col-6-c tr > :nth-child(6), -.col-7-c tr > :nth-child(7), -.col-8-c tr > :nth-child(8), -.col-9-c tr > :nth-child(9), -.col-10-c tr > :nth-child(10), -.col-11-c tr > :nth-child(11), -.col-12-c tr > :nth-child(12) { - text-align: center; -} -.col-1-r tr > :nth-child(1), -.col-2-r tr > :nth-child(2), -.col-3-r tr > :nth-child(3), -.col-4-r tr > :nth-child(4), -.col-5-r tr > :nth-child(5), -.col-6-r tr > :nth-child(6), -.col-7-r tr > :nth-child(7), -.col-8-r tr > :nth-child(8), -.col-9-r tr > :nth-child(9), -.col-10-r tr > :nth-child(10), -.col-11-r tr > :nth-child(11), -.col-12-r tr > :nth-child(12) { - text-align: right; -} - -/* Format figure captions (based on table captions) */ -figure { - counter-increment: figcaption; -} -figcaption { - text-align: left; - font-size: 0.923em; - padding: 0.25em 0.25em 0; - width: 100%; - margin-left: 0; -} -figcaption::before { - content: 'Figure ' counter(figcaption) '. '; - font-weight: bold; -} - -/* Center align the title */ -h1:first-child { - text-align: center; -} - -/* Nested ordered list for ToC */ -nav ol { - counter-reset: item; - padding-left: 2rem; -} -nav ol > li { - display: block; -} -nav ol > li::before { - content: counters(item, '.') ' '; - counter-increment: item; - padding-right: 0.85rem; -} - -/* Center definitions (most useful for display equations) */ -dl dd { - text-align: center; -} - -/* Theorem */ -.theorem { - counter-increment: theorem; - display: block; - margin: 12px 0; - font-style: italic; -} -.theorem::before { - content: 'Theorem ' counter(theorem) '. '; - font-weight: bold; - font-style: normal; -} - -/* Lemma */ -.lemma { - counter-increment: theorem; - display: block; - margin: 12px 0; - font-style: italic; -} -.lemma::before { - content: 'Lemma ' counter(theorem) '. '; - font-weight: bold; - font-style: normal; -} - -/* Proof */ -.proof { - display: block; - margin: 12px 0; - font-style: normal; - position: relative; -} -.proof::before { - content: 'Proof. ' attr(title); - font-style: italic; -} -.proof::after { - content: '◾️'; - filter: var(--proof-symbol-filter); - position: absolute; - right: -12px; - bottom: -2px; -} - -/* Definition */ -.definition { - counter-increment: definition; - display: block; - margin: 12px 0; - font-style: normal; -} -.definition::before { - content: 'Definition ' counter(definition) '. '; - font-weight: bold; - font-style: normal; -} - -/* Center align author name, use small caps and add vertical spacing */ -.author { - margin: 0.85rem 0; - text-align: center; -} - -.date { - margin-left: 1.5rem; -} - -/* Sidenotes */ - -.sidenote { - font-size: 0.8rem; - float: right; - clear: right; - width: 18vw; - margin-right: -20vw; - margin-bottom: 1em; - text-indent: 0; - /* Right sidenotes explicitly aligned to left for wide screens */ - text-align: left; -} - -.sidenote.left { - float: left; - margin-left: -20vw; - margin-bottom: 1em; - text-indent: 0; - /* Left sidenotes explicitly aligned to right for wide screens */ - text-align: right; + padding: 2rem; + font-family: -apple-system, BlinkMacSystemFont, "Arial", sans-serif; } -/* Justify all sidenotes for wide screens when `text-justify` class is used */ -body.text-justify .sidenote, -body.text-justify .sidenote.left { - text-align: justify; -} - -/* (WIP) add border when a sidenote is clicked on */ -.sidenote:target { - border: var(--sidenote-target-border-color) 1.5px solid; - padding: 0 .5rem; - scroll-margin-block-start: 10rem; -} - -/* sidenote counter */ -.sidenote-number { - counter-increment: sidenote-counter; -} - -.sidenote-number::after, -.sidenote::before { - position: relative; - vertical-align: baseline; -} - -/* add number in main content */ -.sidenote-number::after { - content: counter(sidenote-counter); - font-size: 0.7rem; - top: -0.5rem; - left: 0.1rem; -} - -/* add number in front of the sidenote */ -.sidenote-number ~ .sidenote::before { - content: counter(sidenote-counter) ' '; - font-size: 0.7rem; - top: -0.5rem; -} - -label.sidenote-toggle:not(.sidenote-number) { - display: none; -} - -/* sidenotes inside blockquotes are indented more */ -blockquote .sidenote { - margin-right: -24vw; - width: 18vw; -} - - -label.sidenote-toggle { - display: inline; - cursor: pointer; -} - -input.sidenote-toggle { - display: none; -} - -@media (max-width: 1050px) { - label.sidenote-toggle:not(.sidenote-number) { - display: inline; - } - .sidenote { - display: none; - } - .sidenote-toggle:checked + .sidenote { - display: block; - margin: 0.5rem 1.25rem 1rem 0.5rem; - float: left; - left: 1rem; - clear: both; - width: 95%; - } - - /* All sidenotes explicitly aligned to left for narrow screens */ - .sidenote-toggle:checked + .sidenote.left { - text-align: left; - } - - /* Justify all sidenotes for narrow screens when `text-justify` class is used */ - body.text-justify .sidenote-toggle:checked + .sidenote.left { - text-align: justify; - } - - /* tweak indentation of sidenote inside a blockquote */ - blockquote .sidenote { - margin-right: -25vw; - width: 16vw; - } -} - -/* Make footnote text smaller */ -.footnotes p { - line-height: 1.5; - font-size: 85%; - margin-bottom: 0.4rem; -} -.footnotes { - border-top: 1px solid var(--footnotes-border-color); -} - -/* Center title and paragraph */ -.abstract, -.abstract p { - text-align: center; - margin-top: 0; -} -.abstract { - margin: 2.25rem 0; -} -.abstract > h2 { - font-size: 1rem; - margin-bottom: -0.2rem; -} - -/* Format the LaTeX symbol correctly (a higher up, e lower) */ -.latex span:nth-child(1) { - text-transform: uppercase; - font-size: 0.75em; - vertical-align: 0.28em; - margin-left: -0.48em; - margin-right: -0.15em; - line-height: 1ex; -} - -.latex span:nth-child(2) { - text-transform: uppercase; - vertical-align: -0.5ex; - margin-left: -0.1667em; - margin-right: -0.125em; - line-height: 1ex; -} - -/* Prevent line breaks inside an element */ -.whitespace-nowrap { - white-space: nowrap; -} - -/* Heading typography */ h1 { - font-size: 2.5rem; - line-height: 3.25rem; - margin-bottom: 1.625rem; -} - -h2 { - font-size: 1.8rem; - line-height: 2.1rem; - margin-top: 4rem; -} - -h3 { - font-size: 1.4rem; - margin-top: 3rem; -} - -h4 { - font-size: 1.2rem; - margin-top: 2rem; -} - -h5 { - font-size: 1rem; - margin-top: 1.8rem; + font-size: 16px; + margin-top: 0; } -h6 { - font-size: 1rem; - font-style: italic; - font-weight: normal; - margin-top: 2.5rem; -} - -h3, -h4, -h5, -h6 { - line-height: 1.625rem; -} - -h1 + h2 { - margin-top: 1.625rem; +p { + color: rgb(107, 114, 128); + font-size: 15px; + margin-bottom: 10px; + margin-top: 5px; } -h2 + h3, -h3 + h4, -h4 + h5 { - margin-top: 1.4rem; +.card { + max-width: 620px; + margin: 0 auto; + padding: 16px; + border: 1px solid lightgray; + border-radius: 16px; } -h5 + h6 { - margin-top: -0.8rem; +.card p:last-child { + margin-bottom: 0; } - -h2, -h3, -h4, -h5, -h6 { - text-align: left; - margin-bottom: 1rem; -} \ No newline at end of file