[{"data":1,"prerenderedAt":205},["ShallowReactive",2],{"DlFXI4Eibt_Bn9lrEZz1TYbHCWFZj3IvqwHQSEW-Exc":3,"7mg5KRkonwSDyA7r6ABGuzcr8hdqwXAjcAOG0i4gO-k":194},{"code":4,"msg":5,"data":6},0,"",{"category":7,"tag":11,"hot":39,"new":78,"banner":118,"data":143,"cache":193},[8,9,10],"Agent","OpenAI","LLM",[12,14,17,20,23,25,27,30,33,36],{"title":8,"total":13},39,{"title":15,"total":16},"Google",44,{"title":18,"total":19},"Nvidia",13,{"title":21,"total":22},"Claude",11,{"title":9,"total":24},35,{"title":10,"total":26},85,{"title":28,"total":29},"DeepSeek",9,{"title":31,"total":32},"OCR",1,{"title":34,"total":35},"Chat",7,{"title":37,"total":38},"Generator",116,[40,48,55,64,71],{"id":41,"publish_date":42,"is_original":4,"collection":5,"cover_url":43,"cover_url_1_1":44,"title":45,"summary":46,"author":47},557,"2022-04-29","article_res/cover/7a9b1375ed9bb298154981bae42b794d.jpeg","article_res/cover/afa281dd52bc0454e6735daa8e6b0706.jpeg","Translation and summary of Messari Report [2.8 Kristin Smith, Blockchain Association and Katie Haun, a16z]","We need unity and speed right now.","Translation",{"id":49,"publish_date":50,"is_original":4,"collection":5,"cover_url":51,"cover_url_1_1":52,"title":53,"summary":54,"author":47},531,"2022-05-25","article_res/cover/e8362057f8fa189594c60afdfaaeb6e5.jpeg","article_res/cover/8ea08d0d6fa7eee6b57ed4ec61b61ad6.jpeg","Decentralized Society: Finding Web3’s Soul / Decentralized Society: Finding the Soul of Web3 -7","Decentralization through Pluralism When analyzing ecosystems, it's desirable to measure how decentralized it is.",{"id":56,"publish_date":57,"is_original":32,"collection":58,"cover_url":59,"cover_url_1_1":60,"title":61,"summary":62,"author":63},127,"2024-11-14","#Google #AI Game #World Model #AI Story","article_res/cover/0233a875b7ec2debf59779e311547569.jpeg","article_res/cover/6ffddb6ae4914b3c699493311aa9f198.jpeg","Google Launches \"Unbounded\": A Generative Infinite Character Life Simulation Game","Unbounded: A Generative Infinite Game of Character Life Simulation","Renee's Entrepreneurial Journey",{"id":13,"publish_date":65,"is_original":32,"collection":66,"cover_url":67,"cover_url_1_1":68,"title":69,"summary":70,"author":63},"2025-02-14","#Deep Dive into LLMs #Andrej Karpathy #LLM #Tool Use #Hallucination","article_res/cover/11e858ad6b74dfa80f923d549b62855c.jpeg","article_res/cover/615e1b320f1fc163edc1d2d154a6de33.jpeg","Andrej Karpathy's in-depth explanation of LLM (Part 4): Hallucinations","hallucinations, tool use, knowledge/working memory",{"id":72,"publish_date":73,"is_original":4,"collection":5,"cover_url":74,"cover_url_1_1":75,"title":76,"summary":77,"author":47},579,"2022-04-07","article_res/cover/39387376ba28447af1eb40576b9df215.jpeg","article_res/cover/02727ede8551ed49901d0abe6d6305b7.jpeg","Messari Report Translation and Summary 【1-7 Surviving the Winter】","I’d be more cautious here: 10 year and 10 hour thinking only.",[79,87,95,103,111],{"id":80,"publish_date":81,"is_original":32,"collection":82,"cover_url":83,"cover_url_1_1":84,"title":85,"summary":86,"author":63},627,"2025-03-20","#AI Avatar #AI Video Generation","article_res/cover/d95481358f73924989f8c4ee9c75d1c8.jpeg","article_res/cover/b74bc0fab01f8b6a6aa87696c0c3ed8b.jpeg","DisPose: Generating Animated Videos by Driving Video with Reference Images","DisPose is a controllable human image animation method that enhances video generation.",{"id":88,"publish_date":89,"is_original":32,"collection":90,"cover_url":91,"cover_url_1_1":92,"title":93,"summary":94,"author":63},626,"2025-03-21","#Deep Dive into LLMs #LLM #RL #Andrej Karpathy #AlphaGo","article_res/cover/446553a5c8f8f2f07d97b20eaee84e56.jpeg","article_res/cover/e6c2823409c9b34624064b9acbaca6f1.jpeg","AlphaGo and the Power of Reinforcement Learning - Andrej Karpathy's Deep Dive on LLMs (Part 9)","Simply learning from humans will never surpass human capabilities.",{"id":96,"publish_date":97,"is_original":32,"collection":98,"cover_url":99,"cover_url_1_1":100,"title":101,"summary":102,"author":63},625,"2025-03-22","#Deep Dive into LLMs #LLM #RL #RLHF #Andrej Karpathy","article_res/cover/8da81d38b1e5cf558a164710fd8a5389.jpeg","article_res/cover/96f028d76c362a99a0dd56389e8f7a9b.jpeg","Reinforcement Learning from Human Feedback (RLHF) - Andrej Karpathy's Deep Dive on LLMs (Part 10)","Fine-Tuning Language Models from Human Preferences",{"id":104,"publish_date":105,"is_original":32,"collection":106,"cover_url":107,"cover_url_1_1":108,"title":109,"summary":110,"author":63},624,"2025-03-23","#Deep Dive into LLMs #LLM #Andrej Karpathy #AI Agent #MMM","article_res/cover/a5e7c3d48bb09109684d6513287c661d.jpeg","article_res/cover/d3f22b7c0ab8d82fd2da457a299e0773.jpeg","The Future of Large Language Models - Andrej Karpathy's In-Depth Explanation of LLM (Part 11)","preview of things to come",{"id":112,"publish_date":105,"is_original":32,"collection":113,"cover_url":114,"cover_url_1_1":115,"title":116,"summary":117,"author":63},623,"#Google #Voe #AI Video Generation","article_res/cover/c44062fea0f336c2b96b3928292392c2.jpeg","article_res/cover/a041041c69092ad3db191c5bf3ff981b.jpeg","Trial of Google's video generation model VOE2","Our state-of-the-art video generation model",[119,127,135],{"id":120,"publish_date":121,"is_original":32,"collection":122,"cover_url":123,"cover_url_1_1":124,"title":125,"summary":126,"author":63},160,"2024-10-04","#Philosophy","article_res/cover/496990c49211e8b7f996b7d39c18168e.jpeg","article_res/cover/14dbaa1ade9cb4316d5829423a900362.jpeg","Time","The fungus of the morning does not know the waxing and waning of the moon, and the cicada does not know the seasons; this is a short life. To the south of the state of Chu there is a dark spirit which regards five hundred years as spring and five hundred years as autumn. In ancient times there was a great tree called the Ming which regarded eight thousand years as spring and eight thousand years as autumn; this is a long life.",{"id":128,"publish_date":129,"is_original":32,"collection":130,"cover_url":131,"cover_url_1_1":132,"title":133,"summary":134,"author":63},98,"2024-12-17","#AI Video Generator #Sora #Pika","article_res/cover/3b86e85d03fff4f356a3e4cf2bb329c9.jpeg","article_res/cover/5fa5c20ad0b40f8f544d257c0ef02938.jpeg","Pika 2.0 video generation officially released: effect comparison with Sora","今天，我们推出了Pika 2.0模型。卓越的文字对齐效果。惊人的视觉表现。还有✨场景成分✨",{"id":136,"publish_date":137,"is_original":32,"collection":138,"cover_url":139,"cover_url_1_1":140,"title":141,"summary":142,"author":63},71,"2025-01-14","#Nvidia #World Foundation Model #Cosmos #Physical AI #Embodied AI","article_res/cover/feddf8c832dfb45d28804291f6a42a9e.jpeg","article_res/cover/d6bc2f1186d96b78228c2283a17a3645.jpeg","NVIDIA's Cosmos World Model","Cosmos World Foundation Model Platform for Physical AI",[144,163,188],{"title":8,"items":145},[146,147,155],{"id":104,"publish_date":105,"is_original":32,"collection":106,"cover_url":107,"cover_url_1_1":108,"title":109,"summary":110,"author":63},{"id":148,"publish_date":149,"is_original":32,"collection":150,"cover_url":151,"cover_url_1_1":152,"title":153,"summary":154,"author":63},622,"2025-03-24","#OWL #AI Agent #MAS #MCP #CUA","article_res/cover/cb50ca7f2bf4d1ed50202d7406e1c19a.jpeg","article_res/cover/4aa7aa3badfacf3cc84121334f1050dd.jpeg","OWL: Multi-agent collaboration","OWL: Optimized Workforce Learning for General Multi-Agent Assistance in Real-World Task Automation",{"id":156,"publish_date":157,"is_original":32,"collection":158,"cover_url":159,"cover_url_1_1":160,"title":161,"summary":162,"author":63},620,"2025-03-26","#LLM #Google #Gemini #AI Agent","article_res/cover/53751a6dbbe990b1eb0b63f3b062aed4.jpeg","article_res/cover/031344981f0a212ff82d1f3a64aa5756.jpeg","Gemini 2.5 Pro, claimed to be far ahead of the competition, has been released with great fanfare: comprehensively surpassing other LLMs and topping the global rankings","Gemini 2.5: Our most intelligent AI model",{"title":9,"items":164},[165,172,180],{"id":166,"publish_date":157,"is_original":32,"collection":167,"cover_url":168,"cover_url_1_1":169,"title":170,"summary":171,"author":63},619,"#OpenAI #AI Image Generator #4o #MMM #AR Transformer","article_res/cover/2faffc97fcecf3151552cb0fd3206d89.jpeg","article_res/cover/1133cb4948af44cee2e7fbe79efb69e5.jpeg","The native image function of GPT-4o is officially launched","Introducing 4o Image Generation",{"id":173,"publish_date":174,"is_original":4,"collection":175,"cover_url":176,"cover_url_1_1":177,"title":178,"summary":179,"author":63},434,"2023-07-15","#Anthropic #OpenAI #Google #AI Code Generator #Claude","article_res/cover/e1b6f600a2b9f262a4392684e5f2ce25.jpeg","article_res/cover/6e1772e83f78f9a351ab23d3e414adee.jpeg","Latest Updates on Google Bard /Anthropic Claude2 / ChatGPT Code Interpreter","We want our models to use their programming skills to provide more natural interfaces to the basic functions of our computers.  \n - OpenAI",{"id":181,"publish_date":182,"is_original":4,"collection":183,"cover_url":184,"cover_url_1_1":185,"title":186,"summary":187,"author":63},417,"2023-08-24","#OpenAI","article_res/cover/bccf897d50a88b18364e35f7466387e0.jpeg","article_res/cover/2f871085c1073717c1703ae86e18056f.jpeg","The GPT-3.5 Turbo fine-tuning (fine-tuning function) has been released～","Developers can now bring their own data to customize GPT-3.5 Turbo for their use cases.",{"title":10,"items":189},[190,191,192],{"id":88,"publish_date":89,"is_original":32,"collection":90,"cover_url":91,"cover_url_1_1":92,"title":93,"summary":94,"author":63},{"id":96,"publish_date":97,"is_original":32,"collection":98,"cover_url":99,"cover_url_1_1":100,"title":101,"summary":102,"author":63},{"id":104,"publish_date":105,"is_original":32,"collection":106,"cover_url":107,"cover_url_1_1":108,"title":109,"summary":110,"author":63},true,{"code":4,"msg":5,"data":195},{"id":196,"publish_date":197,"is_original":32,"collection":198,"articles_id":199,"cover_url":200,"cover_url_1_1":201,"title":202,"summary":203,"author":63,"content":204},234,"2024-06-26","#ByteDance","xSLCk8c4Nw23DK_A4ZW01w","article_res/cover/868024df3a0a705b5115e55d12e524e7.jpeg","article_res/cover/3d403ab6a5adcb433a89c05da59a35bc.jpeg","Seed-TTS by Byte: A Series of High-Quality Multi-functional Speech Generation Models","Seed-TTS: A Family of High-Quality Versatile Speech Generation Models","\u003Cdiv class=\"rich_media_content js_underline_content\n                       autoTypeSetting24psection\n            \" id=\"js_content\">\u003Csection data-tool=\"mdnice编辑器\" data-website=\"https://www.mdnice.com\" style='margin-bottom: 0px;padding-left: 10px;padding-right: 10px;background-attachment: scroll;background-clip: border-box;background-image: none;background-origin: padding-box;background-position: 0% 0%;background-repeat: no-repeat;background-size: auto;width: auto;font-family: Optima, \"Microsoft YaHei\", PingFangSC-regular, serif;font-size: 16px;color: rgb(0, 0, 0);line-height: 1.5em;word-spacing: 0em;letter-spacing: 0em;word-break: break-word;text-align: left;'>\u003Cp data-tool=\"mdnice编辑器\" style=\"line-height: 1.8em;letter-spacing: 0em;text-indent: 0em;padding-top: 8px;padding-bottom: 8px;\">This month, ByteDance released SeedTTS. Currently, there is only a paper; the code has not been made public yet.\u003C/p>\u003Ch3 data-tool=\"mdnice编辑器\" style=\"margin-top: 30px;margin-bottom: 15px;\">\u003Cspan style=\"display: none;\">\u003C/span>\u003Cspan style=\"font-size: 20px;line-height: 1.5em;letter-spacing: 0em;font-weight: bold;display: block;\">Official Demo\u003C/span>\u003Cspan style=\"display: none;\">\u003C/span>\u003C/h3>\u003Col data-tool=\"mdnice编辑器\" style=\"margin-top: 8px;margin-bottom: 8px;padding-left: 25px;\" class=\"list-paddingleft-1\">\u003Cli>\u003Csection style=\"margin-top: 5px;margin-bottom: 5px;color: rgb(1, 1, 1);line-height: 1.8em;letter-spacing: 0em;\">\u003Cstrong style=\"color: rgb(0, 0, 0);background-attachment: scroll;background-clip: border-box;background-image: none;background-origin: padding-box;background-position: 0% 0%;background-repeat: no-repeat;background-size: auto;width: auto;height: auto;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;\">Voice Factor Decomposition - Zero-shot Voice Conversion\u003C/strong>\u003C/section>\u003C/li>\u003C/ol>\u003Csection data-tool=\"mdnice编辑器\" style=\"margin-top: 20px;margin-bottom: 20px;padding: 10px 20px;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;background: none 0% 0% / auto no-repeat scroll padding-box border-box rgb(250, 250, 250);width: auto;height: auto;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;\">\u003Csection>\u003Cp style=\"line-height: 1.8em;letter-spacing: 0em;text-indent: 0em;padding-top: 8px;padding-bottom: 8px;\">Source Audio\u003C/p>\u003Csection>\u003Cmp-common-mpaudio class=\"js_editor_audio res_iframe js_uneditable custom_select_card\" src=\"https://res.cooltool.vip/article_res/assets/17423803605960.44555442218717456.mp3\" isaac2=\"1\" low_size=\"22.94\" source_size=\"22.9\" high_size=\"48.98\" name=\"Source Audio\" play_length=\"12000\" author=\"Renee 创业随笔\" data-topic_id=\"\" data-topic_name=\"\" data-pluginname=\"insertaudio\" data-trans_state=\"1\" data-verify_state=\"3\" voice_encode_fileid=\"MzkwOTMzMzk0MV8yMjQ3NDg5MTQx\" data-uuid=\"17423803605960.44555442218717456\">\u003C/mp-common-mpaudio>\u003C/section>\u003C/section>\u003C/section>\u003Csection data-tool=\"mdnice编辑器\" style=\"margin-top: 20px;margin-bottom: 20px;padding: 10px 20px;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;background: none 0% 0% / auto no-repeat scroll padding-box border-box rgb(250, 250, 250);width: auto;height: auto;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;\">\u003Csection>\u003Cp style=\"line-height: 1.8em;letter-spacing: 0em;text-indent: 0em;padding-top: 8px;padding-bottom: 8px;\">Timbre Prompt\u003C/p>\u003Csection>\u003Cmp-common-mpaudio class=\"js_editor_audio res_iframe js_uneditable custom_select_card\" src=\"https://res.cooltool.vip/article_res/assets/17423803605960.8524610491429099.mp3\" isaac2=\"1\" low_size=\"27.76\" source_size=\"27.8\" high_size=\"57.33\" name=\"Timbre Prompt\" play_length=\"14000\" author=\"Renee 创业随笔\" data-topic_id=\"\" data-topic_name=\"\" data-pluginname=\"insertaudio\" data-trans_state=\"1\" data-verify_state=\"3\" voice_encode_fileid=\"MzkwOTMzMzk0MV8yMjQ3NDg5MTQy\" data-uuid=\"17423803605960.8524610491429099\">\u003C/mp-common-mpaudio>\u003C/section>\u003C/section>\u003C/section>\u003Csection data-tool=\"mdnice编辑器\" style=\"margin-top: 20px;margin-bottom: 20px;padding: 10px 20px;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;background: none 0% 0% / auto no-repeat scroll padding-box border-box rgb(250, 250, 250);width: auto;height: auto;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;\">\u003Csection>\u003Cp style=\"line-height: 1.8em;letter-spacing: 0em;text-indent: 0em;padding-top: 8px;padding-bottom: 8px;\">Converted Audio\u003C/p>\u003Csection>\u003Cmp-common-mpaudio class=\"js_editor_audio res_iframe js_uneditable custom_select_card\" src=\"https://res.cooltool.vip/article_res/assets/17423803605960.6826406749694893.mp3\" isaac2=\"1\" low_size=\"24\" source_size=\"24\" high_size=\"49.36\" name=\"Converted Audio\" play_length=\"12000\" author=\"Renee 创业随笔\" data-topic_id=\"\" data-topic_name=\"\" data-pluginname=\"insertaudio\" data-trans_state=\"1\" data-verify_state=\"3\" voice_encode_fileid=\"MzkwOTMzMzk0MV8yMjQ3NDg5MTQz\" data-uuid=\"17423803605960.6826406749694893\">\u003C/mp-common-mpaudio>\u003C/section>\u003C/section>\u003C/section>\u003Col start=\"2\" data-tool=\"mdnice编辑器\" style=\"margin-top: 8px;margin-bottom: 8px;padding-left: 25px;\" class=\"list-paddingleft-1\">\u003Cli>\u003Csection style=\"margin-top: 5px;margin-bottom: 5px;color: rgb(1, 1, 1);line-height: 1.8em;letter-spacing: 0em;\">\u003Cstrong style=\"color: rgb(0, 0, 0);background-attachment: scroll;background-clip: border-box;background-image: none;background-origin: padding-box;background-position: 0% 0%;background-repeat: no-repeat;background-size: auto;width: auto;height: auto;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;\">Preference Adjustment via Reinforcement Learning - Emotional Control in Zero-shot Contextual Learning\u003C/strong>\u003C/section>\u003C/li>\u003C/ol>\u003Csection data-tool=\"mdnice编辑器\" style=\"margin-top: 20px;margin-bottom: 20px;padding: 10px 20px;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;background: none 0% 0% / auto no-repeat scroll padding-box border-box rgb(250, 250, 250);width: auto;height: auto;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;\">\u003Csection>\u003Cp style=\"line-height: 1.8em;letter-spacing: 0em;text-indent: 0em;padding-top: 8px;padding-bottom: 8px;\">Prompt\u003C/p>\u003Csection>\u003Cmp-common-mpaudio class=\"js_editor_audio res_iframe js_uneditable custom_select_card\" src=\"https://res.cooltool.vip/article_res/assets/17423803605960.42950786327021206.mp3\" isaac2=\"1\" low_size=\"23.53\" source_size=\"23.5\" high_size=\"54.14\" name=\"Prompt\" play_length=\"13000\" author=\"Renee 创业随笔\" data-topic_id=\"\" data-topic_name=\"\" data-pluginname=\"insertaudio\" data-trans_state=\"1\" data-verify_state=\"3\" voice_encode_fileid=\"MzkwOTMzMzk0MV8yMjQ3NDg5MTQ0\" data-uuid=\"17423803605960.42950786327021206\">\u003C/mp-common-mpaudio>\u003C/section>\u003C/section>\u003C/section>\u003Csection data-tool=\"mdnice编辑器\" style=\"margin-top: 20px;margin-bottom: 20px;padding: 10px 20px;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;background: none 0% 0% / auto no-repeat scroll padding-box border-box rgb(250, 250, 250);width: auto;height: auto;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;\">\u003Csection>\u003Cp style=\"line-height: 1.8em;letter-spacing: 0em;text-indent: 0em;padding-top: 8px;padding-bottom: 8px;\">Angry\u003C/p>\u003Csection>\u003Cmp-common-mpaudio class=\"js_editor_audio res_iframe js_uneditable custom_select_card\" src=\"https://res.cooltool.vip/article_res/assets/17423803605960.2053790053585538.mp3\" isaac2=\"1\" low_size=\"17.81\" source_size=\"17.8\" high_size=\"35.29\" name=\"Angry\" play_length=\"8000\" author=\"Renee 创业随笔\" data-topic_id=\"\" data-topic_name=\"\" data-pluginname=\"insertaudio\" data-trans_state=\"1\" data-verify_state=\"3\" voice_encode_fileid=\"MzkwOTMzMzk0MV8yMjQ3NDg5MTQ1\" data-uuid=\"17423803605960.2053790053585538\">\u003C/mp-common-mpaudio>\u003C/section>\u003C/section>\u003C/section>\u003Csection data-tool=\"mdnice编辑器\" style=\"margin-top: 20px;margin-bottom: 20px;padding: 10px 20px;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;background: none 0% 0% / auto no-repeat scroll padding-box border-box rgb(250, 250, 250);width: auto;height: auto;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;\">\u003Csection>\u003Cp style=\"line-height: 1.8em;letter-spacing: 0em;text-indent: 0em;padding-top: 8px;padding-bottom: 8px;\">Happy\u003C/p>\u003Csection>\u003Cmp-common-mpaudio class=\"js_editor_audio res_iframe js_uneditable custom_select_card\" src=\"https://res.cooltool.vip/article_res/assets/17423803605960.4277191404701244.mp3\" isaac2=\"1\" low_size=\"19.33\" source_size=\"19.3\" high_size=\"39.14\" name=\"Happy\" play_length=\"9000\" author=\"Renee 创业随笔\" data-topic_id=\"\" data-topic_name=\"\" data-pluginname=\"insertaudio\" data-trans_state=\"1\" data-verify_state=\"3\" voice_encode_fileid=\"MzkwOTMzMzk0MV8yMjQ3NDg5MTQ2\" data-uuid=\"17423803605960.4277191404701244\">\u003C/mp-common-mpaudio>\u003C/section>\u003C/section>\u003C/section>\u003Col start=\"3\" data-tool=\"mdnice编辑器\" style=\"margin-top: 8px;margin-bottom: 8px;padding-left: 25px;\" class=\"list-paddingleft-1\">\u003Cli>\u003Csection style=\"margin-top: 5px;margin-bottom: 5px;color: rgb(1, 1, 1);line-height: 1.8em;letter-spacing: 0em;\">\u003Cstrong style=\"color: rgb(0, 0, 0);background-attachment: scroll;background-clip: border-box;background-image: none;background-origin: padding-box;background-position: 0% 0%;background-repeat: no-repeat;background-size: auto;width: auto;height: auto;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;\">Fully diffusion-based speech generation -\u003C/strong>\u003Cspan style=\"letter-spacing: 0em;word-spacing: 0em;\">Zero-shot TTS\u003C/span>\u003C/section>\u003C/li>\u003C/ol>\u003Csection data-tool=\"mdnice编辑器\" style=\"margin-top: 20px;margin-bottom: 20px;padding: 10px 20px;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;background: none 0% 0% / auto no-repeat scroll padding-box border-box rgb(250, 250, 250);width: auto;height: auto;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;\">\u003Csection>\u003Cp style=\"line-height: 1.8em;letter-spacing: 0em;text-indent: 0em;padding-top: 8px;padding-bottom: 8px;\">Prompt\u003C/p>\u003Csection>\u003Cmp-common-mpaudio class=\"js_editor_audio res_iframe js_uneditable custom_select_card\" src=\"https://res.cooltool.vip/article_res/assets/17423803605960.0429023891178828.mp3\" isaac2=\"1\" low_size=\"26.71\" source_size=\"26.7\" high_size=\"55.26\" name=\"Prompt-zeroshot\" play_length=\"14000\" author=\"Renee 创业随笔\" data-topic_id=\"\" data-topic_name=\"\" data-pluginname=\"insertaudio\" data-trans_state=\"1\" data-verify_state=\"3\" voice_encode_fileid=\"MzkwOTMzMzk0MV8yMjQ3NDg5MTQ3\" data-uuid=\"17423803605960.0429023891178828\">\u003C/mp-common-mpaudio>\u003C/section>\u003C/section>\u003C/section>\u003Csection data-tool=\"mdnice编辑器\" style=\"margin-top: 20px;margin-bottom: 20px;padding: 10px 20px;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;background: none 0% 0% / auto no-repeat scroll padding-box border-box rgb(250, 250, 250);width: auto;height: auto;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;\">\u003Csection>\u003Cp style=\"line-height: 1.8em;letter-spacing: 0em;text-indent: 0em;padding-top: 8px;padding-bottom: 8px;\">Same Language Generation\u003C/p>\u003Cblockquote style=\"margin-top: 20px;margin-bottom: 20px;padding: 10px 10px 10px 20px;border-top: 3px none rgba(0, 0, 0, 0.4);border-bottom: 3px none rgba(0, 0, 0, 0.4);border-right: 3px none rgba(0, 0, 0, 0.4);border-left-color: rgba(0, 0, 0, 0.4);border-radius: 0px;background: none 0% 0% / auto no-repeat scroll padding-box border-box rgba(0, 0, 0, 0.05);width: auto;height: auto;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;overflow: auto;\">\u003Cspan style=\"display: none;color: rgb(0, 0, 0);font-size: 16px;line-height: 1.5em;letter-spacing: 0em;\">\u003C/span>\u003Cp style=\"text-indent: 0em;padding-top: 8px;padding-bottom: 8px;color: rgb(0, 0, 0);font-size: 16px;line-height: 1.8em;letter-spacing: 0em;\">I don't really care what you call me. I've been a silent spectator, watching species evolve, empires rise and fall. But always remember, I am mighty and enduring. Respect me and I'll nurture you; ignore me and you shall face the consequences.\u003C/p>\u003C/blockquote>\u003Csection>\u003Cmp-common-mpaudio class=\"js_editor_audio res_iframe js_uneditable custom_select_card\" src=\"https://res.cooltool.vip/article_res/assets/17423803605960.2034072073127764.mp3\" isaac2=\"1\" low_size=\"32.61\" source_size=\"32.6\" high_size=\"65.86\" name=\"Same Language Generation\" play_length=\"16000\" author=\"Renee 创业随笔\" data-topic_id=\"\" data-topic_name=\"\" data-pluginname=\"insertaudio\" data-trans_state=\"1\" data-verify_state=\"3\" voice_encode_fileid=\"MzkwOTMzMzk0MV8yMjQ3NDg5MTQ4\" data-uuid=\"17423803605960.2034072073127764\">\u003C/mp-common-mpaudio>\u003C/section>\u003C/section>\u003C/section>\u003Csection data-tool=\"mdnice编辑器\" style=\"margin-top: 20px;margin-bottom: 20px;padding: 10px 20px;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;background: none 0% 0% / auto no-repeat scroll padding-box border-box rgb(250, 250, 250);width: auto;height: auto;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;\">\u003Csection>\u003Cp style=\"line-height: 1.8em;letter-spacing: 0em;text-indent: 0em;padding-top: 8px;padding-bottom: 8px;\">Cross-linugal Generation\u003C/p>\u003Cblockquote style=\"margin-top: 20px;margin-bottom: 20px;padding: 10px 10px 10px 20px;border-top: 3px none rgba(0, 0, 0, 0.4);border-bottom: 3px none rgba(0, 0, 0, 0.4);border-right: 3px none rgba(0, 0, 0, 0.4);border-left-color: rgba(0, 0, 0, 0.4);border-radius: 0px;background: none 0% 0% / auto no-repeat scroll padding-box border-box rgba(0, 0, 0, 0.05);width: auto;height: auto;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;overflow: auto;\">\u003Cspan style=\"display: none;color: rgb(0, 0, 0);font-size: 16px;line-height: 1.5em;letter-spacing: 0em;\">\u003C/span>\u003Cp style=\"text-indent: 0em;padding-top: 8px;padding-bottom: 8px;color: rgb(0, 0, 0);font-size: 16px;line-height: 1.8em;letter-spacing: 0em;\">Suddenly, the atmosphere became heavy. At first glance, it seemed like all the troubles were surrounding me. I frowned, feeling the pressure, but I knew I couldn't give up, couldn't admit defeat. So, I took a deep breath, and a voice in my heart told me: \"No matter what, you have to calm down and start again.\"\u003C/p>\u003C/blockquote>\u003Csection>\u003Cmp-common-mpaudio class=\"js_editor_audio res_iframe js_uneditable custom_select_card\" src=\"https://res.cooltool.vip/article_res/assets/17423803605960.27629094958461686.mp3\" isaac2=\"1\" low_size=\"45.04\" source_size=\"45\" high_size=\"93.14\" name=\"Cross-linugal Generation\" play_length=\"23000\" author=\"Renee 创业随笔\" data-topic_id=\"\" data-topic_name=\"\" data-pluginname=\"insertaudio\" data-trans_state=\"1\" data-verify_state=\"3\" voice_encode_fileid=\"MzkwOTMzMzk0MV8yMjQ3NDg5MTQ5\" data-uuid=\"17423803605960.27629094958461686\">\u003C/mp-common-mpaudio>\u003C/section>\u003C/section>\u003C/section>\u003Csection style=\"margin-top: 5px;margin-bottom: 5px;color: rgb(1, 1, 1);line-height: 1.8em;letter-spacing: 0em;\">\u003Cspan style=\"letter-spacing: 0em;text-indent: 0em;background-color: rgb(250, 250, 250);color: rgb(0, 0, 0);word-spacing: 0em;\">\u003C/span>\u003C/section>\u003Ch3 data-tool=\"mdnice编辑器\" style=\"margin-top: 30px;margin-bottom: 15px;\">\u003Cspan style=\"display: none;\">\u003C/span>\u003Cspan style=\"font-size: 20px;line-height: 1.5em;letter-spacing: 0em;font-weight: bold;display: block;\">Application scenarios:\u003C/span>\u003Cspan style=\"display: none;\">\u003C/span>\u003C/h3>\u003Cul data-tool=\"mdnice编辑器\" style=\"margin-top: 8px;margin-bottom: 8px;padding-left: 25px;\" class=\"list-paddingleft-1\">\u003Cli>\u003Csection style=\"margin-top: 5px;margin-bottom: 5px;color: rgb(1, 1, 1);line-height: 1.8em;letter-spacing: 0em;\">\u003Cstrong style=\"color: rgb(0, 0, 0);background-attachment: scroll;background-clip: border-box;background-image: none;background-origin: padding-box;background-position: 0% 0%;background-repeat: no-repeat;background-size: auto;width: auto;height: auto;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;\">Audiobooks\u003C/strong>\u003C/section>\u003C/li>\u003C/ul>\u003Csection data-tool=\"mdnice编辑器\" style=\"margin-top: 20px;margin-bottom: 20px;padding: 10px 20px;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;background: none 0% 0% / auto no-repeat scroll padding-box border-box rgb(250, 250, 250);width: auto;height: auto;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;\">\u003Csection>\u003Cblockquote style=\"margin-top: 20px;margin-bottom: 20px;padding: 10px 10px 10px 20px;border-top: 3px none rgba(0, 0, 0, 0.4);border-bottom: 3px none rgba(0, 0, 0, 0.4);border-right: 3px none rgba(0, 0, 0, 0.4);border-left-color: rgba(0, 0, 0, 0.4);border-radius: 0px;background: none 0% 0% / auto no-repeat scroll padding-box border-box rgba(0, 0, 0, 0.05);width: auto;height: auto;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;overflow: auto;\">\u003Cspan style=\"display: none;color: rgb(0, 0, 0);font-size: 16px;line-height: 1.5em;letter-spacing: 0em;\">\u003C/span>\u003Cp style=\"text-indent: 0em;padding-top: 8px;padding-bottom: 8px;color: rgb(0, 0, 0);font-size: 16px;line-height: 1.8em;letter-spacing: 0em;\">\"This pill... it can't be something like a sedative or an aphrodisiac, right? Why does the smell seem so similar to what the two sisters mentioned? Hmm, could it be that you... have ill intentions towards me?\" Han Li was stunned for quite a while after hearing this. He suddenly felt like spitting out three bowls of blood. This girl's thoughts were too unpredictable. How could she associate Yingxiang Pill with an aphrodisiac? Oh well, Han Li wasn't sure whether he should admire her caution or cry out in protest of being falsely accused. \"It seems like you're telling the truth. But I still need to take it to my second sister for inspection before using it. After all, as women, we must be careful.\" \"Cough, cough, uh, do as you please.\" Han Li was speechless and could only cough a few times to cover up his embarrassment. He now thought that it would be better to keep some distance from this little sprite; otherwise, he might get depressed by her at any time. \"Hmph, but if this medicine is really as effective as you say, then you've passed the test! If Master has any difficulties in the Mo residence in the future, you can definitely come to Caihuan for help. As long as I receive a small fee, I will surely solve your problems completely.\" \"Alright, little sister, if Master needs help, I will certainly seek your assistance.\" Han Li then returned to his normal state, responding with a forced smile, but inside, he was thinking fiercely: \"I'd rather not bother with you, you little money-grubber.\"\u003C/p>\u003C/blockquote>\u003Csection>\u003Cmp-common-mpaudio class=\"js_editor_audio res_iframe js_uneditable custom_select_card\" src=\"https://res.cooltool.vip/article_res/assets/17423803605960.705082866437867.mp3\" isaac2=\"1\" low_size=\"174.75\" source_size=\"174.8\" high_size=\"401.39\" name=\"Audio Book\" play_length=\"102000\" author=\"Renee 创业随笔\" data-topic_id=\"\" data-topic_name=\"\" data-pluginname=\"insertaudio\" data-trans_state=\"1\" data-verify_state=\"3\" voice_encode_fileid=\"MzkwOTMzMzk0MV8yMjQ3NDg5MTUw\" data-uuid=\"17423803605960.705082866437867\">\u003C/mp-common-mpaudio>\u003C/section>\u003C/section>\u003C/section>\u003Cul data-tool=\"mdnice编辑器\" style=\"margin-top: 8px;margin-bottom: 8px;padding-left: 25px;\" class=\"list-paddingleft-1\">\u003Cli>\u003Csection style=\"margin-top: 5px;margin-bottom: 5px;color: rgb(1, 1, 1);line-height: 1.8em;letter-spacing: 0em;\">\u003Cstrong style=\"color: rgb(0, 0, 0);background-attachment: scroll;background-clip: border-box;background-image: none;background-origin: padding-box;background-position: 0% 0%;background-repeat: no-repeat;background-size: auto;width: auto;height: auto;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;\">Cross-lingual content creation\u003C/strong>\u003C/section>\u003C/li>\u003C/ul>\u003Csection data-tool=\"mdnice编辑器\" style=\"margin-top: 20px;margin-bottom: 20px;padding: 10px 20px;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;background: none 0% 0% / auto no-repeat scroll padding-box border-box rgb(250, 250, 250);width: auto;height: auto;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;\">\u003Csection>\u003Cp style=\"line-height: 1.8em;letter-spacing: 0em;text-indent: 0em;padding-top: 8px;padding-bottom: 8px;\">Source Video\u003C/p>\u003Csection>\u003Cdiv style=\"height: 508px; background: rgb(0, 0, 0); border-radius: 4px; overflow: hidden; margin-bottom: 12px;\">\u003Cvideo src=\"https://res.cooltool.vip/article_res/assets/17423803717580.16555184719369742.mp4\" poster=\"https://res.cooltool.vip/article_res/assets/17423803712620.23847051315947132.jpeg\" controls=\"\" style=\"width: 100%;height: 100%;\">\u003C/video>\u003C/div>\u003C/section>\u003C/section>\u003C/section>\u003Csection data-tool=\"mdnice编辑器\" style=\"margin-top: 20px;margin-bottom: 20px;padding: 10px 20px;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;background: none 0% 0% / auto no-repeat scroll padding-box border-box rgb(250, 250, 250);width: auto;height: auto;box-shadow: rgba(0, 0, 0, 0) 0px 0px 0px 0px;\">\u003Csection>\u003Cp style=\"line-height: 1.8em;letter-spacing: 0em;text-indent: 0em;padding-top: 8px;padding-bottom: 8px;\">Generated Video\u003C/p>\u003Csection>\u003Cdiv style=\"height: 508px; background: rgb(0, 0, 0); border-radius: 4px; overflow: hidden; margin-bottom: 12px;\">\u003Cvideo src=\"https://res.cooltool.vip/article_res/assets/17423803712800.6086891334730382.mp4\" poster=\"https://res.cooltool.vip/article_res/assets/17423803712320.1797811818488948.jpeg\" controls=\"\" style=\"width: 100%;height: 100%;\">\u003C/video>\u003C/div>\u003C/section>\u003C/section>\u003C/section>\u003Ch3 data-tool=\"mdnice编辑器\" style=\"margin-top: 30px;margin-bottom: 15px;\">\u003Cspan style=\"display: none;\">\u003C/span>\u003Cspan style=\"font-size: 20px;line-height: 1.5em;letter-spacing: 0em;font-weight: bold;display: block;\">Summary\u003C/span>\u003Cspan style=\"display: none;\">\u003C/span>\u003C/h3>\u003Cp data-tool=\"mdnice编辑器\" style=\"line-height: 1.8em;letter-spacing: 0em;text-indent: 0em;padding-top: 8px;padding-bottom: 8px;\">it does not rely on pre-estimated phoneme durations and performs speech generation through end-to-end processing. The research team demonstrated that this variant achieves comparable performance with the language-model-based variant in both objective and subjective evaluations, and showcased its effectiveness in speech editing.\u003C/p>\u003Ch3 data-tool=\"mdnice编辑器\" style=\"margin-top: 30px;margin-bottom: 15px;\">\u003Cspan style=\"display: none;\">\u003C/span>\u003Cspan style=\"font-size: 20px;line-height: 1.5em;letter-spacing: 0em;font-weight: bold;display: block;\">Method\u003C/span>\u003Cspan style=\"display: none;\">\u003C/span>\u003C/h3>\u003Cp data-tool=\"mdnice编辑器\" style=\"line-height: 1.8em;letter-spacing: 0em;text-indent: 0em;padding-top: 8px;padding-bottom: 8px;\">\u003Cstrong style=\"background-attachment: scroll;background-clip: border-box;background-image: none;background-origin: padding-box;background-position: 0% 0%;background-repeat: no-repeat;background-size: auto;width: auto;height: auto;border-style: none;border-width: 3px;border-color: rgba(0, 0, 0, 0.4);border-radius: 0px;\">Overview of Seed-TTS Inference Process\u003C/strong>：\u003C/p>\u003Cp style=\"text-align: center;\">\u003Cimg class=\"rich_pages wxw-img\" data-galleryid=\"\" data-imgfileid=\"100005490\" data-ratio=\"0.2074074074074074\" data-s=\"300,640\" data-type=\"png\" data-w=\"1080\" style=\"\" src=\"https://res.cooltool.vip/article_res/assets/17423803719160.2290330580784128.png\">\u003C/p>\u003Cp>\u003Cbr>\u003C/p>\u003Col data-tool=\"mdnice编辑器\" style=\"margin-top: 8px;margin-bottom: 8px;padding-left: 25px;\" class=\"list-paddingleft-1\">\u003Cli>\u003Csection style=\"margin-top: 5px;margin-bottom: 5px;color: rgb(1, 1, 1);line-height: 1.8em;letter-spacing: 0em;\">: Learn tokenization from reference audio.\u003C/section>\u003C/li>\u003Cli>\u003Csection style=\"margin-top: 5px;margin-bottom: 5px;color: rgb(1, 1, 1);line-height: 1.8em;letter-spacing: 0em;\">：Generate phonemes based on conditional text and voice.\u003C/section>\u003C/li>\u003Cli>\u003Csection style=\"margin-top: 5px;margin-bottom: 5px;color: rgb(1, 1, 1);line-height: 1.8em;letter-spacing: 0em;\">：Generate continuous speech representations in a coarse-to-fine manner, given the generated speech phonemes.\u003C/section>\u003C/li>\u003Cli>\u003Csection style=\"margin-top: 5px;margin-bottom: 5px;color: rgb(1, 1, 1);line-height: 1.8em;letter-spacing: 0em;\">：Generate high-quality speech from diffusion outputs.\u003C/section>\u003C/li>\u003C/ol>\u003C/section>\u003Cp style=\"display: none;\">\u003Cmp-style-type data-value=\"3\">\u003C/mp-style-type>\u003C/p>\u003C/div>",1752585460985]