[{"data":1,"prerenderedAt":380},["ShallowReactive",2],{"$fgukOamtKU1RtUiMFsqdObttmqPPQz0uc7bl_gj_LyX0":3,"$fwJp8_tqDvjONqtqFax27YHnEKhAchVYryeHStGOVvEo":245,"article-454":379},{"code":4,"msg":5,"data":6},0,"",{"category":7,"tag":11,"popular":19,"latest":86,"banner":126,"list":151,"cache":244},[8,9,10],"Agent","OpenAI","LLM",[8,12,13,14,9,10,15,16,17,18],"Google","Nvidia","Claude","DeepSeek","OCR","Chat","Generator",[20,29,37,45,54,62,70,79],{"id":21,"publish_date":22,"is_original":23,"collection":5,"cover_url":24,"cover_url_1_1":25,"title":26,"summary":27,"author":28},411,"2023-09-10",1,"article_res/cover/451ef50c225a8dc61c4336506794d13b.jpeg","article_res/cover/3ba9dc7a72f87d40b20fc2d225289ee3.jpeg","Idealism","Reality is created by the mind, we can change our reality by changing our mind. - Plato","Renee's Entrepreneurial Journey",{"id":30,"publish_date":31,"is_original":23,"collection":32,"cover_url":33,"cover_url_1_1":34,"title":35,"summary":36,"author":28},108,"2024-12-07","#LLM #AGI #AI Agent","article_res/cover/0039044422e4ec9f61c18e8ee1693bb0.jpeg","article_res/cover/4220971b108a91d21407d87bb02fbaa6.jpeg","Freysa.ai: The World's First Adversarial AI Agent Game","说服 Freysa 把钱包里的钱都拿出来",{"id":38,"publish_date":39,"is_original":23,"collection":40,"cover_url":41,"cover_url_1_1":42,"title":43,"summary":44,"author":28},12,"2025-03-09","#Oxford #Reasoning #LLM #Tool Use","article_res/cover/d448e9b3617a0b5302e1bd10c438bca9.jpeg","article_res/cover/864a468f9cc4c9317efadb3811909888.jpeg","Agentic Reasoning Framework - Significantly enhance the reasoning ability of LLMs through the integration of external tools using agents","Agentic Reasoning: Reasoning LLMs with Tools for Deep Research",{"id":46,"publish_date":47,"is_original":4,"collection":48,"cover_url":49,"cover_url_1_1":50,"title":51,"summary":52,"author":53},480,"2023-04-14","#Stable Diffusion","article_res/cover/0bdbe7cb1de4a78e54536e5d9afa7ec9.jpeg","article_res/cover/b3d6ffec0608dcfaf18c5a69906d1490.jpeg","【AIGC Learning】Generate Prompts Using Word Graphs - Stable Diffusion Web UI Series 13","AI will become a powerful tool in education, transforming the way we learn and deliver instruction.  \n- Reid Hoffman","--",{"id":55,"publish_date":56,"is_original":4,"collection":57,"cover_url":58,"cover_url_1_1":59,"title":60,"summary":61,"author":28},413,"2023-09-08","#Neuroscience","article_res/cover/74f8302d78a23d9430f22171eae136b6.jpeg","article_res/cover/87ca08af81bb304746be5261160964c0.jpeg","Can machines be conscious?","Do we have an ethical obligation to not turn off conscious machines? Would turning them off be murder? No. I don't lose any sleep over unplugging a conscious machine.\n- Jeff Hawkins, \"A Thousand Brains\"",{"id":63,"publish_date":64,"is_original":23,"collection":65,"cover_url":66,"cover_url_1_1":67,"title":68,"summary":69,"author":28},178,"2024-09-09","#Entrepreneurship","article_res/cover/a7224f025b55d1820408085faef63079.jpeg","article_res/cover/11a9995b096cbf64465ef01b8673b154.jpeg","37signals company","This damn sense of relaxation",{"id":71,"publish_date":72,"is_original":4,"collection":73,"cover_url":74,"cover_url_1_1":75,"title":76,"summary":77,"author":78},460,"2023-05-12","#Google","article_res/cover/b970687b12faa52da976f91248c2aa7b.jpeg","article_res/cover/d1e71b52cfd2c63bc6e71f3e85ff135c.jpeg","Learn what BRC-20 and Ordinals are using Google Bard","Ordinals - a new protocol that allows users to store arbitrary data on the Bitcoin blockchain","Google Bard mainly writes",{"id":80,"publish_date":81,"is_original":23,"collection":5,"cover_url":82,"cover_url_1_1":83,"title":84,"summary":85,"author":28},309,"2024-03-26","article_res/cover/9877f95894ee88532d0e6012c23a2df3.jpeg","article_res/cover/20092164ddc109ce6ae56b1984246751.jpeg","Learning the Cancun Upgrade with lepton and perplexity","Building a quick conversation-based search demo with Lepton AI.",[87,95,103,111,119],{"id":88,"publish_date":89,"is_original":23,"collection":90,"cover_url":91,"cover_url_1_1":92,"title":93,"summary":94,"author":28},627,"2025-03-20","#AI Avatar #AI Video Generation","article_res/cover/d95481358f73924989f8c4ee9c75d1c8.jpeg","article_res/cover/b74bc0fab01f8b6a6aa87696c0c3ed8b.jpeg","DisPose: Generating Animated Videos by Driving Video with Reference Images","DisPose is a controllable human image animation method that enhances video generation.",{"id":96,"publish_date":97,"is_original":23,"collection":98,"cover_url":99,"cover_url_1_1":100,"title":101,"summary":102,"author":28},626,"2025-03-21","#Deep Dive into LLMs #LLM #RL #Andrej Karpathy #AlphaGo","article_res/cover/446553a5c8f8f2f07d97b20eaee84e56.jpeg","article_res/cover/e6c2823409c9b34624064b9acbaca6f1.jpeg","AlphaGo and the Power of Reinforcement Learning - Andrej Karpathy's Deep Dive on LLMs (Part 9)","Simply learning from humans will never surpass human capabilities.",{"id":104,"publish_date":105,"is_original":23,"collection":106,"cover_url":107,"cover_url_1_1":108,"title":109,"summary":110,"author":28},625,"2025-03-22","#Deep Dive into LLMs #LLM #RL #RLHF #Andrej Karpathy","article_res/cover/8da81d38b1e5cf558a164710fd8a5389.jpeg","article_res/cover/96f028d76c362a99a0dd56389e8f7a9b.jpeg","Reinforcement Learning from Human Feedback (RLHF) - Andrej Karpathy's Deep Dive on LLMs (Part 10)","Fine-Tuning Language Models from Human Preferences",{"id":112,"publish_date":113,"is_original":23,"collection":114,"cover_url":115,"cover_url_1_1":116,"title":117,"summary":118,"author":28},624,"2025-03-23","#Deep Dive into LLMs #LLM #Andrej Karpathy #AI Agent #MMM","article_res/cover/a5e7c3d48bb09109684d6513287c661d.jpeg","article_res/cover/d3f22b7c0ab8d82fd2da457a299e0773.jpeg","The Future of Large Language Models - Andrej Karpathy's In-Depth Explanation of LLM (Part 11)","preview of things to come",{"id":120,"publish_date":113,"is_original":23,"collection":121,"cover_url":122,"cover_url_1_1":123,"title":124,"summary":125,"author":28},623,"#Google #Voe #AI Video Generation","article_res/cover/c44062fea0f336c2b96b3928292392c2.jpeg","article_res/cover/a041041c69092ad3db191c5bf3ff981b.jpeg","Trial of Google's video generation model VOE2","Our state-of-the-art video generation model",[127,135,143],{"id":128,"publish_date":129,"is_original":23,"collection":130,"cover_url":131,"cover_url_1_1":132,"title":133,"summary":134,"author":28},300,"2024-04-16","#AI in Science #AGI","article_res/cover/6bf01e793e0f33e848572412eebdf9b0.jpeg","article_res/cover/91a5ee21dafecb914fabeb9430d46ec1.jpeg","Would Einstein lose his job - AI and Quantum Computing: A Glimpse into the Near Future","So Einstein's job is still safe.",{"id":136,"publish_date":137,"is_original":23,"collection":138,"cover_url":139,"cover_url_1_1":140,"title":141,"summary":142,"author":28},101,"2024-12-14","#Nvidia #AI 3D Generator","article_res/cover/693e07c85980c5c0c8fde3f037733f23.jpeg","article_res/cover/9ea8edff2d5d303ff3fffff3f6f9c3d9.jpeg","NVIDIA's open-source 3D project LLaMA-Mesh","LLaMA-Mesh: Unifying 3D Mesh Generation with Language Models",{"id":144,"publish_date":145,"is_original":23,"collection":146,"cover_url":147,"cover_url_1_1":148,"title":149,"summary":150,"author":28},131,"2024-11-10","#OpenAI","article_res/cover/87f8ed353ce39f31960e7cdfaf075a35.jpeg","article_res/cover/f597a63935f5cd32e484b4aadd6019e8.jpeg","ChatGPT has launched the Search function","Get fast, timely answers with links to relevant web sources.",{"big":152,"small":214},[153,181],{"title":154,"list":155},"AGENT",[156,157,165,173],{"id":112,"publish_date":113,"is_original":23,"collection":114,"cover_url":115,"cover_url_1_1":116,"title":117,"summary":118,"author":28},{"id":158,"publish_date":159,"is_original":23,"collection":160,"cover_url":161,"cover_url_1_1":162,"title":163,"summary":164,"author":28},622,"2025-03-24","#OWL #AI Agent #MAS #MCP #CUA","article_res/cover/cb50ca7f2bf4d1ed50202d7406e1c19a.jpeg","article_res/cover/4aa7aa3badfacf3cc84121334f1050dd.jpeg","OWL: Multi-agent collaboration","OWL: Optimized Workforce Learning for General Multi-Agent Assistance in Real-World Task Automation",{"id":166,"publish_date":167,"is_original":23,"collection":168,"cover_url":169,"cover_url_1_1":170,"title":171,"summary":172,"author":28},620,"2025-03-26","#LLM #Google #Gemini #AI Agent","article_res/cover/53751a6dbbe990b1eb0b63f3b062aed4.jpeg","article_res/cover/031344981f0a212ff82d1f3a64aa5756.jpeg","Gemini 2.5 Pro, claimed to be far ahead of the competition, has been released with great fanfare: comprehensively surpassing other LLMs and topping the global rankings","Gemini 2.5: Our most intelligent AI model",{"id":174,"publish_date":175,"is_original":23,"collection":176,"cover_url":177,"cover_url_1_1":178,"title":179,"summary":180,"author":28},616,"2025-03-29","#MAS #AI Agent #AI Coder #MetaGPT #MGX","article_res/cover/9dcd702ad2035902e5e77967c34a1f1e.jpeg","article_res/cover/0a97fc4a922753c8f46ff38792020df8.jpeg","MGX - An automated website-building platform composed of multiple AI Agents","Your 24/7 AI Team | Dream, Chat, Create.",{"title":182,"list":183},"OPENAI",[184,191,199,206],{"id":185,"publish_date":167,"is_original":23,"collection":186,"cover_url":187,"cover_url_1_1":188,"title":189,"summary":190,"author":28},619,"#OpenAI #AI Image Generator #4o #MMM #AR Transformer","article_res/cover/2faffc97fcecf3151552cb0fd3206d89.jpeg","article_res/cover/1133cb4948af44cee2e7fbe79efb69e5.jpeg","The native image function of GPT-4o is officially launched","Introducing 4o Image Generation",{"id":192,"publish_date":193,"is_original":4,"collection":194,"cover_url":195,"cover_url_1_1":196,"title":197,"summary":198,"author":28},434,"2023-07-15","#Anthropic #OpenAI #Google #AI Code Generator #Claude","article_res/cover/e1b6f600a2b9f262a4392684e5f2ce25.jpeg","article_res/cover/6e1772e83f78f9a351ab23d3e414adee.jpeg","Latest Updates on Google Bard /Anthropic Claude2 / ChatGPT Code Interpreter","We want our models to use their programming skills to provide more natural interfaces to the basic functions of our computers.  \n - OpenAI",{"id":200,"publish_date":201,"is_original":4,"collection":146,"cover_url":202,"cover_url_1_1":203,"title":204,"summary":205,"author":28},417,"2023-08-24","article_res/cover/bccf897d50a88b18364e35f7466387e0.jpeg","article_res/cover/2f871085c1073717c1703ae86e18056f.jpeg","The GPT-3.5 Turbo fine-tuning (fine-tuning function) has been released～","Developers can now bring their own data to customize GPT-3.5 Turbo for their use cases.",{"id":207,"publish_date":208,"is_original":4,"collection":209,"cover_url":210,"cover_url_1_1":211,"title":212,"summary":213,"author":28},407,"2023-09-22","#OpenAI #AI Image Generator","article_res/cover/c59005e903d35cfc32346e2756e2728a.jpeg","article_res/cover/ba011d265e6d84b5c8cb6fd6b757b6cc.jpeg","Dall-E 3","DALL·E 3 understands significantly more nuance and detail, allowing you to easily translate your ideas into images.",[215,221,241],{"title":10,"list":216},[217,218,219,220],{"id":96,"publish_date":97,"is_original":23,"collection":98,"cover_url":99,"cover_url_1_1":100,"title":101,"summary":102,"author":28},{"id":104,"publish_date":105,"is_original":23,"collection":106,"cover_url":107,"cover_url_1_1":108,"title":109,"summary":110,"author":28},{"id":112,"publish_date":113,"is_original":23,"collection":114,"cover_url":115,"cover_url_1_1":116,"title":117,"summary":118,"author":28},{"id":166,"publish_date":167,"is_original":23,"collection":168,"cover_url":169,"cover_url_1_1":170,"title":171,"summary":172,"author":28},{"title":222,"list":223},"GOOGLE",[224,225,226,234],{"id":120,"publish_date":113,"is_original":23,"collection":121,"cover_url":122,"cover_url_1_1":123,"title":124,"summary":125,"author":28},{"id":166,"publish_date":167,"is_original":23,"collection":168,"cover_url":169,"cover_url_1_1":170,"title":171,"summary":172,"author":28},{"id":227,"publish_date":228,"is_original":23,"collection":229,"cover_url":230,"cover_url_1_1":231,"title":232,"summary":233,"author":28},615,"2025-03-30","#AI Researcher #AI Science #HKU #Google #AI Agent","article_res/cover/21fadf906067714bb0db31ae13a77c15.jpeg","article_res/cover/2697999a72bd26b22e85f0e92936d3ed.jpeg","AI-Researcher: LLM-driven全自动 scientific research assistant","AI-Researcher: Fully-Automated Scientific Discovery with LLM Agents  \nOpen-Sourced Alternative to Google AI Co-Scientist",{"id":235,"publish_date":236,"is_original":23,"collection":73,"cover_url":237,"cover_url_1_1":238,"title":239,"summary":240,"author":28},463,"2023-05-09","article_res/cover/89800f207723acdb55fc53bf999ebdc9.jpeg","article_res/cover/5764f369b4accd8f83e94aa4c077a175.jpeg","The Smallville sandbox world - A town with 25 virtual residents","Believable proxies of human behavior can empower interactive apps: Immersive environment, Rehearsal space, Prototyping tool",{"title":242,"list":243},"NVIDIA",[],true,{"code":4,"msg":5,"data":246},{"id":247,"publish_date":248,"is_original":23,"collection":249,"articles_id":250,"cover_url":251,"cover_url_1_1":252,"title":253,"summary":254,"author":28,"content":255,"popular":256,"list":321,"category":377,"tag":378},454,"2023-05-23","#AI Audio Generator","dYYYAJnxPLTEznL3VIxIaQ","article_res/cover/1e70875d4849ffa4f5d888fb70dfa02f.jpeg","article_res/cover/b8cdd05f2b0e85ca053d0dedba60f57f.jpeg","【AIGC Learning】Bark Text-To-Speech(2) Generating Long Audio","📕 Long-form generation, voice consistency enhancements and other examples are now documented in a new notebooks section","\u003Cdiv class=\"rich_media_content js_underline_content\n                       autoTypeSetting24psection\n            \" id=\"js_content\">\u003Cp data-tool=\"mdnice编辑器\" style='margin-bottom: 0px;padding-top: 8px;padding-bottom: 8px;color: black;font-family: Optima-Regular, Optima, PingFangSC-light, PingFangTC-light, \"PingFang SC\", Cambria, Cochin, Georgia, Times, \"Times New Roman\", serif;font-size: 16px;letter-spacing: normal;text-align: left;white-space: normal;line-height: 26px;'>However, this tool originally could only generate audio clips no longer than 13 seconds. But they released a new version last month specifically designed for long audio production.\u003C/p>\u003Cp data-tool=\"mdnice编辑器\" style='margin-bottom: 0px;padding-top: 8px;padding-bottom: 8px;color: black;font-family: Optima-Regular, Optima, PingFangSC-light, PingFangTC-light, \"PingFang SC\", Cambria, Cochin, Georgia, Times, \"Times New Roman\", serif;font-size: 16px;letter-spacing: normal;text-align: left;white-space: normal;line-height: 26px;'>\u003Cspan style=\"letter-spacing: 0px;\">https://github.com/suno-ai/bark/blob/main/notebooks/long_form_generation.ipynb\u003C/span>\u003C/p>\u003Cp data-tool=\"mdnice编辑器\" style='margin-bottom: 0px;padding-top: 8px;padding-bottom: 8px;color: black;font-family: Optima-Regular, Optima, PingFangSC-light, PingFangTC-light, \"PingFang SC\", Cambria, Cochin, Georgia, Times, \"Times New Roman\", serif;font-size: 16px;letter-spacing: normal;text-align: left;white-space: normal;line-height: 26px;'>Before we begin, we also need to download the relevant environment first.\u003C/p>\u003Cpre data-tool=\"mdnice编辑器\" style=\"margin-top: 10px;margin-bottom: 10px;color: rgb(0, 0, 0);font-size: 16px;letter-spacing: normal;text-align: left;border-radius: 5px;box-shadow: rgba(0, 0, 0, 0.55) 0px 2px 10px;\">\u003Cspan style='margin-bottom: -7px;display: block;background: url(\"./assets/17434960258880.5213815918277045.svg\") 10px 10px / 40px no-repeat rgb(40, 44, 52);height: 30px;width: 558px;border-radius: 5px;'>\u003C/span>\u003Ccode style='padding: 15px 16px 16px;overflow-x: auto;color: rgb(171, 178, 191);display: -webkit-box;font-family: \"Operator Mono\", Consolas, Monaco, Menlo, monospace;font-size: 12px;background: rgb(40, 44, 52);border-radius: 5px;'>\u003Cspan style=\"color: rgb(92, 99, 112);font-style: italic;line-height: 26px;\">#@title Install Environment - Must run regardless of what type of audio you are producing.\u003C/span>\u003Cbr>! pip install git+https://github.com/suno-ai/bark.git\u003Cbr>\u003Cbr>\u003Cspan style=\"color: rgb(198, 120, 221);line-height: 26px;\">from\u003C/span> bark \u003Cspan style=\"color: rgb(198, 120, 221);line-height: 26px;\">import\u003C/span> SAMPLE_RATE, generate_audio, preload_models\u003Cbr>\u003Cspan style=\"color: rgb(198, 120, 221);line-height: 26px;\">from\u003C/span> IPython.display \u003Cspan style=\"color: rgb(198, 120, 221);line-height: 26px;\">import\u003C/span> Audio\u003Cbr>\u003Cbr>\u003Cspan style=\"color: rgb(198, 120, 221);line-height: 26px;\">import\u003C/span> os\u003Cbr>\u003Cspan style=\"color: rgb(198, 120, 221);line-height: 26px;\">import\u003C/span> nltk\u003Cbr>nltk.download(\u003Cspan style=\"color: rgb(152, 195, 121);line-height: 26px;\">'punkt'\u003C/span>)\u003Cbr>\u003Cbr>os.environ[\u003Cspan style=\"color: rgb(152, 195, 121);line-height: 26px;\">\"CUDA_VISIBLE_DEVICES\"\u003C/span>] = \u003Cspan style=\"color: rgb(152, 195, 121);line-height: 26px;\">\"0\"\u003C/span>\u003Cbr>\u003Cspan style=\"color: rgb(198, 120, 221);line-height: 26px;\">import\u003C/span> nltk  \u003Cspan style=\"color: rgb(92, 99, 112);font-style: italic;line-height: 26px;\"># we'll use this to split into sentences\u003C/span>\u003Cbr>\u003Cspan style=\"color: rgb(198, 120, 221);line-height: 26px;\">import\u003C/span> numpy \u003Cspan style=\"color: rgb(198, 120, 221);line-height: 26px;\">as\u003C/span> np\u003Cbr>\u003Cbr>\u003Cspan style=\"color: rgb(198, 120, 221);line-height: 26px;\">from\u003C/span> bark.generation \u003Cspan style=\"color: rgb(198, 120, 221);line-height: 26px;\">import\u003C/span> (\u003Cbr>    generate_text_semantic,\u003Cbr>    preload_models,\u003Cbr>)\u003Cbr>\u003Cspan style=\"color: rgb(198, 120, 221);line-height: 26px;\">from\u003C/span> bark.api \u003Cspan style=\"color: rgb(198, 120, 221);line-height: 26px;\">import\u003C/span> semantic_to_waveform\u003Cbr>\u003Cbr>preload_models()\u003Cbr>\u003C/code>\u003C/pre>\u003Cp data-tool=\"mdnice编辑器\" style='margin-bottom: 0px;padding-top: 8px;padding-bottom: 8px;color: black;font-family: Optima-Regular, Optima, PingFangSC-light, PingFangTC-light, \"PingFang SC\", Cambria, Cochin, Georgia, Times, \"Times New Roman\", serif;font-size: 16px;letter-spacing: normal;text-align: left;white-space: normal;line-height: 26px;'>I tried some long-form examples:\u003C/p>\u003Cpre data-tool=\"mdnice编辑器\" style=\"margin-top: 10px;margin-bottom: 10px;color: rgb(0, 0, 0);font-size: 16px;letter-spacing: normal;text-align: left;border-radius: 5px;box-shadow: rgba(0, 0, 0, 0.55) 0px 2px 10px;\">\u003Cspan style='margin-bottom: -7px;display: block;background: url(\"./assets/17434960258880.5213815918277045.svg\") 10px 10px / 40px no-repeat rgb(40, 44, 52);height: 30px;width: 558px;border-radius: 5px;'>\u003C/span>\u003Ccode style='padding: 15px 16px 16px;overflow-x: auto;color: rgb(171, 178, 191);display: -webkit-box;font-family: \"Operator Mono\", Consolas, Monaco, Menlo, monospace;font-size: 12px;background: rgb(40, 44, 52);border-radius: 5px;'>\u003Cspan style=\"color: rgb(92, 99, 112);font-style: italic;line-height: 26px;\">#@title Generating long audio\u003C/span>\u003Cbr>\u003Cbr>speaker = \u003Cspan style=\"color: rgb(152, 195, 121);line-height: 26px;\">\"v2/en_speaker_6\"\u003C/span>\u003Cbr>\u003Cbr>script = \u003Cspan style=\"color: rgb(152, 195, 121);line-height: 26px;\">\"\"\"\u003Cbr>Hey, have you heard about this new text-to-audio model called \"Bark\"? \u003Cbr>Apparently, it's the most realistic and natural-sounding text-to-audio model \u003Cbr>out there right now. People are saying it sounds just like a real person speaking. \u003Cbr>I think it uses advanced machine learning algorithms to analyze and understand the \u003Cbr>nuances of human speech, and then replicates those nuances in its own speech output. \u003Cbr>It's pretty impressive, and I bet it could be used for things like audiobooks or podcasts. \u003Cbr>In fact, I heard that some publishers are already starting to use Bark to create audiobooks. \u003Cbr>It would be like having your own personal voiceover artist. I really think Bark is going to \u003Cbr>be a game-changer in the world of text-to-audio technology! [end]\u003Cbr>\"\"\"\u003C/span>.replace(\u003Cspan style=\"color: rgb(152, 195, 121);line-height: 26px;\">\"\\n\"\u003C/span>, \u003Cspan style=\"color: rgb(152, 195, 121);line-height: 26px;\">\" \"\u003C/span>).strip()\u003Cbr>\u003Cbr>sentences = nltk.sent_tokenize(script)\u003Cbr>\u003Cbr>GEN_TEMP = \u003Cspan style=\"color: rgb(209, 154, 102);line-height: 26px;\">0.6\u003C/span>\u003Cbr>\u003Cbr>silence = np.zeros(int(\u003Cspan style=\"color: rgb(209, 154, 102);line-height: 26px;\">0.1\u003C/span> * SAMPLE_RATE)) \u003Cbr>\u003Cbr>pieces = []\u003Cbr>\u003Cspan style=\"color: rgb(198, 120, 221);line-height: 26px;\">for\u003C/span> sentence \u003Cspan style=\"color: rgb(198, 120, 221);line-height: 26px;\">in\u003C/span> sentences:\u003Cbr>    semantic_tokens = generate_text_semantic(\u003Cbr>        sentence,\u003Cbr>        history_prompt=speaker,\u003Cbr>        temp=GEN_TEMP,\u003Cbr>        min_eos_p=\u003Cspan style=\"color: rgb(209, 154, 102);line-height: 26px;\">0.05\u003C/span>, \u003Cbr>    )\u003Cbr>\u003Cbr>    audio_array = semantic_to_waveform(semantic_tokens, history_prompt=speaker,)\u003Cbr>    pieces += [audio_array, silence.copy()]\u003Cbr>\u003Cbr>Audio(np.concatenate(pieces), rate=SAMPLE_RATE)\u003Cbr>\u003C/code>\u003C/pre>\u003Cp data-tool=\"mdnice编辑器\" style='margin-bottom: 0px;padding-top: 8px;padding-bottom: 8px;color: black;font-family: Optima-Regular, Optima, PingFangSC-light, PingFangTC-light, \"PingFang SC\", Cambria, Cochin, Georgia, Times, \"Times New Roman\", serif;font-size: 16px;letter-spacing: normal;text-align: left;white-space: normal;line-height: 26px;'>This is the audio effect:\u003C/p>\u003Csection>\u003Cmpvoice class=\"js_editor_audio res_iframe js_uneditable custom_select_card\" src=\"/cgi-bin/readtemplate?t=tmpl/audio_tmpl&amp;name=bark%20long%20script&amp;play_length=01:05\" isaac2=\"1\" low_size=\"120.9\" source_size=\"120.9\" high_size=\"257.67\" name=\"bark long script\" play_length=\"65000\" voice_encode_fileid=\"MzkwOTMzMzk0MV8yMjQ3NDg1MjY2\" data-topic_id=\"\" data-topic_name=\"\" data-pluginname=\"insertaudio\" data-trans_state=\"1\" data-verify_state=\"3\">\u003C/mpvoice>\u003C/section>\u003Cp data-tool=\"mdnice编辑器\" style='margin-bottom: 0px;padding-top: 8px;padding-bottom: 8px;color: black;font-family: Optima-Regular, Optima, PingFangSC-light, PingFangTC-light, \"PingFang SC\", Cambria, Cochin, Georgia, Times, \"Times New Roman\", serif;font-size: 16px;letter-spacing: normal;text-align: left;white-space: normal;line-height: 26px;'>We can also generate long conversations:\u003C/p>\u003Cpre data-tool=\"mdnice编辑器\" style=\"margin-top: 10px;margin-bottom: 10px;color: rgb(0, 0, 0);font-size: 16px;letter-spacing: normal;text-align: left;border-radius: 5px;box-shadow: rgba(0, 0, 0, 0.55) 0px 2px 10px;\">\u003Cspan style='margin-bottom: -7px;display: block;background: url(\"./assets/17434960258880.5213815918277045.svg\") 10px 10px / 40px no-repeat rgb(40, 44, 52);height: 30px;width: 558px;border-radius: 5px;'>\u003C/span>\u003Ccode style='padding: 15px 16px 16px;overflow-x: auto;color: rgb(171, 178, 191);display: -webkit-box;font-family: \"Operator Mono\", Consolas, Monaco, Menlo, monospace;font-size: 12px;background: rgb(40, 44, 52);border-radius: 5px;'>\u003Cspan style=\"color: rgb(92, 99, 112);font-style: italic;line-height: 26px;\">#@title Generating long conversations\u003C/span>\u003Cbr>\u003Cbr>speaker_lookup = {\u003Cspan style=\"color: rgb(152, 195, 121);line-height: 26px;\">\"Samantha\"\u003C/span>: \u003Cspan style=\"color: rgb(152, 195, 121);line-height: 26px;\">\"v2/en_speaker_9\"\u003C/span>, \u003Cspan style=\"color: rgb(152, 195, 121);line-height: 26px;\">\"John\"\u003C/span>: \u003Cspan style=\"color: rgb(152, 195, 121);line-height: 26px;\">\"v2/en_speaker_6\"\u003C/span>}\u003Cbr>\u003Cbr>script = \u003Cspan style=\"color: rgb(152, 195, 121);line-height: 26px;\">\"\"\"\u003Cbr>Samantha: Hey, have you heard about this new text-to-audio model called \"Bark\"?\u003Cbr>John: No, I haven't. What's so special about it?\u003Cbr>Samantha: Well, apparently it's the most realistic and natural-sounding text-to-audio model out there right now. People are saying it sounds just like a real person speaking.\u003Cbr>John: Wow, that sounds amazing. How does it work?\u003Cbr>Samantha: I think it uses advanced machine learning algorithms to analyze and understand the nuances of human speech, and then replicates those nuances in its own speech output.\u003Cbr>John: That's pretty impressive. Do you think it could be used for things like audiobooks or podcasts?\u003Cbr>Samantha: Definitely! In fact, I heard that some publishers are already starting to use Bark to create audiobooks. And I bet it would be great for podcasts too.\u003Cbr>John: I can imagine. It would be like having your own personal voiceover artist.\u003Cbr>Samantha: Exactly! I think Bark is going to be a game-changer in the world of text-to-audio technology.\"\"\"\u003C/span>\u003Cbr>script = script.strip().split(\u003Cspan style=\"color: rgb(152, 195, 121);line-height: 26px;\">\"\\n\"\u003C/span>)\u003Cbr>script = [s.strip() \u003Cspan style=\"color: rgb(198, 120, 221);line-height: 26px;\">for\u003C/span> s \u003Cspan style=\"color: rgb(198, 120, 221);line-height: 26px;\">in\u003C/span> script \u003Cspan style=\"color: rgb(198, 120, 221);line-height: 26px;\">if\u003C/span> s]\u003Cbr>script\u003Cbr>\u003Cbr>pieces = []\u003Cbr>silence = np.zeros(int(\u003Cspan style=\"color: rgb(209, 154, 102);line-height: 26px;\">0.1\u003C/span>*SAMPLE_RATE))\u003Cbr>\u003Cspan style=\"color: rgb(198, 120, 221);line-height: 26px;\">for\u003C/span> line \u003Cspan style=\"color: rgb(198, 120, 221);line-height: 26px;\">in\u003C/span> script:\u003Cbr>    speaker, text = line.split(\u003Cspan style=\"color: rgb(152, 195, 121);line-height: 26px;\">\": \"\u003C/span>)\u003Cbr>    audio_array = generate_audio(text, history_prompt=speaker_lookup[speaker], )\u003Cbr>    pieces += [audio_array, silence.copy()]\u003Cbr>\u003Cbr>Audio(np.concatenate(pieces), rate=SAMPLE_RATE)\u003Cbr>\u003C/code>\u003C/pre>\u003Cp data-tool=\"mdnice编辑器\" style='margin-bottom: 0px;padding-top: 8px;padding-bottom: 8px;color: black;font-family: Optima-Regular, Optima, PingFangSC-light, PingFangTC-light, \"PingFang SC\", Cambria, Cochin, Georgia, Times, \"Times New Roman\", serif;font-size: 16px;letter-spacing: normal;text-align: left;white-space: normal;line-height: 26px;'>This is the audio effect:\u003C/p>\u003Csection>\u003Cmpvoice class=\"js_editor_audio res_iframe js_uneditable custom_select_card\" src=\"/cgi-bin/readtemplate?t=tmpl/audio_tmpl&amp;name=bark%20conversation&amp;play_length=01:21\" isaac2=\"1\" low_size=\"152.42\" source_size=\"152.4\" high_size=\"318.04\" name=\"bark conversation\" play_length=\"81000\" voice_encode_fileid=\"MzkwOTMzMzk0MV8yMjQ3NDg1MjY3\" data-topic_id=\"\" data-topic_name=\"\" data-pluginname=\"insertaudio\" data-trans_state=\"1\" data-verify_state=\"3\">\u003C/mpvoice>\u003C/section>\u003Cp data-tool=\"mdnice编辑器\" style='margin-bottom: 0px;padding-top: 8px;padding-bottom: 8px;color: black;font-family: Optima-Regular, Optima, PingFangSC-light, PingFangTC-light, \"PingFang SC\", Cambria, Cochin, Georgia, Times, \"Times New Roman\", serif;font-size: 16px;letter-spacing: normal;text-align: left;white-space: normal;line-height: 26px;'>Supported sound effects:\u003C/p>\u003Cul data-tool=\"mdnice编辑器\" class=\"list-paddingleft-1\" style='margin-top: 8px;margin-bottom: 8px;padding-left: 25px;width: 557.438px;color: black;font-family: Optima-Regular, Optima, PingFangSC-light, PingFangTC-light, \"PingFang SC\", Cambria, Cochin, Georgia, Times, \"Times New Roman\", serif;font-size: 16px;letter-spacing: normal;text-align: left;white-space: normal;'>\u003Cli>\u003Csection style=\"margin-top: 5px;margin-bottom: 5px;line-height: 26px;color: rgb(1, 1, 1);\">[laughter]，[laughs]，[sighs]，[music]，[gasps]，[clears throat]\u003C/section>\u003C/li>\u003Cli>\u003Csection style=\"margin-top: 5px;margin-bottom: 5px;line-height: 26px;color: rgb(1, 1, 1);\">— or ... for hesitations\u003C/section>\u003C/li>\u003Cli>\u003Csection style=\"margin-top: 5px;margin-bottom: 5px;line-height: 26px;color: rgb(1, 1, 1);\">♪ for song lyrics\u003C/section>\u003C/li>\u003Cli>\u003Csection style=\"margin-top: 5px;margin-bottom: 5px;line-height: 26px;color: rgb(1, 1, 1);\">CAPITALIZATION for emphasis of a word\u003C/section>\u003C/li>\u003Cli>\u003Csection style=\"margin-top: 5px;margin-bottom: 5px;line-height: 26px;color: rgb(1, 1, 1);\">[MAN] and [WOMAN]\u003C/section>\u003C/li>\u003C/ul>\u003Cp data-tool=\"mdnice编辑器\" style='margin-bottom: 0px;padding-top: 8px;padding-bottom: 8px;color: black;font-family: Optima-Regular, Optima, PingFangSC-light, PingFangTC-light, \"PingFang SC\", Cambria, Cochin, Georgia, Times, \"Times New Roman\", serif;font-size: 16px;letter-spacing: normal;text-align: left;white-space: normal;line-height: 26px;'>You can also modify the language and voice:\u003C/p>\u003Cp data-tool=\"mdnice编辑器\" style='margin-bottom: 0px;padding-top: 8px;padding-bottom: 8px;color: black;font-family: Optima-Regular, Optima, PingFangSC-light, PingFangTC-light, \"PingFang SC\", Cambria, Cochin, Georgia, Times, \"Times New Roman\", serif;font-size: 16px;letter-spacing: normal;text-align: left;white-space: normal;line-height: 26px;'>All have yielded good results, and they are under the MIT license, which is business-friendly for commercial use～\u003C/p>\u003Cp style=\"display: none;\">\u003Cmp-style-type data-value=\"3\">\u003C/mp-style-type>\u003C/p>\u003C/div>",[257,266,274,282,290,298,306,313],{"id":258,"title_md5":259,"publish_date":260,"author_md5":261,"is_original":23,"collection":262,"summary_md5":263,"cover_url":264,"cover_url_1_1":265},205,"68cfbb38bc5bc0fe0de8a3449522ba3a","2024-08-03","bc27fa490c4d0d525bac812fc0793534","#Prompt Engineering #Nature #Research","65714bda1cad1a317992c3ad58f0f1fe","article_res/cover/2cc284608cd4a665b016ef5a48a21194.jpeg","article_res/cover/43f34dc7688b84136e5db6fde3662937.jpeg",{"id":267,"title_md5":268,"publish_date":269,"author_md5":261,"is_original":4,"collection":270,"summary_md5":271,"cover_url":272,"cover_url_1_1":273},270,"32ea6bbe9aaaa7661a244726d3069bb3","2024-05-20","#AI Agent","554eb3e287a5edf99b36a70f58c04c0a","article_res/cover/df3dfd94230da278a801bb28d27ae25b.jpeg","article_res/cover/377a030c5b17b3ad7fe9125d9b3346e6.jpeg",{"id":275,"title_md5":276,"publish_date":277,"author_md5":278,"is_original":4,"collection":5,"summary_md5":279,"cover_url":280,"cover_url_1_1":281},554,"5c5ca223c42ba689bf3130ab1b859e9e","2022-05-02","70997a2931a60561e615f5171df5f9a5","20d4fd7a8a95643eafcb19d8476fa89e","article_res/cover/5e0e1b6c5a43cc8e35ce6e45e8250f50.jpeg","article_res/cover/fbbab82bf840d89770767f59c7dd43b7.jpeg",{"id":283,"title_md5":284,"publish_date":285,"author_md5":261,"is_original":23,"collection":286,"summary_md5":287,"cover_url":288,"cover_url_1_1":289},111,"4d30c2782ffe1cd1d2d4930d3922cdcd","2024-12-04","#AI Code Generator","551fd817e5b5de2b5df09154dae3ed13","article_res/cover/0e0b713e5d196fc895a6be2fc5ea76ed.jpeg","article_res/cover/6195f5450ab450d5cb5d33fd649dd770.jpeg",{"id":291,"title_md5":292,"publish_date":293,"author_md5":294,"is_original":4,"collection":5,"summary_md5":295,"cover_url":296,"cover_url_1_1":297},598,"ccefbb37d14339b2167b7e38646e4faf","2022-03-19","8b3607d0f4181a3cb6ffdccf7185f09b","f4486bc5ab843101ef9327e41afc7967","article_res/cover/c0b3c15d1af9917e4888e30976e49606.jpeg","article_res/cover/9812ac9f3a9898718353dda47d933a29.jpeg",{"id":299,"title_md5":300,"publish_date":301,"author_md5":261,"is_original":23,"collection":302,"summary_md5":303,"cover_url":304,"cover_url_1_1":305},250,"4b1f4ea79f9a2fc09e0215ab9f734403","2024-06-10","#Buffett","5d486a61280ae734954903488db589a5","article_res/cover/c9692e2e7fee823ceb6e502de7b605a3.jpeg","article_res/cover/1e32882d197c58725ec0d28c0bf797ad.jpeg",{"id":307,"title_md5":308,"publish_date":309,"author_md5":261,"is_original":23,"collection":286,"summary_md5":310,"cover_url":311,"cover_url_1_1":312},132,"72360ca016a2d73c79a994732a6c9985","2024-11-09","a9784420ab50b718dc3fe1ca40c467f8","article_res/cover/f331019b22da4c731e5cbb950f2151cf.jpeg","article_res/cover/e0236f165f8989e216a34876d6afead7.jpeg",{"id":314,"title_md5":315,"publish_date":316,"author_md5":261,"is_original":23,"collection":317,"summary_md5":318,"cover_url":319,"cover_url_1_1":320},127,"980f31d18e225c9d65278075f5db1207","2024-11-14","#Google #AI Game #World Model #AI Story","87de00b51aa83516eaa2eac7df1d322c","article_res/cover/0233a875b7ec2debf59779e311547569.jpeg","article_res/cover/6ffddb6ae4914b3c699493311aa9f198.jpeg",{"related":322,"small":362},[323,331,338,346,354],{"id":324,"publish_date":325,"is_original":4,"collection":5,"cover_url":326,"cover_url_1_1":327,"title":328,"summary":329,"author":330},604,"2022-03-13","article_res/cover/b1e7e12d55932a445e91d45f896c486a.jpeg","article_res/cover/0c07557158250cca3a12a1ea1b9d9a48.jpeg","How to read financial statements - CF Statement of Cash Flows","Why focus on cash flows? Because a share of stock is a","Course notes",{"id":332,"publish_date":333,"is_original":4,"collection":146,"cover_url":334,"cover_url_1_1":335,"title":336,"summary":337,"author":28},382,"2023-11-10","article_res/cover/f3614fc55023f05303030c499936e0f3.jpeg","article_res/cover/63d26a9fb3be7c181f32c9c9f630fd4b.jpeg","GPTs Experience (Upper Chapter)","You can now create custom versions of ChatGPT that combine instructions, extra knowledge, and any combination of skills.",{"id":339,"publish_date":340,"is_original":23,"collection":341,"cover_url":342,"cover_url_1_1":343,"title":344,"summary":345,"author":28},466,"2023-05-06","#LLM","article_res/cover/aac8df76a76b1290258d2661a57ce8c0.jpeg","article_res/cover/ce25a2edb9fbec73f6af894d85173982.jpeg","LangChain Reads PDFs (Part I)","Artificial intelligence is not a separate entity from us, but a reflection of our own mind. \n-《Impromptu》",{"id":347,"publish_date":348,"is_original":23,"collection":349,"cover_url":350,"cover_url_1_1":351,"title":352,"summary":353,"author":28},243,"2024-06-17","#AI Avatar #Tencent","article_res/cover/18411086f214e950ca1ad80957d15d52.jpeg","article_res/cover/fa639bdf4a5ba7330027539519841b0c.jpeg","Two models from Tencent that make Avatars talk: V-Express and MuseTalk","V-Express aims to generate a talking head video under the control of a reference image and an audio.",{"id":355,"publish_date":356,"is_original":23,"collection":357,"cover_url":358,"cover_url_1_1":359,"title":360,"summary":361,"author":28},121,"2024-11-23","#AI Avatar #Alibaba","article_res/cover/454b11e6d0ae30c7908f91f72da1aad5.jpeg","article_res/cover/f4d4b8d4705c488aabfc335f36546c7c.jpeg","Alibaba releases EchoMimic_V2, a half-body digital human","Towards Striking, Simplified, and Semi-Body Human Animation",[363,369,375],{"title":10,"list":364},[365,366,367,368],{"id":96,"publish_date":97,"is_original":23,"collection":98,"cover_url":99,"cover_url_1_1":100,"title":101,"summary":102,"author":28},{"id":104,"publish_date":105,"is_original":23,"collection":106,"cover_url":107,"cover_url_1_1":108,"title":109,"summary":110,"author":28},{"id":112,"publish_date":113,"is_original":23,"collection":114,"cover_url":115,"cover_url_1_1":116,"title":117,"summary":118,"author":28},{"id":166,"publish_date":167,"is_original":23,"collection":168,"cover_url":169,"cover_url_1_1":170,"title":171,"summary":172,"author":28},{"title":222,"list":370},[371,372,373,374],{"id":120,"publish_date":113,"is_original":23,"collection":121,"cover_url":122,"cover_url_1_1":123,"title":124,"summary":125,"author":28},{"id":166,"publish_date":167,"is_original":23,"collection":168,"cover_url":169,"cover_url_1_1":170,"title":171,"summary":172,"author":28},{"id":227,"publish_date":228,"is_original":23,"collection":229,"cover_url":230,"cover_url_1_1":231,"title":232,"summary":233,"author":28},{"id":235,"publish_date":236,"is_original":23,"collection":73,"cover_url":237,"cover_url_1_1":238,"title":239,"summary":240,"author":28},{"title":242,"list":376},[],[8,9,10],[8,12,13,14,9,10,15,16,17,18],["Reactive",245],1754646411073]