[{"_1":2,"_560":-5,"_561":-5},"loaderData",{"_3":4,"_312":313},"root",{"_5":-5,"_6":7,"_8":9,"_16":17,"_306":307},"user","language","en","languageConfig",{"_10":7,"_11":12,"_13":14,"_15":-5},"code","name","English","dir","ltr","subdomain","translations",{"_18":19,"_30":31,"_56":57,"_76":77,"_28":100,"_127":128,"_139":140,"_92":162,"_170":171,"_82":176,"_198":199,"_22":204},"header",{"_20":21,"_22":23,"_24":25,"_26":27,"_28":29},"home","Home","about","About","signIn","Sign in","signOut","Sign out","search","Search","footer",{"_32":33,"_34":35,"_36":37,"_38":39,"_40":41,"_42":43,"_44":45,"_46":47,"_48":49,"_50":51,"_52":53,"_54":55},"tagline","Everything about China's Innovation","description","Pandaily is a tech media based in Beijing. Our mission is to deliver premium content and contextual insights on China's technology scene to the worldwide tech community.","aboutUs","About Us","joinUs","Join Us","contactUs","Contact Us","writeForUs","Write for Us","donateToUs","Donate To Us","partnership","Partnership","trade","Trade","techBuzzChina","TechBuzz China","backToTop","Back to top","copyright","© 2017 - {{year}} Pandaily. All rights reserved.","categories",{"_58":59,"_60":61,"_62":63,"_64":65,"_66":67,"_68":69,"_70":71,"_72":73,"_74":75},"news","News","industry","Industry","startups","Startups","ai","AI","culture","Culture","market","Market","gadgets","Gadgets","auto","Auto","gaming","Gaming","common",{"_78":79,"_80":81,"_82":83,"_84":85,"_86":87,"_88":89,"_90":91,"_92":93,"_94":95,"_96":97,"_98":99},"readMore","Read more","loading","Loading...","error","Error","notFound","Not found","goBack","Go back","share","Share","enterHere","Enter here","posts","Posts","previous","Previous","next","Next","minRead","min read",{"_101":102,"_103":104,"_105":106,"_107":108,"_109":110,"_119":120,"_121":122,"_123":124,"_125":126},"placeholder","Search articles, categories, tags...","searching","Searching...","close","Close search","tipsTitle","Search Tips:","tips",{"_111":112,"_113":114,"_115":116,"_117":118},"autoSearch","Search is performed automatically as you type","exactPhrase","Use quotes for exact phrases: \"artificial intelligence\"","searchScope","Search works across article titles, content, categories, and tags","closeShortcut","to close","noResults","No results found for \"{{query}}\"","noResultsHint","Try adjusting your search terms or browse our categories","resultsCount","Found {{count}} result for \"{{query}}\"","resultsCount_plural","Found {{count}} results for \"{{query}}\"","category",{"_129":130,"_131":132,"_133":134,"_135":136,"_137":138},"title","Category","showing","Showing {{count}} of {{total}} posts in this category","noPosts","No posts found in this category","noPostsDescription","This category doesn't have any published posts yet.","browseAllPosts","Browse All Posts","homepage",{"_141":142,"_143":144,"_145":146,"_147":148,"_149":150,"_151":152,"_153":154,"_155":156},"featuredStory","Featured Story","featuredNews","Featured News","exploreByCategory","Explore by Category","latestNews","Latest News","exploreAllNews","Explore All News","noMorePosts","No more posts to load","loadingMore","Loading more news...","newsletter",{"_157":158,"_34":159,"_160":161},"stayUpdated","Stay Updated","Get the latest China tech news delivered to your inbox","subscribe","Subscribe to Newsletter",{"_163":164,"_131":165,"_133":166,"_135":167,"_94":95,"_96":97,"_168":169},"allPosts","All Posts","Showing {{count}} of {{total}} posts","No posts found","Check back later for new content.","backToAllPosts","Back to All Posts","tag",{"_129":172,"_131":173,"_133":174,"_135":175},"Tag","Showing {{count}} of {{total}} posts with this tag","No posts with this tag","This tag does not have any published posts yet.",{"_177":178,"_182":183,"_186":187,"_190":191,"_192":193,"_194":195,"_196":197},"404",{"_129":179,"_180":181},"Page Not Found","message","The page you're looking for doesn't exist or has been moved. Let's get you back on track!","500",{"_129":184,"_180":185},"Server Error","Our servers are having a moment. Our team has been notified and is working to fix this.","general",{"_129":188,"_180":189},"Oops! Something went wrong","We're sorry, but something unexpected happened. Please try again.","backToHome","Back to Home","tryAgain","Try Again","funTitle","Don't worry, this happens to the best of us!","funMessage","While you're here, why not explore our latest articles on China's tech scene? We have amazing insights waiting for you on our homepage.","meta",{"_129":200,"_34":201,"_202":203},"Pandaily - China Tech News, AI & Electric Vehicle Insights","Premier English-language source for Chinese technology news, AI breakthroughs, and electric vehicle developments. Deep insights from Beijing's tech landscape for the global community.","keywords","China tech news, Chinese technology, AI news China, electric vehicles China, Chinese startups, fintech China, Pandaily, TechBuzz China podcast",{"_198":205,"_209":210,"_220":221,"_234":235,"_281":282,"_298":299},{"_129":206,"_34":207,"_202":208},"About Pandaily - Premier China Tech News & Insights","Learn about Pandaily, Beijing's premier English-language media company delivering contextual insights on Chinese technology, business, and innovation to the global community.","Pandaily, China tech news, Chinese technology, TechBuzz China podcast, DecodeChina, Pandata, China business insights","hero",{"_129":211,"_212":213,"_214":215,"_216":217,"_218":219},"About Pandaily","subtitle","Beijing's premier English-language media company delivering contextual insights on Chinese technology, business, and innovation to the global community.","location","Beijing, China","globalAudience","Global Audience","millionsReached","Millions Reached","whoWeAre",{"_129":222,"_34":223,"_224":225},"Who We Are","Pandaily is a Beijing-based media company equipped with a deep understanding of China's technology landscape and the unicorns that drive its innovation. Our mission is to deliver premium content with contextual insights on Chinese technology, business, sports, and culture to the worldwide community.","stats",{"_226":227,"_228":229,"_230":231,"_232":233},"productLines","Product Lines","reach","Reach","podcast","Podcast","events","Events","whatWeDo",{"_129":236,"_212":237,"_238":239,"_252":253,"_267":268},"What We Do","Pandaily operates three core product lines designed to bridge the gap between China's dynamic tech ecosystem and the global community.","onlineContent",{"_129":240,"_241":242,"_230":245,"_248":249},"Online English Content","pandaily",{"_129":243,"_34":244},"Pandaily.com","Our website publishes English content on industrial insights, tech company moves, product reviews, and cultural pieces with a focus on North American and Asian readers.",{"_129":246,"_34":247},"TechBuzz China Podcast","Weekly insights from China experts Rui Ma & Ying-Ying Lu, uncovering unique perspectives on Chinese tech news that don't make it into English coverage.","video",{"_129":250,"_34":251},"Pandaily Video Series","In-depth reviews of smart devices and insider exploration of China's tech scene for all technology enthusiasts.","community",{"_129":254,"_255":256},"Community Connection","decodeChina",{"_129":257,"_34":258,"_259":260},"DecodeChina","A one-week intensive immersion into China's tech scene, occurring bi-monthly to broaden participants' understanding through:","items",{"_261":262,"_263":264,"_265":266},"visits","Company visits and networking","courses","Pandaily-designed courses","workshops","Workshops and cultural excursions","data",{"_129":269,"_270":271},"Data Service","pandata",{"_129":272,"_34":273,"_259":274},"Pandata","A comprehensive database containing information on China's most influential tech companies, including:",{"_275":276,"_277":278,"_279":280},"overviews","Company overviews","biographies","Executive team biographies","stories","Origin stories and developments","byTheNumbers",{"_129":283,"_34":284,"_224":285},"By the Numbers","As one of the most popular sources for the international community to learn about China, Pandaily has reached millions around the globe. Though our subscribers hail from all corners of the world, our goal is persistent: to break through the language barrier and strengthen our readers' understanding of China.",{"_286":287,"_288":289,"_290":291,"_292":293,"_294":295,"_296":297},"millions","Millions","millionsLabel","Global Readers Reached","weekly","Weekly","weeklyLabel","Podcast Episodes","global","Global","globalLabel","Subscriber Community","cta",{"_129":300,"_34":301,"_302":303,"_304":305},"Join Our Community","Stay connected with China's evolving tech landscape through our comprehensive coverage and expert insights.","readLatestNews","Read Latest News","listenToPodcast","Listen to Podcast","ENV",{"_308":309,"_310":311},"STRAPI_BASE_URL","https://cms.pandaily.com","GA_MEASUREMENT_ID","G-FZLJC5WJDF","routes/$slug",{"_314":315,"_373":374,"_6":7},"post",{"_316":317,"_129":318,"_319":320,"_321":322,"_323":324,"_325":326,"_327":328,"_329":330,"_331":332,"_333":334,"_6":7,"_335":336,"_337":-5,"_338":339,"_340":341,"_56":342,"_348":349,"_363":364,"_365":-5,"_366":-5,"_367":368,"_369":370,"_371":372},"documentId","v4iopszkj3tgwh3lamivfuei","Alibaba DAMO Academy Creates World's Largest AI Pre-Training Model, With Parameters Far Exceeding Google and Microsoft","slug","alibaba-damo-academy-creates-worlds-largest-ai-pre-training-model-with-parameters-far-exceeding-google-and-microsoft","excerpt","On Monday, the Alibaba DAMO Academy announced the latest development of a multi-modal large model M6, whose parameters have jumped from 1 trillion to 10 trillion.","content","\n

On Monday, the Alibaba DAMO Academy announced the latest development of a multi-modal large model M6, whose parameters have jumped from 1 trillion to 10 trillion, far exceeding the trillion-level model previously released by Google and Microsoft, becoming the world's largest AI pre-training model.

\n\n\n\n

According to the company, the M6 has achieved the ultimate low carbon and high efficiency in the industry, using 512 GPUs to train a usable 10 trillion model within 10 days. Compared to the GPT-3, a large model released last year, M6 achieves the same parameter scale and consumes only 1% of its energy.

\n\n\n\n

M6 is a general AI model developed by DAMO Academy, with multi-modal and multi-task functions. Its cognitive and creative capabilities surpass traditional AI, and it is especially good at design, writing and Q&A. It can be used widely across the fields of e-commerce, manufacturing, literature and art, scientific research and so on. Compared with traditional AI, the large model has hundreds or thousands of times the number of \"neurons\" and has input significant levels of data in advance, showing the learning ability of \"drawing inferences from others,\" much like human beings.

\n\n\n\n

According to Alibaba, as the first commercialized multi-modal large model in China, M6 has been applied in over 40 scenarios, with a daily call volume of hundreds of millions.

\n\n\n\n

At the same time, DAMO Academy has also launched MUGE, the largest Chinese multi-modal evaluation data set at present, which covers the tasks of graphic description, text generation of images and cross-modal retrieval, filling the gap cause by a lack of relevant Chinese authoritative evaluation benchmarks.

\n\n\n\n

Zhou Jingren, Head of Data Analytics and Intelligence Lab at DAMO Academy, said, \"Next, we will deeply study the cognitive mechanism of the brain and strive to improve the cognitive ability of M6 to a level close to human beings. For example, by simulating human cross-modal knowledge extraction and understanding of humans, the underlying framework of general AI algorithms is constructed. On the other hand, the creativity of M6 in different scenarios is continuously enhanced to produce excellent application value. \"

\n","publishedDate","2021-11-08T16:32:06.000Z","featured",false,"viewCount",0,"readingTime",2,"status","draft","originalWordPressId",73491,"featuredImage","featuredImageUrl","https://assets.pandaily.com/uploads/2021/11/damo111.png","gallery",[],[343],{"_316":344,"_11":61,"_319":60,"_345":346,"_34":347},"g4fec3qxgdgpnifg4f4r7n0q","color","#000000","","tags",[350,355,359],{"_316":351,"_11":352,"_319":353,"_345":354,"_34":347},"cioqpkdtdi1m78uxfpyrckvh","Artificial Intelligence","artificial-intelligence","#6366f1",{"_316":356,"_11":357,"_319":358,"_345":354,"_34":347},"c4a4sk8sj21qvhqmm0opt0eb","DAMO Academy","damo-academy",{"_316":360,"_11":361,"_319":362,"_345":354,"_34":347},"v3netkvgxgb9j336zxpmm2vu","carbon emissions","carbon-emissions","authors",[],"seo","externalVideo","createdAt","2025-06-24T22:44:00.011Z","updatedAt","2025-06-24T23:50:59.009Z","publishedAt","2025-06-24T23:50:59.037Z","featuredPosts",[375,406,444,492,525],{"_316":376,"_129":377,"_319":378,"_321":379,"_323":380,"_325":381,"_327":382,"_329":330,"_331":332,"_333":383,"_6":7,"_335":-5,"_337":384,"_338":-5,"_56":394,"_348":397,"_363":402,"_365":-5,"_366":-5,"_367":403,"_369":404,"_371":405},"c02ahmmnww0km08s3iymveoc","StepFun Releases Step 3.5 Flash, an Open-Source Foundation Model Built for AI Agents","step-fun-releases-step-3-5-flash-an-open-source-foundation-model-built-for-ai-agents","StepFun has open-sourced Step 3.5 Flash, an agent-first foundation model delivering up to 350 TPS inference, 256K context support, and performance approaching closed-source models in reasoning and agent tasks.","On February 2, Chinese AI company StepFun officially released Step 3.5 Flash, its latest and most powerful open-source foundation model, positioning it as “born for agents.” The company says the model delivers strong reasoning capabilities, high stability, and performance optimized specifically for Agent-based workflows.\n\n![stepfun.png](https://cms-image.pandaily.com/stepfun_d8dfb3c990.png)\n\n**Key highlights include:**\n- Faster: Inference speeds of up to 350 tokens per second for single-request coding tasks\n- Stronger: Performance in Agent scenarios and mathematical reasoning comparable to leading closed-source models\n- More stable: Capable of handling complex, long-horizon, multi-step tasks\n\n![stepfun2.png](https://cms-image.pandaily.com/stepfun2_9c41c868a2.png)\n\nAccording to StepFun, the next generation of foundation models must not only be “smarter,” but also trustworthy, responsive, and cost-efficient. To achieve this balance, Step 3.5 Flash adopts several architectural innovations:\n- Sparse Mixture-of-Experts (MoE): Each token activates only around 11 billion parameters, out of a total 196 billion, significantly reducing compute costs\n- MTP-3 (Multi-Token Prediction): The model predicts three tokens per step, effectively doubling inference efficiency\n- Hybrid Attention Architecture (SWA + Full Attention): A 3:1 sliding-window-to-global attention mix allows the model to focus on key segments in long texts, enabling efficient processing of up to 256K context length with lower computational overhead\n\nStep 3.5 Flash is now fully available, and StepFun also revealed that training for the Step 4 model has already begun. The company invited developers and researchers to participate in the model’s open development and ecosystem co-creation.\n\nWith its emphasis on Agent intelligence, long-context reasoning, and inference efficiency, Step 3.5 Flash signals StepFun’s ambition to establish a competitive open-source foundation for next-generation AI agent systems.\n\nSource: IT Home","2026-02-02T12:56:48.363Z",true,"published",{"_316":385,"_386":387,"_388":-5,"_389":-5,"_390":391,"_392":393},"jahv4a1nk2d00yxx4xjsakjl","url","https://cms-image.pandaily.com/Step_Fun_59981a7900.png","alternativeText","caption","width",2000,"height",1040,[395],{"_316":396,"_11":65,"_319":64,"_345":346,"_34":347},"ou7tkn9cq6eba9jr68hqiwch",[398],{"_316":399,"_11":400,"_319":401,"_345":354,"_34":347},"w1k3s5b3bkkk546hmggvwdg3","StepFun","stepfun",[],"2026-02-02T07:27:07.839Z","2026-02-02T12:56:48.255Z","2026-02-02T12:56:48.320Z",{"_316":407,"_129":408,"_319":409,"_321":410,"_323":411,"_325":412,"_327":382,"_329":330,"_331":413,"_333":383,"_6":7,"_335":-5,"_337":414,"_338":-5,"_56":420,"_348":422,"_363":440,"_365":-5,"_366":-5,"_367":441,"_369":442,"_371":443},"m2ls6jkk0pyidxc7zympvyt4","An In-Depth Interview with YoooTek Founder Xiao Ruizhe","an-in-depth-interview-with-yooo-tek-founder-xiao-ruizhe","In an era defined by constant notifications and information overload, startup YoooTek is attempting a softer, more human-centered approach to technology.","In an era defined by constant notifications and information overload, startup YoooTek is attempting a softer, more human-centered approach to technology. Rooted in the engineering and robotics foundation of publicly listed company [Yijiahe](https://en.yijiahe.com/) (603666.SH), YoooTek is built around a simple but ambitious idea: **technology should help people feel seen, understood, and supported.**\n\nThat philosophy takes concrete form in YoooTek’s first product, AI ONE—a compact AI device that magnetically attaches to the back of a smartphone. Rather than functioning as yet another screen or app, AI ONE acts as a physical switch for “information minimalism.” Paired with its companion app, it creates a buffer between users and their phones, redefining how information is received, filtered, and prioritized.\n\n![AI ONE.jpg](https://cms-image.pandaily.com/AI_ONE_fb41e17b34.jpg)\n\nAI ONE combines two core functions. The first is notification curation, designed to filter noise from constant message streams. Instead of confronting users with endless unread badges, the device distills what truly matters and signals urgency through a simple light—if it doesn’t light up, the message can wait. The second function, called “Flash Insight,” serves as a lightweight external memory. Users can record short voice notes at any moment, which AI automatically organizes into structured notes or to-do items—no screens, no apps, no friction.\n\nBehind AI ONE is YoooTek’s deep integration of multimodal perception, natural language understanding, and emotional computation. Drawing on years of robotics and intelligent systems experience, the team has developed technologies that not only interpret what users say, but how they say it—quietly embedding complex AI beneath a calm, non-intrusive interface.\n\nIn the following interview, YoooTek founder Xiao Ruizhe explains why selling a product is ultimately about shaping user mindset, why AI ONE had to be hardware rather than software, and why restraint—not novelty—is the key to building meaningful AI products.\n\n![AI ONE founder.png](https://cms-image.pandaily.com/AI_ONE_founder_5051f7483d.png)\n\n## Q&A\n\n### Q: You’ve said that “selling a product is essentially selling a state of mind.” What do you mean by that?\n\n**Xiao Ruizhe:** I believe selling a product is fundamentally about selling a state of mind. Consumers do not make purchasing decisions based on specifications, but on their identification with a particular way of life or sense of self. What ultimately matters is not the feature set itself, but what owning that product represents to the user. When someone decides to buy it, they are also making a statement about who they are and how they want to live. That’s why, when defining a product, the first question shouldn’t be about functionality, but about why someone would want it in their life in the first place.\n\n### Q: Why did you decide to build a consumer-facing product at Yijiahe?\n\n**Xiao:** On one hand, Yijiahe wanted to explore consumer products. On the other hand, I was already thinking about doing something consumer-facing that deeply integrates AI. When we first met, we didn’t rush into discussing what to build. For me, finding the right partners matters more than deciding on the product itself. If people are aligned in how they think and how they work, the product direction will eventually emerge.\n\n### Q: Why did you almost completely abandon the first product concept?\n\n**Xiao:** The first version was closer to a large AI toy. Technically, it incorporated various sensors and components, but we hadn’t answered a fundamental question: what actually defines a good AI product? If you don’t understand that, the product inevitably relies on novelty. Once the novelty wears off, there’s nothing left. That’s why I chose to delay the launch rather than push something out prematurely.\n\n### Q: What changed your understanding of companion-style AI products?\n\n**Xiao:** I gradually realized that language itself is an extremely low-bandwidth form of interaction. Real human interaction is high-context—it constantly adapts through expressions, emotions, and subtle behavioral cues. If an AI companion cannot read context, it’s almost impossible for it to work well. Pure conversation, by itself, is not enough to create a meaningful sense of companionship.\n\n### Q: Is that why emotion recognition and visual perception became so important to you?\n\n**Xiao:** Yes. Micro-expressions are a core part of how humans read each other, and from a technical standpoint that means high-frame-rate visual perception. Without enough contextual data, the experience simply breaks down. If the system cannot perceive subtle emotional changes, it will always respond in a shallow or inappropriate way. These valuable explorations will gradually take shape in our future products.\n\n### Q: Bringing it back to AI ONE—what problem does it fundamentally solve?\n\n**Xiao:** At its core, AI One is designed to address information overload. We want to place a physical buffer between users and their phones. The idea is simple: if the light doesn’t turn on, you don’t need to check your phone. That single signal allows people to regain focus without constantly second-guessing whether they’re missing something important.\n\n### Q: Why did this have to be a hardware product instead of an app?\n\n**Xiao:** There are two reasons. The first is system-level constraints. The second is logic. You can’t claim to help users filter information while still forcing them to see everything on their screens. That contradiction only disappears when there’s a separate physical layer that takes over part of the decision-making process.\n\n### Q: Why did you choose light as the primary interaction mechanism?\n\n**Xiao:** We ruled out sound because most phones are kept on silent. We also ruled out vibration, because when a device is attached to a phone, you can’t tell which one is vibrating. Light turned out to be the most restrained and effective option—it delivers information without demanding attention.\n\n### Q: Why limit voice recording to 60 seconds?\n\n**Xiao:** Because we don’t want to become a meeting tool. Once you allow long recordings, the product starts drifting toward professional software. AI ONE is meant to be a personal, always-with-you assistant—something lightweight enough to fit naturally into everyday life.\n\n### Q: Why was it so important to price AI ONE in the hundred-yuan range?\n\n**Xiao:** At this price point, decision friction drops to its lowest level. Users don’t overthink the purchase. For me, it matters more that AI ONE becomes a foundational product—one that can enter as many people’s lives as possible and allow the broader public to experience a new form of AI-driven interaction and convenience—than optimizing short-term hardware margins.\n\n### Q: How do you approach user data and privacy?\n\n**Xiao:** There is a hard line we won’t cross: we will never sell user data to third parties. Once you cross that line, you lose your foundation. Trust is the only reason users are willing to let AI into their daily lives, and that trust collapses instantly if data becomes a commodity. But promises alone are not enough. To address users’ concerns about security, we developed a novel data-asset ownership architecture—the Glass-Box Trusted Privacy Computing Architecture. Its core logic is a shift from trust based on promises to trust verified by architecture.\n\n### Q: How do you view recent AI phone experiments like ByteDance’s?\n\n**Xiao:** They’re interesting demos, but not restrained enough. If you break existing commercial rules, something may work in the short term, but the ecosystem will eventually push back. Sustainable products have to innovate within rules, not by ignoring them. Our path is different from theirs. We pursue sustainable innovation within existing ecosystems and rules, rather than disrupting or breaking them. One advantage of this approach is that ecosystem players built up over many years can become partners who move forward alongside us.\n\n### Q: Looking five or ten years ahead, what defines success for you?\n\n**Xiao:** If we’re still alive, that’s success. If you don’t survive, nothing else really matters. In an industry that changes this fast, longevity is the only proof that your direction was right.","2026-01-04T14:35:34.909Z",7,{"_316":415,"_386":416,"_388":347,"_389":417,"_390":418,"_392":419},"dmmw8v2daslaeefp76dtfco1","https://cms-image.pandaily.com/IMG_0598_566b8573c8.JPG","YoooTek AI One",2730,1535,[421],{"_316":396,"_11":65,"_319":64,"_345":346,"_34":347},[423,427,431,432,436],{"_316":424,"_11":425,"_319":426,"_345":354,"_34":-5},"nb97mhajkwkyfyoybduz225y","Yijiahe","yijiahe",{"_316":428,"_11":429,"_319":430,"_345":354,"_34":-5},"adtw7uiflf4yiigny2dgrb2r","YoooTek","yooo-tek",{"_316":351,"_11":352,"_319":353,"_345":354,"_34":347},{"_316":433,"_11":434,"_319":435,"_345":354,"_34":347},"ejpm9snjpxhw17gfjgugw1qx","Chinese Brands","chinese-brands",{"_316":437,"_11":438,"_319":439,"_345":354,"_34":-5},"qj8wznxhxz877vp5stkozhua","Technologies","technologies-1",[],"2026-01-04T13:13:29.118Z","2026-01-04T14:35:34.689Z","2026-01-04T14:35:34.822Z",{"_316":445,"_129":446,"_319":447,"_321":448,"_323":449,"_325":450,"_327":382,"_329":330,"_331":451,"_333":383,"_6":7,"_335":-5,"_337":452,"_338":-5,"_56":457,"_348":463,"_363":488,"_365":-5,"_366":-5,"_367":489,"_369":490,"_371":491},"e31oem9rg7p06lj5agyg97pd","Bets on Generative AI to Redefine Drug Discovery——IntelliGenAI and Their Foundation Model Approach ","bets-on-generative-ai-to-redefine-drug-discovery-intelli-gen-ai-and-their-foundation-model-approach","IntelliGenAI's IntelliFold foundation model represents a promising breakthrough in generative AI for structural biology, achieving performance comparable to or surpassing AlphaFold 3, with controllable features poised to accelerate drug discovery and redefine scientific research paradigms.","For decades, new drug development has been constrained by the notorious “double ten” rule: a 10-year timeline, $1 billion in costs, and barely a 10% success rate for bringing a new therapy to market. A newly founded Generative science startup, IntelliGenAI, believes it can upend that paradigm. By leveraging cutting-edge generative AI in structural biology, IntelliGenAI aims to dramatically accelerate drug discovery and improve success odds. The company recently closed an angel funding round reportedly in the “tens of millions of US dollars” to advance its technology and is gearing up for growth.\n\n### Merging Structural Biology with Generative AI\n\nIntelliFold’s（which is the foundation model released by the company ） core innovation is a generative AI model for 3D biomolecular structure prediction. In essence, the startup has built a large-scale “base model” akin to DeepMind’s AlphaFold-3, but with broader capabilities tailored for drug R&D like affinity and allosteric site. The IntelliFold model can predict how different biological molecules – proteins, DNA/RNA, small-molecule drugs, ions, etc. – interacts with each other in three-dimensional space with high precision. According to a early version open technical report from the company, IntelliFold’s performance on key protein-structure benchmarks is on par with Google DeepMind’s latest AlphaFold 3, and the latest Pro version of the model has already been shown to comprehensively surpass AF-3 on public test datasets. This means the model not only computes protein folding, but can also anticipate binding conformations and even estimate binding affinity between a protein and a prospective drug molecule – a crucial metric for virtual screening .\n\nA major feature of IntelliFold’s system is its controllability. By applying lightweight, trainable adapters, the base model can be guided toward specific tasks . For example, it can focus on predicting allosteric conformational changes – the subtle shape shifts a protein undergoes when a molecule binds to a distant site – without losing accuracy on the primary conformation . “Given a specific protein sequence, the IntelliFold model can predict its binding conformation and mode with a small molecule,” explains Ronald Sun, president of the company, highlighting a key capability that addresses a clear market need in drug discovery. Beyond structure alone, the model can output an affinity value for the binding, potentially boosting the efficiency and accuracy of drug screening by orders of magnitude. These advances provide pharmaceutical researchers with a powerful tool to design and evaluate new therapeutic molecules far more efficiently than before.\n\nThe IntelliFold platform was developed in-house by the startup IntelliGenAI, which was initiated by 2 college mates in late 2024 amid a surge of interest in generative AI ventures . Ronald Sun, IntelliFold’s President, is a former tech venture investor who spent years backing frontier technology projects to win before deciding to build one himself . The chief scientist, Siqi Sun, is a Fudan University researcher who previously worked at Microsoft’s headquarter research labs in Seattle , specializing in advanced large-language models for years after won \"SOTA\" in structure prediction on CASP12(Critical Assessment of Structure Prediction, 2016) . The larger founding team’s uncommon mix of AI expertise and structural biology know-how enabled them to create a sophisticated prediction model from the ground up, rather than just wrapping existing tools. Most team members have dual backgrounds in computational biology and deep learning, which Ronald notes was critical for developing their own large model for scientific research. An early version of IntelliFold’s server has already been made available to collaborators and testers, showcasing the technology’s potential in real-world drug discovery projects.\n\n### “Generative Science” – A New Research Paradigm\n\nIntelliFold’s approach exemplifies what Ronald Sun calls “generative science” – applying generative AI to scientific discovery in ways that fundamentally differ from the traditional research paradigm. For centuries, science has advanced through the painstaking process of formulating theories, deriving equations, and experimentally verifying each step . In drug development, for instance, researchers normally must identify a biological target, design a molecule, and iteratively test and tweak hypotheses in the lab. Generative AI offers a radically different path: instead of explicitly mapping out every molecular interaction with first-principles physics and chemistry, the AI model is trained on massive datasets of sequences, structures, and experimental results. It can then directly generate plausible solutions or predictions, even without a perfect human understanding of every mechanism .\n\nAccording to Ronald, this data-driven generative method can yield outcomes that are “relatively accurate(compared with ground truths), but absolutely faster and broader” in scope compared to traditional techniques. In other words, a well-trained model might not explain why a particular protein folds or binds the way it does, but it can predict what will happen much more quickly and across vastly more possibilities than any lab could test manually, and is currently one of the most effective and leading approaches for tackling harder and more complex binding problems, such as so-called undruggable targets. The true dawn of this generative science approach was marked by DeepMind’s AlphaFold2, which in 2020 solved the decades-old problem of predicting protein 3D structures from amino acid sequences . AlphaFold3 (announced in 2024) extended that capability to model interactions between proteins and other molecules like nucleic acids, small compounds, and even antibodies – opening the door for AI to guide drug discovery in a meaningful way.\n\nNow, startups like IntelliFold are pushing this trend further. “We’re seeing a potential shift in the first principles of scientific research,” Ronald says of the generative AI wave. “For the first time, it may be possible to expand human scientific knowledge ten times faster and broader, even without fully interpretable models for every step.” Ronald expects that harnessing AI in this way could boost research efficiency by at least an order of magnitude and allow scientists to explore options that were previously infeasible. In the pharmaceutical context, he notes, an GenAI-driven paradigm could drastically shorten the discovery cycle and reduce costs per new drug candidate. Success rates might improve “several-fold,” as advanced models uncover viable drug hits that human experts might overlook. By applying generative models directly to scientific exploration, IntelliFold hopes to turn what was once a slow, linear process into something more akin to rapid prototyping – testing countless virtual compounds and scenarios with unprecedented accuracy in silico with only the most promising ones moving to physical trials.\n\n### Chasing SOTA by surfing the scaling law\n\nAlongside symbolic language intelligence and physical world intelligence, scientific intelligence that capture representations of natural laws and deep underlying regularities constitute the third top-level pillar of Artificial General Intelligence (AGI). Across a wide range of natural science domains—spanning the extremely concrete and the extremely abstract, the macroscopic and the microscopic—there exist objective structures that can be formalized, systematized, and ultimately operationalized as tools.\n\nHistorically, mathematical principles and empirical scientific experimentation were the primary means by which humanity explained natural forces and unlocked productivity, guiding sustained and transformative progress. However, since the advent of AlphaFold2 (AF-2), a new race toward state-of-the-art (SOTA) performance has emerged—one in which competition between models themselves has become the principal arena of intellectual rivalry.\n\nThe CASP competition, which had seen only incremental advances over several decades, entered a new phase at CASP12 in 2016 with the introduction of convolutional neural networks, and was ultimately brought to a decisive turning point at CASP14, where AlphaFold2 effectively solved the long-standing problem of single-protein structure prediction at near-experimental accuracy.\n\nWhile years of progress in monomeric structure prediction—culminating in AF-2—have been of profound scientific significance and provided industry with far superior starting points for downstream research, they remain insufficient for one of the most critical challenges in early-stage drug discovery: co-folding. In this domain, the industry has long lacked a solution that simultaneously offers reliable interaction awareness and high-throughput efficiency.\n\nThe formal release of AlphaFold3 in 2024, with its generative-AI-based capability for complex and composite structure prediction, marked a major inflection point in the industrial value of biological foundation models. Its breakthroughs in predicting structures of diverse molecular complexes—including antigen–antibody systems and protein–small-molecule interactions—opened a new chapter. Building on this capability, AlphaFold-related platforms secured multiple landmark partnerships with multinational pharmaceutical companies such as Novartis and Eli Lilly, involving upfront payments in the tens of millions of US dollars and total deal values ranging from USD 1–2 billion.\n\nIn parallel, replication efforts and exploratory improvements have rapidly followed. Yet due to the exceptionally high barrier to entry, requiring deep expertise in both large-scale generative models and structural biology, progress has been incremental rather than explosive. Recent benchmark studies—such as the newly published FoldBench benchmark—have revealed meaningful overall progress in this direction, while also highlighting that current SOTA methods still have considerable room for improvement on certain tasks.\n\nUsing biology as a representative example, it has become increasingly clear that how domain-specific scientific data and knowledge are tokenized and mapped into generative AI architectures is now the foundational and defining problem of Generative Science. Once domain science has been successfully tokenized and its feasibility validated, the next imperative is scaling—a process that demands iterative advances in model architecture and infrastructure.\n\nGenerative science is not simply about stacking more Transformer blocks. To build more powerful and effective models, researchers need a deep understanding of both domain-specific science and model architectures themselves, in order to find the right scaling directions. Otherwise, merely piling on more compute and data will still fail to achieve good results.\n\nThis process—scaling toward higher-capacity, higher-efficiency models, achieving stronger performance, integrating increasingly concrete problem settings and scenario-specific data, and forming a self-reinforcing dynamic flywheel of iteration—is rapidly emerging as the standard methodology of Generative Science.\n\nAt the same time, this methodology is expanding quickly beyond biology. Led by organizations such as DeepMind, innovators are actively applying the transformative potential of Transformers and generative-science principles to domains including, but not limited to, climate modeling, materials science, and nuclear fusion control.\n\n### IntelligenAI: Timeline and Innovations\n\nBuilding upon architectural innovations and algorithmic evolution within GenAI frameworks, according to their [update released](https://arxiv.org/abs/2507.02025) in 2025 summer , IntelligenAI had delivered a series of results that are on par with, or in some cases surpass, AlphaFold3 and current industry SOTA: \n\n1. The Pro version outperforms AlphaFold3 across multiple key metrics.\n![01.PNG](https://cms-image.pandaily.com/01_7aebad9b6f.PNG)\n2. By inserting LoRA adapters, the model achieves not only excellent performance in canonical (orthosteric) binding scenarios, but also exceptional capability in directed control tasks, including allosteric site targeting, pocket-guided folding, and epitope-guided folding.\n![02.png](https://cms-image.pandaily.com/02_a9c496b7b2.png)\n3. One of the world’s first foundation models to achieve GenAI-based affinity prediction, demonstrating significantly superior SOTA performance across multiple datasets.\n![03.png](https://cms-image.pandaily.com/03_27b1bc8739.png)\n4. Among the validated and effective improvements currently under development (in internal testing, not yet publicly deployed), more than half stem from fundamental rethinking of model architecture and training paradigms, rather than from data scale alone—an approach expected to yield substantial performance gains in the next major release.\n \n### Racing to Revolutionize Drug Discovery by generative AI \n\nIntelliFold is launching its platform at a time of fierce global competition in AI-driven biotech. The potential to revolutionize drug discovery has attracted not only scientists but also tech giants and venture capital on a massive scale. In early 2024, for example, Alphabet’s DeepMind spun out Isomorphic Labs, which quickly inked partnership deals with pharma majors Lilly and Novartis to co-develop new therapies using AlphaFold’s AI capabilities . Those deals carried hefty upfront payments ($37.5–45 million each) – a strong validation that pharmaceutical companies see real value in generative models for drug design . Another startup in the field, Chai Discovery raised over $200 million with backing from notable AI figures (including OpenAI and Anthropic). And in the past year, a high-profile new venture involving leading scientists even secured a record $1.5 billion in initial funding – signaling the tremendous optimism around AI’s potential in life sciences.\n\nCompared with the last wave of AIDD in Greater China years ago, IntelliFold represents a new wave of biotech innovation that leverages the area's new emerging strengths in both generative artificial intelligence and pharmaceutical research industrial capabilities. The company’s progress has already drawn attention in domestic media, with observers calling IntelliFold’s success a sign of the “huge potential of GenAI engine in early stage biomedicine”. Rather than court widespread hype, however, the company prefers to engage specialized industry audiences and experts ahead, focusing on tangible scientific and commercial milestones. In the coming months, besides the launch of IntelliFold new version early 2026 , the Company alsoplans to collaborate with major drug companies and research institutions to validate and refine its AI models on real-world R&D projects. By contributing valuable early-stage drug candidates and continuously upgrading its IntelliFold platform, the startup aims to help raise the overall efficiency and success rate of drug development in the industry.\n\n“We see enormous opportunities in this space because it’s an industry with high value but very low efficiency,” Ronald says, “If our generative AI approach can cut ten-year timelines down to a few years, and turn 10% success odds into 20%, it will transform what is possible in biotech.And it will be the triumph of the new forged demension of ”Principles of Natural Philosophy“, unfold by generative intelligence. Definitely it would also benefit domine science itself a lot, already started in biology，and other domains would soon echo and push this into a grand symphony of generative science from a skilled sonata of AI-Biotech” . While such goals will take time to fully realize, the trajectory is set. With its blend of AI prowess and scientific insight, IntelliFold is ambitiously positioning itself to turn the double-ten dilemma on its head – potentially ushering in a new era where designing a drug is more like designing a computer chip, and breakthroughs come at the pace of machines rather than human labor . The race to revolutionize drug discovery is on, and IntelliFold is one of the young contenders betting that generative AI can deliver the quantum leap that researchers and patients have been waiting for.","2025-12-22T05:00:00.000Z",12,{"_316":453,"_386":454,"_388":-5,"_389":-5,"_390":455,"_392":456},"y0neqxz51pjhwks1m5erlg9t","https://cms-image.pandaily.com/ai_blog_master_1_dfb244fb08.jpg",1200,686,[458,459],{"_316":396,"_11":65,"_319":64,"_345":346,"_34":347},{"_316":460,"_11":461,"_319":462,"_345":346,"_34":-5},"nd7u5jlcbw44fqibmzu4ckhw","Technology","technology",[464,468,472,476,480,484],{"_316":465,"_11":466,"_319":467,"_345":354,"_34":-5},"bkk28pbefi5317twofp6kqr2","IntelliGenAI","intelli-gen-ai",{"_316":469,"_11":470,"_319":471,"_345":354,"_34":-5},"y35b6440kzibhdkhl24t45k8","AlphaFold","alpha-fold",{"_316":473,"_11":474,"_319":475,"_345":354,"_34":-5},"nmnuq3qyha9kt1vr5t15ub4z","IntelliFold","intelli-fold",{"_316":477,"_11":478,"_319":479,"_345":354,"_34":347},"i6h2n9s03oi523j5w8vtcytg","drug research","drug-research",{"_316":481,"_11":482,"_319":483,"_345":354,"_34":-5},"r99axkta2ysvj55205r1mgi6","ChinaTech","china-tech-1",{"_316":485,"_11":486,"_319":487,"_345":354,"_34":347},"w22l19333obyhsn1xwfyb80k","0.1AI","0-1ai",[],"2025-12-22T06:35:23.378Z","2026-01-05T11:50:57.518Z","2026-01-05T11:50:57.575Z",{"_316":493,"_129":494,"_319":495,"_321":496,"_323":497,"_325":498,"_327":382,"_329":330,"_331":499,"_333":383,"_6":7,"_335":-5,"_337":500,"_338":-5,"_56":503,"_348":505,"_363":521,"_365":-5,"_366":-5,"_367":522,"_369":523,"_371":524},"qt5xweptb0a5fts45oe9s9pm","“Qwen Panic”: How Alibaba’s AI Ambitions Are Shaking Silicon Valley","qwen-panic-how-alibaba-s-ai-ambitions-are-shaking-silicon-valley","\"Qwen Panic\" captures Silicon Valley's unease as Alibaba's AI advances challenge U.S. dominance, with its open-source Qwen models and ChatGPT-competing app reshaping the competitive landscape.","## The Rise of “Qwen Panic” in Silicon Valley\nA new expression is making the rounds among U.S. technologists — “Qwen Panic.” It describes the unease spreading across Silicon Valley as Alibaba’s rapid advances in artificial intelligence challenge long-standing assumptions about American leadership in the field. In the span of a year, Alibaba not only released its open-source Qwen series of AI models, but also launched a consumer-facing Qwen App aimed squarely at competing with ChatGPT.\n\nThese moves have upended the narrative of a one-sided U.S.–China AI race. American developers — from startups to Big Tech — now increasingly rely on Qwen, a model that is not only powerful but also remarkably cheap. The result is a psychological shift: for the first time, Silicon Valley is confronting a world where a Chinese AI model may be setting the pace.\n\nOn November 14, the Financial Times published a report that injected a new — and explosive — dimension into the conversation.\n\nAccording to the FT, a newly surfaced White House national security memorandum, containing declassified fragments of top-secret intelligence, accused Alibaba of providing technology that supported PLA-linked operations targeting U.S. interests.\n\nThe memo offered no specifics — no evidence, no details on what “capabilities” were implicated, and no indication of whether Washington intended to respond. But the reaction was swift: Alibaba’s U.S.-listed shares dropped 4.2% within hours.\n\nThe political optics were profound. For the first time, U.S. intelligence allegations touched directly on a company whose AI models are now foundational to a growing portion of the global open-source ecosystem.\n\n## When an Open Model Starts Hollowing Out Silicon Valley\nAlibaba’s open-source strategy has had a seismic impact on the U.S. technical landscape. By releasing high-performing model weights for free, Qwen has effectively hollowed out some of Silicon Valley’s traditional advantages.\n\nMajor American companies have quietly adopted it. Amazon, for example, uses Qwen to develop simulation software for its next-generation delivery robots. Apple, facing regulatory barriers in China, chose Qwen to power Siri’s AI requests in the Chinese market.\n\nIn academia and research, the shift is even more striking. Stanford researchers led by Fei-Fei Li built a top-tier reasoning model (“S1”) on Qwen2.5-32B — for under $50. The Allen Institute for AI built its multimodal system on Qwen2-72B, while former OpenAI CTO Mira Murati’s new lab includes Qwen as a default fine-tuning option.\n\nThis is why developers now casually refer to Qwen as “**the strongest free model available.**” As Qwen becomes the backbone for experiments, prototypes, and early-stage products, Silicon Valley’s dependence is deepening. The technical moat that once protected U.S. AI leadership is showing cracks.\n\n## Alibaba’s Full-Stack Offensive: From Cloud Power to Consumer AI\nIf Qwen’s open-source success rattled engineers, Alibaba’s next move shook the ecosystem as a whole. The company launched the Qwen App, a direct challenger to ChatGPT — but more importantly, the anchor of a full-stack AI offensive.\n\nAlibaba is the rare AI player with the entire chain:\n\n- Cloud infrastructure\n- Foundation models\n- Consumer apps\n- Real-world services in e-commerce, logistics, finance, maps, payments, and more\n\nThis means the Qwen App is not just a chatbot — it is a potential control center for Alibaba’s vast digital empire. Imagine an AI agent that can help you shop on Taobao, plan routes on Amap, manage payments on Alipay, support enterprise workflows on DingTalk, or optimize supply chains in Cainiao Logistics.\n\nThis is Alibaba’s biggest advantage over U.S. AI firms: the ability to integrate AI with an already massive application universe. ChatGPT, in contrast, is still largely a stand-alone product. For Silicon Valley executives, the realization that Chinese AI will be deployed inside such a powerful ecosystem is deeply unsettling.\n\n## Why Washington Is Suddenly Talking About Open Models\nQwen’s rise has triggered a broader strategic reaction in the United States. The most high-profile example is the launch of the ATOM Project (American Truly Open Models) — a coalition of industry leaders and researchers pushing the U.S. to regain open-source AI leadership.\n\nIts founding members include figures from Nvidia, Hugging Face, major VC firms, and former OpenAI employees. The initiative calls for:\n\n- A dedicated U.S. open-model lab\n- Government and private funding\n- A roadmap to match or surpass Qwen and DeepSeek\n\nBehind this urgency lies a recognition: open-source AI is becoming a strategic battleground, and China now holds the advantage.\n\nNvidia CEO Jensen Huang, during U.S. and China visits, praised Chinese open models and warned American policymakers that the future of innovation hinges on openness — implicitly acknowledging that Qwen and its peers have outpaced U.S. open alternatives. Even OpenAI is preparing its first open-source release in years, a shift unthinkable before Qwen.\n\nThe strategic fear is clear: if Chinese open models become the global default, the U.S. risks losing not only influence but also the technological standards that shape future industries.\n\n## The Cost War: How Qwen Exposes the Fragility of America’s AI Economics\nPerhaps the most uncomfortable aspect for American firms is the economics. The U.S. AI model relies on:\n\n- enormous capital expenditure\n- proprietary APIs\n- vast, debt-funded data centers\n- expensive inference costs\n\nBy contrast, Qwen is cheap. Developers can run it locally, fine-tune it for a few dollars, or deploy it on inexpensive cloud hardware. Stanford’s high-performance S1 reasoning model — built on Qwen — cost less than $50 to train.\n\nThis cost advantage is so large that Western companies are already switching.\n\nAirbnb CEO Brian Chesky openly stated that Airbnb’s new AI agent relies heavily on Qwen — calling it fast and incredibly cheap, while noting that OpenAI’s integration “was not ready.”\n\nEven more symbolically, Amazon Web Services now offers Alibaba’s Qwen models on Amazon Bedrock — effectively making Qwen an official option for American enterprises.\n\nFor U.S. AI firms carrying billions in infrastructure costs, the implications are dire: a world where the best (or good-enough) AI is also the cheapest is a world where their business model becomes fragile.\n\n## The Real Battlefield: Productivity, Ecosystems, and the Pace of Adoption\nThe “Qwen Panic” ultimately reflects a deeper shift in the AI race — from a contest of model intelligence to a battle over ecosystems and adoption speed.\n\nAlibaba’s chairman Joe Tsai put it succinctly:\n\n\n>“The winner will be determined by who adopts AI faster.”\n\nOpenAI may have the most refined model, but Alibaba has the largest real-world playground to deploy one. Qwen App is merely the first step in linking foundation models with commerce, finance, logistics, and public services at consumer scale.\n\nYes, Qwen App still needs market traction and may take time to mature. But its symbolic impact is already enormous. For the first time, U.S. policymakers and CEOs are confronting a plausible future in which Chinese AI — open, cheap, scalable, and ecosystem-integrated — becomes the global default.\n\nThe resulting panic is not irrational. It signals a recognition that the future of AI will be won not by the most elegant algorithm, but by the model embedded most deeply into everyday life.","2025-11-21T11:03:52.023Z",6,{"_316":501,"_386":502,"_388":-5,"_389":-5,"_390":391,"_392":393},"iskzmbpzcgv61h6bqsxezkzp","https://cms-image.pandaily.com/qwen_logo1_3ccd4ecb38.png",[504],{"_316":396,"_11":65,"_319":64,"_345":346,"_34":347},[506,510,512,516,520],{"_316":507,"_11":508,"_319":509,"_345":354,"_34":347},"irkol3v314zpwuyagrts9r0q","Aliababa","aliababa",{"_316":511,"_11":65,"_319":64,"_345":354,"_34":347},"ji5tef72gjtbd7bx0er6q9jv",{"_316":513,"_11":514,"_319":515,"_345":354,"_34":347},"xom32g2nuexjlnh0qyxo8q0a","Qwen","qwen",{"_316":517,"_11":518,"_319":519,"_345":354,"_34":347},"cyq307m6qd1ly49pullhcmt8","China","china-bn",{"_316":437,"_11":438,"_319":439,"_345":354,"_34":-5},[],"2025-11-15T11:14:18.640Z","2025-11-21T11:03:51.895Z","2025-11-21T11:03:51.992Z",{"_316":526,"_129":527,"_319":528,"_321":529,"_323":530,"_325":531,"_327":382,"_329":330,"_331":532,"_333":334,"_6":7,"_335":-5,"_337":533,"_338":-5,"_56":538,"_348":543,"_363":556,"_365":-5,"_366":-5,"_367":557,"_369":558,"_371":559},"ws7slzpf9v8enr3x5c1v2iwa","Alibaba Launches Robotics and Embodied AI ","alibaba-launches-robotics-and-embodied-ai","Alibaba Group has set up a dedicated Robotics and Embodied AI team, signaling its entry into the fast-growing race among global tech giants to bring artificial intelligence into the physical world.","October 8 – Alibaba Group has formed an internal robotics team, signaling its formal entry into the global race among tech giants to build AI-powered physical products.\n\nOn Wednesday, Lin Junyang, head of technology at Alibaba’s Tongyi Qianwen large model unit, announced on social media platform X that the company has established a “Robotics and Embodied AI Group.” The move highlights Alibaba’s strategic push from software-based AI into hardware and real-world applications.\nThe announcement comes as global peers ramp up investments in robotics. On the same day, Japan’s SoftBank said it would acquire ABB’s industrial robotics business, deepening its footprint in what it calls “physical AI.”\n\nAlibaba Cloud has also made its first foray into embodied intelligence, leading a $140 million funding round last month in Shenzhen-based startup X Square Robot.\n\nAt the 2025 Yunqi Cloud Summit two weeks ago, Alibaba CEO Wu Yongming projected global AI investment would surge to $4 trillion within five years, stressing that Alibaba must keep pace. In addition to the ¥380 billion earmarked in February for cloud and AI infrastructure, the company plans further spending.\n\n**From Multimodal Models to Real-World Agents**\nLin also noted on X that “multimodal foundation models are now being transformed into fundamental agents capable of long-horizon reasoning through reinforcement learning, using tools and memory.” He added that such applications “should naturally move from the virtual world into the physical one.”\n\n![截屏2025-10-09 10.04.37.png](https://cms-image.pandaily.com/2025_10_09_10_04_37_7926b25229.png)\n\nAs head of Tongyi Qianwen, Lin previously worked on multimodal models that process voice, images, and text. The new robotics group underscores Alibaba’s intent to extend its AI expertise into embodied products, aiming for a foothold in the fast-growing embodied AI market.\n\n**Backing X Square Robot**\n\nIn September, Alibaba Cloud led a $140 million Series A+ round for X Square Robot, marking its first major investment in embodied intelligence. The Shenzhen startup, less than two years old, has raised about $280 million across eight funding rounds.\n\nX Square pursues a software-first strategy. Last month it released Wall-OSS, an open-source embodied intelligence foundation model, alongside its Quanta X2 robot. The machine can attach a mop head for 360-degree cleaning and features a robotic hand sensitive enough to detect subtle pressure changes—moving closer to human-like functionality.\n\nThe company has not yet launched a consumer product, and pricing will vary by application. Research firm Humanoid Guide estimates its humanoid robot at around $80,000. X Square is already generating revenue from sales to schools, hotels, and elder-care facilities, and is preparing for an IPO next year. COO Yang Qian said the company expects “robot butlers” to become a reality within five years, though admitted that AI for robotics still lags behind advances in chatbots and code generation.\n\n**A Global Robotics Race**\n\nAlibaba’s entry comes as major tech firms double down on robotics. Venture capital has been pouring into the humanoid robot sector, with widespread belief that combining generative AI with robotics will transform human–machine interaction.\n\nAt NVIDIA’s annual shareholder meeting in June, CEO Jensen Huang said AI and robotics represent two trillion-dollar growth opportunities for the company, predicting self-driving cars will be the first major commercial application. He envisioned billions of robots, hundreds of millions of autonomous vehicles, and tens of thousands of robotic factories powered by NVIDIA’s technology.\n\nMeanwhile, SoftBank this week announced a $5.4 billion cash acquisition of ABB’s robotics unit, which generated $2.3 billion in revenue in 2024 and employs about 7,000 people worldwide. Chairman Masayoshi Son described the deal as a step toward fusing “artificial superintelligence with robotics” to shape SoftBank’s “next frontier.”\n\nCitigroup estimates the global robotics market could reach $7 trillion by 2050, attracting vast capital inflows—including from state-backed funds—into one of technology’s most hotly contested arenas.","2025-10-09T03:55:55.257Z",3,{"_316":534,"_386":535,"_388":-5,"_389":-5,"_390":536,"_392":537},"f5nog9gg8ftuin65indlqno2","https://cms-image.pandaily.com/qwen_thumb_1170x725_4405eb526b.jpg",1170,725,[539],{"_316":540,"_11":541,"_319":542,"_345":346,"_34":-5},"dun1lrqbgtz19z0gwnrym89h","Newsflash","newsflash",[544,545,546,551],{"_316":507,"_11":508,"_319":509,"_345":354,"_34":347},{"_316":513,"_11":514,"_319":515,"_345":354,"_34":347},{"_316":547,"_11":548,"_319":549,"_345":354,"_34":550},"qpuv4vmxoygygmu4gco7t39s","Robotics","robotics-1","Alibaba’s creation of a robotics team underlines its ambition to extend its AI strength into physical applications — and secure a position in one of technology’s most competitive frontiers.",{"_316":552,"_11":553,"_319":554,"_345":354,"_34":555},"txsgh0rlolxfxzjlpa24yqkg","EmbodiedAI","embodied-ai","Embodied AIintegrates artificial intelligence into physical systems, like robots, enabling them to perceive, understand, and interact with the real world using sensors and actuators. This field combines machine learning, computer vision, and robotics to create intelligent agents that learn from real-world experiences, adapt to dynamic environments, and perform complex physical tasks, bridging the gap between software-based AI and practical, real-world applications. ",[],"2025-10-09T02:42:00.579Z","2025-10-09T03:55:55.181Z","2025-10-09T03:55:55.228Z","actionData","errors"]