[{"_1":2,"_548":-5,"_549":-5},"loaderData",{"_3":4,"_312":313},"root",{"_5":-5,"_6":7,"_8":9,"_16":17,"_306":307},"user","language","en","languageConfig",{"_10":7,"_11":12,"_13":14,"_15":-5},"code","name","English","dir","ltr","subdomain","translations",{"_18":19,"_30":31,"_56":57,"_76":77,"_28":100,"_127":128,"_139":140,"_92":162,"_170":171,"_82":176,"_198":199,"_22":204},"header",{"_20":21,"_22":23,"_24":25,"_26":27,"_28":29},"home","Home","about","About","signIn","Sign in","signOut","Sign out","search","Search","footer",{"_32":33,"_34":35,"_36":37,"_38":39,"_40":41,"_42":43,"_44":45,"_46":47,"_48":49,"_50":51,"_52":53,"_54":55},"tagline","Everything about China's Innovation","description","Pandaily is a tech media based in Beijing. Our mission is to deliver premium content and contextual insights on China's technology scene to the worldwide tech community.","aboutUs","About Us","joinUs","Join Us","contactUs","Contact Us","writeForUs","Write for Us","donateToUs","Donate To Us","partnership","Partnership","trade","Trade","techBuzzChina","TechBuzz China","backToTop","Back to top","copyright","© 2017 - {{year}} Pandaily. All rights reserved.","categories",{"_58":59,"_60":61,"_62":63,"_64":65,"_66":67,"_68":69,"_70":71,"_72":73,"_74":75},"news","News","industry","Industry","startups","Startups","ai","AI","culture","Culture","market","Market","gadgets","Gadgets","auto","Auto","gaming","Gaming","common",{"_78":79,"_80":81,"_82":83,"_84":85,"_86":87,"_88":89,"_90":91,"_92":93,"_94":95,"_96":97,"_98":99},"readMore","Read more","loading","Loading...","error","Error","notFound","Not found","goBack","Go back","share","Share","enterHere","Enter here","posts","Posts","previous","Previous","next","Next","minRead","min read",{"_101":102,"_103":104,"_105":106,"_107":108,"_109":110,"_119":120,"_121":122,"_123":124,"_125":126},"placeholder","Search articles, categories, tags...","searching","Searching...","close","Close search","tipsTitle","Search Tips:","tips",{"_111":112,"_113":114,"_115":116,"_117":118},"autoSearch","Search is performed automatically as you type","exactPhrase","Use quotes for exact phrases: \"artificial intelligence\"","searchScope","Search works across article titles, content, categories, and tags","closeShortcut","to close","noResults","No results found for \"{{query}}\"","noResultsHint","Try adjusting your search terms or browse our categories","resultsCount","Found {{count}} result for \"{{query}}\"","resultsCount_plural","Found {{count}} results for \"{{query}}\"","category",{"_129":130,"_131":132,"_133":134,"_135":136,"_137":138},"title","Category","showing","Showing {{count}} of {{total}} posts in this category","noPosts","No posts found in this category","noPostsDescription","This category doesn't have any published posts yet.","browseAllPosts","Browse All Posts","homepage",{"_141":142,"_143":144,"_145":146,"_147":148,"_149":150,"_151":152,"_153":154,"_155":156},"featuredStory","Featured Story","featuredNews","Featured News","exploreByCategory","Explore by Category","latestNews","Latest News","exploreAllNews","Explore All News","noMorePosts","No more posts to load","loadingMore","Loading more news...","newsletter",{"_157":158,"_34":159,"_160":161},"stayUpdated","Stay Updated","Get the latest China tech news delivered to your inbox","subscribe","Subscribe to Newsletter",{"_163":164,"_131":165,"_133":166,"_135":167,"_94":95,"_96":97,"_168":169},"allPosts","All Posts","Showing {{count}} of {{total}} posts","No posts found","Check back later for new content.","backToAllPosts","Back to All Posts","tag",{"_129":172,"_131":173,"_133":174,"_135":175},"Tag","Showing {{count}} of {{total}} posts with this tag","No posts with this tag","This tag does not have any published posts yet.",{"_177":178,"_182":183,"_186":187,"_190":191,"_192":193,"_194":195,"_196":197},"404",{"_129":179,"_180":181},"Page Not Found","message","The page you're looking for doesn't exist or has been moved. Let's get you back on track!","500",{"_129":184,"_180":185},"Server Error","Our servers are having a moment. Our team has been notified and is working to fix this.","general",{"_129":188,"_180":189},"Oops! Something went wrong","We're sorry, but something unexpected happened. Please try again.","backToHome","Back to Home","tryAgain","Try Again","funTitle","Don't worry, this happens to the best of us!","funMessage","While you're here, why not explore our latest articles on China's tech scene? We have amazing insights waiting for you on our homepage.","meta",{"_129":200,"_34":201,"_202":203},"Pandaily - China Tech News, AI & Electric Vehicle Insights","Premier English-language source for Chinese technology news, AI breakthroughs, and electric vehicle developments. Deep insights from Beijing's tech landscape for the global community.","keywords","China tech news, Chinese technology, AI news China, electric vehicles China, Chinese startups, fintech China, Pandaily, TechBuzz China podcast",{"_198":205,"_209":210,"_220":221,"_234":235,"_281":282,"_298":299},{"_129":206,"_34":207,"_202":208},"About Pandaily - Premier China Tech News & Insights","Learn about Pandaily, Beijing's premier English-language media company delivering contextual insights on Chinese technology, business, and innovation to the global community.","Pandaily, China tech news, Chinese technology, TechBuzz China podcast, DecodeChina, Pandata, China business insights","hero",{"_129":211,"_212":213,"_214":215,"_216":217,"_218":219},"About Pandaily","subtitle","Beijing's premier English-language media company delivering contextual insights on Chinese technology, business, and innovation to the global community.","location","Beijing, China","globalAudience","Global Audience","millionsReached","Millions Reached","whoWeAre",{"_129":222,"_34":223,"_224":225},"Who We Are","Pandaily is a Beijing-based media company equipped with a deep understanding of China's technology landscape and the unicorns that drive its innovation. Our mission is to deliver premium content with contextual insights on Chinese technology, business, sports, and culture to the worldwide community.","stats",{"_226":227,"_228":229,"_230":231,"_232":233},"productLines","Product Lines","reach","Reach","podcast","Podcast","events","Events","whatWeDo",{"_129":236,"_212":237,"_238":239,"_252":253,"_267":268},"What We Do","Pandaily operates three core product lines designed to bridge the gap between China's dynamic tech ecosystem and the global community.","onlineContent",{"_129":240,"_241":242,"_230":245,"_248":249},"Online English Content","pandaily",{"_129":243,"_34":244},"Pandaily.com","Our website publishes English content on industrial insights, tech company moves, product reviews, and cultural pieces with a focus on North American and Asian readers.",{"_129":246,"_34":247},"TechBuzz China Podcast","Weekly insights from China experts Rui Ma & Ying-Ying Lu, uncovering unique perspectives on Chinese tech news that don't make it into English coverage.","video",{"_129":250,"_34":251},"Pandaily Video Series","In-depth reviews of smart devices and insider exploration of China's tech scene for all technology enthusiasts.","community",{"_129":254,"_255":256},"Community Connection","decodeChina",{"_129":257,"_34":258,"_259":260},"DecodeChina","A one-week intensive immersion into China's tech scene, occurring bi-monthly to broaden participants' understanding through:","items",{"_261":262,"_263":264,"_265":266},"visits","Company visits and networking","courses","Pandaily-designed courses","workshops","Workshops and cultural excursions","data",{"_129":269,"_270":271},"Data Service","pandata",{"_129":272,"_34":273,"_259":274},"Pandata","A comprehensive database containing information on China's most influential tech companies, including:",{"_275":276,"_277":278,"_279":280},"overviews","Company overviews","biographies","Executive team biographies","stories","Origin stories and developments","byTheNumbers",{"_129":283,"_34":284,"_224":285},"By the Numbers","As one of the most popular sources for the international community to learn about China, Pandaily has reached millions around the globe. Though our subscribers hail from all corners of the world, our goal is persistent: to break through the language barrier and strengthen our readers' understanding of China.",{"_286":287,"_288":289,"_290":291,"_292":293,"_294":295,"_296":297},"millions","Millions","millionsLabel","Global Readers Reached","weekly","Weekly","weeklyLabel","Podcast Episodes","global","Global","globalLabel","Subscriber Community","cta",{"_129":300,"_34":301,"_302":303,"_304":305},"Join Our Community","Stay connected with China's evolving tech landscape through our comprehensive coverage and expert insights.","readLatestNews","Read Latest News","listenToPodcast","Listen to Podcast","ENV",{"_308":309,"_310":311},"STRAPI_BASE_URL","https://cms.pandaily.com","GA_MEASUREMENT_ID","G-FZLJC5WJDF","routes/$slug",{"_314":315,"_371":372,"_6":7,"_547":328},"post",{"_316":317,"_129":318,"_319":320,"_321":322,"_323":324,"_325":326,"_327":328,"_329":330,"_331":332,"_333":334,"_6":7,"_335":336,"_337":-5,"_338":339,"_340":341,"_56":342,"_348":349,"_361":362,"_363":-5,"_364":-5,"_365":366,"_367":368,"_369":370},"documentId","b61o9ap2hatw0pea3ik934gp","HIT Shenzhen Team Develops Multimodal Large Model 'JiuTian', Tops OpenCompass Ranking","slug","hit-shenzhen-team-develops-multimodal-large-model-jiutian-tops-opencompass-ranking","excerpt","The first multimodal large-scale model 'JiuTian' has topped the OpenCompass multimodal large-scale model ranking upon its debut evaluation.","content","\n

Harbin Institute of Technology (Shenzhen) Computing and Intelligence Research Institute team, relying on Shenzhen Hashen Asset Management Co., Ltd. for achievement transformation, has established a multimodal large-scale model development enterprise - Shenzhen Ruoyu Technology Co., Ltd. (abbreviated as 'Ruo Yu Technology')

\n\n\n\n

The first multimodal large-scale model 'JiuTian' under Shenzhen Ruoyu Technology Co., Ltd. has topped the OpenCompass multimodal large-scale model ranking upon its debut evaluation.

\n\n\n\n

'123 billion parameters', '120 million image-text pairs', '5.5 million bilingual language samples', '1.2 million fine-tuning data samples', “500,000 reinforcement data samples”... The improvement of core parameters brings about a qualitative change in the model's capabilities. JiuTian multimodal large-scale model has achieved remarkable performance in logical reasoning, relational reasoning, and perceptual abilities.

\n\n\n\n

With over billions of parameters, JiuTian has achieved multimodal fusion of text, images, audio, and video. Its intelligent understanding and response capabilities not only cover fields such as natural language processing, computer vision, and speech recognition but also effectively break down the information barriers between different modalities, integrating them into a unified 'JiuTian'.

\n\n\n\n

'The 'JiuTian' symbolizes the highest celestial realm in ancient Chinese mythology, representing our boundless pursuit of technological progress and longing for an intelligent future. This model transcends the boundaries of various modes such as text, images, audio, and video with its powerful understanding and responsive capabilities, achieving true multimodal fusion.' Dr. Sun Teng, CEO of Ruoyu Technology, explained: 'By finding bridges that connect various fields from a disordered and fragmented information world, integrating information from different domains such as natural language processing, computer vision, and speech recognition breaks down the information silos between modalities and truly achieves orderly flow and communication of information.'

\n\n\n\n

Harbin Institute of Technology Shenzhen Campus has established an asset joint-stock company to encourage the transformation and implementation of achievements by faculty and staff. HIT (Shenzhen) receives policy support for the integration of production, education, and research. If Shenzhen Ruoyu Technology Co., Ltd. had been established from the beginning with the school as an initial shareholder, it would have provided strong support for the company's development.

\n\n\n\n

Recently, the well-known magazine IEEE Intelligent Systems announced its list of 'AI's 10 to Watch' for the year 2022. Professor Nie Liqiang was included in this list due to his contributions in the field of multimodal research. Professor Nie is a recipient of the DAMO Academy Qingcheng Award and TR35 China Award. He stated that the achievements of Harbin Institute of Technology (Shenzhen) in the field of artificial intelligence should not only exist within laboratories but also be transformed into practical applications to serve national defense, aerospace, and society.

\n\n\n\n

If Ruoyu Technology Co., Ltd. has another AI expert as a co-founder, it would be Professor Zhang Min. Professor Zhang is the Assistant President of Harbin Institute of Technology (Shenzhen), the first distinguished young scholar in NLP field in China, a national \"Top Talent\" recipient, a mid-career expert with outstanding contributions recognized by the state, and he also enjoys special allowances from the State Council. Harbin Institute of Technology ranks first among Chinese research institutions in NLP direction according to CSRankings (2022-2023), an authoritative ranking list in computer science. Professor Zhang is the most influential person at Harbin Institute of Technology in this field.

\n\n\n\n

Dr. Sun Teng, co-founder and CEO of Ruoyu Technology Co., Ltd. , is also a core expert in the company's research and development team. Dr. Sun's research has always focused on multimedia computing, with related achievements published in CCF A-class conferences and IEEE/ACM Trans. Dr. Sun has previous successful entrepreneurial experience and possesses full-process experience in the application of artificial intelligence technology in vertical fields as well as company management expertise.

\n\n\n\n

Geng Chen, another co-founder of Ruoyu Technology Co., Ltd. , serves as the company's strategic advisor. He has been repeatedly recognized as the best technology analyst by New Fortune magazine and has accumulated rich industry resources throughout his years of research career. He is responsible for investment and financing activities as well as connecting industrial resources for the company's implementation purposes.

\n\n\n\n

‘If Ruoyu Technology Co., Ltd. was established at this time, it has its historical mission and ideals. As cutting-edge researchers, we deeply feel the transformative impact of artificial intelligence on future society. The productivity explosion brought by generative AI will redefine production relationships in various industries. It is our honor and mission to have the opportunity to participate in it. ’Computing power, data, and talent are the three major barriers for entering the field of large-scale models, and Ruoyu Technology Co., Ltd. has gathered these core elements from its inception. The internally developed research and development team led by top talents has formed independent iterative capabilities. In the future, under the leadership of technical experts, ‘JiuTian’will continue to iterate.

\n\n\n\n

With top-notch entrepreneurial team, core capabilities in self-developed multimodal large models, and successful practical experience, Ruo Yu Technology expresses that it will bring a touch of brilliance to the 'Battle of Hundred Models'.

\n\n\n\n

Based on the foundation of large-scale model capabilities, reshaping each track has become an industry consensus. According to OpenAI's development path, when models reach a certain size, new abilities will emerge, especially some previously unseen capabilities.

\n\n\n\n

If JiuTian will continue to iterate in the future, Dr. Sun Teng said: 'JiuTian' is still iterating towards both larger and smaller directions. On one hand, it is increasing the scale of parameters to explore nodes that support the emergence of universal multimodal large models. On the other hand, in order to meet the application needs of industry users and achieve maximum effects with minimal computing power, it is necessary to compress large models into lightweight ones and combine them with edge computing devices.

\n\n\n\n

Based on the multimodal framework of 'JiuTian', Ruo Yu Technology's business model has a fundamental difference from the AI 1.0 era. In the past, the business model required redeveloping algorithms for each specific demand, operating on a project basis. With 'JiuTian' as a unified multimodal foundation, there is no need to redesign the framework; only minor adjustments based on different industry data are necessary to obtain corresponding industry models. Customers can even make secondary adjustments themselves according to their specific domain requirements using their own data.

\n\n\n\n

The difficulty of multimodal large models lies in the fusion of multimodal information. Common fusion methods include linear addition, cascading, and other relatively crude means. However, the final effect is often not as impressive as that of a single modality. This is because some technical teams lack experience and capabilities in fine-tuning multimodal data, integrating and aligning multimodal features.

\n\n\n\n

JiuTian has a fully integrated model training framework for autonomous development of multimodal feature extraction, alignment, fusion, and inference, as well as a comprehensive and meticulous process for collecting and cleaning multimodal data. The model's top ranking on the multimodal large-scale model list proves the team's leading capabilities in the field of multimodal large-scale models.

\n\n\n\n

Robots are system-level application products in the industrial field, and they are a key direction empowered by the multimodal large model base of 'Ruo Yu-Jiu Tian'. Harbin Institute of Technology currently has deep industry-academia-research accumulation in the field of robotics. In the future, embodied robots will require the fusion of multimodal information such as speech, vision, decision-making, and control to form a closed loop. The multimodal large model base of 'JiuTian' will further integrate research based on Harbin Institute of Technology's accumulated expertise in robotics and has already established deep cooperation with several large consumer electronics/automotive companies.

\n\n\n\n

With the 'JiuTian' multimodal large model base, Ruo Yu Technology has the ability to provide personalized and customized services for users in different fields through fine-tuning of existing multimodal large model bases. It provides capabilities such as language pre-training large models, multimodal pre-training large models, and vertical domain pre-training large models, aiming to build a future AI general-purpose platform and infrastructure.

\n","publishedDate","2023-08-09T21:48:43.000Z","featured",false,"viewCount",0,"readingTime",7,"status","draft","originalWordPressId",160296,"featuredImage","featuredImageUrl","https://assets.pandaily.com/uploads/2023/08/未命名的设计-4-1.jpg","gallery",[],[343],{"_316":344,"_11":65,"_319":64,"_345":346,"_34":347},"ou7tkn9cq6eba9jr68hqiwch","color","#000000","","tags",[350,353,357],{"_316":351,"_11":65,"_319":64,"_345":352,"_34":347},"ji5tef72gjtbd7bx0er6q9jv","#6366f1",{"_316":354,"_11":355,"_319":356,"_345":352,"_34":347},"j45fwu61bg7hx57fo10s37oq","China","china",{"_316":358,"_11":359,"_319":360,"_345":352,"_34":347},"mo0hxge43fpc98n7st8ovkxx","Computer Science","computer-science","authors",[],"seo","externalVideo","createdAt","2025-06-24T22:31:05.550Z","updatedAt","2025-06-24T23:45:48.413Z","publishedAt","2025-06-24T23:45:48.447Z","featuredPosts",[373,419,454,486,516],{"_316":374,"_129":375,"_319":376,"_321":377,"_323":378,"_325":379,"_327":380,"_329":330,"_331":332,"_333":381,"_6":7,"_335":-5,"_337":382,"_338":-5,"_56":392,"_348":394,"_361":415,"_363":-5,"_364":-5,"_365":416,"_367":417,"_369":418},"mmse2foiyudc0uk3mom59kb9","Lenovo Built the AI Engine Behind the 2026 World Cup — Here's How It Performed on Opening Night","lenovo-built-the-ai-engine-behind-the-2026-world-cup-here-s-how-it-performed-on-opening-night","For the global tech industry, the real story was unfolding behind the broadcast feed. Every one of those pivotal moments — the early goal, the VAR-reviewed red cards, the offside checks — ran through AI systems built and deployed by Lenovo, FIFA's official technology partner and the first Chinese company ever to occupy that role at a World Cup.","On the evening of June 12, inside Mexico City's legendary Estadio Azteca, host nation Mexico dispatched South Africa 2–0 in the opening match of the 2026 FIFA World Cup. Julián Quiñones struck in the ninth minute — the fastest opening-match goal since 2006 — and Raúl Jiménez headed in a second midway through the second half. Three red cards, a World Cup record for an opener, added to the drama.\nBut for the global tech industry, the real story was unfolding behind the broadcast feed. Every one of those pivotal moments — the early goal, the VAR-reviewed red cards, the offside checks — ran through AI systems built and deployed by Lenovo, FIFA's official technology partner and the first Chinese company ever to occupy that role at a World Cup.\n## From Shaky Bodycam to Broadcast-Grade First-Person View\nThe most visible piece of Lenovo's technology stack was the Referee View Al Stabilizer. Match officials have worn chest-mounted cameras for years, but the raw footage — captured while sprinting and pivoting through physical confrontations — has always been too jittery for live broadcast. Lenovo's AI-driven image stabilization pipeline processes the feed in real time with sub-two-second latency, reducing motion distortion by up to 50% while preserving the authentic first-person perspective.\n![101781440114_.pic.jpg](https://cms-image.pandaily.com/101781440114_pic_17ff1e6f17.jpg)\nFor the first time in World Cup history, billions of viewers could watch a goal unfold from the referee's own line of sight. When Quiñones fired his low shot past the goalkeeper, audiences around the world experienced the moment not from a distant camera tower but from the vantage point of the official standing meters away. Later, when South Africa's Siyabonga Siswana was sent off following a VAR review, the referee-cam replay offered an unprecedented window into the split-second judgment calls that define the modern game.\n## 3D Digital Avatars and \"Scalp-Level\" Offside Calls\nLenovo's **3D Digital Avatars** tackled what is perhaps the sport's most contentious flashpoint: offside decisions. Trained on hundreds of thousands of body-scan data points, the system auto-generated accurate 3D digital replicas of all 1,248 players in the tournament — an industry first. Rather than relying on flat 2D broadcast angles, VAR officials can now rotate a fully rendered 3D scene to verify offside positions down to what FIFA internally calls \"scalp-level precision.\"\nIn the opener, the technology was put to immediate use. All three red-card incidents and multiple offside calls were rendered through the 3D visualization pipeline, giving both officials and viewers a transparent, angle-independent view of each decision. Johannes Holzmüller, FIFA's Director of Innovation, has described the system as a major leap in both the accuracy and the public credibility of refereeing.\n## An AI Tactical Brain That Turns Two Days Into Two Hours\nLess visible to viewers but potentially more transformative for the sport itself is the **FIFA AI Pro** — the first FIFA-certified generative AI knowledge assistant for football. The system ingests millions of data points per match across more than 2,000 performance metrics. Coaching staffs can query it in natural language: ask for a comparison of set-piece conversion rates, request a tactical breakdown of an opponent's high-press patterns, or generate a scouting report on a substitute.\nPost-match analysis that previously required two full days of manual video review can now be completed in roughly two hours. For a tournament that has expanded to 48 teams across 16 cities in three countries, that kind of efficiency gain is not a luxury — it is an operational necessity.\n## The Infrastructure Beneath the AI\nNone of these AI applications would function without the edge-computing backbone Lenovo installed across all tournament venues. Pure cloud solutions cannot meet the latency and reliability requirements of live global broadcasting, so Lenovo deployed on-site **ThinkSystem servers** to handle real-time data throughput for streaming, predictive fault scheduling, and decision-support systems. ThinkPad laptops and Lenovo smartphones round out the device fleet powering day-to-day tournament operations. Across the three host countries, Intelligent Command Center and Technology Command Center Observability give organizers a unified, AI-augmented view of every venue simultaneously.\nThe scale of the challenge is staggering. The 2026 World Cup is the largest ever staged — 48 teams, 104 matches, an estimated 60 billion cumulative viewers, and data volumes projected at thousands of times the 2022 edition. Operating under near-zero tolerance for downtime, the opening match served as a high-stakes systems integration test that Lenovo's hybrid AI architecture passed cleanly.\n## A 24-Year Arc: From the Pitch to the Tech Stack\nThe narrative symmetry was hard to miss. On the same evening, a gala dinner in Mexico City — hosted by Tencent News and titled \"Night of Dreams: Civilization and Intelligence\" — brought together football legend Bora Milutinović, Lenovo Group vice president Carol Chen, sports broadcasters, and cultural figures. Milutinović, who coached Mexico to the quarterfinals at Azteca in 1986 and later led China to its only World Cup appearance in 2002, reflected on the arc: twenty-four years ago, Chinese football reached the World Cup stage through its players; today, Chinese technology is embedded in the tournament's core operating system.\nThe shift mirrors a broader evolution for Chinese companies on the global sports stage. Earlier generations of Chinese brands participated in international events primarily as sponsors — logo placements on perimeter boards. Lenovo's role at this World Cup is fundamentally different. The company is not buying visibility; it is building the technical infrastructure that makes the event function. From the Olympics to Formula 1 and now FIFA, Lenovo has moved from hardware supplier to end-to-end AI solutions provider for the world's most demanding live-event environments.\n## Beyond the Stadium: Community Football and Consumer AI\nLenovo is also using the World Cup moment to push its AI capabilities downstream. Through its global \"Work For Humankind\" initiative and the \"Your Club, Your Canvas\" program, the company brought generative AI tools to grassroots football. A community team in Beijing called \"Wellness United\" used Lenovo's AI system Qira (Tianxi AI in China) to design custom jerseys that fuse street-culture aesthetics with football identity. The team's designers then connected remotely with elementary school students in rural Yunnan province, guiding the children through their first-ever AI-assisted creative project — designing their own team kits from over 2,000 kilometers away.\nMeanwhile, on the consumer front, Lenovo launched a \"World Cup Prediction: Human vs. AI\" campaign in Beijing, pitting its Qira (Tianxi in China) AI agent against 11 leading Chinese AI models — including DeepSeek, Kimi, Ernie Bot, and Qwen — in a tournament-long prediction contest open to public participation. The initiative transforms passive viewership into interactive engagement while stress-testing multiple AI systems in a sustained, real-world scenario across all 104 matches.\n## What Comes Next\nCarol Chen framed the opening match as a beginning rather than a culmination. \"The World Cup is just a starting point,\" she said. \"As hybrid AI matures, it will gradually integrate into athletic training, event operations, content distribution, and fan interaction. We want to take the capabilities validated on the World Cup stage and distill them into replicable, scalable solutions.\"\nLenovo has already begun that process domestically. A strategic partnership with the Chinese Football Association will bring World Cup-grade smart-sports technology to the Chinese Super League. Parallel initiatives target youth academies and school football programs, aiming to democratize access to the same analytical and visualization tools now available to World Cup coaching staffs.\nThe opening whistle at Azteca was, in one sense, just the start of a football tournament. In another, it marked the moment that AI stopped being a sideshow add-on to elite sport and became part of the operating system — and that a Chinese technology company proved it could build that system for the biggest stage on earth.","2026-06-14T12:59:50.311Z",true,"published",{"_316":383,"_384":385,"_386":-5,"_387":-5,"_388":389,"_390":391},"n85jgvoo6wl8jozem1xclw8x","url","https://cms-image.pandaily.com/81781439606_pic_d0513e77eb.jpg","alternativeText","caption","width",600,"height",339,[393],{"_316":344,"_11":65,"_319":64,"_345":346,"_34":347},[395,399,403,407,411],{"_316":396,"_11":397,"_319":398,"_345":352,"_34":-5},"hvio3sza2xrdrp3z0u8wfjcu","World Cup 2026","world-cup-2026-tag",{"_316":400,"_11":401,"_319":402,"_345":352,"_34":347},"n2uu4sdwz1gizjdenghn1e0v","Lenovo","lenovo",{"_316":404,"_11":405,"_319":406,"_345":352,"_34":347},"cioqpkdtdi1m78uxfpyrckvh","Artificial Intelligence","artificial-intelligence",{"_316":408,"_11":409,"_319":410,"_345":352,"_34":-5},"qj8wznxhxz877vp5stkozhua","Technologies","technologies-1",{"_316":412,"_11":413,"_319":414,"_345":352,"_34":347},"zjc80kqzgfezdi6z7o5z2b35","3D","3d",[],"2026-06-14T12:50:09.325Z","2026-06-14T12:59:50.140Z","2026-06-14T12:59:50.265Z",{"_316":420,"_129":421,"_319":422,"_321":423,"_323":424,"_325":425,"_327":380,"_329":330,"_331":426,"_333":381,"_6":7,"_335":-5,"_337":427,"_338":-5,"_56":432,"_348":437,"_361":450,"_363":-5,"_364":-5,"_365":451,"_367":452,"_369":453},"y1lqw0bqzwqxad7ocyw7tg91","BYD Secretly Develops Humanoid Robot Codename 'Yao-Shun-Yu' as Auto Giants Race Into Embodied AI","byd-secretly-develops-humanoid-robot-codename-yao-shun--jun2026","BYD Secretly Develops Humanoid Robot Codename 'Yao-Shun-Yu' as Auto Giants Race Into Embodied AI\n\nBYD, China's largest electric vehicle manufacturer, has confirmed it is secretly developing humanoid robots under a project codenamed \"Yao-Shun-Yu.\" The revelation came from BYD Executive Vice President Li Ke in a recent interview, shedding light on the automaker's ambitions beyond electric vehicles and into the rapidly emerging field of embodied AI. The project was initiated in 2022 and operates under BYD's 15th Business Unit, which focuses on electronic integration and intelligence.","BYD Secretly Develops Humanoid Robot Codename 'Yao-Shun-Yu' as Auto Giants Race Into Embodied AI\n\nBYD, China's largest electric vehicle manufacturer, has confirmed it is secretly developing humanoid robots under a project codenamed \"Yao-Shun-Yu.\" The revelation came from BYD Executive Vice President Li Ke in a recent interview, shedding light on the automaker's ambitions beyond electric vehicles and into the rapidly emerging field of embodied AI.\n\nThe project was initiated in 2022 and operates under BYD's 15th Business Unit, which focuses on electronic integration and intelligence. Li Ke highlighted BYD's unique advantages in developing humanoid robots, noting the company's deep expertise in motors, batteries, electronics, precision manufacturing, and chips. The automaker also boasts a 4,000-plus engineer autonomous driving team and plans to invest 100 billion RMB in AI and automotive intelligence initiatives.\n\n\"The fundamental challenge in this space is that China's robots lack a brain, while US robots have strong brains but weak limbs,\" Li Ke said. \"BYD aims to produce robots that excel in both dimensions.\" This dual focus on hardware and intelligence differentiates BYD's approach from many competitors who prioritize one over the other.\n\nThe company is taking a pragmatic approach to production. The final humanoid robot product may not be entirely self-manufactured; BYD could adopt an open platform strategy, allowing third-party components and software integration. This mirrors BYD's \"technology fish pond\" corporate strategy, where the company prepares a wide range of technologies in advance and deploys them when market conditions are right.\n\nBYD would likely serve as its own largest customer for the robots. Potential use cases include deploying the humanoids as store greeters at BYD's expanding retail network and in factory floor roles across its manufacturing facilities. This captive demand provides a concrete revenue pathway that many robotics startups lack.\n\nBYD is far from alone in this race. Tesla has begun mass production of its Optimus Gen-3 humanoid robot, with 50 units already deployed at its Shanghai factory. XPeng plans to mass produce its IRON humanoid by the end of 2026, and Li Auto has its own internal project codenamed Nexus. The convergence of automakers into humanoid robotics reflects a broader recognition that the manufacturing and AI capabilities developed for autonomous vehicles transfer naturally to general-purpose robots.\n\nAs China's largest EV maker doubles down on embodied AI, the distinction between automaker and robotics company continues to blur, with BYD positioning itself at the intersection of both worlds.","2026-06-08T18:44:49.203Z",2,{"_316":428,"_384":429,"_386":-5,"_387":-5,"_388":430,"_390":431},"z9ual6eoll14vcacp5toc0c4","https://cms-image.pandaily.com/image_1780625733478_fc097aa549.jpeg",2000,1040,[433],{"_316":434,"_11":435,"_319":436,"_345":346,"_34":-5},"gwhfszki8m2h9k8f37u4cfyx","Robotics","robotics",[438,442,446],{"_316":439,"_11":440,"_319":441,"_345":352,"_34":347},"qa70r9uewj9vxf51cj452r18","BYD","byd",{"_316":443,"_11":444,"_319":445,"_345":352,"_34":347},"pjr9or9yxn9bsbltp19m6g5s","humanoid robot","humanoid-robot",{"_316":447,"_11":448,"_319":449,"_345":352,"_34":-5},"p3udk12s3pkcjp19xn11md06","Embodied AI Benchmark","embodied-ai-benchmark",[],"2026-06-05T01:55:53.724Z","2026-06-08T18:44:49.109Z","2026-06-08T18:44:49.174Z",{"_316":455,"_129":456,"_319":457,"_321":458,"_323":459,"_325":460,"_327":380,"_329":330,"_331":426,"_333":381,"_6":7,"_335":-5,"_337":461,"_338":-5,"_56":466,"_348":471,"_361":482,"_363":-5,"_364":-5,"_365":483,"_367":484,"_369":485},"f4ufsfsxnn63g9dn2hbm9l72","Unitree Files for IPO, Aiming to Become 'First Embodied Intelligence Stock'","unitree-files-ipo-embodied-intelligence-jun2026","Unitree Technology, a globally leading high-performance general-purpose robotics company, is set to have its initial public offering reviewed by the Shanghai St...","Unitree Technology, a globally leading high-performance general-purpose robotics company, is set to have its initial public offering reviewed by the Shanghai Stock Exchange's listing committee on June 1. The company, which shipped the highest number of humanoid robots globally in 2025, is positioning itself to become the \"first embodied intelligence stock\" on China's A-share market.\n\nAccording to Unitree's prospectus, the company's revenue surged from RMB 159 million to RMB 1.699 billion between 2023 and 2025, representing a compound annual growth rate of 226.78%. During the same period, net profit after deductions swung from a loss of RMB 18 million to a profit of RMB 591 million. However, in the first quarter of 2026, while revenue grew 68.49% year-on-year, net profit after deductions declined 52.55%, primarily due to a RMB 38.3 million increase in R&D expenses and significantly higher sales costs.\n\nIndustry experts view this \"strategic loss\" as acceptable given the company's heavy R&D investment in cutting-edge robotics technology. The STAR Market, China's sci-tech board, actively supports hard-tech enterprises, and Unitree's increased R&D spending is viewed favorably as long as investments remain focused on core technologies.\n\nUnitree's journey from performing on China's Spring Festival Gala stage to deploying robots at Tokyo's Haneda Airport demonstrates its expanding real-world applications, spanning quadrupedal robots to dual-arm semi-humanoid robots. The company has built an extensive ecosystem spanning component supply, application deployment, and indirect investment networks.\n\nWith policy support and capital market backing, China's domestic robotics industry is transitioning from a \"theme-driven\" phase to an \"independent pricing\" phase, with Unitree's listing potentially catalyzing a revaluation of the entire supply chain. The IPO is expected to unlock capital for further R&D and capacity expansion, benefiting the broader robotics supply chain including core components such as sensors, servo systems, and AI algorithms. The successful listing would mark a significant milestone for China's embodied AI sector, paving the way for more robotics companies to access public capital markets.","2026-06-08T18:44:13.621Z",{"_316":462,"_384":463,"_386":-5,"_387":-5,"_388":464,"_390":465},"tshleg1vz84jap4m3u9blbo1","https://cms-image.pandaily.com/dee3dbfd8ad66cc78818c426b8cb4339_3334ab035d.jpg",1438,960,[467],{"_316":468,"_11":469,"_319":470,"_345":346,"_34":-5},"hue01g6mx1gm4uk1amww98ca","IPO","ipo",[472,476,480],{"_316":473,"_11":474,"_319":475,"_345":352,"_34":-5},"d3syfednz11ilypi5unzasei","Unitree","unitree-tag",{"_316":477,"_11":478,"_319":479,"_345":352,"_34":-5},"n19frogo9ky15d3jk7p59y6c","Humanoid Robot","humanoid-robot-tag",{"_316":481,"_11":469,"_319":470,"_345":352,"_34":347},"uynky0cbzoo762qnvien2vdr",[],"2026-06-01T01:11:23.874Z","2026-06-08T18:44:13.508Z","2026-06-08T18:44:13.578Z",{"_316":487,"_129":488,"_319":489,"_321":490,"_323":491,"_325":492,"_327":380,"_329":330,"_331":493,"_333":381,"_6":7,"_335":-5,"_337":494,"_338":-5,"_56":499,"_348":501,"_361":512,"_363":-5,"_364":-5,"_365":513,"_367":514,"_369":515},"i2dv879a47clu2n5x0qfffjt","China’s AI Stack Is No Longer Catching Up — It’s Setting the Pace","china-s-ai-stack-is-no-longer-catching-up-it-s-setting-the-pace","For years, the narrative around China’s AI industry was framed as a race to close the gap with the West — faster chips, bigger models, more data. But a quiet shift has occurred.\n Driven by Huawei’s innovative “cluster + SuperPoD” architecture and the open‑source CANN framework, a complete end‑to‑end ecosystem has taken shape, providing a tangible alternative that is no longer merely theoretical.","For years, the narrative around China’s AI industry was framed as a race to close the gap with the West — faster chips, bigger models, more data. But a quiet shift has occurred. Judging by the numbers coming out of OpenRouter and the engineering choices behind DeepSeek V4, that framing is now out of date.\n\nChina’s AI ecosystem hasn’t just caught up. In key dimensions, it has moved ahead — and it’s built on a foundation that is architecturally distinct from anything Silicon Valley has produced.\n\n## The Token Consumption Tells the Story\n\nThe clearest signal of China’s AI maturity is usage data. According to continuous tracking from OpenRouter throughout March and April 2026, Chinese large models have consistently ranked first globally in weekly token consumption for multiple consecutive weeks.\n\nIn the week of March 9, Chinese model companies claimed the top two spots in the platform’s monthly statistics for the first time. By early April, all six of the top-ranked global models were Chinese.\n\nTo put that in context: China’s daily token consumption has surged from roughly 100 billion to 140 trillion. That’s not the kind of growth you see from researchers running experiments. That’s what AI becoming infrastructure looks like — the same category as electricity or broadband, not a demonstration project.\n\nThe significance of that scale goes beyond bragging rights. Token consumption is a proxy for economic integration. Every enterprise workflow automated, every developer tool powered, every consumer product enhanced — each generates usage that feeds back into model improvement and ecosystem depth. At 140 trillion tokens a day, Chinese AI companies are accumulating real-world training signal and deployment experience at a pace that is very difficult to replicate from behind.\n\nWhile much of the Western tech industry is still debating when AI applications will become real, in China, the answer is already embedded in the daily usage numbers.\n\n## DeepSeek V4 Changes the Chip Conversation\n\nThe release of DeepSeek V4 was a technical milestone, but perhaps not for the reason most people assume. Yes, the model’s capabilities are impressive. But the more significant story is what happened at the infrastructure level.\n\nWhen Huawei announced full support for DeepSeek V4 at the same moment the model launched, it shattered a long-standing assumption in the industry: that Chinese chips were perpetually a half-step behind, requiring adaptation work after the fact. The “release-as-launch” model turned that assumption on its head.\n\nThis wasn’t a transplant-and-adapt process. DeepSeek V4 and the Atlas SuperPoD product were co-designed — the model’s fine-grained Expert Parallel (EP) architecture was built with the hardware in mind from the start. As DeepSeek’s technical report states in Section 3.1: “We have verified this fine-grained expert parallel scheme on both the NVIDIA GPU and Huawei Ascend NPU platforms.” The scheme splits MoE experts into waves and continuously overlaps computation, dispatch, and result-sending — delivering a 1.5x to 1.73x performance improvement on the Atlas SuperPoD product, with gains reaching up to 1.96x on latency-sensitive RL rollouts. That’s not “usable.” That’s a performance advantage.\n\nTo appreciate why this matters, consider how NVIDIA built its dominance. It wasn’t just chips — it was two decades of models, frameworks, and libraries all optimized for NVIDIA hardware, creating a self-reinforcing loop where the best models ran best on NVIDIA. DeepSeek V4’s co-design with the Atlas SuperPoD product is the first convincing evidence that China is building its own version of that loop — and that it’s already producing results.\n\nFor a global AI industry that has grown accustomed to NVIDIA as the only serious option, this represents a genuine alternative — one that is no longer theoretical.\n\n## The System Shift: From Stacking Chips to SuperPoD\n\nUnderstanding why this matters requires stepping back from individual chip specs and looking at how large-scale AI training and inference actually work.\n\nThe bottleneck in modern AI computing is no longer single-chip performance. It’s cluster efficiency. When you’re running clusters of thousands — or tens of thousands — of accelerators, two problems dominate:\n\n**Communication overhead.** Data synchronization across chips introduces latency that eats into raw computing power. The larger the cluster, the worse the linear speedup ratio degrades.\n\n**Memory constraints.** Large MoE models have parameter counts that no single chip can hold. That requires cross-node unified addressing and efficient memory access at the system level.\n\nNo matter how fast a single chip runs at peak, the cluster’s bottleneck brings the effective throughput down to the weakest link. This is why the industry’s competitive focus has shifted from “peak FLOPS per chip” to “effective throughput per cluster.” Simply buying and stacking more chips — the approach that worked in earlier AI generations — stops scaling efficiently past a certain point.\n\nHuawei’s answer is an innovative “cluster + SuperPoD” architecture, and the latest SuperPoD product — a system-level re-think rather than an incremental hardware upgrade.\n\nAt the heart of this is the Atlas 950 SuperPoD (AI computing) and TaiShan 950 SuperPoD (general computing). The Atlas 950 SuperPoD supports up to 8,192 cards interconnected via Huawei’s UnifiedBus interconnect, delivering ultra-high bandwidth, ultra-low latency, and unified memory addressing across the entire cluster. That last feature matters most: unified memory addressing means the software doesn’t need to explicitly manage address mapping for data transmission between nodes — from the model’s perspective, the cluster behaves like a single large-memory system, which is exactly what MoE architectures need to run efficiently at scale. It is currently the only AI SuperPoD in China to have achieved large-scale commercial deployment.\n\nThe TaiShan 950 SuperPoD extends this architectural logic to general-purpose computing — and goes further. It introduces TB-level interconnect bandwidth, hundred-ns-level latency, and memory pooling that enables cross-node data transfer via memory semantics, fundamentally addressing the long-standing challenges of high latency, data movement overhead, and coordination inefficiency in general compute workloads. This also makes it a foundational architecture for IT infrastructure in the Agentic AI era. \n\n## The Ecosystem Question: CANN’s Open-Source Play\n\nHardware is only half the story. The other half — and historically, the more difficult half for Chinese tech — is the software ecosystem.\n\nDevelopers don’t adopt new hardware because the specs look good. They adopt it when the migration cost is low and the tooling is mature. This is precisely where challengers to NVIDIA have consistently stumbled: AMD’s ROCm ecosystem, for instance, offers competitive hardware but has struggled to attract the developer base needed to match CUDA’s depth of tooling and documentation.\n\nHuawei’s open-source strategy for CANN (Compute Architecture for Neural Networks) is designed to address exactly this concern — by meeting developers where they already are rather than asking them to start over.\n\nCANN supports Ascend C and PyPTO, and is compatible with major programming frameworks including Triton and TileLang. More than 70 mainstream models — Chinese and international — work out of the box. The library includes 1,500+ basic operators and 100+ fusion operators. The system is integrated with more than 90 open-source communities.\n\nCANN went fully open-source in 2025. In the five months since, 65 open-source projects have launched in the community — roughly one new project every three days. Monthly active developers in the community now exceed 3,000.\n\nThat pace of ecosystem growth is meaningful. Developer ecosystems are notoriously slow to build and fast to abandon. The open-source model distributes the development cost across the community while creating genuine ownership — the same playbook that made PyTorch and Linux what they are. The numbers suggest this one is gaining genuine momentum.\n\nWhat This Means for the Global AI Industry\n\nThe picture that emerges from all of this is not simply “China has good AI chips now.” It’s something more structural.\n\nChina’s AI stack — from the Atlas 950 SuperPoD and TaiShan 950 SuperPoD at the infrastructure layer, through the CANN open-source framework, to models like DeepSeek V4 at the application layer — now constitutes an end-to-end, domestically innovated ecosystem. The chip-to-model closed loop that the industry once assumed only NVIDIA and its partners could provide is no longer exclusive.\n\nFor global customers and developers, this changes the calculus in a meaningful way. There is now a new option for the Agentic AI era: one with competitive performance benchmarks, a growing open-source ecosystem, and a computing stack purpose-built for the demands of persistent, multi-step AI workloads that define where the industry is heading.\n\nWhether that option gets adopted widely will depend on factors beyond technology: trust, enterprise inertia, and developer familiarity all play a role. But the technical foundation is real, and it is no longer being built — it has been built.\n\nThe more interesting question now is how fast the rest of the world notices.\n\n","2026-06-08T18:43:22.545Z",8,{"_316":495,"_384":496,"_386":-5,"_387":-5,"_388":497,"_390":498},"fs9k878gmvvc5ueohd4aa0yz","https://cms-image.pandaily.com/feature_945d0048ae.jpg",1430,804,[500],{"_316":344,"_11":65,"_319":64,"_345":346,"_34":347},[502,507],{"_316":503,"_11":504,"_319":505,"_345":352,"_34":506},"jponyn46ilsnjscx0pzd1529","China AI ecosystem","china-ai-ecosystem","The integrated network of Chinese hardware, models, software frameworks, and deployment infrastructure that has achieved full-stack independence. Unlike earlier “copy-and-adapt” approaches, this ecosystem is architecturally distinct—exemplified by co-designed solutions like DeepSeek V4 running on Huawei’s Ascend NPUs via the open-source CANN framework. Its scale (140 trillion tokens/day) signals AI as infrastructure, not experimentation.",{"_316":508,"_11":509,"_319":510,"_345":352,"_34":511},"rt6nwbeo4i0vqej4micc0bq3","SuperPoD architecture","super-po-d-architecture","A cluster-level computing design from Huawei that treats thousands of accelerators as a single, unified memory system. The Atlas 950 SuperPoD (AI) and TaiShan 950 SuperPoD (general computing) overcome traditional bottlenecks—communication overhead and memory constraints—by using high-bandwidth interconnects and memory pooling. This enables efficient MoE model training/inference where simply stacking chips fails, delivering up to 1.96× performance gains for latency-sensitive workloads.",[],"2026-06-01T11:06:17.775Z","2026-06-08T18:43:22.399Z","2026-06-08T18:43:22.493Z",{"_316":517,"_129":518,"_319":519,"_321":520,"_323":521,"_325":522,"_327":380,"_329":330,"_331":523,"_333":381,"_6":7,"_335":-5,"_337":524,"_338":-5,"_56":527,"_348":530,"_361":543,"_363":-5,"_364":-5,"_365":544,"_367":545,"_369":546},"eiompattwon08cp12frjjf4j","From DeepSeek to DeepRoute: Why a Top AI Researcher Bet on the Physical World","from-deep-seek-to-deep-route-why-a-top-ai-researcher-bet-on-the-physical-world","At the 2026 Beijing Auto Show, DeepRoute.ai signaled its shift from ADAS supplier to Physical AI infrastructure builder, combining a unified foundation model, large-scale real-world data, and the addition of ex-DeepSeek scientist Ruan Chong to bet on AI for the physical world.","### A Stage, Not a Product Launch\n\nOn April 25, 2026, in Hall A4 of the China International Exhibition Center in Beijing, DeepRoute.ai held a press conference that stood apart from the spectacle of concept cars and glossy spec sheets filling the surrounding halls. There was no vehicle on display. By leaving the showroom floor empty of hardware, DeepRoute sent a clear message: they aren't a carmaker, but the 'brain' builder. Instead of a product launch, CEO Maxwell Zhou used the stage to lay out a broader thesis: that the true horizon for autonomous driving isn't just better cars, but the creation of AI infrastructure for the physical world.\n\n![微信图片_20260428225041_9_1958.jpg](https://cms-image.pandaily.com/20260428225041_9_1958_0e1504bac3.jpg)\n\nThe event was a deliberate full-stack declaration. In the span of one afternoon, DeepRoute unveiled its top-level strategic framing (Physical AI), its core technical architecture (the Foundation Model), a glimpse of new product direction (a cabin-driving integrated Agent), a vision statement (\"make peace of mind the norm\"), and a market position: one in every three new urban NOA-equipped vehicles in China now runs on DeepRoute's system — over 300,000 cars on the road.\n\n![微信图片_20260428225040_8_1958.jpg](https://cms-image.pandaily.com/20260428225040_8_1958_21f461b8d3.jpg)\n\nBut perhaps the most significant moment came midway through the event, when Chief Scientist Ruan Chong — formerly the head of R&D at DeepSeek and a core researcher in multimodal AI — stepped onto a public stage for the first time since joining the company. His presence, as much as anything he said, sent a signal that the industry is reading carefully.\n\n### From Better Supplier to Infrastructure Builder\n\nThe autonomous driving industry has long competed on feature benchmarks: which system handles rain better, which detects coner cases faster. DeepRoute's framing at this year's Beijing Auto Show broke from that paradigm entirely. Maxwell Zhou articulated a vision not of a better ADAS supplier, but of a company building the foundational AI layer for the physical world, \"like electricity or telecommunications,\" as he put it, \"infrastructure that supports how the real world runs.\"\n\nThis is a meaningful conceptual shift. \"Software-defined vehicle\" framing, which dominated the industry's self-description for the better part of a decade, ultimately remained product-centric: software as the differentiator within a vehicle context. \"Physical AI infrastructure\" is capability-centric — it points to a layer of AI competence that can be deployed across a wide range of embodied agents, beginning with autonomous vehicles but explicitly not ending there.\n\nMaxwell Zhou was direct in his reasoning: \"What I care about most is safety. Ninety percent of what matters is safety — everything else is ten points.\" The aspiration for 1,000+ kilometer MPCI (Miles Per Critical Intervention) by the end of 2026 is the concrete expression of that belief. \"Tesla has already done this,\" he said during the media roundtable. \"If someone else can do it, we can do it too.\"\n\nThe underlying argument is that this level of reliability is simply not achievable via the small-model paradigm. \"Whatever you do in the small-model world, you cannot get ten times better by working harder,\" Zhou said. \"That's not the path.\"\n\n### The Signal in the Talent Migration\n\nWhen Ruan Chong left DeepSeek to join DeepRoute as Chief Scientist, the industry took notice. His public debut at Beijing Auto Show made that bet official.\n\nIn the media roundtable, Ruan was characteristically direct about his reasoning. \"I don't like working on things with diminishing marginal returns,\" he said. \"Language models are very mature — almost any task can be handled by one model. But in multimodal and embodied intelligence, we're nowhere near that stage. I'd rather be part of a frontier than a mature field.\" He also cited a sense of mission: \"If my presence or absence makes no difference, why am I doing it?\"\n\nThis isn't an isolated move. Maxwell Zhou framed it as a broader trend: \"Today, the heads of multimodal research at major internet companies are coming into autonomous driving. That's because once multimodal has a breakthrough, you can do precise experimental prediction — and then it generates impact in the physical world.\" Gemini's advances in early 2026, he argued, represented a capability inflection that made the physical-AI bet credible in a way it wasn't in 2024 or 2025.\n\nThis talent migration matters beyond optics. In an industry where R&D approach determines everything, the arrival of researchers who built frontier LLM systems changes what kinds of problems a company can even attempt to solve.\n\n### The Architecture: One Model to Drive, Understand, and Judge\n\nRuan Chong's keynote was titled \"Being AI-Native in the Post-LLM Era\" — a deliberate framing that locates DeepRoute's technical approach within the broader trajectory of AI development, rather than within the narrower history of ADAS.\n\nThe core argument: traditional autonomous driving systems are built around many small, specialized models — one for pedestrian detection, one for traffic lights, one for trajectory planning, and so on. This creates what Ruan called \"cognitive fragmentation\" — brittle hand-offs between models, difficulty integrating new data, and a ceiling on what the overall system can learn.\n\nDeepRoute's Foundation Model unifies three capabilities under a single architecture:\n\nThe Driver Model handles actual driving decisions — taking sensor inputs and outputting actions (steering, braking, acceleration).\n\nThe Analyst Model integrates language modality. It can explain why the vehicle is making a given decision in natural language — \"approaching an intersection with a blind corner, decelerating to account for potential pedestrian emergence\" — while simultaneously handling data annotation across the R&D pipeline.\n\nThe Critic Model enables learning from negative data — not just mimicking good driving behavior, but understanding why certain behaviors (running red lights, competing for right-of-way) are bad, and actively avoiding them. \"In the small-model era, you could only use positive data,\" Ruan explained. \"Now we can tell the model what bad looks like, and let it learn to avoid those patterns.\"\n\nThe practical result of this architecture is a compression of the R&D iteration cycle from approximately five days to twelve hours. That number deserves more attention than it typically gets. It doesn't just mean faster development — it means a qualitatively different research process: one where the team can run experiments, observe results, and adjust approach on a daily cadence rather than a weekly one. At scale, that compounds into a significant capability advantage.\n\nRuan was also candid about the deployment challenge. Large models face real constraints on edge hardware. His answer was two-pronged: distillation (using the large model to train a smaller one, yielding a small model far superior to one trained from scratch) and time (\"trust the trajectory of hardware — a 50MB model that seemed huge in 2017 looks trivial now; the same will happen at every scale\").\n\n### Data as Infrastructure: The Flywheel Logic\n\nDeepRoute's current market position is not incidental to its technical strategy — it is the strategy. The 300,000+ vehicles on the road running DeepRoute's system have generated over 1.3 billion kilometers of real-world driving data and 44.8 million hours of active usage in the past year alone.\n\nThis isn't primarily a commercial achievement — it's a data flywheel. Physical AI systems, unlike language models, cannot be trained primarily on pre-existing internet data. The data has to come from real-world deployment. Every additional vehicle running DeepRoute's system produces more training signal for the Foundation Model, which improves the system, which makes it more attractive to OEM partners, which expands deployment. The 2026 target of one million vehicles on road is, in this light, not just a sales goal — it's a model training goal.\n\nZhou was explicit about the inflection point: \"Once you're above two million vehicles per year, the marginal cost of additional data decreases. At that point, data stops being the bottleneck.\" The current 300,000-vehicle position is designed to get DeepRoute to that threshold.\n\nThe roadmap is ambitious but specific: 1,000+ km MPCI by end of 2026, user high-frequency activation rate above 50%, and the cabin-driving integrated Agent entering production. These targets are interdependent — higher MPCI builds user trust, higher activation generates more data, more data improves MPCI.\n\n### Path Competition: A Global Frame\n\nThe Physical AI frame places DeepRoute in a global competition that extends beyond the autonomous driving market. The key technical contenders — Tesla, Waymo, and an increasingly capable Chinese ecosystem — are converging on a similar insight: that the path to reliable autonomous systems runs through unified foundation models trained at scale on real-world data, not through the progressive refinement of specialized small models.\n\nZhou was respectful but direct about Tesla's position: \"Tesla has already hit 1,000 km MPCI. We don't know if they can go from 1,000 to 10,000 — that depends on whether their multimodal approach can scale further. But if it can, that's a USD 4 trillion company. That's what Musk is betting on.\"\n\nThe roundtable discussion surfaced a more nuanced debate on technical architecture. Xu Yinghao, formerly of Ant Group's embodied intelligence team, argued that VLA (Vision-Language-Action) models and world models are not competing approaches but complementary ones: VLA provides the deployment-ready capability, world models provide the data synthesis that makes VLA training possible at scale. Alibaba Cloud's Huo Jian pointed to reinforcement learning as the paradigm most likely to break the ceiling on both: \"The pattern of labeled data driving model improvement is being superseded.\"\n\nWhere does DeepRoute fit in this picture? Its approach — unified foundation model plus scaled real-world data — is neither pure simulation-dependent nor purely end-to-end in the Tesla sense. The 12-hour data flywheel is designed precisely to make the distinction less important: if you can run high-quality experiments fast enough, the choice of architectural paradigm becomes less determinative than the quality of the iteration process itself. \"True leadership isn't a model at a point in time,\" Ruan said. \"It's how you organize the research process to keep improving.\"\n\n### The Power Structure Question\n\nIf Physical AI becomes a genuine infrastructure layer — comparable in significance to mobile connectivity or cloud computing — then the competitive dynamics between three categories of players will be reshaped: technology giants (who own foundation model capabilities), automakers (who own manufacturing scale and real-world deployment channels), and autonomous driving specialists (who own the engineering bridgework between the two).\n\nMaxwell Zhou's framing at the roundtable was pointed on this: the companies that will define the outcome are not those that capture the largest market share in the near term, but those that build capabilities that cannot be easily replicated. In his view, the Physical AI infrastructure layer will ultimately be owned by whoever does the hard foundational work — the architecture-level research, the data systems, the iteration methodology — not by whoever deploys the most aggressively in the short term. It is a bet on depth over speed, and on compound returns from genuine technical ownership rather than execution against a borrowed blueprint.\n\nDeepRoute's self-positioning as infrastructure — not product, not feature set — is a deliberate move in this dynamic. Infrastructure companies are not typically winner-take-all markets in the way software products are; they tend toward oligopoly with high switching costs. If that logic holds for Physical AI, a 200,000-vehicles-per-year operation generating unique training data from real-world deployment is a more defensible position than any single model architecture.\n\n### The China Advantage — and Its Limits\n\nChina's role in this story is worth examining carefully. The country's EV market penetration rate, complex urban environments, and regulatory tolerance for large-scale testing have created conditions that are, at minimum, highly favorable for the kind of data-intensive Physical AI development DeepRoute is pursuing. \"One in every three new urban NOA vehicles in China runs on our system\" is not just a commercial metric — it reflects the density of real-world physical AI deployment that is simply harder to achieve at comparable scale elsewhere.\n\nThe \"technology-scenario-data-business\" rapid iteration loop that Zhou described is arguably more executable in China's current market than in any other geography. The combination of willingness to deploy partially-capable AI systems at scale, a manufacturing ecosystem that can execute on high-volume OEM agreements, and a talent pipeline shaped by years of foundation model research — including researchers like Ruan Chong who have worked at the frontier of both language and multimodal AI — creates a specific advantage.\n\nThe harder question is whether that advantage compounds over time or faces ceiling effects. Physical AI deployment generates unique value from diversity and complexity of scenarios, not just volume. China's urban environments provide the former. But trust, regulation, and societal willingness to rely on AI systems for safety-critical physical tasks will determine how far the deployment envelope can extend — in China and globally.\n\n### What This Moment Means\n\nDeepRoute's Beijing Auto Show announcement was, in the end, not about any single product or metric. It was about a bet on which kind of AI company matters in the next decade.\n\nThe claim that Physical AI represents the next major competitive arena after language AI is not unique to DeepRoute — it's becoming a consensus view across the industry. What DeepRoute is arguing is that within that arena, the decisive advantage will go to companies that can close the data-model-deployment flywheel fastest, at the highest level of real-world complexity, with the talent capable of operating frontier research methods in a physical context.\n\nRuan Chong's arrival, the 12-hour iteration cycle, the 300,000-vehicle data asset, and the 1,000 km MPCI target are all components of the same argument. Whether that argument proves correct — whether DeepRoute can translate a strong market position in Chinese urban NOA into genuine Physical AI infrastructure — will be one of the more consequential questions in global technology over the next few years.\n\nWhat is already visible is that the framing of competition has changed. The question is no longer which ADAS supplier has the best performance on a benchmark. It's which company is building the layer of AI capability that the physical world will run on. That's a different kind of race, and it's one that Beijing Auto Show 2026 made unmistakably clear has begun.","2026-04-29T06:58:17.435Z",12,{"_316":525,"_384":526,"_386":-5,"_387":-5,"_388":430,"_390":431},"a57b9ioczo7u8568tx4h7co1","https://cms-image.pandaily.com/Deep_Route_1_3c590209d3.png",[528],{"_316":529,"_11":59,"_319":58,"_345":346,"_34":347},"u9uewvwvdfl4hd8yy6xyqkwq",[531,535,539],{"_316":532,"_11":533,"_319":534,"_345":352,"_34":347},"dlqtconq7x9fwzf6kepwq94w","DeepRoute.ai","deeproute-ai",{"_316":536,"_11":537,"_319":538,"_345":352,"_34":347},"mlhvdd2f7cr9wfoqefxbf6d5","ADAS","adas",{"_316":540,"_11":541,"_319":542,"_345":352,"_34":347},"l42xhcsepyvfcsemx6tdd8p2","DeepSeek","deepseek",[],"2026-04-28T14:49:28.298Z","2026-04-29T06:58:17.307Z","2026-04-29T06:58:17.389Z","isDraft","actionData","errors"]