{"payload":{"pageCount":1,"repositories":[{"type":"Public","name":"LightZero","owner":"opendilab","isFork":false,"description":"[NeurIPS 2023 Spotlight] LightZero: A Unified Benchmark for Monte Carlo Tree Search in General Sequential Decision Scenarios","allTopics":["board-game","reinforcement-learning","pytorch","gym","mcts","gomoku","tictactoe","atari","alpha-beta-pruning","monte-carlo-tree-search","continuous-control","board-games","alphazero","self-play","mcts-algorithm","muzero","stochastic-muzero","efficientzero","sampled-muzero","gumbel-muzero"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":11,"issueCount":5,"starsCount":903,"forksCount":80,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-31T06:20:02.435Z"}},{"type":"Public","name":"DI-engine","owner":"opendilab","isFork":false,"description":"OpenDILab Decision AI Engine","allTopics":["impala","reinforcement-learning-algorithms","minigrid","atari","imitation-learning","distributed-system","drl","inverse-reinforcement-learning","r2d2","smac","mujoco","multiagent-reinforcement-learning","pytorch-rl","self-play","model-based-reinforcement-learning","exploration-exploitation","distributed-reinforcement-learning","offline-rl","python","reinforcement-learning"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":10,"issueCount":4,"starsCount":2653,"forksCount":342,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-30T08:14:46.009Z"}},{"type":"Public","name":"PPOxFamily","owner":"opendilab","isFork":false,"description":"PPO x Family DRL Tutorial Course(决策智能入门级公开课:8节课帮你盘清算法理论,理顺代码逻辑,玩转决策AI应用实践 )","allTopics":["python","course","reinforcement-learning","deep-reinforcement-learning","decision-intelligence"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":42,"issueCount":13,"starsCount":1768,"forksCount":161,"license":"Apache License 2.0","participation":[1,3,2,0,1,0,4,6,1,1,7,0,1,0,0,0,0,0,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-15T11:44:33.821Z"}},{"type":"Public","name":"DI-engine-docs","owner":"opendilab","isFork":false,"description":"DI-engine docs (Chinese and English)","allTopics":["reinforcement-learning","deep-learning","reinforcement-learning-algorithms","imitation-learning","inverse-reinforcement-learning","pytorch-rl","model-based-reinforcement-learning","multi-agent-reinforcement-learning","offline-rl"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":0,"starsCount":253,"forksCount":58,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-08T09:33:37.095Z"}},{"type":"Public","name":"DI-star","owner":"opendilab","isFork":false,"description":"An artificial intelligence platform for the StarCraft II with large-scale distributed training and grand-master agents.","allTopics":["league","artificial-intelligence","starcraft2","self-play","reinforcment-learning","deep-learning","deep-reinforcement-learning"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":1177,"forksCount":111,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-06T03:08:47.648Z"}},{"type":"Public","name":"SmartRefine","owner":"opendilab","isFork":false,"description":"[CVPR 2024] SmartRefine: An Scenario-Adaptive Refinement Framework for Efficient Motion Prediction","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":5,"starsCount":56,"forksCount":4,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-22T12:31:33.976Z"}},{"type":"Public","name":"SO2","owner":"opendilab","isFork":false,"description":"[AAAI2024] A Perspective of Q-value Estimation on Offline-to-Online Reinforcement Learning","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":255,"forksCount":2,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-23T06:51:44.260Z"}},{"type":"Public","name":"InterFuser","owner":"opendilab","isFork":false,"description":"[CoRL 2022] InterFuser: Safety-Enhanced Autonomous Driving Using Interpretable Sensor Fusion Transformer","allTopics":["transformer","autonomous-driving","bird-view-image"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":56,"starsCount":481,"forksCount":42,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-20T14:08:54.147Z"}},{"type":"Public","name":"DI-toolkit","owner":"opendilab","isFork":false,"description":"A simple toolkit package for opendilab","allTopics":["python","toolkit"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":101,"forksCount":3,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-17T12:37:33.903Z"}},{"type":"Public","name":"CodeMorpheus","owner":"opendilab","isFork":false,"description":"CodeMorpheus: Generate code self-portraits with one click(一键生成代码自画像,决策型 AI + 生成式 AI)","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":39,"forksCount":2,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-08T14:49:47.913Z"}},{"type":"Public","name":"huggingface_ding","owner":"opendilab","isFork":false,"description":"Auxiliary code for pulling, loading reinforcement learning models based on DI-engine from the Huggingface Hub, or pushing them onto Huggingface Hub with auto-created model card.","allTopics":["decision-making","huggingface","reinforcement-learning"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":29,"forksCount":1,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-12-12T06:03:21.066Z"}},{"type":"Public","name":"LLMRiddles","owner":"opendilab","isFork":false,"description":"Open-Source Reproduction/Demo of the LLM Riddles Game","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":3,"issueCount":0,"starsCount":485,"forksCount":34,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-11-29T16:18:55.701Z"}},{"type":"Public","name":"treevalue","owner":"opendilab","isFork":false,"description":"Here are the most awesome tree structure computing solutions, make your life easier. (这里有目前性能最优的树形结构计算解决方案)","allTopics":["tree","framework","nested-structures","python3","data-structures","tree-structure"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":4,"starsCount":223,"forksCount":3,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-10-22T19:24:50.939Z"}},{"type":"Public","name":"DI-treetensor","owner":"opendilab","isFork":false,"description":"Let DI-treetensor help you simplify the structure processing!(树形运算一不小心就逻辑混乱?DI-treetensor快速帮你搞定)","allTopics":["reinforcement-learning","deep-learning","numpy","tree-structure","tensor","python","pytorch"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":1,"starsCount":187,"forksCount":5,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-09-19T09:46:39.764Z"}},{"type":"Public","name":"GoBigger","owner":"opendilab","isFork":false,"description":"[ICLR 2023] Come & try Decision-Intelligence version of \"Agar\"! Gobigger could also help you with multi-agent decision intelligence study.","allTopics":["game","python","environment","league","multi-agent","gym","rl-environment","reinforcement-learning"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":440,"forksCount":35,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-08-31T05:41:03.711Z"}},{"type":"Public","name":"DOS","owner":"opendilab","isFork":false,"description":"[CVPR 2023] ReasonNet: End-to-End Driving with Temporal and Global Reasoning","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":8,"starsCount":120,"forksCount":10,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-06-29T08:09:46.085Z"}},{"type":"Public","name":"DI-smartcross","owner":"opendilab","isFork":false,"description":"Decision Intelligence platform for Traffic Crossing Signal Control","allTopics":["traffic-signal-control","traffic-light-control","reinforcement-learning"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":217,"forksCount":4,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-03-22T03:18:23.171Z"}},{"type":"Public","name":"Gobigger-Explore","owner":"opendilab","isFork":false,"description":"Still struggling with the high threshold or looking for the appropriate baseline? Come here and new starters can also play with your own multi-agents! ","allTopics":["multi-agent","reinforcement-learning"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":174,"forksCount":9,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-02-20T10:25:22.776Z"}},{"type":"Public","name":"DI-sheep","owner":"opendilab","isFork":false,"description":"羊了个羊 + 深度强化学习(Deep Reinforcement Learning + 3 Tiles Game)","allTopics":["react","javascript","typescript","reinforcement-learning","deep-reinforcement-learning","artificial-intelligence","di-engine","python"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":390,"forksCount":24,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-02-13T11:39:56.665Z"}},{"type":"Public","name":"LightTuner","owner":"opendilab","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":159,"forksCount":2,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-12-26T04:56:42.845Z"}},{"type":"Public","name":"DI-adventure","owner":"opendilab","isFork":false,"description":"Decision Intelligence Adventure for Beginners","allTopics":["python","reinforcement-learning","deep-reinforcement-learning"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":61,"forksCount":5,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-12-09T10:41:34.007Z"}},{"type":"Public","name":"ACE","owner":"opendilab","isFork":false,"description":"[AAAI 2023] Official PyTorch implementation of paper \"ACE: Cooperative Multi-agent Q-learning with Bidirectional Action-Dependency\".","allTopics":["reinforcement-learning","multi-agent","smac","multi-agent-reinforcement-learning","gfootball"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":190,"forksCount":9,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-12-07T06:59:13.560Z"}},{"type":"Public","name":"DIgging","owner":"opendilab","isFork":false,"description":"Decision Intelligence for digging best parameters in target environment.","allTopics":["evolutionary-algorithm","bayesian-optimization","searching","reinforcement-learning"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":88,"forksCount":0,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-10-12T05:51:35.805Z"}},{"type":"Public","name":"DI-drive","owner":"opendilab","isFork":false,"description":"Decision Intelligence Platform for Autonomous Driving simulation.","allTopics":["pytorch","imitation-learning","autodrive","carla","metadrive","reinforcement-learning","autonomous-driving"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":542,"forksCount":59,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-10-10T06:44:07.033Z"}},{"type":"Public","name":"DI-bioseq","owner":"opendilab","isFork":false,"description":"Decision Intelligence platform for Biological Sequence Searching","allTopics":["biological-data-analysis","biological-sequence-analysis","reinforcement-learning"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":105,"forksCount":1,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-10-10T06:37:35.273Z"}},{"type":"Public","name":"GoBigger-Challenge-2021","owner":"opendilab","isFork":false,"description":"Interested in multi-agents? The 1st Go-Bigger Multi-Agent Decision Intelligence Challenge is coming and a big bonus is waiting for you!","allTopics":["challenge","reinforcement-learning","gym","gobigger"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":195,"forksCount":34,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-10-09T03:23:23.998Z"}},{"type":"Public","name":"DI-hpc","owner":"opendilab","isFork":false,"description":"OpenDILab RL HPC OP Lib","allTopics":["reinforcement-learning","hpc","cuda","pytorch","lstm"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":0,"starsCount":204,"forksCount":6,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-10-08T05:19:10.212Z"}}],"repositoryCount":27,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"Repositories"}