{"payload":{"pageCount":2,"repositories":[{"type":"Public","name":"LightZero","owner":"opendilab","isFork":false,"description":"[NeurIPS 2023 Spotlight] LightZero: A Unified Benchmark for Monte Carlo Tree Search in General Sequential Decision Scenarios (awesome MCTS)","allTopics":["board-game","reinforcement-learning","pytorch","gym","mcts","gomoku","tictactoe","atari","alpha-beta-pruning","monte-carlo-tree-search","continuous-control","board-games","alphazero","self-play","mcts-algorithm","muzero","stochastic-muzero","efficientzero","sampled-muzero","gumbel-muzero"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":18,"issueCount":5,"starsCount":1055,"forksCount":109,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-20T10:50:29.048Z"}},{"type":"Public","name":"DI-engine","owner":"opendilab","isFork":false,"description":"OpenDILab Decision AI Engine. The Most Comprehensive Reinforcement Learning Framework B.P.","allTopics":["python","reinforcement-learning","impala","reinforcement-learning-algorithms","minigrid","atari","imitation-learning","distributed-system","drl","inverse-reinforcement-learning","r2d2","smac","mujoco","multiagent-reinforcement-learning","pytorch-rl","self-play","model-based-reinforcement-learning","exploration-exploitation","distributed-reinforcement-learning","offline-rl"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":13,"issueCount":5,"starsCount":2979,"forksCount":364,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-20T07:37:52.971Z"}},{"type":"Public","name":"PsyDI","owner":"opendilab","isFork":false,"description":"PsyDI: Towards a Personalized and Progressively In-depth Chatbot for Psychological Measurements. (e.g. MBTI Measurement Agent)","allTopics":["reinforcement-learning","chatbot","mbti","vlm","llm"],"primaryLanguage":{"name":"TypeScript","color":"#3178c6"},"pullRequestCount":1,"issueCount":1,"starsCount":111,"forksCount":10,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,1,4,7,38,5,1,28,0,2,0,0,0,0,4,4,5,11,9,10,0,10,14,7,6,3,0,1,0,3,1,0,1,2,1,0,3,1,4,0,0,0,0,0,1],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-19T08:42:38.221Z"}},{"type":"Public","name":"GenerativeRL","owner":"opendilab","isFork":false,"description":"Python library for solving reinforcement learning (RL) problems using generative models (e.g. Diffusion Models).","allTopics":["reinforcement-learning","generative-model","rl","diffusion","flow-model","diffusion-models","offline-rl","generative-ai","diffusion-policy"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":56,"forksCount":4,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,5,7,1,0,1,3,1,1,1,2,0,0,2,0,1],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-14T13:16:09.220Z"}},{"type":"Public","name":"treevalue","owner":"opendilab","isFork":false,"description":"Here are the most awesome tree structure computing solutions, make your life easier. (这里有目前性能最优的树形结构计算解决方案)","allTopics":["tree","framework","nested-structures","python3","data-structures","tree-structure"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":4,"starsCount":229,"forksCount":3,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-12T08:32:49.939Z"}},{"type":"Public","name":"awesome-exploration-rl","owner":"opendilab","isFork":false,"description":"A curated list of awesome exploration RL resources (continually updated)","allTopics":["awesome","reinforcement-learning","exploration","reinforcement-learning-algorithms","awesome-list","exploratory","exploration-exploitation","sparse-reward-algorithms","delayed-rewards","hard-exploration"],"primaryLanguage":null,"pullRequestCount":0,"issueCount":0,"starsCount":372,"forksCount":9,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,2,0,0,0,0,1,0,0,0,0,0,0,0,0,2,0,0,0,0,0,0,0,0,0,0,2,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-30T15:58:59.509Z"}},{"type":"Public","name":"awesome-multi-modal-reinforcement-learning","owner":"opendilab","isFork":false,"description":"A curated list of Multi-Modal Reinforcement Learning resources (continually updated)","allTopics":[],"primaryLanguage":null,"pullRequestCount":1,"issueCount":0,"starsCount":374,"forksCount":10,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-30T09:43:13.710Z"}},{"type":"Public","name":"awesome-decision-transformer","owner":"opendilab","isFork":false,"description":"A curated list of Decision Transformer resources (continually updated)","allTopics":["awesome","reinforcement-learning","reinforcement-learning-algorithms","awesome-list","imitation-learning","decision-transformers"],"primaryLanguage":null,"pullRequestCount":1,"issueCount":0,"starsCount":672,"forksCount":25,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-30T09:40:55.932Z"}},{"type":"Public","name":"awesome-RLHF","owner":"opendilab","isFork":false,"description":"A curated list of reinforcement learning with human feedback resources (continually updated)","allTopics":["deep-reinforcement-learning","large-language-models","human-feedback","rlhf","reinforcement-learning","deep-learning"],"primaryLanguage":null,"pullRequestCount":3,"issueCount":0,"starsCount":3255,"forksCount":200,"license":"Apache License 2.0","participation":[0,0,0,0,1,1,0,0,0,0,2,0,1,0,0,1,0,0,1,1,0,1,0,2,0,3,1,0,1,1,0,0,1,0,0,1,0,0,0,1,0,0,0,1,0,0,0,0,1,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-30T09:38:58.748Z"}},{"type":"Public","name":"SmartRefine","owner":"opendilab","isFork":false,"description":"[CVPR 2024] SmartRefine: A Scenario-Adaptive Refinement Framework for Efficient Motion Prediction","allTopics":["autonomous-driving","trajectory-prediction","motion-prediction"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":12,"starsCount":101,"forksCount":8,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,4,0,8,0,0,0,0,0,0,0,0,0,0,3,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-27T17:56:35.976Z"}},{"type":"Public","name":"awesome-model-based-RL","owner":"opendilab","isFork":false,"description":"A curated list of awesome model based RL resources (continually updated)","allTopics":["awesome","reinforcement-learning-algorithms","awesome-list","model-based-rl","model-based-reinforcement-learning","reinforcement-learning"],"primaryLanguage":null,"pullRequestCount":0,"issueCount":0,"starsCount":870,"forksCount":46,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-26T10:25:32.079Z"}},{"type":"Public","name":"awesome-ui-agents","owner":"opendilab","isFork":false,"description":"A curated list of of awesome UI agents resources, encompassing Web, App, OS, and beyond (continually updated)","allTopics":[],"primaryLanguage":null,"pullRequestCount":1,"issueCount":0,"starsCount":41,"forksCount":4,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-16T09:11:41.336Z"}},{"type":"Public","name":"LLMRiddles","owner":"opendilab","isFork":false,"description":"Open-Source Reproduction/Demo of the LLM Riddles Game","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":0,"starsCount":516,"forksCount":36,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-30T09:22:46.898Z"}},{"type":"Public","name":"DI-1024","owner":"opendilab","isFork":false,"description":"1024 + 深度强化学习(Deep Reinforcement Learning + 1024 Game/ 2048 Game)","allTopics":["javascript","python","reinforcement-learning","deep-reinforcement-learning","2048","2048-game","1024-game"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":109,"forksCount":3,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-23T10:36:08.665Z"}},{"type":"Public","name":"DI-engine-docs","owner":"opendilab","isFork":false,"description":"DI-engine docs (Chinese and English)","allTopics":["reinforcement-learning","deep-learning","reinforcement-learning-algorithms","imitation-learning","inverse-reinforcement-learning","pytorch-rl","model-based-reinforcement-learning","multi-agent-reinforcement-learning","offline-rl"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":0,"starsCount":279,"forksCount":62,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-11T12:36:20.864Z"}},{"type":"Public","name":"LMDrive","owner":"opendilab","isFork":false,"description":"[CVPR 2024] LMDrive: Closed-Loop End-to-End Driving with Large Language Models","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":43,"starsCount":616,"forksCount":51,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-07T06:10:13.691Z"}},{"type":"Public","name":"pytorch_sphinx_theme","owner":"opendilab","isFork":true,"description":"PyTorch Sphinx Theme","allTopics":[],"primaryLanguage":{"name":"CSS","color":"#563d7c"},"pullRequestCount":0,"issueCount":0,"starsCount":50,"forksCount":138,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-07T04:29:52.112Z"}},{"type":"Public","name":"DI-hpc","owner":"opendilab","isFork":false,"description":"OpenDILab RL HPC OP Lib, including CUDA and Triton kernel","allTopics":["reinforcement-learning","hpc","cuda","pytorch","lstm","triton"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":219,"forksCount":7,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-04T08:00:02.212Z"}},{"type":"Public","name":"awesome-diffusion-model-in-rl","owner":"opendilab","isFork":false,"description":"A curated list of Diffusion Model in RL resources (continually updated)","allTopics":["deep-reinforcement-learning","diffusion-model","reinfocement-learning","diffusion-models"],"primaryLanguage":null,"pullRequestCount":2,"issueCount":0,"starsCount":742,"forksCount":41,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-25T04:46:08.897Z"}},{"type":"Public","name":"SO2","owner":"opendilab","isFork":false,"description":"[AAAI2024] A Perspective of Q-value Estimation on Offline-to-Online Reinforcement Learning","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":286,"forksCount":4,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-22T01:04:02.260Z"}},{"type":"Public","name":"PPOxFamily","owner":"opendilab","isFork":false,"description":"PPO x Family DRL Tutorial Course(决策智能入门级公开课:8节课帮你盘清算法理论,理顺代码逻辑,玩转决策AI应用实践 )","allTopics":["python","course","reinforcement-learning","deep-reinforcement-learning","decision-intelligence"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":42,"issueCount":14,"starsCount":1899,"forksCount":172,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-15T11:44:33.821Z"}},{"type":"Public","name":"awesome-AI-based-protein-design","owner":"opendilab","isFork":false,"description":"A collection of research papers for AI-based protein design","allTopics":["awesome","protein-structure","artificial-intelligence","protein","awesome-list"],"primaryLanguage":null,"pullRequestCount":0,"issueCount":0,"starsCount":217,"forksCount":13,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-13T05:37:22.642Z"}},{"type":"Public","name":"DI-star","owner":"opendilab","isFork":false,"description":"An artificial intelligence platform for the StarCraft II with large-scale distributed training and grand-master agents.","allTopics":["league","artificial-intelligence","starcraft2","self-play","reinforcment-learning","deep-learning","deep-reinforcement-learning"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":1216,"forksCount":114,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-06T03:08:47.648Z"}},{"type":"Public","name":"OpenPaL","owner":"opendilab","isFork":false,"description":"Building open-ended embodied agent in battle royale FPS game","allTopics":["embodied-agent","embodied-ai","large-language-models","open-ended-learning"],"primaryLanguage":null,"pullRequestCount":0,"issueCount":1,"starsCount":33,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-06T16:26:45.188Z"}},{"type":"Public","name":"InterFuser","owner":"opendilab","isFork":false,"description":"[CoRL 2022] InterFuser: Safety-Enhanced Autonomous Driving Using Interpretable Sensor Fusion Transformer","allTopics":["transformer","autonomous-driving","bird-view-image"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":61,"starsCount":527,"forksCount":44,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-20T14:08:54.147Z"}},{"type":"Public","name":"DI-toolkit","owner":"opendilab","isFork":false,"description":"A simple toolkit package for opendilab","allTopics":["python","toolkit"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":113,"forksCount":3,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-17T12:37:33.903Z"}},{"type":"Public","name":"CodeMorpheus","owner":"opendilab","isFork":false,"description":"CodeMorpheus: Generate code self-portraits with one click(一键生成代码自画像,决策型 AI + 生成式 AI)","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":45,"forksCount":3,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-08T14:49:47.913Z"}},{"type":"Public","name":"huggingface_ding","owner":"opendilab","isFork":false,"description":"Auxiliary code for pulling, loading reinforcement learning models based on DI-engine from the Huggingface Hub, or pushing them onto Huggingface Hub with auto-created model card.","allTopics":["decision-making","huggingface","reinforcement-learning"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":46,"forksCount":1,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-12-12T06:03:21.066Z"}},{"type":"Public","name":"DI-treetensor","owner":"opendilab","isFork":false,"description":"Let DI-treetensor help you simplify the structure processing!(树形运算一不小心就逻辑混乱?DI-treetensor快速帮你搞定)","allTopics":["reinforcement-learning","deep-learning","numpy","tree-structure","tensor","python","pytorch"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":1,"starsCount":202,"forksCount":4,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-09-19T09:46:39.764Z"}},{"type":"Public","name":"GoBigger","owner":"opendilab","isFork":false,"description":"[ICLR 2023] Come & try Decision-Intelligence version of \"Agar\"! Gobigger could also help you with multi-agent decision intelligence study.","allTopics":["game","python","environment","league","multi-agent","gym","rl-environment","reinforcement-learning"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":457,"forksCount":34,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-08-31T05:41:03.711Z"}}],"repositoryCount":47,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"opendilab repositories"}