{"payload":{"pageCount":2,"repositories":[{"type":"Public","name":"LightZero","owner":"opendilab","isFork":false,"description":"[NeurIPS 2023 Spotlight] LightZero: A Unified Benchmark for Monte Carlo Tree Search in General Sequential Decision Scenarios","allTopics":["board-game","reinforcement-learning","pytorch","gym","mcts","gomoku","tictactoe","atari","alpha-beta-pruning","monte-carlo-tree-search","continuous-control","board-games","alphazero","self-play","mcts-algorithm","muzero","stochastic-muzero","efficientzero","sampled-muzero","gumbel-muzero"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":11,"issueCount":5,"starsCount":903,"forksCount":80,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-31T06:20:02.435Z"}},{"type":"Public","name":"DI-engine","owner":"opendilab","isFork":false,"description":"OpenDILab Decision AI Engine","allTopics":["impala","reinforcement-learning-algorithms","minigrid","atari","imitation-learning","distributed-system","drl","inverse-reinforcement-learning","r2d2","smac","mujoco","multiagent-reinforcement-learning","pytorch-rl","self-play","model-based-reinforcement-learning","exploration-exploitation","distributed-reinforcement-learning","offline-rl","python","reinforcement-learning"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":10,"issueCount":4,"starsCount":2652,"forksCount":342,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-30T08:14:46.009Z"}},{"type":"Public","name":"awesome-RLHF","owner":"opendilab","isFork":false,"description":"A curated list of reinforcement learning with human feedback resources (continually updated)","allTopics":["deep-reinforcement-learning","large-language-models","human-feedback","rlhf","reinforcement-learning","deep-learning"],"primaryLanguage":null,"pullRequestCount":2,"issueCount":0,"starsCount":2876,"forksCount":186,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-26T11:17:50.336Z"}},{"type":"Public","name":"PsyDI","owner":"opendilab","isFork":false,"description":"PsyDI: A MBTI agent that helps you understand your personality type through a relaxed multi-modal interaction.","allTopics":["reinforcement-learning","chatbot","mbti","vlm","llm"],"primaryLanguage":{"name":"TypeScript","color":"#3178c6"},"pullRequestCount":0,"issueCount":0,"starsCount":41,"forksCount":2,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,4,7,38,5,1,28,0,2,0,0,0,0,4,4,5,11,9,10,0,10,14,7,6,3,0,1,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-21T08:57:13.948Z"}},{"type":"Public","name":"awesome-model-based-RL","owner":"opendilab","isFork":false,"description":"A curated list of awesome model based RL resources (continually updated)","allTopics":["awesome","reinforcement-learning-algorithms","awesome-list","model-based-rl","model-based-reinforcement-learning","reinforcement-learning"],"primaryLanguage":null,"pullRequestCount":0,"issueCount":0,"starsCount":752,"forksCount":42,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-20T10:01:29.080Z"}},{"type":"Public","name":"PPOxFamily","owner":"opendilab","isFork":false,"description":"PPO x Family DRL Tutorial Course（决策智能入门级公开课：8节课帮你盘清算法理论，理顺代码逻辑，玩转决策AI应用实践 ）","allTopics":["python","course","reinforcement-learning","deep-reinforcement-learning","decision-intelligence"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":42,"issueCount":13,"starsCount":1768,"forksCount":161,"license":"Apache License 2.0","participation":[1,3,2,0,1,0,4,6,1,1,7,0,1,0,0,0,0,0,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-15T11:44:33.821Z"}},{"type":"Public","name":"awesome-AI-based-protein-design","owner":"opendilab","isFork":false,"description":"A collection of research papers for AI-based protein design","allTopics":["awesome","protein-structure","artificial-intelligence","protein","awesome-list"],"primaryLanguage":null,"pullRequestCount":0,"issueCount":0,"starsCount":191,"forksCount":12,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-13T05:37:22.642Z"}},{"type":"Public","name":"awesome-decision-transformer","owner":"opendilab","isFork":false,"description":"A curated list of Decision Transformer resources (continually updated)","allTopics":["awesome","reinforcement-learning","reinforcement-learning-algorithms","awesome-list","imitation-learning","decision-transformers"],"primaryLanguage":null,"pullRequestCount":0,"issueCount":0,"starsCount":585,"forksCount":21,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-10T06:06:07.545Z"}},{"type":"Public","name":"awesome-multi-modal-reinforcement-learning","owner":"opendilab","isFork":false,"description":"A curated list of Multi-Modal Reinforcement Learning resources (continually updated)","allTopics":[],"primaryLanguage":null,"pullRequestCount":0,"issueCount":0,"starsCount":332,"forksCount":10,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-10T06:05:22.970Z"}},{"type":"Public","name":"DI-engine-docs","owner":"opendilab","isFork":false,"description":"DI-engine docs (Chinese and English)","allTopics":["reinforcement-learning","deep-learning","reinforcement-learning-algorithms","imitation-learning","inverse-reinforcement-learning","pytorch-rl","model-based-reinforcement-learning","multi-agent-reinforcement-learning","offline-rl"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":0,"starsCount":253,"forksCount":58,"license":"Apache License 2.0","participation":[0,2,0,2,0,1,1,4,3,0,2,2,0,0,1,0,0,0,3,2,0,2,0,0,1,2,1,0,0,5,1,1,0,0,3,0,0,0,0,0,0,2,0,0,0,2,0,0,2,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-08T09:33:37.095Z"}},{"type":"Public","name":"DI-star","owner":"opendilab","isFork":false,"description":"An artificial intelligence platform for the StarCraft II with large-scale distributed training and grand-master agents.","allTopics":["league","artificial-intelligence","starcraft2","self-play","reinforcment-learning","deep-learning","deep-reinforcement-learning"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":1177,"forksCount":111,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-06T03:08:47.648Z"}},{"type":"Public","name":"awesome-diffusion-model-in-rl","owner":"opendilab","isFork":false,"description":"A curated list of Diffusion Model in RL resources (continually updated)","allTopics":["deep-reinforcement-learning","diffusion-model","reinfocement-learning","diffusion-models"],"primaryLanguage":null,"pullRequestCount":1,"issueCount":0,"starsCount":606,"forksCount":34,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-19T11:18:19.295Z"}},{"type":"Public","name":"LMDrive","owner":"opendilab","isFork":false,"description":"[CVPR 2024] LMDrive: Closed-Loop End-to-End Driving with Large Language Models","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":34,"starsCount":483,"forksCount":47,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-12T08:32:10.691Z"}},{"type":"Public","name":"GenerativeRL","owner":"opendilab","isFork":false,"description":"","allTopics":[],"primaryLanguage":null,"pullRequestCount":0,"issueCount":0,"starsCount":5,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-11T05:45:37.403Z"}},{"type":"Public","name":"awesome-exploration-rl","owner":"opendilab","isFork":false,"description":"A curated list of awesome exploration RL resources (continually updated)","allTopics":["awesome","reinforcement-learning","exploration","reinforcement-learning-algorithms","awesome-list","exploratory","exploration-exploitation","sparse-reward-algorithms","delayed-rewards","hard-exploration"],"primaryLanguage":null,"pullRequestCount":0,"issueCount":0,"starsCount":310,"forksCount":7,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-09T04:11:13.509Z"}},{"type":"Public","name":"SmartRefine","owner":"opendilab","isFork":false,"description":"[CVPR 2024] SmartRefine: An Scenario-Adaptive Refinement Framework for Efficient Motion Prediction","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":5,"starsCount":56,"forksCount":4,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-22T12:31:33.976Z"}},{"type":"Public","name":"OpenPaL","owner":"opendilab","isFork":false,"description":"Building open-ended embodied agent in battle royale FPS game","allTopics":["embodied-agent","embodied-ai","large-language-models","open-ended-learning"],"primaryLanguage":null,"pullRequestCount":0,"issueCount":1,"starsCount":27,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-06T16:26:45.188Z"}},{"type":"Public","name":"SO2","owner":"opendilab","isFork":false,"description":"[AAAI2024] A Perspective of Q-value Estimation on Offline-to-Online Reinforcement Learning","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":255,"forksCount":2,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-23T06:51:44.260Z"}},{"type":"Public","name":"InterFuser","owner":"opendilab","isFork":false,"description":"[CoRL 2022] InterFuser: Safety-Enhanced Autonomous Driving Using Interpretable Sensor Fusion Transformer","allTopics":["transformer","autonomous-driving","bird-view-image"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":56,"starsCount":481,"forksCount":42,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-20T14:08:54.147Z"}},{"type":"Public","name":"DI-toolkit","owner":"opendilab","isFork":false,"description":"A simple toolkit package for opendilab","allTopics":["python","toolkit"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":101,"forksCount":3,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-17T12:37:33.903Z"}},{"type":"Public","name":"CodeMorpheus","owner":"opendilab","isFork":false,"description":"CodeMorpheus: Generate code self-portraits with one click（一键生成代码自画像，决策型 AI + 生成式 AI）","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":39,"forksCount":2,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-08T14:49:47.913Z"}},{"type":"Public","name":"huggingface_ding","owner":"opendilab","isFork":false,"description":"Auxiliary code for pulling, loading reinforcement learning models based on DI-engine from the Huggingface Hub, or pushing them onto Huggingface Hub with auto-created model card.","allTopics":["decision-making","huggingface","reinforcement-learning"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":29,"forksCount":1,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-12-12T06:03:21.066Z"}},{"type":"Public","name":"LLMRiddles","owner":"opendilab","isFork":false,"description":"Open-Source Reproduction/Demo of the LLM Riddles Game","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":3,"issueCount":0,"starsCount":485,"forksCount":34,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-11-29T16:18:55.701Z"}},{"type":"Public","name":"treevalue","owner":"opendilab","isFork":false,"description":"Here are the most awesome tree structure computing solutions, make your life easier. （这里有目前性能最优的树形结构计算解决方案）","allTopics":["tree","framework","nested-structures","python3","data-structures","tree-structure"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":4,"starsCount":223,"forksCount":3,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-10-22T19:24:50.939Z"}},{"type":"Public","name":"DI-treetensor","owner":"opendilab","isFork":false,"description":"Let DI-treetensor help you simplify the structure processing!（树形运算一不小心就逻辑混乱？DI-treetensor快速帮你搞定）","allTopics":["reinforcement-learning","deep-learning","numpy","tree-structure","tensor","python","pytorch"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":1,"starsCount":187,"forksCount":5,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-09-19T09:46:39.764Z"}},{"type":"Public","name":"GoBigger","owner":"opendilab","isFork":false,"description":"[ICLR 2023] Come &amp; try Decision-Intelligence version of \"Agar\"! Gobigger could also help you with multi-agent decision intelligence study.","allTopics":["game","python","environment","league","multi-agent","gym","rl-environment","reinforcement-learning"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":440,"forksCount":35,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-08-31T05:41:03.711Z"}},{"type":"Public","name":"awesome-end-to-end-autonomous-driving","owner":"opendilab","isFork":false,"description":"A curated list of awesome End-to-End Autonomous Driving resources (continually updated)","allTopics":["autonomous-driving","imitation-learning","paper-list","reinforcement-learning"],"primaryLanguage":null,"pullRequestCount":0,"issueCount":0,"starsCount":298,"forksCount":13,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-08-13T10:21:30.231Z"}},{"type":"Public","name":"DOS","owner":"opendilab","isFork":false,"description":"[CVPR 2023] ReasonNet: End-to-End Driving with Temporal and Global Reasoning","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":8,"starsCount":120,"forksCount":10,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-06-29T08:09:46.085Z"}},{"type":"Public","name":"miniwob-plusplus","owner":"opendilab","isFork":true,"description":"MiniWoB++: a web interaction benchmark for reinforcement learning","allTopics":[],"primaryLanguage":{"name":"HTML","color":"#e34c26"},"pullRequestCount":0,"issueCount":0,"starsCount":9,"forksCount":44,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-04-01T06:46:44.328Z"}},{"type":"Public","name":"DI-smartcross","owner":"opendilab","isFork":false,"description":"Decision Intelligence platform for Traffic Crossing Signal Control","allTopics":["traffic-signal-control","traffic-light-control","reinforcement-learning"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":217,"forksCount":4,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-03-22T03:18:23.171Z"}}],"repositoryCount":46,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"Repositories"}