{"payload":{"pageCount":2,"repositories":[{"type":"Public","name":"LightZero","owner":"opendilab","isFork":false,"description":"[NeurIPS 2023 Spotlight] LightZero: A Unified Benchmark for Monte Carlo Tree Search in General Sequential Decision Scenarios (awesome MCTS)","allTopics":["board-game","reinforcement-learning","pytorch","gym","mcts","gomoku","tictactoe","atari","alpha-beta-pruning","monte-carlo-tree-search","continuous-control","board-games","alphazero","self-play","mcts-algorithm","muzero","stochastic-muzero","efficientzero","sampled-muzero","gumbel-muzero"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":16,"issueCount":8,"starsCount":1012,"forksCount":103,"license":"Apache License 2.0","participation":[6,0,5,3,2,0,0,3,8,4,6,2,3,1,2,7,2,3,2,1,0,0,0,0,3,0,1,2,1,5,4,5,0,5,4,1,1,1,0,0,1,0,1,1,2,4,3,7,2,5,0,2],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-19T11:11:53.048Z"}},{"type":"Public","name":"awesome-ui-agents","owner":"opendilab","isFork":false,"description":"A curated list of of awesome UI agents resources, encompassing Web, App, OS, and beyond (continually updated)","allTopics":[],"primaryLanguage":null,"pullRequestCount":0,"issueCount":0,"starsCount":29,"forksCount":3,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,7,0,0,0,0,0,0,3],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-16T09:11:41.336Z"}},{"type":"Public","name":"DI-engine","owner":"opendilab","isFork":false,"description":"OpenDILab Decision AI Engine. The Most Comprehensive Reinforcement Learning Framework B.P.","allTopics":["python","reinforcement-learning","impala","reinforcement-learning-algorithms","minigrid","atari","imitation-learning","distributed-system","drl","inverse-reinforcement-learning","r2d2","smac","mujoco","multiagent-reinforcement-learning","pytorch-rl","self-play","model-based-reinforcement-learning","exploration-exploitation","distributed-reinforcement-learning","offline-rl"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":12,"issueCount":5,"starsCount":2897,"forksCount":358,"license":"Apache License 2.0","participation":[7,4,4,5,5,0,1,2,7,1,7,1,0,0,0,1,4,4,6,0,2,1,5,8,0,0,1,0,1,2,0,0,2,4,2,2,0,5,0,1,2,0,1,5,2,4,0,1,0,1,0,1],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-14T13:49:41.971Z"}},{"type":"Public","name":"GenerativeRL","owner":"opendilab","isFork":false,"description":"Python library for solving reinforcement learning (RL) problems using generative models (e.g. Diffusion Models).","allTopics":["reinforcement-learning","generative-model","rl","diffusion","flow-model","diffusion-models","offline-rl","generative-ai","diffusion-policy"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":45,"forksCount":3,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,6,6,1,1,0,3,1,2,0,2],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-13T16:02:00.403Z"}},{"type":"Public","name":"PsyDI","owner":"opendilab","isFork":false,"description":"PsyDI: Towards a Personalized and Progressively In-depth Chatbot for Psychological Measurements. (e.g. MBTI Measurement Agent)","allTopics":["reinforcement-learning","chatbot","mbti","vlm","llm"],"primaryLanguage":{"name":"TypeScript","color":"#3178c6"},"pullRequestCount":1,"issueCount":0,"starsCount":69,"forksCount":1,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,1,6,5,43,0,7,22,0,2,0,0,0,0,4,4,5,11,13,6,3,7,14,8,5,3,0,1,0,3,1,1,0,2,1,0,3,1,4,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-08T06:12:08.221Z"}},{"type":"Public","name":"LLMRiddles","owner":"opendilab","isFork":false,"description":"Open-Source Reproduction/Demo of the LLM Riddles Game","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":0,"starsCount":515,"forksCount":36,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,75,2,1,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-30T09:22:46.898Z"}},{"type":"Public","name":"DI-1024","owner":"opendilab","isFork":false,"description":"1024 + 深度强化学习(Deep Reinforcement Learning + 1024 Game/ 2048 Game)","allTopics":["javascript","python","reinforcement-learning","deep-reinforcement-learning","2048","2048-game","1024-game"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":108,"forksCount":3,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-23T10:36:08.665Z"}},{"type":"Public","name":"awesome-RLHF","owner":"opendilab","isFork":false,"description":"A curated list of reinforcement learning with human feedback resources (continually updated)","allTopics":["deep-reinforcement-learning","large-language-models","human-feedback","rlhf","reinforcement-learning","deep-learning"],"primaryLanguage":null,"pullRequestCount":2,"issueCount":0,"starsCount":3167,"forksCount":201,"license":"Apache License 2.0","participation":[2,0,1,0,1,0,0,0,0,1,1,0,0,0,0,2,0,1,0,0,1,0,0,2,0,1,0,1,1,0,3,1,1,0,1,0,0,1,0,1,0,0,0,0,1,0,0,1,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-21T09:10:24.748Z"}},{"type":"Public","name":"DI-engine-docs","owner":"opendilab","isFork":false,"description":"DI-engine docs (Chinese and English)","allTopics":["reinforcement-learning","deep-learning","reinforcement-learning-algorithms","imitation-learning","inverse-reinforcement-learning","pytorch-rl","model-based-reinforcement-learning","multi-agent-reinforcement-learning","offline-rl"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":0,"starsCount":275,"forksCount":62,"license":"Apache License 2.0","participation":[2,0,0,1,0,0,1,2,2,0,2,0,0,1,2,1,0,0,5,1,1,0,2,1,0,0,0,0,0,0,2,0,0,0,2,0,0,2,0,0,0,0,1,1,0,1,2,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-11T12:36:20.864Z"}},{"type":"Public","name":"LMDrive","owner":"opendilab","isFork":false,"description":"[CVPR 2024] LMDrive: Closed-Loop End-to-End Driving with Large Language Models","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":39,"starsCount":587,"forksCount":52,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,9,5,1,2,3,5,3,1,0,0,0,3,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-07T06:10:13.691Z"}},{"type":"Public","name":"awesome-decision-transformer","owner":"opendilab","isFork":false,"description":"A curated list of Decision Transformer resources (continually updated)","allTopics":["awesome","reinforcement-learning","reinforcement-learning-algorithms","awesome-list","imitation-learning","decision-transformers"],"primaryLanguage":null,"pullRequestCount":0,"issueCount":0,"starsCount":657,"forksCount":25,"license":"Apache License 2.0","participation":[0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,1,0,1,0,0,0,0,0,0,1,0,0,0,0,1,1,0,0,0,1,0,0,1,0,0,0,0,1,0,0,1,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-07T04:34:23.932Z"}},{"type":"Public","name":"pytorch_sphinx_theme","owner":"opendilab","isFork":true,"description":"PyTorch Sphinx Theme","allTopics":[],"primaryLanguage":{"name":"CSS","color":"#563d7c"},"pullRequestCount":0,"issueCount":0,"starsCount":50,"forksCount":137,"license":"MIT License","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-07T04:29:52.112Z"}},{"type":"Public","name":"DI-hpc","owner":"opendilab","isFork":false,"description":"OpenDILab RL HPC OP Lib, including CUDA and Triton kernel","allTopics":["reinforcement-learning","hpc","cuda","pytorch","lstm","triton"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":218,"forksCount":7,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-04T08:00:02.212Z"}},{"type":"Public","name":"awesome-diffusion-model-in-rl","owner":"opendilab","isFork":false,"description":"A curated list of Diffusion Model in RL resources (continually updated)","allTopics":["deep-reinforcement-learning","diffusion-model","reinfocement-learning","diffusion-models"],"primaryLanguage":null,"pullRequestCount":1,"issueCount":0,"starsCount":708,"forksCount":39,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-25T04:46:08.897Z"}},{"type":"Public","name":"SO2","owner":"opendilab","isFork":false,"description":"[AAAI2024] A Perspective of Q-value Estimation on Offline-to-Online Reinforcement Learning","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":284,"forksCount":4,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-22T01:04:02.260Z"}},{"type":"Public","name":"awesome-model-based-RL","owner":"opendilab","isFork":false,"description":"A curated list of awesome model based RL resources (continually updated)","allTopics":["awesome","reinforcement-learning-algorithms","awesome-list","model-based-rl","model-based-reinforcement-learning","reinforcement-learning"],"primaryLanguage":null,"pullRequestCount":0,"issueCount":0,"starsCount":849,"forksCount":46,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-17T05:51:07.079Z"}},{"type":"Public","name":"awesome-multi-modal-reinforcement-learning","owner":"opendilab","isFork":false,"description":"A curated list of Multi-Modal Reinforcement Learning resources (continually updated)","allTopics":[],"primaryLanguage":null,"pullRequestCount":0,"issueCount":0,"starsCount":366,"forksCount":10,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-16T15:57:48.710Z"}},{"type":"Public","name":"awesome-exploration-rl","owner":"opendilab","isFork":false,"description":"A curated list of awesome exploration RL resources (continually updated)","allTopics":["awesome","reinforcement-learning","exploration","reinforcement-learning-algorithms","awesome-list","exploratory","exploration-exploitation","sparse-reward-algorithms","delayed-rewards","hard-exploration"],"primaryLanguage":null,"pullRequestCount":0,"issueCount":0,"starsCount":364,"forksCount":9,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-11T16:14:03.509Z"}},{"type":"Public","name":"SmartRefine","owner":"opendilab","isFork":false,"description":"[CVPR 2024] SmartRefine: A Scenario-Adaptive Refinement Framework for Efficient Motion Prediction","allTopics":["autonomous-driving","trajectory-prediction","motion-prediction"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":11,"starsCount":94,"forksCount":6,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-06T12:42:48.976Z"}},{"type":"Public","name":"PPOxFamily","owner":"opendilab","isFork":false,"description":"PPO x Family DRL Tutorial Course(决策智能入门级公开课:8节课帮你盘清算法理论,理顺代码逻辑,玩转决策AI应用实践 )","allTopics":["python","course","reinforcement-learning","deep-reinforcement-learning","decision-intelligence"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":42,"issueCount":14,"starsCount":1869,"forksCount":169,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-15T11:44:33.821Z"}},{"type":"Public","name":"awesome-AI-based-protein-design","owner":"opendilab","isFork":false,"description":"A collection of research papers for AI-based protein design","allTopics":["awesome","protein-structure","artificial-intelligence","protein","awesome-list"],"primaryLanguage":null,"pullRequestCount":0,"issueCount":0,"starsCount":215,"forksCount":13,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-13T05:37:22.642Z"}},{"type":"Public","name":"DI-star","owner":"opendilab","isFork":false,"description":"An artificial intelligence platform for the StarCraft II with large-scale distributed training and grand-master agents.","allTopics":["league","artificial-intelligence","starcraft2","self-play","reinforcment-learning","deep-learning","deep-reinforcement-learning"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":1211,"forksCount":113,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-06T03:08:47.648Z"}},{"type":"Public","name":"OpenPaL","owner":"opendilab","isFork":false,"description":"Building open-ended embodied agent in battle royale FPS game","allTopics":["embodied-agent","embodied-ai","large-language-models","open-ended-learning"],"primaryLanguage":null,"pullRequestCount":0,"issueCount":1,"starsCount":32,"forksCount":1,"license":null,"participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,3,0,0,0,0,0,0,17,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-06T16:26:45.188Z"}},{"type":"Public","name":"InterFuser","owner":"opendilab","isFork":false,"description":"[CoRL 2022] InterFuser: Safety-Enhanced Autonomous Driving Using Interpretable Sensor Fusion Transformer","allTopics":["transformer","autonomous-driving","bird-view-image"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":62,"starsCount":519,"forksCount":43,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,0,2,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-20T14:08:54.147Z"}},{"type":"Public","name":"DI-toolkit","owner":"opendilab","isFork":false,"description":"A simple toolkit package for opendilab","allTopics":["python","toolkit"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":112,"forksCount":3,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-17T12:37:33.903Z"}},{"type":"Public","name":"CodeMorpheus","owner":"opendilab","isFork":false,"description":"CodeMorpheus: Generate code self-portraits with one click(一键生成代码自画像,决策型 AI + 生成式 AI)","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":45,"forksCount":3,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-08T14:49:47.913Z"}},{"type":"Public","name":"huggingface_ding","owner":"opendilab","isFork":false,"description":"Auxiliary code for pulling, loading reinforcement learning models based on DI-engine from the Huggingface Hub, or pushing them onto Huggingface Hub with auto-created model card.","allTopics":["decision-making","huggingface","reinforcement-learning"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":45,"forksCount":1,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,2,0,0,0,0,0,0,2,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-12-12T06:03:21.066Z"}},{"type":"Public","name":"treevalue","owner":"opendilab","isFork":false,"description":"Here are the most awesome tree structure computing solutions, make your life easier. (这里有目前性能最优的树形结构计算解决方案)","allTopics":["tree","framework","nested-structures","python3","data-structures","tree-structure"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":4,"starsCount":228,"forksCount":3,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-10-22T19:24:50.939Z"}},{"type":"Public","name":"DI-treetensor","owner":"opendilab","isFork":false,"description":"Let DI-treetensor help you simplify the structure processing!(树形运算一不小心就逻辑混乱?DI-treetensor快速帮你搞定)","allTopics":["reinforcement-learning","deep-learning","numpy","tree-structure","tensor","python","pytorch"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":1,"starsCount":201,"forksCount":4,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-09-19T09:46:39.764Z"}},{"type":"Public","name":"GoBigger","owner":"opendilab","isFork":false,"description":"[ICLR 2023] Come & try Decision-Intelligence version of \"Agar\"! Gobigger could also help you with multi-agent decision intelligence study.","allTopics":["game","python","environment","league","multi-agent","gym","rl-environment","reinforcement-learning"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":456,"forksCount":34,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-08-31T05:41:03.711Z"}}],"repositoryCount":47,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"opendilab repositories"}