{"payload":{"pageCount":1,"repositories":[{"type":"Public","name":"Open-Assistant","owner":"LAION-AI","isFork":false,"description":"OpenAssistant is a chat-based assistant that understands tasks, can interact with third-party systems, and retrieve information dynamically to do so.","allTopics":["python","machine-learning","ai","nextjs","discord-bot","assistant","language-model","chatgpt","rlhf"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":65,"issueCount":223,"starsCount":36747,"forksCount":3194,"license":"Apache License 2.0","participation":[17,36,16,5,4,4,3,20,8,10,4,4,4,1,0,0,0,0,0,0,0,1,1,1,0,7,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-07T03:03:27.093Z"}},{"type":"Public","name":"annotate-collection","owner":"LAION-AI","isFork":false,"description":"A repository with data for annotation.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":0,"license":null,"participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,8,11,3,0,0,2,0,0,17,1,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-01T21:07:59.250Z"}},{"type":"Public","name":"Discord-Scrapers","owner":"LAION-AI","isFork":false,"description":"Implementation of a discord channel scraper to generate datasets.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":47,"forksCount":5,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,65,21,23,1,1,11,0,4,1,6,0,0,0,0,0,0,0,0,2,0,0,0,0,1,6,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-25T17:16:39.675Z"}},{"type":"Public","name":"natural_voice_assistant","owner":"LAION-AI","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":4,"starsCount":417,"forksCount":32,"license":"MIT License","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,7,14,17,1,0,0,3,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-27T09:29:23.162Z"}},{"type":"Public","name":"audio-dataset","owner":"LAION-AI","isFork":false,"description":"Audio Dataset for training CLAP and other models","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":5,"issueCount":32,"starsCount":592,"forksCount":53,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-05T21:08:13.149Z"}},{"type":"Public","name":"CLAP","owner":"LAION-AI","isFork":false,"description":"Contrastive Language-Audio Pretraining","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":41,"starsCount":1198,"forksCount":118,"license":"Creative Commons Zero v1.0 Universal","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-05T20:58:38.181Z"}},{"type":"Public","name":"Open-Instruction-Generalist","owner":"LAION-AI","isFork":false,"description":"Open Instruction Generalist is an assistant trained on massive synthetic instructions to perform many millions of tasks","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":6,"starsCount":203,"forksCount":19,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-13T00:19:36.879Z"}},{"type":"Public","name":"riverbed","owner":"LAION-AI","isFork":false,"description":"Tools for content datamining and NLP at scale","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":40,"forksCount":6,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-11-12T06:15:36.624Z"}},{"type":"Public","name":"Text-to-speech","owner":"LAION-AI","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":59,"forksCount":6,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-11-04T10:10:21.518Z"}},{"type":"Public","name":"phenaki","owner":"LAION-AI","isFork":false,"description":"A phenaki reproduction using pytorch.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":3,"issueCount":5,"starsCount":219,"forksCount":22,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-10-23T05:03:23.739Z"}},{"type":"Public","name":"math_problems-step-by-step_solutions","owner":"LAION-AI","isFork":false,"description":"Here we provide and collect many functions to generate math problem and step by step solutions for LLM training","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":16,"forksCount":0,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-06-21T09:59:43.865Z"}},{"type":"Public","name":"CLIP-based-NSFW-Detector","owner":"LAION-AI","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":12,"starsCount":274,"forksCount":29,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-05-30T21:06:23.060Z"}},{"type":"Public","name":"Conditional-Pretraining-of-Large-Language-Models","owner":"LAION-AI","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":36,"forksCount":8,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-05-07T22:08:33.189Z"}},{"type":"Public","name":"blade2blade","owner":"LAION-AI","isFork":false,"description":"Adversarial Training and SFT for Bot Safety Models","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":38,"forksCount":7,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-04-18T08:05:03.690Z"}},{"type":"Public","name":"dalle2-laion","owner":"LAION-AI","isFork":false,"description":"Pretrained Dalle2 from laion","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":10,"starsCount":496,"forksCount":66,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-04-15T15:16:22.423Z"}},{"type":"Public","name":"Anh","owner":"LAION-AI","isFork":false,"description":"Anh - LAION's multilingual assistant datasets and models","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":27,"forksCount":5,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-04-05T02:21:52.257Z"}},{"type":"Public","name":"LionizeR","owner":"LAION-AI","isFork":false,"description":"Experiments with Summarization, Long Context and Retrieval","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":4,"forksCount":3,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-03-23T21:07:36.717Z"}},{"type":"Public","name":"dataset-inference","owner":"LAION-AI","isFork":false,"description":"The new repository for the genral inference pipeline.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":3,"forksCount":2,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-01-31T08:39:46.654Z"}},{"type":"Public","name":"Big-Interleaved-Dataset","owner":"LAION-AI","isFork":false,"description":"Big-Interleaved-Dataset","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":15,"starsCount":56,"forksCount":8,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-01-21T22:43:52.455Z"}},{"type":"Public","name":"temporal-embedding-aggregation","owner":"LAION-AI","isFork":false,"description":"Aggregating embeddings over time ","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":19,"starsCount":30,"forksCount":4,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-01-19T17:26:08.453Z"}},{"type":"Public","name":"LAION-5B-WatermarkDetection","owner":"LAION-AI","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":89,"forksCount":14,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-01-10T17:56:27.391Z"}},{"type":"Public","name":"GIF","owner":"LAION-AI","isFork":false,"description":"General / Global Inference Framework","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":5,"starsCount":3,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-11-20T22:19:57.314Z"}},{"type":"Public","name":"safety-pipeline","owner":"LAION-AI","isFork":false,"description":"A collection of safety classifiers and models to process image and texts.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":4,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-11-14T22:06:08.198Z"}},{"type":"Public","name":"laion-dedup","owner":"LAION-AI","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":4,"starsCount":12,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-11-07T19:32:00.190Z"}},{"type":"Public","name":"laionide","owner":"LAION-AI","isFork":false,"description":"This repository contains training code and checkpoitns for finetuning glide.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":12,"forksCount":1,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-08-17T22:52:01.221Z"}},{"type":"Public","name":"ldm-finetune","owner":"LAION-AI","isFork":false,"description":"Home of `erlich` and `ongo`. Finetune latent-diffusion/glid-3-xl text2image on your own data.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":10,"starsCount":179,"forksCount":19,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-08-05T14:58:27.658Z"}},{"type":"Public","name":"conditioned-prior","owner":"LAION-AI","isFork":false,"description":"(wip) Use LAION-AI's CLIP \"conditoned prior\" to generate CLIP image embeds from CLIP text embeds.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":24,"forksCount":2,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-07-14T15:55:12.020Z"}},{"type":"Public","name":"watermark-detection","owner":"LAION-AI","isFork":false,"description":"A repository containing datasets and tools to train a watermark classifier.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":1,"starsCount":53,"forksCount":12,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-06-22T17:36:48.754Z"}},{"type":"Public","name":"dataset-spec","owner":"LAION-AI","isFork":false,"description":"Describe the format of image/text datasets","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":11,"forksCount":1,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-04-26T09:02:03.561Z"}},{"type":"Public","name":"crawlingathome","owner":"LAION-AI","isFork":true,"description":"A client library for Crawling@Home's effort to filter CommonCrawl with CLIP, building a large scale image-text dataset.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":7,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-04-04T07:39:17.551Z"}}],"repositoryCount":30,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"Repositories"}