KodCode-V1 is the largest fully-synthetic open-source dataset providing verifiable solutions and tests for coding tasks.
Project Website | π Technical Report | πΎ Github Repo | π€ KodCode-V1 (For RL) | π€ KodCode-V1-SFT-R1 (for SFT)\n
","classNames":"hf-sanitized hf-sanitized-W9jLb_GG8-S3ATDYnvbHs"},"users":[{"_id":"653df1323479e9ebbe3eb6cc","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/653df1323479e9ebbe3eb6cc/K_g-r1iMRNKj99LXPuYF3.jpeg","isPro":true,"fullname":"Zhangchen Xu","user":"zhangchenxu","type":"user"},{"_id":"637c88b6d55081513c5690d8","avatarUrl":"/avatars/6766e23ebf46b46d6c8b48351c571907.svg","isPro":false,"fullname":"Yang Liu","user":"nlpyang","type":"user"},{"_id":"605e8dfd5abeb13e714c4c18","avatarUrl":"/avatars/bc27a0ed17b2bd4311e89d3028fa327b.svg","isPro":true,"fullname":"yueqin yin","user":"yyqoni","type":"user"},{"_id":"68bf55bedec59c87bff929a0","avatarUrl":"/avatars/7d6734f535a076a3cd1714bfdd07dd17.svg","isPro":false,"fullname":"Radha Poovendran","user":"poovendran","type":"user"}],"userCount":4,"collections":[{"slug":"KodCode/kodcode-v1-67c28236e5911f17dbe1769a","title":"KodCode-V1","description":"KodCode-V1 is the largest fully-synthetic open-source dataset providing verifiable solutions and tests for coding tasks.","gating":false,"lastUpdated":"2025-04-02T05:15:36.389Z","owner":{"_id":"67b42f0de9a5a43b0de32a59","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/653df1323479e9ebbe3eb6cc/PXYB67R9dgSLPARIhySGr.jpeg","fullname":"KodCode","name":"KodCode","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":31,"isUserFollowing":false},"items":[{"_id":"67c2823ca237c1ac224d9d38","position":0,"type":"dataset","note":{"html":"For RL.","text":"For RL."},"author":"KodCode","downloads":1433,"gated":false,"id":"KodCode/KodCode-V1","lastModified":"2025-03-17T07:56:27.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":487432,"libraries":["datasets","dask","mlcroissant","polars"],"formats":["parquet"],"modalities":["tabular","text"]},"private":false,"repoType":"dataset","likes":102,"isLikedByUser":false,"isBenchmark":false},{"_id":"67ecc7e56a89505ee1555c25","position":1,"type":"dataset","note":{"html":"For RL.","text":"For RL."},"author":"KodCode","downloads":1403,"gated":false,"id":"KodCode/KodCode-Light-RL-10K","lastModified":"2025-04-02T05:13:01.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":10000,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["tabular","text"]},"private":false,"repoType":"dataset","likes":8,"isLikedByUser":false,"isBenchmark":false},{"_id":"67c2aacb6748b10a82a92538","position":2,"type":"dataset","note":{"html":"for SFT.","text":"for SFT."},"author":"KodCode","downloads":1165,"gated":false,"id":"KodCode/KodCode-V1-SFT-R1","lastModified":"2025-03-17T07:57:30.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":483437,"libraries":["datasets","dask","mlcroissant","polars"],"formats":["parquet"],"modalities":["tabular","text"]},"private":false,"repoType":"dataset","likes":36,"isLikedByUser":false,"isBenchmark":false},{"_id":"67d749e1ba098a0651cf235a","position":3,"type":"dataset","note":{"html":"For SFT.","text":"For SFT."},"author":"KodCode","downloads":86,"gated":false,"id":"KodCode/KodCode-V1-SFT-4o","lastModified":"2025-03-16T21:59:33.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":409552,"libraries":["datasets","dask","mlcroissant","polars"],"formats":["parquet"],"modalities":["tabular","text"]},"private":false,"repoType":"dataset","likes":10,"isLikedByUser":false,"isBenchmark":false}],"position":0,"theme":"orange","private":false,"shareUrl":"https://hf.co/collections/KodCode/kodcode-v1","upvotes":5,"isUpvotedByUser":false}],"datasets":[{"author":"KodCode","downloads":1403,"gated":false,"id":"KodCode/KodCode-Light-RL-10K","lastModified":"2025-04-02T05:13:01.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":10000,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["tabular","text"]},"private":false,"repoType":"dataset","likes":8,"isLikedByUser":false,"isBenchmark":false},{"author":"KodCode","downloads":1165,"gated":false,"id":"KodCode/KodCode-V1-SFT-R1","lastModified":"2025-03-17T07:57:30.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":483437,"libraries":["datasets","dask","mlcroissant","polars"],"formats":["parquet"],"modalities":["tabular","text"]},"private":false,"repoType":"dataset","likes":36,"isLikedByUser":false,"isBenchmark":false},{"author":"KodCode","downloads":1433,"gated":false,"id":"KodCode/KodCode-V1","lastModified":"2025-03-17T07:56:27.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":487432,"libraries":["datasets","dask","mlcroissant","polars"],"formats":["parquet"],"modalities":["tabular","text"]},"private":false,"repoType":"dataset","likes":102,"isLikedByUser":false,"isBenchmark":false},{"author":"KodCode","downloads":86,"gated":false,"id":"KodCode/KodCode-V1-SFT-4o","lastModified":"2025-03-16T21:59:33.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":409552,"libraries":["datasets","dask","mlcroissant","polars"],"formats":["parquet"],"modalities":["tabular","text"]},"private":false,"repoType":"dataset","likes":10,"isLikedByUser":false,"isBenchmark":false}],"models":[],"paperPreviews":[],"spaces":[],"buckets":[],"numBuckets":0,"numDatasets":4,"numModels":0,"numSpaces":1,"lastOrgActivities":[],"acceptLanguages":["*"],"canReadRepos":false,"canReadSpaces":false,"blogPosts":[],"currentRepoPage":0,"filters":{},"paperView":false}">
AI & ML interests
Better coding data for all π§‘
Organization Card
π± KodCode: A Diverse, Challenging, and Verifiable Synthetic Dataset for Coding
KodCode is the largest fully-synthetic open-source dataset providing verifiable solutions and tests for coding tasks. It contains 12 distinct subsets spanning various domains (from algorithmic to package-specific knowledge) and difficulty levels (from basic coding exercises to interview and competitive programming challenges). KodCode is designed for both supervised fine-tuning (SFT) and RL tuning.
πΈοΈ Project Website | π Technical Report | πΎ Github Repo | π€ KodCode-V1 (For RL) | π€ KodCode-V1-SFT-R1 (for SFT)
models
0
None public yet