Collections of publicly available datasets
Indic Verse
community
Hugging Face Hub\n\n
\n","classNames":"hf-sanitized hf-sanitized-zSFid4v9KrnprAnVw8HVE"},"users":[{"_id":"630bc25d4c0945d20b880e9a","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/630bc25d4c0945d20b880e9a/CjDLfmCGcCkOS4E1t756M.jpeg","isPro":false,"fullname":"Divi Eswar Chowdary","user":"eswardivi","type":"user"},{"_id":"6274b2221c67dcb7144993a1","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/6274b2221c67dcb7144993a1/4NDu6MhAirfUtJeutzaky.png","isPro":false,"fullname":"Nikhil Chowdary Paleti","user":"LightFury9","type":"user"}],"userCount":2,"collections":[{"slug":"indiehackers/telugu-datasets-65d6e3bc56cb514b482200de","title":"Telugu Datasets","description":"Collections of publicly available datasets","gating":false,"lastUpdated":"2024-02-22T06:05:40.950Z","owner":{"_id":"65bbf3cc40bed843e1c5ac53","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/630bc25d4c0945d20b880e9a/rVbC8dtQpSGnhYG8UQPyK.jpeg","fullname":"Indic Verse","name":"indiehackers","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":3,"isUserFollowing":false},"items":[{"_id":"65d6e40d51bdab3cabc777ea","position":0,"type":"dataset","author":"indiehackers","downloads":13,"gated":false,"id":"indiehackers/telugu_dataset","lastModified":"2024-02-16T03:40:32.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":344539,"libraries":["datasets","dask","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},{"_id":"65d6e43490f11951bcf8660a","position":1,"type":"dataset","author":"indiehackers","downloads":27,"gated":false,"id":"indiehackers/telugu_instruction_dataset","lastModified":"2024-02-01T06:16:00.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":145048,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false}],"position":0,"theme":"green","private":false,"shareUrl":"https://hf.co/collections/indiehackers/telugu-datasets","upvotes":1,"isUpvotedByUser":false},{"slug":"indiehackers/telugu-romanized-datasets-65d6e472c178e22ac89948ed","title":"Telugu Romanized Datasets","description":"Transliterated Telugu Dataset to English","gating":false,"lastUpdated":"2024-02-22T06:07:21.479Z","owner":{"_id":"65bbf3cc40bed843e1c5ac53","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/630bc25d4c0945d20b880e9a/rVbC8dtQpSGnhYG8UQPyK.jpeg","fullname":"Indic Verse","name":"indiehackers","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":3,"isUserFollowing":false},"items":[{"_id":"65d6e490550694a180fbb001","position":0,"type":"dataset","author":"indiehackers","downloads":11,"gated":false,"id":"indiehackers/tenglish_dataset","lastModified":"2024-02-16T19:12:24.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":344539,"libraries":["datasets","dask","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":1,"isLikedByUser":false,"isBenchmark":false},{"_id":"65d6e4992eddc83926261ba8","position":1,"type":"dataset","author":"indiehackers","downloads":6,"gated":false,"id":"indiehackers/tenglish_wikipedia","lastModified":"2024-02-16T19:13:53.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":87854,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false}],"position":1,"theme":"orange","private":false,"shareUrl":"https://hf.co/collections/indiehackers/telugu-romanized-datasets","upvotes":0,"isUpvotedByUser":false},{"slug":"indiehackers/telugu-instruction-dataset-65e3520d84e0784eecb2eb0e","title":"Telugu Instruction Dataset","description":"","gating":false,"lastUpdated":"2024-03-02T16:22:05.569Z","owner":{"_id":"65bbf3cc40bed843e1c5ac53","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/630bc25d4c0945d20b880e9a/rVbC8dtQpSGnhYG8UQPyK.jpeg","fullname":"Indic Verse","name":"indiehackers","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":3,"isUserFollowing":false},"items":[{"_id":"65e3522df70c00af960bc8b2","position":0,"type":"dataset","author":"indiehackers","downloads":27,"gated":false,"id":"indiehackers/telugu_instruction_dataset","lastModified":"2024-02-01T06:16:00.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":145048,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false}],"position":2,"theme":"purple","private":false,"shareUrl":"https://hf.co/collections/indiehackers/telugu-instruction-dataset","upvotes":1,"isUpvotedByUser":false}],"datasets":[{"author":"indiehackers","downloads":6,"gated":false,"id":"indiehackers/hellaswag-telugu-custom-2k","lastModified":"2024-04-23T08:58:36.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":2009,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["tabular","text"]},"private":false,"repoType":"dataset","likes":2,"isLikedByUser":false,"isBenchmark":false},{"author":"indiehackers","downloads":7,"gated":false,"id":"indiehackers/hellaswag-telugu-custom","lastModified":"2024-04-22T02:24:12.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":10042,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["tabular","text"]},"private":false,"repoType":"dataset","likes":1,"isLikedByUser":false,"isBenchmark":false},{"author":"indiehackers","downloads":7,"gated":false,"id":"indiehackers/winogrande_debiased-telugu_filtered","lastModified":"2024-04-21T04:46:34.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":11672,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},{"author":"indiehackers","downloads":5,"gated":false,"id":"indiehackers/databricks-dolly-15k-Telugu-romanized","lastModified":"2024-04-17T13:16:52.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":15011,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},{"author":"indiehackers","downloads":6,"gated":false,"id":"indiehackers/winogrande_debiased-telugu-romanized-nodict","lastModified":"2024-04-06T14:36:30.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":12282,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},{"author":"indiehackers","downloads":14,"gated":false,"id":"indiehackers/winogrande_debiased-telugu-romanized","lastModified":"2024-04-06T14:20:25.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":12282,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},{"author":"indiehackers","downloads":12,"gated":false,"id":"indiehackers/winogrande_debiased-telugu","lastModified":"2024-04-06T13:57:55.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":12282,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},{"author":"indiehackers","downloads":4,"gated":false,"id":"indiehackers/telugu_romanized_2000_mistral","lastModified":"2024-04-06T03:35:36.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":127416,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},{"author":"indiehackers","downloads":6,"gated":false,"id":"indiehackers/telugu_romanized_2048_mistral","lastModified":"2024-04-02T19:48:55.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":125414,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},{"author":"indiehackers","downloads":6,"gated":false,"id":"indiehackers/telugu_romanized","lastModified":"2024-04-02T07:08:54.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":87854,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false}],"models":[{"author":"indiehackers","authorData":{"_id":"65bbf3cc40bed843e1c5ac53","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/630bc25d4c0945d20b880e9a/rVbC8dtQpSGnhYG8UQPyK.jpeg","fullname":"Indic Verse","name":"indiehackers","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":3,"isUserFollowing":false},"downloads":0,"gated":false,"id":"indiehackers/gemma7b-telugu-instruct","availableInferenceProviders":[],"lastModified":"2024-04-20T17:29:36.000Z","likes":0,"private":false,"repoType":"model","isLikedByUser":false},{"author":"indiehackers","authorData":{"_id":"65bbf3cc40bed843e1c5ac53","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/630bc25d4c0945d20b880e9a/rVbC8dtQpSGnhYG8UQPyK.jpeg","fullname":"Indic Verse","name":"indiehackers","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":3,"isUserFollowing":false},"downloads":0,"gated":false,"id":"indiehackers/gemma2b-telugu-instruct","availableInferenceProviders":[],"lastModified":"2024-04-20T12:52:53.000Z","likes":0,"private":false,"repoType":"model","isLikedByUser":false},{"author":"indiehackers","authorData":{"_id":"65bbf3cc40bed843e1c5ac53","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/630bc25d4c0945d20b880e9a/rVbC8dtQpSGnhYG8UQPyK.jpeg","fullname":"Indic Verse","name":"indiehackers","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":3,"isUserFollowing":false},"downloads":0,"gated":false,"id":"indiehackers/llama3-telugu-instruct","availableInferenceProviders":[],"lastModified":"2024-04-20T10:04:20.000Z","likes":0,"private":false,"repoType":"model","isLikedByUser":false},{"author":"indiehackers","authorData":{"_id":"65bbf3cc40bed843e1c5ac53","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/630bc25d4c0945d20b880e9a/rVbC8dtQpSGnhYG8UQPyK.jpeg","fullname":"Indic Verse","name":"indiehackers","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":3,"isUserFollowing":false},"downloads":0,"gated":false,"id":"indiehackers/gemma-telugu-instruct-test1","availableInferenceProviders":[],"lastModified":"2024-04-19T12:58:47.000Z","likes":0,"private":false,"repoType":"model","isLikedByUser":false},{"author":"indiehackers","authorData":{"_id":"65bbf3cc40bed843e1c5ac53","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/630bc25d4c0945d20b880e9a/rVbC8dtQpSGnhYG8UQPyK.jpeg","fullname":"Indic Verse","name":"indiehackers","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":3,"isUserFollowing":false},"downloads":0,"gated":false,"id":"indiehackers/mistral-tenglish-april5_2","availableInferenceProviders":[],"lastModified":"2024-04-06T01:20:20.000Z","likes":0,"private":false,"repoType":"model","isLikedByUser":false}],"paperPreviews":[],"spaces":[],"buckets":[],"numBuckets":0,"numDatasets":19,"numModels":5,"numSpaces":1,"lastOrgActivities":[],"acceptLanguages":["*"],"canReadRepos":false,"canReadSpaces":false,"blogPosts":[],"currentRepoPage":0,"filters":{},"paperView":false}">
datasets
19
π Citation
\nIf you use our datasets or models in your research, please cite us as follows:
\n@misc{IndicVerse2024, \n author = {Nikhil Chowdary Paleti and Divi Eswar Chowdary}, \n title = {Indic Verse: Datasets and Models for Advancing Indic Languages in NLP}, \n year = {2024}, \n publisher = {Hugging Face}, \n url = {https://huggingface.co/IndicVerse} \n}\n\n\n","classNames":"hf-sanitized hf-sanitized-zSFid4v9KrnprAnVw8HVE"},"users":[{"_id":"630bc25d4c0945d20b880e9a","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/630bc25d4c0945d20b880e9a/CjDLfmCGcCkOS4E1t756M.jpeg","isPro":false,"fullname":"Divi Eswar Chowdary","user":"eswardivi","type":"user"},{"_id":"6274b2221c67dcb7144993a1","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/6274b2221c67dcb7144993a1/4NDu6MhAirfUtJeutzaky.png","isPro":false,"fullname":"Nikhil Chowdary Paleti","user":"LightFury9","type":"user"}],"userCount":2,"collections":[{"slug":"indiehackers/telugu-datasets-65d6e3bc56cb514b482200de","title":"Telugu Datasets","description":"Collections of publicly available datasets","gating":false,"lastUpdated":"2024-02-22T06:05:40.950Z","owner":{"_id":"65bbf3cc40bed843e1c5ac53","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/630bc25d4c0945d20b880e9a/rVbC8dtQpSGnhYG8UQPyK.jpeg","fullname":"Indic Verse","name":"indiehackers","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":3,"isUserFollowing":false},"items":[{"_id":"65d6e40d51bdab3cabc777ea","position":0,"type":"dataset","author":"indiehackers","downloads":13,"gated":false,"id":"indiehackers/telugu_dataset","lastModified":"2024-02-16T03:40:32.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":344539,"libraries":["datasets","dask","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},{"_id":"65d6e43490f11951bcf8660a","position":1,"type":"dataset","author":"indiehackers","downloads":27,"gated":false,"id":"indiehackers/telugu_instruction_dataset","lastModified":"2024-02-01T06:16:00.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":145048,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false}],"position":0,"theme":"green","private":false,"shareUrl":"https://hf.co/collections/indiehackers/telugu-datasets","upvotes":1,"isUpvotedByUser":false},{"slug":"indiehackers/telugu-romanized-datasets-65d6e472c178e22ac89948ed","title":"Telugu Romanized Datasets","description":"Transliterated Telugu Dataset to English","gating":false,"lastUpdated":"2024-02-22T06:07:21.479Z","owner":{"_id":"65bbf3cc40bed843e1c5ac53","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/630bc25d4c0945d20b880e9a/rVbC8dtQpSGnhYG8UQPyK.jpeg","fullname":"Indic Verse","name":"indiehackers","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":3,"isUserFollowing":false},"items":[{"_id":"65d6e490550694a180fbb001","position":0,"type":"dataset","author":"indiehackers","downloads":11,"gated":false,"id":"indiehackers/tenglish_dataset","lastModified":"2024-02-16T19:12:24.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":344539,"libraries":["datasets","dask","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":1,"isLikedByUser":false,"isBenchmark":false},{"_id":"65d6e4992eddc83926261ba8","position":1,"type":"dataset","author":"indiehackers","downloads":6,"gated":false,"id":"indiehackers/tenglish_wikipedia","lastModified":"2024-02-16T19:13:53.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":87854,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false}],"position":1,"theme":"orange","private":false,"shareUrl":"https://hf.co/collections/indiehackers/telugu-romanized-datasets","upvotes":0,"isUpvotedByUser":false},{"slug":"indiehackers/telugu-instruction-dataset-65e3520d84e0784eecb2eb0e","title":"Telugu Instruction Dataset","description":"","gating":false,"lastUpdated":"2024-03-02T16:22:05.569Z","owner":{"_id":"65bbf3cc40bed843e1c5ac53","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/630bc25d4c0945d20b880e9a/rVbC8dtQpSGnhYG8UQPyK.jpeg","fullname":"Indic Verse","name":"indiehackers","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":3,"isUserFollowing":false},"items":[{"_id":"65e3522df70c00af960bc8b2","position":0,"type":"dataset","author":"indiehackers","downloads":27,"gated":false,"id":"indiehackers/telugu_instruction_dataset","lastModified":"2024-02-01T06:16:00.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":145048,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false}],"position":2,"theme":"purple","private":false,"shareUrl":"https://hf.co/collections/indiehackers/telugu-instruction-dataset","upvotes":1,"isUpvotedByUser":false}],"datasets":[{"author":"indiehackers","downloads":6,"gated":false,"id":"indiehackers/hellaswag-telugu-custom-2k","lastModified":"2024-04-23T08:58:36.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":2009,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["tabular","text"]},"private":false,"repoType":"dataset","likes":2,"isLikedByUser":false,"isBenchmark":false},{"author":"indiehackers","downloads":7,"gated":false,"id":"indiehackers/hellaswag-telugu-custom","lastModified":"2024-04-22T02:24:12.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":10042,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["tabular","text"]},"private":false,"repoType":"dataset","likes":1,"isLikedByUser":false,"isBenchmark":false},{"author":"indiehackers","downloads":7,"gated":false,"id":"indiehackers/winogrande_debiased-telugu_filtered","lastModified":"2024-04-21T04:46:34.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":11672,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},{"author":"indiehackers","downloads":5,"gated":false,"id":"indiehackers/databricks-dolly-15k-Telugu-romanized","lastModified":"2024-04-17T13:16:52.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":15011,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},{"author":"indiehackers","downloads":6,"gated":false,"id":"indiehackers/winogrande_debiased-telugu-romanized-nodict","lastModified":"2024-04-06T14:36:30.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":12282,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},{"author":"indiehackers","downloads":14,"gated":false,"id":"indiehackers/winogrande_debiased-telugu-romanized","lastModified":"2024-04-06T14:20:25.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":12282,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},{"author":"indiehackers","downloads":12,"gated":false,"id":"indiehackers/winogrande_debiased-telugu","lastModified":"2024-04-06T13:57:55.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":12282,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},{"author":"indiehackers","downloads":4,"gated":false,"id":"indiehackers/telugu_romanized_2000_mistral","lastModified":"2024-04-06T03:35:36.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":127416,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},{"author":"indiehackers","downloads":6,"gated":false,"id":"indiehackers/telugu_romanized_2048_mistral","lastModified":"2024-04-02T19:48:55.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":125414,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},{"author":"indiehackers","downloads":6,"gated":false,"id":"indiehackers/telugu_romanized","lastModified":"2024-04-02T07:08:54.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":87854,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false}],"models":[{"author":"indiehackers","authorData":{"_id":"65bbf3cc40bed843e1c5ac53","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/630bc25d4c0945d20b880e9a/rVbC8dtQpSGnhYG8UQPyK.jpeg","fullname":"Indic Verse","name":"indiehackers","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":3,"isUserFollowing":false},"downloads":0,"gated":false,"id":"indiehackers/gemma7b-telugu-instruct","availableInferenceProviders":[],"lastModified":"2024-04-20T17:29:36.000Z","likes":0,"private":false,"repoType":"model","isLikedByUser":false},{"author":"indiehackers","authorData":{"_id":"65bbf3cc40bed843e1c5ac53","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/630bc25d4c0945d20b880e9a/rVbC8dtQpSGnhYG8UQPyK.jpeg","fullname":"Indic Verse","name":"indiehackers","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":3,"isUserFollowing":false},"downloads":0,"gated":false,"id":"indiehackers/gemma2b-telugu-instruct","availableInferenceProviders":[],"lastModified":"2024-04-20T12:52:53.000Z","likes":0,"private":false,"repoType":"model","isLikedByUser":false},{"author":"indiehackers","authorData":{"_id":"65bbf3cc40bed843e1c5ac53","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/630bc25d4c0945d20b880e9a/rVbC8dtQpSGnhYG8UQPyK.jpeg","fullname":"Indic Verse","name":"indiehackers","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":3,"isUserFollowing":false},"downloads":0,"gated":false,"id":"indiehackers/llama3-telugu-instruct","availableInferenceProviders":[],"lastModified":"2024-04-20T10:04:20.000Z","likes":0,"private":false,"repoType":"model","isLikedByUser":false},{"author":"indiehackers","authorData":{"_id":"65bbf3cc40bed843e1c5ac53","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/630bc25d4c0945d20b880e9a/rVbC8dtQpSGnhYG8UQPyK.jpeg","fullname":"Indic Verse","name":"indiehackers","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":3,"isUserFollowing":false},"downloads":0,"gated":false,"id":"indiehackers/gemma-telugu-instruct-test1","availableInferenceProviders":[],"lastModified":"2024-04-19T12:58:47.000Z","likes":0,"private":false,"repoType":"model","isLikedByUser":false},{"author":"indiehackers","authorData":{"_id":"65bbf3cc40bed843e1c5ac53","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/630bc25d4c0945d20b880e9a/rVbC8dtQpSGnhYG8UQPyK.jpeg","fullname":"Indic Verse","name":"indiehackers","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":3,"isUserFollowing":false},"downloads":0,"gated":false,"id":"indiehackers/mistral-tenglish-april5_2","availableInferenceProviders":[],"lastModified":"2024-04-06T01:20:20.000Z","likes":0,"private":false,"repoType":"model","isLikedByUser":false}],"paperPreviews":[],"spaces":[],"buckets":[],"numBuckets":0,"numDatasets":19,"numModels":5,"numSpaces":1,"lastOrgActivities":[],"acceptLanguages":["*"],"canReadRepos":false,"canReadSpaces":false,"blogPosts":[],"currentRepoPage":0,"filters":{},"paperView":false}">
AI & ML interests
None defined yet.
Organization Card
π IndicVerse
IndicVerse is dedicated to advancing natural language processing (NLP) capabilities for Indic languages. Our mission is to bridge the gap in NLP research for low-resource Indic languages by providing high-quality datasets, pre-trained models, and tools tailored for diverse linguistic needs.
π What We Do
- Datasets: Creation and publication of datasets for various NLP tasks, including translation, classification, and generation, with a focus on Indic languages.
- Models: Development of state-of-the-art NLP models fine-tuned for Indic languages, leveraging techniques like PEFT and LoRA.
- Research: Conducting and sharing research to solve key challenges in Indic NLP, including transliteration, low-resource learning, and domain-specific applications.
π Featured Projects
- Hellaswag-Telugu: A Telugu version of the Hellaswag dataset for advanced evaluation.
- Indic Language Translation and Transliteration: Custom tools and APIs for translation and mixed transliteration (Telugu-English).
π οΈ How to Contribute
We welcome contributions! Whether youβre interested in annotating data, building models, or sharing insights, feel free to get in touch.
π Links
π Citation
If you use our datasets or models in your research, please cite us as follows:
@misc{IndicVerse2024,
author = {Nikhil Chowdary Paleti and Divi Eswar Chowdary},
title = {Indic Verse: Datasets and Models for Advancing Indic Languages in NLP},
year = {2024},
publisher = {Hugging Face},
url = {https://huggingface.co/IndicVerse}
}
datasets
19
indiehackers/hellaswag-telugu-custom-2k
Viewer
β’
Updated
β’
2.01k
β’
6
β’
2
indiehackers/hellaswag-telugu-custom
Viewer
β’
Updated
β’
10k
β’
7
β’
1
indiehackers/winogrande_debiased-telugu_filtered
Viewer
β’
Updated
β’
11.7k
β’
7
indiehackers/databricks-dolly-15k-Telugu-romanized
Viewer
β’
Updated
β’
15k
β’
5
indiehackers/winogrande_debiased-telugu-romanized-nodict
Viewer
β’
Updated
β’
12.3k
β’
6
indiehackers/winogrande_debiased-telugu-romanized
Viewer
β’
Updated
β’
12.3k
β’
14
indiehackers/winogrande_debiased-telugu
Viewer
β’
Updated
β’
12.3k
β’
12
indiehackers/telugu_romanized_2000_mistral
Viewer
β’
Updated
β’
127k
β’
4
indiehackers/telugu_romanized_2048_mistral
Viewer
β’
Updated
β’
125k
β’
6
indiehackers/telugu_romanized
Viewer
β’
Updated
β’
87.9k
β’
6