Deprecated: The each() function is deprecated. This message will be suppressed on further calls in /home/zhenxiangba/zhenxiangba.com/public_html/phproxy-improved-master/index.php on line 456
indiehackers (Indic Verse)
[go: Go Back, main page]

Hugging Face Hub\n\n

πŸ“œ Citation

\n

If you use our datasets or models in your research, please cite us as follows:

\n
@misc{IndicVerse2024,  \n  author = {Nikhil Chowdary Paleti and Divi Eswar Chowdary},  \n  title = {Indic Verse: Datasets and Models for Advancing Indic Languages in NLP},  \n  year = {2024},  \n  publisher = {Hugging Face},  \n  url = {https://huggingface.co/IndicVerse}  \n}\n
\n
\n","classNames":"hf-sanitized hf-sanitized-zSFid4v9KrnprAnVw8HVE"},"users":[{"_id":"630bc25d4c0945d20b880e9a","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/630bc25d4c0945d20b880e9a/CjDLfmCGcCkOS4E1t756M.jpeg","isPro":false,"fullname":"Divi Eswar Chowdary","user":"eswardivi","type":"user"},{"_id":"6274b2221c67dcb7144993a1","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/6274b2221c67dcb7144993a1/4NDu6MhAirfUtJeutzaky.png","isPro":false,"fullname":"Nikhil Chowdary Paleti","user":"LightFury9","type":"user"}],"userCount":2,"collections":[{"slug":"indiehackers/telugu-datasets-65d6e3bc56cb514b482200de","title":"Telugu Datasets","description":"Collections of publicly available datasets","gating":false,"lastUpdated":"2024-02-22T06:05:40.950Z","owner":{"_id":"65bbf3cc40bed843e1c5ac53","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/630bc25d4c0945d20b880e9a/rVbC8dtQpSGnhYG8UQPyK.jpeg","fullname":"Indic Verse","name":"indiehackers","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":3,"isUserFollowing":false},"items":[{"_id":"65d6e40d51bdab3cabc777ea","position":0,"type":"dataset","author":"indiehackers","downloads":13,"gated":false,"id":"indiehackers/telugu_dataset","lastModified":"2024-02-16T03:40:32.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":344539,"libraries":["datasets","dask","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},{"_id":"65d6e43490f11951bcf8660a","position":1,"type":"dataset","author":"indiehackers","downloads":27,"gated":false,"id":"indiehackers/telugu_instruction_dataset","lastModified":"2024-02-01T06:16:00.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":145048,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false}],"position":0,"theme":"green","private":false,"shareUrl":"https://hf.co/collections/indiehackers/telugu-datasets","upvotes":1,"isUpvotedByUser":false},{"slug":"indiehackers/telugu-romanized-datasets-65d6e472c178e22ac89948ed","title":"Telugu Romanized Datasets","description":"Transliterated Telugu Dataset to English","gating":false,"lastUpdated":"2024-02-22T06:07:21.479Z","owner":{"_id":"65bbf3cc40bed843e1c5ac53","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/630bc25d4c0945d20b880e9a/rVbC8dtQpSGnhYG8UQPyK.jpeg","fullname":"Indic Verse","name":"indiehackers","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":3,"isUserFollowing":false},"items":[{"_id":"65d6e490550694a180fbb001","position":0,"type":"dataset","author":"indiehackers","downloads":11,"gated":false,"id":"indiehackers/tenglish_dataset","lastModified":"2024-02-16T19:12:24.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":344539,"libraries":["datasets","dask","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":1,"isLikedByUser":false,"isBenchmark":false},{"_id":"65d6e4992eddc83926261ba8","position":1,"type":"dataset","author":"indiehackers","downloads":6,"gated":false,"id":"indiehackers/tenglish_wikipedia","lastModified":"2024-02-16T19:13:53.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":87854,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false}],"position":1,"theme":"orange","private":false,"shareUrl":"https://hf.co/collections/indiehackers/telugu-romanized-datasets","upvotes":0,"isUpvotedByUser":false},{"slug":"indiehackers/telugu-instruction-dataset-65e3520d84e0784eecb2eb0e","title":"Telugu Instruction Dataset","description":"","gating":false,"lastUpdated":"2024-03-02T16:22:05.569Z","owner":{"_id":"65bbf3cc40bed843e1c5ac53","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/630bc25d4c0945d20b880e9a/rVbC8dtQpSGnhYG8UQPyK.jpeg","fullname":"Indic Verse","name":"indiehackers","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":3,"isUserFollowing":false},"items":[{"_id":"65e3522df70c00af960bc8b2","position":0,"type":"dataset","author":"indiehackers","downloads":27,"gated":false,"id":"indiehackers/telugu_instruction_dataset","lastModified":"2024-02-01T06:16:00.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":145048,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false}],"position":2,"theme":"purple","private":false,"shareUrl":"https://hf.co/collections/indiehackers/telugu-instruction-dataset","upvotes":1,"isUpvotedByUser":false}],"datasets":[{"author":"indiehackers","downloads":6,"gated":false,"id":"indiehackers/hellaswag-telugu-custom-2k","lastModified":"2024-04-23T08:58:36.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":2009,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["tabular","text"]},"private":false,"repoType":"dataset","likes":2,"isLikedByUser":false,"isBenchmark":false},{"author":"indiehackers","downloads":7,"gated":false,"id":"indiehackers/hellaswag-telugu-custom","lastModified":"2024-04-22T02:24:12.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":10042,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["tabular","text"]},"private":false,"repoType":"dataset","likes":1,"isLikedByUser":false,"isBenchmark":false},{"author":"indiehackers","downloads":7,"gated":false,"id":"indiehackers/winogrande_debiased-telugu_filtered","lastModified":"2024-04-21T04:46:34.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":11672,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},{"author":"indiehackers","downloads":5,"gated":false,"id":"indiehackers/databricks-dolly-15k-Telugu-romanized","lastModified":"2024-04-17T13:16:52.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":15011,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},{"author":"indiehackers","downloads":6,"gated":false,"id":"indiehackers/winogrande_debiased-telugu-romanized-nodict","lastModified":"2024-04-06T14:36:30.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":12282,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},{"author":"indiehackers","downloads":14,"gated":false,"id":"indiehackers/winogrande_debiased-telugu-romanized","lastModified":"2024-04-06T14:20:25.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":12282,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},{"author":"indiehackers","downloads":12,"gated":false,"id":"indiehackers/winogrande_debiased-telugu","lastModified":"2024-04-06T13:57:55.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":12282,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},{"author":"indiehackers","downloads":4,"gated":false,"id":"indiehackers/telugu_romanized_2000_mistral","lastModified":"2024-04-06T03:35:36.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":127416,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},{"author":"indiehackers","downloads":6,"gated":false,"id":"indiehackers/telugu_romanized_2048_mistral","lastModified":"2024-04-02T19:48:55.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":125414,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},{"author":"indiehackers","downloads":6,"gated":false,"id":"indiehackers/telugu_romanized","lastModified":"2024-04-02T07:08:54.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":87854,"libraries":["datasets","pandas","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false}],"models":[{"author":"indiehackers","authorData":{"_id":"65bbf3cc40bed843e1c5ac53","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/630bc25d4c0945d20b880e9a/rVbC8dtQpSGnhYG8UQPyK.jpeg","fullname":"Indic Verse","name":"indiehackers","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":3,"isUserFollowing":false},"downloads":0,"gated":false,"id":"indiehackers/gemma7b-telugu-instruct","availableInferenceProviders":[],"lastModified":"2024-04-20T17:29:36.000Z","likes":0,"private":false,"repoType":"model","isLikedByUser":false},{"author":"indiehackers","authorData":{"_id":"65bbf3cc40bed843e1c5ac53","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/630bc25d4c0945d20b880e9a/rVbC8dtQpSGnhYG8UQPyK.jpeg","fullname":"Indic Verse","name":"indiehackers","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":3,"isUserFollowing":false},"downloads":0,"gated":false,"id":"indiehackers/gemma2b-telugu-instruct","availableInferenceProviders":[],"lastModified":"2024-04-20T12:52:53.000Z","likes":0,"private":false,"repoType":"model","isLikedByUser":false},{"author":"indiehackers","authorData":{"_id":"65bbf3cc40bed843e1c5ac53","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/630bc25d4c0945d20b880e9a/rVbC8dtQpSGnhYG8UQPyK.jpeg","fullname":"Indic Verse","name":"indiehackers","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":3,"isUserFollowing":false},"downloads":0,"gated":false,"id":"indiehackers/llama3-telugu-instruct","availableInferenceProviders":[],"lastModified":"2024-04-20T10:04:20.000Z","likes":0,"private":false,"repoType":"model","isLikedByUser":false},{"author":"indiehackers","authorData":{"_id":"65bbf3cc40bed843e1c5ac53","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/630bc25d4c0945d20b880e9a/rVbC8dtQpSGnhYG8UQPyK.jpeg","fullname":"Indic Verse","name":"indiehackers","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":3,"isUserFollowing":false},"downloads":0,"gated":false,"id":"indiehackers/gemma-telugu-instruct-test1","availableInferenceProviders":[],"lastModified":"2024-04-19T12:58:47.000Z","likes":0,"private":false,"repoType":"model","isLikedByUser":false},{"author":"indiehackers","authorData":{"_id":"65bbf3cc40bed843e1c5ac53","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/630bc25d4c0945d20b880e9a/rVbC8dtQpSGnhYG8UQPyK.jpeg","fullname":"Indic Verse","name":"indiehackers","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":3,"isUserFollowing":false},"downloads":0,"gated":false,"id":"indiehackers/mistral-tenglish-april5_2","availableInferenceProviders":[],"lastModified":"2024-04-06T01:20:20.000Z","likes":0,"private":false,"repoType":"model","isLikedByUser":false}],"paperPreviews":[],"spaces":[],"buckets":[],"numBuckets":0,"numDatasets":19,"numModels":5,"numSpaces":1,"lastOrgActivities":[],"acceptLanguages":["*"],"canReadRepos":false,"canReadSpaces":false,"blogPosts":[],"currentRepoPage":0,"filters":{},"paperView":false}">

AI & ML interests

None defined yet.

🌏 IndicVerse

IndicVerse is dedicated to advancing natural language processing (NLP) capabilities for Indic languages. Our mission is to bridge the gap in NLP research for low-resource Indic languages by providing high-quality datasets, pre-trained models, and tools tailored for diverse linguistic needs.

πŸš€ What We Do

  • Datasets: Creation and publication of datasets for various NLP tasks, including translation, classification, and generation, with a focus on Indic languages.
  • Models: Development of state-of-the-art NLP models fine-tuned for Indic languages, leveraging techniques like PEFT and LoRA.
  • Research: Conducting and sharing research to solve key challenges in Indic NLP, including transliteration, low-resource learning, and domain-specific applications.

πŸ“š Featured Projects

  • Hellaswag-Telugu: A Telugu version of the Hellaswag dataset for advanced evaluation.
  • Indic Language Translation and Transliteration: Custom tools and APIs for translation and mixed transliteration (Telugu-English).

πŸ› οΈ How to Contribute

We welcome contributions! Whether you’re interested in annotating data, building models, or sharing insights, feel free to get in touch.

🌐 Links

πŸ“œ Citation

If you use our datasets or models in your research, please cite us as follows:

@misc{IndicVerse2024,  
  author = {Nikhil Chowdary Paleti and Divi Eswar Chowdary},  
  title = {Indic Verse: Datasets and Models for Advancing Indic Languages in NLP},  
  year = {2024},  
  publisher = {Hugging Face},  
  url = {https://huggingface.co/IndicVerse}  
}