Deprecated: The each() function is deprecated. This message will be suppressed on further calls in /home/zhenxiangba/zhenxiangba.com/public_html/phproxy-improved-master/index.php on line 456
MaLA-LM (MaLA-LM)
[go: Go Back, main page]

MaLA-LM (Massive Language Adaptation of Large Language Models)! 🌍

\n

MaLA-LM focuses on adapting large language models to support hundreds of languages, including many underrepresented ones. Our models are multilingual, scalable, and optimized for diverse linguistic tasks.

\n

Featured 🗣️

\n

Check out our multilingual LLM collections, featuring models trained to handle 500+ languages, ideal for global, multilingual applications.

\n

Dive into the collections: EMMA-500 | MaLA corpus | MaLA-500

\n

Join our Discord server 👋
https://discord.com/invite/F5mEb7U6we

\n

Happy building! 🚀

\n","classNames":"hf-sanitized hf-sanitized-NT4ZZOz2-wJKuzUeZeltC"},"users":[{"_id":"617a92e16f37340367d5d791","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/617a92e16f37340367d5d791/omgyzmaF90KBLa3YgFxhS.png","isPro":false,"fullname":"Shaoxiong","user":"jisx","type":"user"},{"_id":"6347e493e3f2de18545cbfe8","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/6347e493e3f2de18545cbfe8/_Y068r6Qh7QxqqntRDqC-.jpeg","isPro":false,"fullname":"Peiqin Lin","user":"lpq29743","type":"user"},{"_id":"6514ba89f95f39fd02a949da","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/noauth/3NqhopFY4bQIMxUKNN4es.jpeg","isPro":false,"fullname":"Zihao Li","user":"Zihao-Li","type":"user"},{"_id":"6611225516a9b10274a2ea98","avatarUrl":"/avatars/60b90a165673ba3fa0736d3c48108fb3.svg","isPro":false,"fullname":"Jaakko Paavola","user":"JaakkoP","type":"user"},{"_id":"641248d400634c4fe98589a8","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/641248d400634c4fe98589a8/HAo3C6NC0TiJmXGC_N4aU.jpeg","isPro":false,"fullname":"Pinzhen Chen","user":"pinzhenchen","type":"user"},{"_id":"62054c0b522e40b4a18d8744","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/62054c0b522e40b4a18d8744/e6bJyJCwEuOZI8BiKC0rx.jpeg","isPro":true,"fullname":"Indraneil Paul","user":"iNeil77","type":"user"},{"_id":"62da7114ef8ba975c91fb4c9","avatarUrl":"/avatars/7c0f6068d40a63300a66740e3eb00519.svg","isPro":false,"fullname":"Dayyán O'Brien","user":"Dayyyan","type":"user"},{"_id":"64de06e5a8b70ab6b35a7c89","avatarUrl":"/avatars/45f287a9c07d3fe04c0782a6a99e9743.svg","isPro":false,"fullname":"Hengyu Luo","user":"hengyu-luo","type":"user"},{"_id":"66f60e3413092aa61b68f408","avatarUrl":"/avatars/afacec14751ba6e8b16de45281a70118.svg","isPro":false,"fullname":"Tianxiang Wang","user":"TianxiangWang","type":"user"},{"_id":"65fed45b08d35929362dd651","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/65fed45b08d35929362dd651/KLMxsyRN6_HhCZP1iDw6K.png","isPro":false,"fullname":"FeiYuan","user":"FeYuan","type":"user"},{"_id":"62f41fccd6ba2ee26653a358","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/1660166064634-noauth.jpeg","isPro":false,"fullname":"Yilei Tu","user":"yileitu","type":"user"}],"userCount":11,"collections":[{"slug":"MaLA-LM/fineopus-69201e3593c3f3883203a4e9","title":"FineOPUS","description":"","gating":false,"lastUpdated":"2026-01-07T12:12:41.313Z","owner":{"_id":"651150db327d22455c5d1e28","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/617a92e16f37340367d5d791/ZTrhLcWPyiDTdELAMs13j.jpeg","fullname":"MaLA-LM","name":"MaLA-LM","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":35,"isUserFollowing":false},"items":[{"_id":"69201e3c91bc5b1c15588dcc","position":0,"type":"dataset","author":"MaLA-LM","downloads":60685,"gated":false,"id":"MaLA-LM/FineOPUS-Original","lastModified":"2025-11-29T11:40:39.000Z","datasetsServerInfo":{"viewer":"preview","numRows":0,"libraries":[],"formats":[],"modalities":[]},"private":false,"repoType":"dataset","likes":1,"isLikedByUser":false,"isBenchmark":false},{"_id":"6936eac33324835650b708a5","position":1,"type":"dataset","author":"MaLA-LM","downloads":16287,"gated":false,"id":"MaLA-LM/FineOPUS-ReLID","lastModified":"2025-12-27T19:38:40.000Z","datasetsServerInfo":{"viewer":"preview","numRows":0,"libraries":[],"formats":[],"modalities":[]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},{"_id":"695e4db97ad0bc58078a1d82","position":3,"type":"dataset","author":"MaLA-LM","downloads":6067,"gated":false,"id":"MaLA-LM/FineOPUS-Deduplicated","lastModified":"2026-01-05T21:25:37.000Z","datasetsServerInfo":{"viewer":"preview","numRows":0,"libraries":[],"formats":[],"modalities":[]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false}],"position":1,"theme":"purple","private":false,"shareUrl":"https://hf.co/collections/MaLA-LM/fineopus","upvotes":1,"isUpvotedByUser":false},{"slug":"MaLA-LM/mala-corpus-66e05127641a51de34d39529","title":"MaLA corpus","description":"MaLA Corpus for Massive Language Adaptation of Large Language Models https://mala-lm.github.io","gating":false,"lastUpdated":"2025-11-21T08:08:26.391Z","owner":{"_id":"651150db327d22455c5d1e28","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/617a92e16f37340367d5d791/ZTrhLcWPyiDTdELAMs13j.jpeg","fullname":"MaLA-LM","name":"MaLA-LM","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":35,"isUserFollowing":false},"items":[{"_id":"66e05139b37ddb97cdf41a52","position":0,"type":"dataset","note":{"html":"The MaLA monolingual corpus's noisy version that integrates texts from different sources without cleaning.","text":"The MaLA monolingual corpus's noisy version that integrates texts from different sources without cleaning."},"author":"MaLA-LM","downloads":597,"gated":false,"id":"MaLA-LM/mala-monolingual-integration","lastModified":"2025-10-22T08:18:53.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":2135314310,"libraries":["datasets","dask","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":2,"isLikedByUser":false,"isBenchmark":false},{"_id":"66e05145e1bfac4b46246acb","position":1,"type":"dataset","note":{"html":"The MaLA monolingual corpus's filtered version that performs further data filtering","text":"The MaLA monolingual corpus's filtered version that performs further data filtering"},"author":"MaLA-LM","downloads":1113,"gated":false,"id":"MaLA-LM/mala-monolingual-filter","lastModified":"2025-10-22T06:55:22.000Z","datasetsServerInfo":{"viewer":"viewer-partial","numRows":1420064392,"libraries":["datasets","mlcroissant"],"formats":["arrow"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":2,"isLikedByUser":false,"isBenchmark":false},{"_id":"66e0514fd64de03c6dccc9f7","position":2,"type":"dataset","note":{"html":"The MaLA monolingual corpus's deduplicated version that removes repeated data points","text":"The MaLA monolingual corpus's deduplicated version that removes repeated data points"},"author":"MaLA-LM","downloads":1606,"gated":false,"id":"MaLA-LM/mala-monolingual-dedup","lastModified":"2025-10-22T06:54:48.000Z","datasetsServerInfo":{"viewer":"viewer-partial","numRows":969079711,"libraries":["datasets","mlcroissant"],"formats":["arrow"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":2,"isLikedByUser":false,"isBenchmark":false},{"_id":"66eaa25dd60627ee1c1f2111","position":3,"type":"dataset","note":{"html":"The MaLA monolingual corpus's final version is processed by splitting the filtered and deduplicated version into training and test sets ","text":"The MaLA monolingual corpus's final version is processed by splitting the filtered and deduplicated version into training and test sets "},"author":"MaLA-LM","downloads":1619,"gated":false,"id":"MaLA-LM/mala-monolingual-split","lastModified":"2025-10-22T07:59:03.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":824745465,"libraries":["datasets","dask","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":4,"isLikedByUser":false,"isBenchmark":false}],"position":2,"theme":"orange","private":false,"shareUrl":"https://hf.co/collections/MaLA-LM/mala-corpus","upvotes":7,"isUpvotedByUser":false},{"slug":"MaLA-LM/emma-500-66eaa9acf1f512c8915b7166","title":"EMMA-500","description":"Enhancing massively multilingual adaptation of LLMs on 500+ languages https://mala-lm.github.io","gating":false,"lastUpdated":"2025-11-21T08:08:26.397Z","owner":{"_id":"651150db327d22455c5d1e28","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/617a92e16f37340367d5d791/ZTrhLcWPyiDTdELAMs13j.jpeg","fullname":"MaLA-LM","name":"MaLA-LM","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":35,"isUserFollowing":false},"items":[{"_id":"683ea1701c7412719bfc1efc","position":0,"type":"paper","id":"2506.00469","title":"Massively Multilingual Adaptation of Large Language Models Using\n Bilingual Translation Data","thumbnailUrl":"https://cdn-thumbnails.huggingface.co/social-thumbnails/papers/2506.00469.png","upvotes":4,"publishedAt":"2025-05-31T08:37:17.000Z","isUpvotedByUser":false},{"_id":"681f0b29bf6f0ab482704bee","position":1,"type":"model","author":"MaLA-LM","authorData":{"_id":"651150db327d22455c5d1e28","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/617a92e16f37340367d5d791/ZTrhLcWPyiDTdELAMs13j.jpeg","fullname":"MaLA-LM","name":"MaLA-LM","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":35,"isUserFollowing":false},"downloads":5,"gated":false,"id":"MaLA-LM/emma-500-llama3-8b-mono","availableInferenceProviders":[],"lastModified":"2025-06-09T08:21:24.000Z","likes":0,"pipeline_tag":"text-generation","private":false,"repoType":"model","isLikedByUser":false,"widgetOutputUrls":[],"numParameters":8030261248},{"_id":"681f0b2f25638573da5451e7","position":2,"type":"model","author":"MaLA-LM","authorData":{"_id":"651150db327d22455c5d1e28","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/617a92e16f37340367d5d791/ZTrhLcWPyiDTdELAMs13j.jpeg","fullname":"MaLA-LM","name":"MaLA-LM","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":35,"isUserFollowing":false},"downloads":2306,"gated":false,"id":"MaLA-LM/emma-500-llama3-8b-bi","availableInferenceProviders":[],"lastModified":"2025-06-09T08:21:46.000Z","likes":0,"pipeline_tag":"text-generation","private":false,"repoType":"model","isLikedByUser":false,"widgetOutputUrls":[],"numParameters":8030261248},{"_id":"681f0b376645b9f7d112d706","position":3,"type":"model","author":"MaLA-LM","authorData":{"_id":"651150db327d22455c5d1e28","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/617a92e16f37340367d5d791/ZTrhLcWPyiDTdELAMs13j.jpeg","fullname":"MaLA-LM","name":"MaLA-LM","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":35,"isUserFollowing":false},"downloads":8,"gated":false,"id":"MaLA-LM/emma-500-llama3.1-8b-mono","availableInferenceProviders":[],"lastModified":"2025-06-09T08:20:53.000Z","likes":0,"pipeline_tag":"text-generation","private":false,"repoType":"model","isLikedByUser":false,"widgetOutputUrls":[],"numParameters":8030261248}],"position":3,"theme":"orange","private":false,"shareUrl":"https://hf.co/collections/MaLA-LM/emma-500","upvotes":4,"isUpvotedByUser":false},{"slug":"MaLA-LM/mala-500-660e57f8e53e3cc2ccd31cb9","title":"MaLA-500","description":"MaLA-500: Massive Language Adaptation of Large Language Models https://mala-lm.github.io","gating":false,"lastUpdated":"2025-11-21T08:08:26.400Z","owner":{"_id":"651150db327d22455c5d1e28","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/617a92e16f37340367d5d791/ZTrhLcWPyiDTdELAMs13j.jpeg","fullname":"MaLA-LM","name":"MaLA-LM","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":35,"isUserFollowing":false},"items":[{"_id":"660e583faf7a99f9fb8b206d","position":0,"type":"model","author":"MaLA-LM","authorData":{"_id":"651150db327d22455c5d1e28","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/617a92e16f37340367d5d791/ZTrhLcWPyiDTdELAMs13j.jpeg","fullname":"MaLA-LM","name":"MaLA-LM","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":35,"isUserFollowing":false},"downloads":0,"gated":false,"id":"MaLA-LM/mala-500-10b-v2","availableInferenceProviders":[],"lastModified":"2024-04-03T07:28:58.000Z","likes":6,"pipeline_tag":"text-generation","private":false,"repoType":"model","isLikedByUser":false},{"_id":"660e5834fa5d819e96944765","position":1,"type":"model","author":"MaLA-LM","authorData":{"_id":"651150db327d22455c5d1e28","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/617a92e16f37340367d5d791/ZTrhLcWPyiDTdELAMs13j.jpeg","fullname":"MaLA-LM","name":"MaLA-LM","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":35,"isUserFollowing":false},"downloads":0,"gated":false,"id":"MaLA-LM/mala-500-10b-v1","availableInferenceProviders":[],"lastModified":"2024-04-03T08:25:04.000Z","likes":59,"pipeline_tag":"text-generation","private":false,"repoType":"model","isLikedByUser":false},{"_id":"66db24b7b761ebc47d7562b1","position":2,"type":"model","author":"Zihao-Li","authorData":{"_id":"6514ba89f95f39fd02a949da","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/noauth/3NqhopFY4bQIMxUKNN4es.jpeg","fullname":"Zihao Li","name":"Zihao-Li","type":"user","isPro":false,"isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":6,"isUserFollowing":false},"downloads":5,"gated":false,"id":"Zihao-Li/mala-500-10b-v2-merged","availableInferenceProviders":[],"lastModified":"2024-08-31T20:20:19.000Z","likes":0,"pipeline_tag":"text-generation","private":false,"repoType":"model","isLikedByUser":false,"numParameters":8607535104},{"_id":"66db24c5ba8010cc01572914","position":3,"type":"model","author":"Zihao-Li","authorData":{"_id":"6514ba89f95f39fd02a949da","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/noauth/3NqhopFY4bQIMxUKNN4es.jpeg","fullname":"Zihao Li","name":"Zihao-Li","type":"user","isPro":false,"isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":6,"isUserFollowing":false},"downloads":4,"gated":false,"id":"Zihao-Li/mala-500-10b-v1-merged","availableInferenceProviders":[],"lastModified":"2024-08-31T20:19:49.000Z","likes":0,"pipeline_tag":"text-generation","private":false,"repoType":"model","isLikedByUser":false,"numParameters":8607535104}],"position":4,"theme":"indigo","private":false,"shareUrl":"https://hf.co/collections/MaLA-LM/mala-500","upvotes":0,"isUpvotedByUser":false},{"slug":"MaLA-LM/lucky52-660e5fd24a2ced4b334d63d6","title":"Lucky52","description":"Ji, S., & Chen, P. (2025). How Many Languages Make Good Multilingual Instruction Tuning? A Case Study on BLOOM. In Proceedings of COLING 2025.","gating":false,"lastUpdated":"2025-11-21T08:08:26.399Z","owner":{"_id":"651150db327d22455c5d1e28","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/617a92e16f37340367d5d791/ZTrhLcWPyiDTdELAMs13j.jpeg","fullname":"MaLA-LM","name":"MaLA-LM","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":35,"isUserFollowing":false},"items":[{"_id":"660e80a01b60c78affe0c629","position":0,"type":"model","author":"MaLA-LM","authorData":{"_id":"651150db327d22455c5d1e28","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/617a92e16f37340367d5d791/ZTrhLcWPyiDTdELAMs13j.jpeg","fullname":"MaLA-LM","name":"MaLA-LM","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":35,"isUserFollowing":false},"downloads":5,"gated":false,"id":"MaLA-LM/lucky52-bloom-7b1-no-1","availableInferenceProviders":[],"lastModified":"2024-12-10T09:05:31.000Z","likes":0,"pipeline_tag":"text-generation","private":false,"repoType":"model","isLikedByUser":false},{"_id":"66124fe5f21e83b68f0b372e","position":1,"type":"model","author":"MaLA-LM","authorData":{"_id":"651150db327d22455c5d1e28","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/617a92e16f37340367d5d791/ZTrhLcWPyiDTdELAMs13j.jpeg","fullname":"MaLA-LM","name":"MaLA-LM","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":35,"isUserFollowing":false},"downloads":3,"gated":false,"id":"MaLA-LM/lucky52-bloom-7b1-no-2","availableInferenceProviders":[],"lastModified":"2025-04-08T17:06:45.000Z","likes":0,"pipeline_tag":"text-generation","private":false,"repoType":"model","isLikedByUser":false,"numParameters":8096620544},{"_id":"66124fe5c89fb0188b9ac5a6","position":2,"type":"model","author":"MaLA-LM","authorData":{"_id":"651150db327d22455c5d1e28","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/617a92e16f37340367d5d791/ZTrhLcWPyiDTdELAMs13j.jpeg","fullname":"MaLA-LM","name":"MaLA-LM","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":35,"isUserFollowing":false},"downloads":4,"gated":false,"id":"MaLA-LM/lucky52-bloom-7b1-no-3","availableInferenceProviders":[],"lastModified":"2025-04-08T17:06:52.000Z","likes":0,"pipeline_tag":"text-generation","private":false,"repoType":"model","isLikedByUser":false,"numParameters":8096620544},{"_id":"66124fe5ceb89d45d6a2cc3e","position":3,"type":"model","author":"MaLA-LM","authorData":{"_id":"651150db327d22455c5d1e28","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/617a92e16f37340367d5d791/ZTrhLcWPyiDTdELAMs13j.jpeg","fullname":"MaLA-LM","name":"MaLA-LM","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":35,"isUserFollowing":false},"downloads":4,"gated":false,"id":"MaLA-LM/lucky52-bloom-7b1-no-4","availableInferenceProviders":[],"lastModified":"2025-04-08T17:06:39.000Z","likes":0,"pipeline_tag":"text-generation","private":false,"repoType":"model","isLikedByUser":false,"numParameters":8096620544}],"position":5,"theme":"green","private":false,"shareUrl":"https://hf.co/collections/MaLA-LM/lucky52","upvotes":0,"isUpvotedByUser":false},{"slug":"MaLA-LM/polybench-66f0008816bffdccd5145763","title":"PolyBench","description":"Benchmarks in many languages","gating":false,"lastUpdated":"2025-11-21T08:08:26.405Z","owner":{"_id":"651150db327d22455c5d1e28","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/617a92e16f37340367d5d791/ZTrhLcWPyiDTdELAMs13j.jpeg","fullname":"MaLA-LM","name":"MaLA-LM","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":35,"isUserFollowing":false},"items":[{"_id":"66f0009082d5de5715c4295f","position":0,"type":"dataset","author":"MaLA-LM","downloads":90,"gated":false,"id":"MaLA-LM/PolyWrite","lastModified":"2024-09-27T11:07:04.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":35751,"libraries":["datasets","dask","mlcroissant"],"formats":["json"],"modalities":["tabular","text"]},"private":false,"repoType":"dataset","likes":3,"isLikedByUser":false,"isBenchmark":false},{"_id":"66f140da76a8038cb40b3788","position":1,"type":"dataset","author":"Davlan","downloads":2193,"gated":false,"id":"Davlan/sib200","lastModified":"2024-02-19T16:34:23.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":205820,"libraries":[],"formats":[],"modalities":["text"]},"private":false,"repoType":"dataset","likes":18,"isLikedByUser":false,"isBenchmark":false},{"_id":"66f26297663677075d516763","position":2,"type":"dataset","author":"openai","downloads":8118,"gated":false,"id":"openai/MMMLU","lastModified":"2024-10-16T18:39:00.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":393176,"libraries":["datasets","dask","mlcroissant","polars"],"formats":["csv"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":515,"isLikedByUser":false,"isBenchmark":false}],"position":6,"theme":"indigo","private":false,"shareUrl":"https://hf.co/collections/MaLA-LM/polybench","upvotes":0,"isUpvotedByUser":false}],"datasets":[{"author":"MaLA-LM","downloads":6067,"gated":false,"id":"MaLA-LM/FineOPUS-Deduplicated","lastModified":"2026-01-05T21:25:37.000Z","datasetsServerInfo":{"viewer":"preview","numRows":0,"libraries":[],"formats":[],"modalities":[]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},{"author":"MaLA-LM","downloads":16287,"gated":false,"id":"MaLA-LM/FineOPUS-ReLID","lastModified":"2025-12-27T19:38:40.000Z","datasetsServerInfo":{"viewer":"preview","numRows":0,"libraries":[],"formats":[],"modalities":[]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},{"author":"MaLA-LM","downloads":60685,"gated":false,"id":"MaLA-LM/FineOPUS-Original","lastModified":"2025-11-29T11:40:39.000Z","datasetsServerInfo":{"viewer":"preview","numRows":0,"libraries":[],"formats":[],"modalities":[]},"private":false,"repoType":"dataset","likes":1,"isLikedByUser":false,"isBenchmark":false},{"author":"MaLA-LM","downloads":382,"gated":false,"id":"MaLA-LM/mala-bilingual-translation-corpus","lastModified":"2025-10-24T11:41:02.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":16546569756,"libraries":["datasets","dask","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":6,"isLikedByUser":false,"isBenchmark":false},{"author":"MaLA-LM","downloads":597,"gated":false,"id":"MaLA-LM/mala-monolingual-integration","lastModified":"2025-10-22T08:18:53.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":2135314310,"libraries":["datasets","dask","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":2,"isLikedByUser":false,"isBenchmark":false},{"author":"MaLA-LM","downloads":1619,"gated":false,"id":"MaLA-LM/mala-monolingual-split","lastModified":"2025-10-22T07:59:03.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":824745465,"libraries":["datasets","dask","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":4,"isLikedByUser":false,"isBenchmark":false},{"author":"MaLA-LM","downloads":1113,"gated":false,"id":"MaLA-LM/mala-monolingual-filter","lastModified":"2025-10-22T06:55:22.000Z","datasetsServerInfo":{"viewer":"viewer-partial","numRows":1420064392,"libraries":["datasets","mlcroissant"],"formats":["arrow"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":2,"isLikedByUser":false,"isBenchmark":false},{"author":"MaLA-LM","downloads":1606,"gated":false,"id":"MaLA-LM/mala-monolingual-dedup","lastModified":"2025-10-22T06:54:48.000Z","datasetsServerInfo":{"viewer":"viewer-partial","numRows":969079711,"libraries":["datasets","mlcroissant"],"formats":["arrow"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":2,"isLikedByUser":false,"isBenchmark":false},{"author":"MaLA-LM","downloads":466,"gated":false,"id":"MaLA-LM/mala-opus-dedup-2410-reLID","lastModified":"2025-10-21T16:01:28.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":62543304579,"libraries":["datasets","dask","mlcroissant","polars"],"formats":["parquet"],"modalities":["tabular","text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},{"author":"MaLA-LM","downloads":260,"gated":false,"id":"MaLA-LM/mala-opus-dedup-2410-sample","lastModified":"2025-10-21T15:47:44.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":9501683548,"libraries":["datasets","dask","polars","mlcroissant"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false}],"models":[{"author":"MaLA-LM","authorData":{"_id":"651150db327d22455c5d1e28","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/617a92e16f37340367d5d791/ZTrhLcWPyiDTdELAMs13j.jpeg","fullname":"MaLA-LM","name":"MaLA-LM","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":35,"isUserFollowing":false},"downloads":2,"gated":false,"id":"MaLA-LM/lucky52-bloom-7b1-no-32","availableInferenceProviders":[],"lastModified":"2025-07-18T19:04:03.000Z","likes":0,"pipeline_tag":"text-generation","private":false,"repoType":"model","isLikedByUser":false,"numParameters":8096620544},{"author":"MaLA-LM","authorData":{"_id":"651150db327d22455c5d1e28","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/617a92e16f37340367d5d791/ZTrhLcWPyiDTdELAMs13j.jpeg","fullname":"MaLA-LM","name":"MaLA-LM","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":35,"isUserFollowing":false},"downloads":68,"gated":false,"id":"MaLA-LM/emma-500-llama3.1-8b-bi","availableInferenceProviders":[],"lastModified":"2025-06-09T08:22:10.000Z","likes":1,"pipeline_tag":"text-generation","private":false,"repoType":"model","isLikedByUser":false,"widgetOutputUrls":[],"numParameters":8030261248},{"author":"MaLA-LM","authorData":{"_id":"651150db327d22455c5d1e28","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/617a92e16f37340367d5d791/ZTrhLcWPyiDTdELAMs13j.jpeg","fullname":"MaLA-LM","name":"MaLA-LM","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":35,"isUserFollowing":false},"downloads":2306,"gated":false,"id":"MaLA-LM/emma-500-llama3-8b-bi","availableInferenceProviders":[],"lastModified":"2025-06-09T08:21:46.000Z","likes":0,"pipeline_tag":"text-generation","private":false,"repoType":"model","isLikedByUser":false,"widgetOutputUrls":[],"numParameters":8030261248},{"author":"MaLA-LM","authorData":{"_id":"651150db327d22455c5d1e28","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/617a92e16f37340367d5d791/ZTrhLcWPyiDTdELAMs13j.jpeg","fullname":"MaLA-LM","name":"MaLA-LM","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":35,"isUserFollowing":false},"downloads":5,"gated":false,"id":"MaLA-LM/emma-500-llama3-8b-mono","availableInferenceProviders":[],"lastModified":"2025-06-09T08:21:24.000Z","likes":0,"pipeline_tag":"text-generation","private":false,"repoType":"model","isLikedByUser":false,"widgetOutputUrls":[],"numParameters":8030261248},{"author":"MaLA-LM","authorData":{"_id":"651150db327d22455c5d1e28","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/617a92e16f37340367d5d791/ZTrhLcWPyiDTdELAMs13j.jpeg","fullname":"MaLA-LM","name":"MaLA-LM","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":35,"isUserFollowing":false},"downloads":8,"gated":false,"id":"MaLA-LM/emma-500-llama3.1-8b-mono","availableInferenceProviders":[],"lastModified":"2025-06-09T08:20:53.000Z","likes":0,"pipeline_tag":"text-generation","private":false,"repoType":"model","isLikedByUser":false,"widgetOutputUrls":[],"numParameters":8030261248},{"author":"MaLA-LM","authorData":{"_id":"651150db327d22455c5d1e28","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/617a92e16f37340367d5d791/ZTrhLcWPyiDTdELAMs13j.jpeg","fullname":"MaLA-LM","name":"MaLA-LM","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":35,"isUserFollowing":false},"downloads":4,"gated":false,"id":"MaLA-LM/lucky52-bloom-7b1-no-3","availableInferenceProviders":[],"lastModified":"2025-04-08T17:06:52.000Z","likes":0,"pipeline_tag":"text-generation","private":false,"repoType":"model","isLikedByUser":false,"numParameters":8096620544},{"author":"MaLA-LM","authorData":{"_id":"651150db327d22455c5d1e28","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/617a92e16f37340367d5d791/ZTrhLcWPyiDTdELAMs13j.jpeg","fullname":"MaLA-LM","name":"MaLA-LM","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":35,"isUserFollowing":false},"downloads":3,"gated":false,"id":"MaLA-LM/lucky52-bloom-7b1-no-2","availableInferenceProviders":[],"lastModified":"2025-04-08T17:06:45.000Z","likes":0,"pipeline_tag":"text-generation","private":false,"repoType":"model","isLikedByUser":false,"numParameters":8096620544},{"author":"MaLA-LM","authorData":{"_id":"651150db327d22455c5d1e28","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/617a92e16f37340367d5d791/ZTrhLcWPyiDTdELAMs13j.jpeg","fullname":"MaLA-LM","name":"MaLA-LM","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":35,"isUserFollowing":false},"downloads":4,"gated":false,"id":"MaLA-LM/lucky52-bloom-7b1-no-4","availableInferenceProviders":[],"lastModified":"2025-04-08T17:06:39.000Z","likes":0,"pipeline_tag":"text-generation","private":false,"repoType":"model","isLikedByUser":false,"numParameters":8096620544},{"author":"MaLA-LM","authorData":{"_id":"651150db327d22455c5d1e28","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/617a92e16f37340367d5d791/ZTrhLcWPyiDTdELAMs13j.jpeg","fullname":"MaLA-LM","name":"MaLA-LM","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":35,"isUserFollowing":false},"downloads":3,"gated":false,"id":"MaLA-LM/lucky52-bloom-7b1-no-5","availableInferenceProviders":[],"lastModified":"2025-04-08T17:06:33.000Z","likes":0,"pipeline_tag":"text-generation","private":false,"repoType":"model","isLikedByUser":false,"numParameters":8096620544},{"author":"MaLA-LM","authorData":{"_id":"651150db327d22455c5d1e28","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/617a92e16f37340367d5d791/ZTrhLcWPyiDTdELAMs13j.jpeg","fullname":"MaLA-LM","name":"MaLA-LM","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":35,"isUserFollowing":false},"downloads":4,"gated":false,"id":"MaLA-LM/lucky52-bloom-7b1-no-6","availableInferenceProviders":[],"lastModified":"2025-04-08T17:06:26.000Z","likes":0,"pipeline_tag":"text-generation","private":false,"repoType":"model","isLikedByUser":false,"numParameters":8096620544}],"paperPreviews":[],"spaces":[],"buckets":[],"numBuckets":0,"numDatasets":22,"numModels":59,"numSpaces":1,"lastOrgActivities":[{"time":"2026-01-21T12:06:11.787Z","user":"yileitu","userAvatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/1660166064634-noauth.jpeg","type":"paper","paper":{"id":"2410.00193","title":"Do Vision-Language Models Really Understand Visual Language?","publishedAt":"2024-09-30T19:45:11.000Z","upvotes":0,"isUpvotedByUser":false}},{"time":"2026-01-21T12:06:07.379Z","user":"yileitu","userAvatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/1660166064634-noauth.jpeg","type":"paper","paper":{"id":"2502.11364","title":"Blessing of Multilinguality: A Systematic Analysis of Multilingual In-Context Learning","publishedAt":"2025-02-17T02:27:35.000Z","upvotes":0,"isUpvotedByUser":false}},{"time":"2026-01-20T09:24:40.595Z","user":"jisx","userAvatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/617a92e16f37340367d5d791/omgyzmaF90KBLa3YgFxhS.png","orgAvatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/617a92e16f37340367d5d791/ZTrhLcWPyiDTdELAMs13j.jpeg","type":"publish","repoData":{"author":"MaLA-LM","downloads":23,"gated":false,"id":"MaLA-LM/mala-code-reasoning-v3","lastModified":"2025-05-26T07:15:10.000Z","datasetsServerInfo":{"viewer":"viewer-partial","numRows":168439231,"libraries":["datasets","dask","polars","mlcroissant"],"formats":["json"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":0,"isLikedByUser":false,"isBenchmark":false},"repoId":"MaLA-LM/mala-code-reasoning-v3","repoType":"dataset","org":"MaLA-LM"}],"acceptLanguages":["*"],"canReadRepos":false,"canReadSpaces":false,"blogPosts":[],"currentRepoPage":0,"filters":{},"paperView":false}">

AI & ML interests

NLP & LLM

Recent Activity

Welcome to MaLA-LM (Massive Language Adaptation of Large Language Models)! 🌍

MaLA-LM focuses on adapting large language models to support hundreds of languages, including many underrepresented ones. Our models are multilingual, scalable, and optimized for diverse linguistic tasks.

Featured 🗣️

Check out our multilingual LLM collections, featuring models trained to handle 500+ languages, ideal for global, multilingual applications.

Dive into the collections: EMMA-500 | MaLA corpus | MaLA-500

Join our Discord server 👋
https://discord.com/invite/F5mEb7U6we

Happy building! 🚀