Deprecated: The each() function is deprecated. This message will be suppressed on further calls in /home/zhenxiangba/zhenxiangba.com/public_html/phproxy-improved-master/index.php on line 456
J-shang (Ning Shang)
[go: Go Back, main page]

https://huggingface.co/spaces/HuggingFaceFW/blogpost-fineweb-v1","text":"From CC 2013-20 ~ 2025-26 (continue updating)\n18.5T tokens, English only\nBlog: https://huggingface.co/spaces/HuggingFaceFW/blogpost-fineweb-v1"},"author":"HuggingFaceFW","downloads":197213,"gated":false,"id":"HuggingFaceFW/fineweb","lastModified":"2025-07-11T20:16:53.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":52453695892,"libraries":[],"formats":[],"modalities":["tabular","text"]},"private":false,"repoType":"dataset","likes":2666,"isLikedByUser":false,"isBenchmark":false},{"_id":"69365fbf810333893a0f349d","position":2,"type":"dataset","note":{"html":"From CC 2013-20 ~ 2025-26 (continue updating)\n1.3T tokens\nPaper: https://arxiv.org/abs/2406.17557","text":"From CC 2013-20 ~ 2025-26 (continue updating)\n1.3T tokens\nPaper: https://arxiv.org/abs/2406.17557"},"author":"HuggingFaceFW","downloads":262345,"gated":false,"id":"HuggingFaceFW/fineweb-edu","lastModified":"2025-07-11T20:16:53.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":3496736741,"libraries":["datasets","dask","polars","mlcroissant"],"formats":["parquet"],"modalities":["tabular","text"]},"private":false,"repoType":"dataset","likes":953,"isLikedByUser":false,"isBenchmark":false},{"_id":"69363f19a118d6b1afed2976","position":3,"type":"dataset","note":{"html":"From CC 2013-20 ~ 2024-18\n20TB disk (3T words), 1000+ languages\nBlog: https://huggingface.co/spaces/HuggingFaceFW/blogpost-fine-tasks","text":"From CC 2013-20 ~ 2024-18\n20TB disk (3T words), 1000+ languages\nBlog: https://huggingface.co/spaces/HuggingFaceFW/blogpost-fine-tasks"},"author":"HuggingFaceFW","downloads":74224,"gated":false,"id":"HuggingFaceFW/fineweb-2","lastModified":"2025-10-27T18:32:07.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":4484929995,"libraries":[],"formats":[],"modalities":["tabular","text"]},"private":false,"repoType":"dataset","likes":753,"isLikedByUser":false,"isBenchmark":false}],"position":0,"theme":"blue","private":false,"shareUrl":"https://hf.co/collections/J-shang/pt-datasets","upvotes":0,"isUpvotedByUser":false}],"datasets":[],"models":[],"buckets":[],"numBuckets":0,"numberLikes":1,"papers":[{"id":"2502.20082","title":"LongRoPE2: Near-Lossless LLM Context Window Scaling","thumbnailUrl":"https://cdn-thumbnails.huggingface.co/social-thumbnails/papers/2502.20082.png","upvotes":36,"publishedAt":"2025-02-27T13:41:07.000Z","isUpvotedByUser":false},{"id":"2501.04519","title":"rStar-Math: Small LLMs Can Master Math Reasoning with Self-Evolved Deep\n Thinking","thumbnailUrl":"https://cdn-thumbnails.huggingface.co/social-thumbnails/papers/2501.04519.png","upvotes":288,"publishedAt":"2025-01-08T14:12:57.000Z","isUpvotedByUser":false}],"posts":[],"totalPosts":0,"spaces":[],"u":{"avatarUrl":"/avatars/787553c73e9a96adc5219e67acd29c00.svg","isPro":false,"fullname":"Ning Shang","user":"J-shang","orgs":[],"signup":{},"isHf":false,"isMod":false,"type":"user","theme":"light"},"upvotes":4,"numFollowers":5,"numFollowingUsers":0,"numFollowingOrgs":0,"numModels":0,"numDatasets":0,"numSpaces":0,"isFollowing":false,"isFollower":false,"sampleFollowers":[{"user":"OldKingMeister","fullname":"Siyuan Wang","type":"user","_id":"6495b0b844bc2e9ce6cc849b","isPro":false,"avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/noauth/j6aucl_tefMHwtD-bdUAw.jpeg"},{"user":"21world","fullname":"www.minds.com/jelyazko/","type":"user","_id":"64548986cd09ceba0e1709cb","isPro":false,"avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/64548986cd09ceba0e1709cb/muGiatjmPfzxYb3Rjcqas.jpeg"},{"user":"Kseniase","fullname":"Ksenia Se","type":"user","_id":"64838b28c235ef76b63e4999","isPro":false,"avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/64838b28c235ef76b63e4999/ZhQCYoU3vps71Ag7Jezj6.jpeg"},{"user":"Tonic","fullname":"Joseph [open/acc] Pollack","type":"user","_id":"62a3bb1cd0d8c2c2169f0b88","isPro":true,"avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/62a3bb1cd0d8c2c2169f0b88/eT2TS0IlQbZtz-F_zHLz9.jpeg"}],"isWatching":false,"isIgnored":false,"acceptLanguages":["*"],"filters":{},"currentRepoPage":0}">