Deprecated: The each() function is deprecated. This message will be suppressed on further calls in /home/zhenxiangba/zhenxiangba.com/public_html/phproxy-improved-master/index.php on line 456
fineinstructions (FineInstructions)
[go: Go Back, main page]

FineInstructions

community
\"FineInstructionsCoverImage\"

\n

✨ Paper: https://arxiv.org/abs/2601.22146

\n

✨ Code: Coming soon

\n

✨ Datasets:

\n\n

✨ Models:

\n
    \n
  1. Query Genericizer (Query ⇒ Instruction Template): https://huggingface.co/fineinstructions/query_templatizer
  2. \n
  3. Document ⇔ Template Matching / Retrieval Embedding: https://huggingface.co/fineinstructions/instruction_template_retrieval_embedding
  4. \n
  5. Template Instantiator (Document + Template ⇒ Synthetic Instruction-Answer Pair): https://huggingface.co/fineinstructions/template_instantiator
  6. \n
\n

✨ Citation:

\n
@article{patel2026fineinstructions,\n  title={FineInstructions: Scaling Synthetic Instructions to Pre-Training Scale},\n  author={Patel, Ajay and Raffel, Colin and Callison-Burch, Chris},\n  journal={arXiv preprint arXiv:2601.22146},\n  year={2026},\n  archivePrefix={arXiv},\n  primaryClass={cs.CL},\n  doi={10.48550/arXiv.2601.22146}\n}\n
\n

✨ Built with DataDreamer: http://datadreamer.dev/

\n

✨ FineInstructions Pipeline:

\n

\"FineInstructionsPipeline\"

\n","classNames":"hf-sanitized hf-sanitized-E7Ba09oa2H5rwkxQYaaBF"},"users":[{"_id":"61c40eeb727d1257bf3cf5ba","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/61c40eeb727d1257bf3cf5ba/hVNbcFjsvwWqWarcGTOdI.jpeg","isPro":false,"fullname":"Ajay Patel","user":"AjayP13","type":"user"},{"_id":"6079c29765b9d0165cb18392","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/1618592397610-noauth.jpeg","isPro":false,"fullname":"Colin Raffel","user":"craffel","type":"user"},{"_id":"6303ce25fc783bfc744216af","avatarUrl":"/avatars/09f5e87c1f56a1b7f6ef9c5037682285.svg","isPro":false,"fullname":"Chris Callison-Burch","user":"CCB","type":"user"}],"userCount":3,"collections":[],"datasets":[{"author":"fineinstructions","downloads":264,"gated":false,"id":"fineinstructions/finetemplates","lastModified":"2026-01-30T04:10:14.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":18588204,"libraries":["datasets","dask","mlcroissant","polars"],"formats":["parquet"],"modalities":["tabular","text"]},"private":false,"repoType":"dataset","likes":2,"isLikedByUser":false,"isBenchmark":false},{"author":"fineinstructions","downloads":2221,"gated":false,"id":"fineinstructions/fineinstructions_nemotron","lastModified":"2026-01-30T04:08:23.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":1228476202,"libraries":["datasets","dask","polars","mlcroissant"],"formats":["parquet"],"modalities":["tabular","text"]},"private":false,"repoType":"dataset","likes":4,"isLikedByUser":false,"isBenchmark":false},{"author":"fineinstructions","downloads":54,"gated":false,"id":"fineinstructions/real_queries","lastModified":"2026-01-30T04:05:26.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":21454204,"libraries":["datasets","dask","mlcroissant","polars"],"formats":["parquet"],"modalities":["text"]},"private":false,"repoType":"dataset","likes":2,"isLikedByUser":false,"isBenchmark":false}],"models":[{"author":"fineinstructions","authorData":{"_id":"677fd99972d67fdcd1624163","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/61c40eeb727d1257bf3cf5ba/PbZWCoc-IhhHGU4H7kitU.jpeg","fullname":"FineInstructions","name":"fineinstructions","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":8,"isUserFollowing":false},"downloads":24,"gated":false,"id":"fineinstructions/template_instantiator","availableInferenceProviders":[],"lastModified":"2026-01-30T04:05:55.000Z","likes":0,"pipeline_tag":"text-generation","private":false,"repoType":"model","isLikedByUser":false,"widgetOutputUrls":[],"numParameters":3212749824},{"author":"fineinstructions","authorData":{"_id":"677fd99972d67fdcd1624163","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/61c40eeb727d1257bf3cf5ba/PbZWCoc-IhhHGU4H7kitU.jpeg","fullname":"FineInstructions","name":"fineinstructions","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":8,"isUserFollowing":false},"downloads":23,"gated":false,"id":"fineinstructions/query_templatizer","availableInferenceProviders":[{"provider":"featherless-ai","modelStatus":"live","providerStatus":"live","providerId":"fineinstructions/query_templatizer","task":"conversational","isCheapestPricingOutput":false,"isFastestThroughput":false,"isModelAuthor":false}],"lastModified":"2026-01-30T04:05:27.000Z","likes":0,"pipeline_tag":"text-generation","private":false,"repoType":"model","isLikedByUser":false,"widgetOutputUrls":[],"numParameters":1235814400},{"author":"fineinstructions","authorData":{"_id":"677fd99972d67fdcd1624163","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/61c40eeb727d1257bf3cf5ba/PbZWCoc-IhhHGU4H7kitU.jpeg","fullname":"FineInstructions","name":"fineinstructions","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":8,"isUserFollowing":false},"downloads":17,"gated":false,"id":"fineinstructions/instruction_template_retrieval_embedding","availableInferenceProviders":[],"lastModified":"2026-01-30T04:05:27.000Z","likes":0,"pipeline_tag":"sentence-similarity","private":false,"repoType":"model","isLikedByUser":false,"widgetOutputUrls":[],"numParameters":567754752},{"author":"fineinstructions","authorData":{"_id":"677fd99972d67fdcd1624163","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/61c40eeb727d1257bf3cf5ba/PbZWCoc-IhhHGU4H7kitU.jpeg","fullname":"FineInstructions","name":"fineinstructions","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":8,"isUserFollowing":false},"downloads":3,"gated":false,"id":"fineinstructions/pretraining_experiments","availableInferenceProviders":[],"lastModified":"2026-01-30T04:05:27.000Z","likes":0,"private":false,"repoType":"model","isLikedByUser":false}],"paperPreviews":[{"_id":"2601.22146","title":"FineInstructions: Scaling Synthetic Instructions to Pre-Training Scale","id":"2601.22146","thumbnailUrl":"https://cdn-thumbnails.huggingface.co/social-thumbnails/papers/2601.22146.png"}],"spaces":[],"buckets":[],"numBuckets":0,"numDatasets":3,"numModels":4,"numSpaces":1,"lastOrgActivities":[{"time":"2026-02-02T17:00:16.231Z","user":"AjayP13","userAvatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/61c40eeb727d1257bf3cf5ba/hVNbcFjsvwWqWarcGTOdI.jpeg","type":"paper","paper":{"id":"2601.22146","title":"FineInstructions: Scaling Synthetic Instructions to Pre-Training Scale","publishedAt":"2026-01-29T18:58:47.000Z","upvotes":9,"isUpvotedByUser":true}},{"time":"2026-01-30T04:05:56.231Z","user":"AjayP13","userAvatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/61c40eeb727d1257bf3cf5ba/hVNbcFjsvwWqWarcGTOdI.jpeg","orgAvatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/61c40eeb727d1257bf3cf5ba/PbZWCoc-IhhHGU4H7kitU.jpeg","type":"update","repoData":{"author":"fineinstructions","authorData":{"_id":"677fd99972d67fdcd1624163","avatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/61c40eeb727d1257bf3cf5ba/PbZWCoc-IhhHGU4H7kitU.jpeg","fullname":"FineInstructions","name":"fineinstructions","type":"org","isHf":false,"isHfAdmin":false,"isMod":false,"followerCount":8,"isUserFollowing":false},"downloads":24,"gated":false,"id":"fineinstructions/template_instantiator","availableInferenceProviders":[],"lastModified":"2026-01-30T04:05:55.000Z","likes":0,"pipeline_tag":"text-generation","private":false,"repoType":"model","isLikedByUser":false,"widgetOutputUrls":[],"numParameters":3212749824},"repoId":"fineinstructions/template_instantiator","repoType":"model","org":"fineinstructions"},{"time":"2026-01-30T04:05:30.128Z","user":"AjayP13","userAvatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/61c40eeb727d1257bf3cf5ba/hVNbcFjsvwWqWarcGTOdI.jpeg","orgAvatarUrl":"https://cdn-avatars.huggingface.co/v1/production/uploads/61c40eeb727d1257bf3cf5ba/PbZWCoc-IhhHGU4H7kitU.jpeg","type":"update","repoData":{"author":"fineinstructions","downloads":2221,"gated":false,"id":"fineinstructions/fineinstructions_nemotron","lastModified":"2026-01-30T04:08:23.000Z","datasetsServerInfo":{"viewer":"viewer","numRows":1228476202,"libraries":["datasets","dask","polars","mlcroissant"],"formats":["parquet"],"modalities":["tabular","text"]},"private":false,"repoType":"dataset","likes":4,"isLikedByUser":false,"isBenchmark":false},"repoId":"fineinstructions/fineinstructions_nemotron","repoType":"dataset","org":"fineinstructions"}],"acceptLanguages":["*"],"canReadRepos":false,"canReadSpaces":false,"blogPosts":[],"currentRepoPage":0,"filters":{},"paperView":false}">

AI & ML interests

None defined yet.

Recent Activity

FineInstructionsCoverImage

✨ Paper: https://arxiv.org/abs/2601.22146

✨ Code: Coming soon

✨ Datasets:

✨ Models:

  1. Query Genericizer (Query ⇒ Instruction Template): https://huggingface.co/fineinstructions/query_templatizer
  2. Document ⇔ Template Matching / Retrieval Embedding: https://huggingface.co/fineinstructions/instruction_template_retrieval_embedding
  3. Template Instantiator (Document + Template ⇒ Synthetic Instruction-Answer Pair): https://huggingface.co/fineinstructions/template_instantiator

✨ Citation:

@article{patel2026fineinstructions,
  title={FineInstructions: Scaling Synthetic Instructions to Pre-Training Scale},
  author={Patel, Ajay and Raffel, Colin and Callison-Burch, Chris},
  journal={arXiv preprint arXiv:2601.22146},
  year={2026},
  archivePrefix={arXiv},
  primaryClass={cs.CL},
  doi={10.48550/arXiv.2601.22146}
}

✨ Built with DataDreamer: http://datadreamer.dev/

✨ FineInstructions Pipeline:

FineInstructionsPipeline