{"id":175,"slug":"m-a-p--finefineweb","name":"FineFineWeb","author":"m-a-p","description":"\n\t\n\t\t\n\t\tFineFineWeb: A Comprehensive Study on Fine-Grained Domain Web Corpus\n\t\n\narXiv: Coming Soon\nProject Page: Coming Soon\nBlog: Coming Soon\n\n\t\n\t\t\n\t\tData Statistics\n\t\n\n\n\t\n\t\t\nDomain (#tokens/#samples)\nIteration 1 Tokens\nIteration 2 Tokens\nIteration 3 Tokens\nTotal Tokens\nIteration 1 Count\nIteration 2 Count\nIteration 3 Count\nTotal Count\n\n\n\t\t\naerospace\n5.77B\n261.63M\n309.33M\n6.34B\n9100000\n688505\n611034\n10399539\n\n\nagronomy\n13.08B\n947.41M\n229.04M\n14.26B\n15752828\n2711790\n649404\n19114022\n\n\nartistic… See the full description on the dataset page: https://huggingface.co/datasets/m-a-p/FineFineWeb.","tags":"[\"Task_categories:text-Classification\",\"Task_categories:text-Generation\",\"Language:en\",\"Size_categories:1B<n<10B\",\"Modality:tabular\",\"Modality:text\"]","license":null,"framework":null,"parameters":null,"downloads":586140,"likes":130,"verified":1,"created_at":"2026-04-20 14:59:20","updated_at":"2026-05-08 14:17:34","source_url":"https://huggingface.co/datasets/m-a-p/FineFineWeb","source_platform":"huggingface","hf_repo_id":"m-a-p/FineFineWeb","ollama_name":"","category":"dataset","latest_version":"v1.0.0","version_count":1,"signature_count":2,"risk_level":null,"risk_score":null,"versions":[{"id":174,"model_id":175,"version":"v1.0.0","manifest_hash":"9acda62b2f517019f0543db3c6beb162603c1f0257e3252276c0552bb5029748","file_count":0,"total_size":0,"r2_manifest_key":"manifests/datasets/m-a-p--finefineweb/v1.0.0.json","created_at":"2026-04-20 14:59:20"}],"files":[],"signatures":[{"id":536,"version_id":174,"signer_did":"did:quantamrkt:registry:shield-v1","algorithm":"ML-DSA-65","signature_hex":"744afec93a7f09c0591aacbb5bea91e48ea0e68704c4a21d94f0167616d21e21","attestation_type":"registry","signed_at":"2026-04-20 14:59:20"},{"id":700,"version_id":174,"signer_did":"did:web:quantamrkt.com:chain:authority","algorithm":"ML-DSA-87","signature_hex":"e64954eb518d3566a75cfe641c9f82a917f8e44111d9babb26c4e805659f54a157680ac1de838aeda63586ececbecf4f918fe3bb87dd76e207f831c516d2d438571e0d582c5e84c8d5ad95326fa95d0edb261381513d8a3cf8192f0aa4101efcea3f3c8cb8e8a8784a8e01ec4c8620a3dc35528e4265aef1d707927d57cd76d0a273a3ed47676d823676912eeb8cb83549614dbe84d595428a2af93482199ddaff88476f6afd1641c730700028471482eea4b94a19c72a6630642f99a3e6b0c40fd2f31c830f0b6bf6648a3d62c42f3de61bdfe030e6e17f3d54135d9b9ce4e9d1bd15eb84d5c72ea11ecaa3fe5caf097b4309dbc52526a4ddc30f425e621757827673dc22f670eaaf6be461a72a96efe3dd6db887351867ea7668daee485c3654fc3f1754ba6e3951806f121cd77cd23554734056b4f1b5d856e3c5bcbbdc27a0b42b666769077f6be59b5a1ddec8243622f9e8bbf8c48c468883542fcb7e419ce1c23e6323848ce43a26e9baaa6475b53ba0df5fa97a158b76171707f28c951b3be1c12f92cf852c8f8ea370ee9aaafc32ffe273a7420cac0293f9c0732066d1ebdbb60027af7c23743dfd376d16d9e241b41c0346f0613d0eb4cde0c0f0afc8cd0ea5f32ca0c27ec88907804602b17fa1f4a3ca7f17c712912672e4da247e030e82f8f929c5e76a01ac8faebdf572c4c47b325a46aa6e7ef35ed093e6481f021940a35cc3935866e8f7e8487b1e416ac4973f41fd7589404ae2ce1e09abcecda5fa025aed584cde94bf91cd71627243ed9c6763f54cb9035b0f4dcd3f5e9c32e35d3fbaf8caeb99043954ec00dfa03562d3e4d8a765ad4be4c717f4c6617f5aa7ca29c8c8a58fd5ec6f799730d16c962fc07b7d6e26bba09baf79b833c115187188563a946db4e714cff0c5dad644300c6c544806e6cc7ceb4278e96d856e864a44e2de5725ae5074fda347ca53eaca05b9990a5b8d27850bc9b134fc1805aac0bc180dd9871f69d1fa1302fe1b29adb0aa790606c2315727f500d7635b792ff46a6625d398cfca54617f0ab6bff630c6956f1200f22e5836b45868fb59ca6c9c4a2a15fe9edee0434828962f90f7742fbc47b3e71fc5fafa1a78dbc8a9e871a3bf9314e8dfd8a3998bc43e616268c5af49e513883ebdd301f9acc44bb81bb75f2fe8862aae4f10398809940d2802db2f2d7aa7f4c687cb80fe789a945d728539e8f5fb934030c0dbe466c12935a98d90011b1a1a9f63e3f82bd4045265d28660487bd15541cce9b4a70b9283bb53c3c34bfe51c4320d1cddfd1f725d7366b94df7f2910732b240e37d9bf3108715b01467f8c1c6757def0f69be0ca9ce6ed9153c85576b8e77c4fc6795ecaedacf9c37bb53099270af0f2747bf8052779597dc023aa2121c9de7649f4ca6af0e298c9f862b6c1e51260d4d5bc57931e6191aadff4b71046576dbc2f2dbebee041263220e2138b4b7fded8c3db4eb2f60b70477a1e784c91a92e3b684111db50ecec09c321cb24aba5bb558a8667a03c622a9e96cad80017d497b58d6331e68bba2ba2c1d86d22baa0fb201437b9ee28fa8c5d3ca4a7c564d5250229dca8d96ebf926b09e5c7ab59333a127c73e25d16da788ed3448a6a954ef5c089111544ba0964e443272303633e96c58b5e41bb3ee0b36d41775314f1d2e5507c7fb6555a25ba0996d9ac4f40812b8ed45384d2e010be6c347a0395fb66dcc8d5f88b7a3e7e1ab5f7ca175d0d4579988bb925d3af656ccbb97cc87b58cd3f9a4ddfd7f280ee9b36d011e2bc8ed2dbb6a636a018fb8b017be954fc18f5e0c770a985ddd9f343e181c91028b24b0cae2cda3ba9f3c26303c5834075842caae2a7dbb75583b98140f3f21d27a6f11585ca0def3647a1d3b6d4647f0d0afdf1846910dd4fe47485ab6c53d271fc67e94f34b697398755b2c3196d0d276160faee7ef692205a5931f3679cabf38648c7b6e3790adaf9fdca37203cc27085f341b0890b9b552033e1752632976dce63ea36bf2479072f6a46ff8ec2707d7b0524945a6f4d072b3de6abe269a822ba7d0e48033bd6b0f2b4fbba9f3cadb47accc644bdc19de98f65fc76f2f9880d67a4d4cc7ce00da93ec32689ee2b9af207bd5094d75700861a8bdb38953d7d1f9f48f800ee374bd729757d9139bedfe73b9f31131454ce2a627ff51e7024be1cc18d4b40a7611dde0a81a634c6bdf776b5fb005d76c52bb4c68cac5a6977da28474cca590e4ff3c046bb0a1f449c4f98059bcba67d722739a0429c9703af66e0a5271d6cb18480766d1a5b09366b0b285796760f537b2196bbeed32a37e3fe71f6f3b440b6a842a52318452b6e8cf79095207625527d932f121b742c00022a59d3567010825710456613d0403c673131b389f17ea017723f1258bbc463769a397b48f613440522349dc4f6529ad45b34272ef4e0005a8ce6819d8a90c51b840235c86db7d4ea2435a161b5aa8a5ccec578d7ec5a1c728a0668c550249ea9032086bccd479b6aad28d060c5c54990f4172a11e4924a658526ddaca8356294d47e5cfd18fa28da4ce469e711713d5340a2430cc9256b46036c06779da3522d48f5e497b06c9256b526e8059efbaed5130c97450d39dcad740ec380a581a62ae17fb64ba0903c7cd32e8affba30e8d662db9ded9734e3c004963750a4831b3b53a162d12fe215b4e68a23fd8425ec6ca899b6c2855cb20b30745d632b9d8d8a248d59397e3daad6aa8c35878fc7ee33022a04089ede86edb40a0dad6024c533c0bce45eec63535ce0255d668e3170fcf6f561efc26946e9b741741d4c455b38299500f940f225bc4244bd47c75dc06406ee6f9712535967a8e66efe1179abfa54ed82c1bd63cb1e8d11af4e27c5799283f895c36a9726fe0b6aaeb3ccf886596ed1c22d3ed44880b58e623bd9cd1fe58e4b40b7182be5a3fa4de2211213342891771fabd2e19fd9420972a5ecc973ae34cc9890ac11680672427ffc8b35ec8453780b314e2e04f6f5ba23b6634777fd1ba637b6155c7c6218bf917cce806794c1e159a637d20e4ef08c6fd13df2f6f90eb790eee781a539bbffa44df073c16f84609ca202e2b8aa431d5b4e830031997336f5a767f560f3ced4bd2cd9cc1a1038b6a75d674437142cdd5387ae2d9958402fa444d64f6e1d110210c2f3fa58f990f926b5f7346f37185627cd3032e9ee2dd9af55cd2e243e381d86a11a2a9b528dbbd9b520b67933ef54bad2a48198599767b5f6b88fa4e74a96026bbf5a3a59e38c7c6f244241b534c60b1e3b3f915515e588918029e74897f4e060d9bcd9a13e96a91ee435a184b36e6dc97d26f2922205da3c9629305166dcae60e3a16c4dcb6f0b83f13e3de4ae9b6c5d625807b75159031c7ce5ef4938a11ef0306794bbf6c8acb5c8197bf9f731244dfd56c05ab4058d9e01c9939324a95d5d35dd6f4c910d301bad911e500c05fd26b0ee5a53fb322c39a41ca846159002c565ba083fb64b068dbe3dd72550181daf3c60c2b9d5811055c90fbab158e265c6c294be8b09297c8131ff90395b7fe2846dac0afb92cf03dfdb16f153dc7db85a61a94fdbc025931c92a65cfb4825df07b78600c966433653c89f478245eb8944821240dab20a2430d6e0542370bc904df947ce21458abc3b710bdc830d7eb45f927716e28031834031f34184f86d559263ed008a936626e42d7e0100517a4867557dc1fcf857cd086c38df64c5baa145f5e8655427a67ac054f0b7d5d8d6c2fbcbe22f7b2431768baeb9db56e6fdba22cb9da51e92d0cf40c2e010dabbb65046559e6ff1043fd2f8379a1cf7b91cf2c9757700c2f4a3eac9d8d9a46482cd366b2b30f26a9244b8a90475d9c55975e4f5e86c0fff567accad4cbfc60967667a9d74c061112ec02e3799b22eb31cbae9d6a54699a65b044f0454a57e55988783bed467523bfa0b2c10cce2813d35a6d89393de56bfc55baae4297414c044606660ec05735b199a156251db445fb24c6045499c9d7ea6bfb8c99b6e50d8a8815a06e6151457755552d2ba558e3f87db29b303bdd3bad35057e13dc4d590a233e1d9ae2d46e0eff78f3f752d25e8e0135eed4edfe2099b56114be670d1b2f54ac604ca69bfcdafc03c941a637a89356a29ce96511fece3d80b4c79414a621af94d244e96dbb4c5a0923848a70ec95a35dfd6a6fdcc7da1a0cf55fe5fa6f30a79dfe0d1fac38c3de3286c01414b973ce15c8e9e86ae3cd70df0887e7a51c2e62adb0d93ffcad607680e3b008360bf1ffc884d110984b2b7d72731f7000f06e88626fbedc9139d3f01ed71951dda7a404e1568f245cbcd0ff9c77862620588957260766ef6ca65be95ca0961dc8d45006d27f4135f28eb08005d5e4180c3bbb9725e8dfaa1a4490e0130b11f788edd010158a88cc2256d345842f2ecc3148f02ea4e567814752b2bed8e613d3183946e715cad6f833392d0276594dc6ff9a9e31920cc9a029a5cd5c076cd8239fa0a9e38b28a0590fc41af0c0ea0a2aa463148be669d0916da0f5044c78097a946dfefcd679761f7abac10334b4c0a36b2976f41e71aa7d2ff74c80e63a884d437bb004883d44adf4be87aea1430bf722c9cfa0749711a94015866cc56c28c22f250cefb19c21017d68c57e108baf4858beac7b293869486deee4786cab3fb16e7a0d5cfd022beaf819a63a8321630c4f5025d3a520326e2067f47fdf5ab182253e863e83f5bec120112057cb6f20961ee9fbfdc9b32bd8b51365b959d2f361dd3953eddcddce942214d7f53b3493acd2c4ab722a5306397aa14c20e36fca6b02068fd03fd9b772d1bb736941640c08d95ee0c3996b6f7398aed853155d681a24b38035b9e1b7cd28038ddf8d246942c6dfe1daa4aa603afad963da5117a16b561f8b28a4a61f63b8473f6d5e0d5549b8027b7583db66bef132a4c6676fe98c99f5d40e37e11b8e8c198eff0dc7182cd95f7199488970efce41840ad3f1f88b499969c33d9031730e61bfc2043757b90f8380732fc490afc97ed9a12ba0215c06e807d5ac4fefa53bde9a2aadc53fe68d0ee7bc15f48f4620d5f85e5e377cc30036739ac17182fa48274e742f403ba70c6c4bd4a2395f11a0bf97660d4bfa1852dab88850070c3809ee1561e39ba5aee1363627f2406a1e013917c0f5b055a4ff33c5c1a9b7cbee5c829471dd7d9afb05d2ac756e50346f07ce6afa61679e72988cac651aa431141cab96581aec2923ea36473a26e0f960c80d34052cbcd45bf26afec5cc3e59deca9bd0663ef563c0ad29951718c3434e829dd7ca456356cc6dc967458db364d9d5c7c95c62bd1c4a3142778bd89cb855fd0e0834e326ffe0fa929376904dee204111fcb2218dd34c5911b9b4d30eb52e68d02a2dec9ec0c382b9ab58af1e3b19a1fa65fd3ec9e1a32e8a765075c50538e28de6fcd038873a5ddb7dfd9f8f92db88a5d4a6ae9d3e76f8841ade1d2ac7b93cfb9523961e3316236fc396fa182daed4477ebfa593079e4d332440f6bfea78fe9bb6eb514492005e9d0f8375ca0aa518240cab5bfb80f063bb2b6646767783227cc6fa2595386849b9c4cbd72e0ab19a7dd1e1674c653df5778e19281608ee233d86c5ca81e9da830d255941ca342856e4cb033b859931dd5cc9da4d6501b51e7673b3a56428987055196da8e49eebd1c30b572b5b775f83ddbf3732ef678cc800631feec5b0c6edf0a7424a53055e466dce0e6c3a085ae1e80dfe2f37098888809b5ff7f7dc65a57dda836f4ce941f43efee5622577cea85f00b825ba8f85333dfce40143285c13b0b38577df397f11f5d94f506d42e04fea0241785e0ee09d23ce6b74f87821e11d0ecd6b119b2ed746461bb06f82787326a2197a4bb0853ad085fbfd8868ce917e87d67d6aff647d15fc518400e0e16211873a49e909a4b197f9222f17fbaf3bafc1ea4509da70ce23ca7537d1b4a1575b5feb21886c05ae469ca8ce8364dcf8c8a00f0fdbc484fd1ffe35346a80c3e19565f20a8018ba857a8077c598ee96e0acbe50532c4ff2af66dc01a30214126b30e4a481a3820f24d2a9bfb6b92aea160559ec39120d961d6742cfbf290349c393fa9b6e801718e4007df95f79e5c02b71f50af4e3c823c44cbd97b0a02702a09564793b9a6690fc38d26cd2e2e02046e358f091fc3f2c7bf142db543af2527f036bb781706bb34dcba450e5c92fdfc67560bf67a44c6328dbdd12a57555ebf715cac9a890bc2ccbee3afad2f01177638717eb7dded07f250f069972d67d66131bbf5a405deb42986deecce5e0464b0fe0f2cb9b4799078fab92447c69a8f93fba16cc70b0d13545524a204197c507f4c9f3690c3e76a3b9a8b9a98aa97db8e0f356a2d8a23d8a61bf656165df3cca99db51e6cea9bf7f044c5674a3a8fb085077798a99a3bccad9eaf2fb73a4c2c7196893101c414e94aec9e0f5141a4a5e61b6182dec0206070b163669737c879fb0b6b9cc0000000000000000000000000000000714181b242a2d3c","attestation_type":"pqc_registry","signed_at":"2026-04-20 19:44:39"}],"hndl":null}