{"id":234,"slug":"allenai--madlad-400","name":"MADLAD-400","author":"allenai","description":"\n\t\n\t\t\n\t\tMADLAD-400\n\t\n\n\n\t\n\t\t\n\t\tDataset and Introduction\n\t\n\nMADLAD-400 (Multilingual Audited Dataset: Low-resource And Document-level) is\na document-level multilingual dataset based on Common Crawl, covering 419\nlanguages in total. This uses all snapshots of CommonCrawl available as of August\n1, 2022. The primary advantage of this dataset over similar datasets is that it\nis more multilingual (419 languages), it is audited and more highly filtered,\nand it is document-level. The main disadvantage… See the full description on the dataset page: https://huggingface.co/datasets/allenai/MADLAD-400.","tags":"[\"Task_categories:text-Generation\",\"Size_categories:n>1T\"]","license":null,"framework":null,"parameters":null,"downloads":165545,"likes":168,"verified":1,"created_at":"2026-04-20 18:22:11","updated_at":"2026-04-23 00:03:31","source_url":"https://huggingface.co/datasets/allenai/MADLAD-400","source_platform":"huggingface","hf_repo_id":"allenai/MADLAD-400","ollama_name":"","category":"dataset","latest_version":"v1.0.0","version_count":1,"signature_count":2,"risk_level":null,"risk_score":null,"versions":[{"id":233,"model_id":234,"version":"v1.0.0","manifest_hash":"303933acf4d21970e3ae723f228478b280fa37b6dc0c01298e513eda71a0785b","file_count":0,"total_size":0,"r2_manifest_key":"manifests/datasets/allenai--madlad-400/v1.0.0.json","created_at":"2026-04-20 18:22:11"}],"files":[],"signatures":[{"id":595,"version_id":233,"signer_did":"did:quantamrkt:registry:shield-v1","algorithm":"ML-DSA-65","signature_hex":"97abe22e5bce4f2aa31b88f43f06717d7a5af7830efbe99b2be59cfd4cb19719","attestation_type":"registry","signed_at":"2026-04-20 18:22:11"},{"id":717,"version_id":233,"signer_did":"did:web:quantamrkt.com:chain:authority","algorithm":"ML-DSA-87","signature_hex":"cd5780cc0c17ca386e48007097c356513a2409769920582a94d96423ed3dd43d8cca7fb563e71bec4e329127ea307d7ed43d3dc1cf60660ea0c7dd694e8b94086a0f784c7c859734cbb47289e534410db0b3b8ab1d8b01d12b052286488e24c0a348b696141291f566cd843660d755496f3f098bace35efe72348f477427035f4495f9fa09990397c0cb23d67fd1db306cc92e9d4f48e08a157accae79e4a72be4009e2e8e76294c29e8eb28dc2b211aa9d28d2ce9af184c6323af588d39f40083f8ba29597c3c3a93ef4f7ac24386bb4219bc3fa5768561ea42dee36720c9df169aef34f94f77aaa192ca358906409fef6a0a0cb5b65f1d0a6f43c0b6c64004de954f460c6c1adf009307a59714ff1d145f202bf66959969e0cbf0620af17086ee82aad0a9021278e4c50e5716e5686c507f761e55ddf24a1a9a60e4d8dd9a24feb371ad8e252328490f8fc443272961a62cd4c1889dddda3b3b3ce73674497575deadb61bdec92a096dde39961e2dd48b6868e758383dd9c47139f8938817708c49b28f088666ee402ca8567f83e535ff29a5f734e54f12a1c564043e1b818d15be66bac9eca2f6126d9c179e1e8f70d90bea0621efe5a076fee0285b12a9f09cb2da6f68e4b42cd81a9c7bfa791e9636fb970f127c7ac0ba4c529d756257298ad87c00f3b978f056123ea41943a690b1610590fa666ed93654561cacfa083a5d254f0707d1762768901a40322941a601a9e3e8d0c6ab44a199f2f6533b3f259ecb9e71e178f963309fa402d85168b484d0f6d6e866972571a599cddd22cae205246b8e3a1aff16468c3ca8a2bd27cd9865219a36e918bdb8b6555b83de8cce223aafc9d27072f951188ca45a104cd3d7b8414b0dd8c5ec6da5ef503825af64c694aa7ab13d8955112590b7b2aff0f2dab169de19bb88a9d535315fb9697c47c64cef858c33b8b52b6464c720bf6ce9ac66f5ae2ec5a32ffcd170070b14ff99acfed2d1d58cdd6893d010f405755c3f6afdc6b356ea9323e1e5245fd03e9419a955a806b8d7aaf7427486dd2934d8638bbc1623c0a13de278f857119d30e11beb0676c2f306de523139192190abfa4a3095f9a50735a6e266cc150bf7267beac79005346b02c5723e08c301218763e568c31f06731b947b227c65bb41bb97ca73c0e65b1bff1be89adbc4cd73850c764e37b8f090b38dc6d3e7374aef8d13d4cc9ef7209841f6f326a03e00efe9fa75055e0a33919c20f09a26fd3505230fbda6c411a13c598ec3c20b949820b8a1044f8eac4de51f5bca403dc08ea2ca65cfdecabddaa3d79532f8febe5da150442785fad4dd75cf40d5fe02e478a1ee05b00d6ac835eda4a603564dcd83b8806b56be4b402f1489819af150f4376ec6ef1bfbfbe880218958cfd09ebfa118da1d80145959cde7fd3c545d049c2f1372dda357bd3be408b89f43f7578ea4822503ca2fa1e60204487be15816247f5f0e7f3fc0fbc90062d8e2eb1d07930d67750e1e8e484a229fc34222272a7c2dd55795584f410d3526ba6580d9c8dd46e0e962c8953416ddbbff5ff19beeaf8575e0a14fd6c9843b8c256eec6a8b2970b4b040be9e1d23ae06a8bf03c71e2c38fc924426b696ef12582c3784abbb36a1f06d5a4ca8ef3af299647c1a264067666d10e55f63def956f1eb40de8bfaeb2687c82efe9f9181025485de3110eb4a07485265417fe26ac2997ac69330293ed3e1bfda736bd73889e8106566671df41e993465ee38014dc87d03e4b164f1a159897b80f1cfff6694f247bda233d00cd38cf1a439d5e87ac40e387bf3e4f616f6ddc13eac2d20a3d00ba4ecccbaae04517b2ed6b5859a81514d906bad132816a54f9433aafad46d407074eb40f8c068a1a20b2587b13a9f2f518107861f53da777b5f10f8be57867c91d0c84eb48491643017d7b41829ddf0cc75eef2a8503cb7f3cc46c90da35a36e45a495faef859cc2840be15525e764058aefe7f10efefa938a199be937577fbb2bc122b6f15b42c5b80821e82cb969b3440d3666e7b16cd68800f7c847b2279376213ab9a611dcf618636f3365b3683a60e513132560e4b307c3609eb40f163d86b8835804c35056cf187b67a28971c84f0aca3fc89c822df3ab49a4587300044fcc768b65c58b03e6523b6649b93e4aca1a9d71a1d8d3335361bffbaca5c203ba1c95935117baa2c0cacd2115be94e9a48f1f083e447a09fcf8a1022fc82d91275e7514cfceaab33589a960c0879ff7887c022c3a20d410b72f1964c2844e5789b4eaabd624b788fbe2b1f563dc33e587b4ecd52265b04c20e86f89e32f6906db71592b0097f1628ff2eda53f19049bc11fca9edf43f34c0bef30052d75efacad8e4120dbe37a6592099f8c5213a65e9142a951ab5e42cf84beae1d7b290a62ea4b9a9ad37ac9beca444fdd2ea6f91c2cfd9574cc5f4ca99f2278bf24227a349346f62eecba7f153050260df0346a799a0d374d127fb70f1e17e10556240738e74382a9665ae747aaafeb1cdd8bec02303ffc13c60cfe7ad8ae947d728970e6f4d76e1d23765237b27d9047b8828b9996d24db608a8e8a2279b7cc25bc4d127616368b9f403fffb8cccf4578e226f029582095f4de8a0ea6fd3cf9bd73dfe39c878fc4d11e61dab01442a67060cb9f44933b19e6f269ce4129b59d64a862fc0775ca5d284be6358c1a5a37ac447ec64799b2338e693e3b12ba06756b8fe1caded61325e01eea822b86f71e27268d3e471f8e5cf352906f41617875d26f2cda338de6c7fe829824381147172189fe42e23a488b0fc3dad1cc36cd0860c01da83bbf10163e789bdd719a04de4c299f4c9e64e81fef76f01934b3b4a4d95b7f905d6b248b3cfa9e7d1cccf10d1c54a807f1c79b5a7f419683f5070f806f5da13ff88a32bbde6b02a4cde49421cbcd7f376f3164c94c8c5b923ba12217f066f20560917d34c10a2cac0e8e5fb823a34f676d03462c737527491397a04c2dd14cb8e2af374063aa6fd2ee0989530ea6e423989a758b6782f14387461e4d8b8c1968f3079fea2daacb7c14651f0e8bd5a66976f18e99b16d79557b2616cc92847c1eadf1420a298bdbda2409594d853ad032fdb44e83be1f4471132fb87f9dc934481d4776e5f6237ebb2f4f2a8c2ef57253f0ee2478a909700138c91d2de5d97e6d8d34d5d796be1a0e3c8f176bf27c15b7b3b4ff02e2b669b345c6bc4901998b2214967632414fd623d7c6709441db41d0a251a991bc2af1320bd9657266395782699079566763ec189a52a8f719208eea41508a752a3037acc2c2227155f6119b59c5b8e8acafb5d0de226e509231380dfcfab2b4cea0c8157df37959dd0ff6a940954af820796d77049f2351c79323ee9d5b356cd7052789a20e5ee70cbd99717d076821e6e196c35121dd2fbd8967e19c6cb8114a18cf330b90f33196e2dd8fc000a8f26abb53b8ccd436a28ad331328075c84bb1b86d2a6e4067859bb71b10931a8df5f6d112427f1016432812d6a1e9322a97d789c06cb9e72df67890fb4176b6e2a45efdefc291627b7bd22511924ffbe055de6125c1d9feb0a5f6bca8f628decebac4f24830bcdc6edccbfe0cafe4467239d46bff889b52fe765d40ad40e38af4652b8119a80af8e2d4c40cd9930635a8e49224c4be67dde6284283c78821f765b8f62fe9286ca2ba1f7c5650fddbe4a8f7567e5f19d736c426d510f3792bbd0c543554c218b2b1dd51f549d19931d75af4146ff0334932f802c6bb582df684b99d4ab5419d34b1b36a473b55e95eadd5f9a16f641af796aeeabfc0ad5e89134bef0b11cb78588ba7e29e7814981ac1d50dd23e4aa3da0e462e1926813b3c2bc6a350fc8e855f8420a706164d9ac8c7fff75fa229cbfa157c6461d04a00671efdba5527594619cb188c02ee340ef05520e91598f662dd60310528036ed5067559e160441b8d42c12cb52ee3fe68f421620e3e855f09249fa6054964aa34a39385ec17099c2517a619d4eb39751231af499c163902a36bf97f8b792d815b7dc381574008c8996f3a61f50f87fd2660db711eb55930d557f334cfcecb8b73a350fda0395da298adbdd0f3c397700c2a989ecb32770f7ba9e95787d2dcc551c17ab569e192884830de1c192c8ce2a30bf4a1c9b14950b9f9275aa4a9432bf3617e2861b09bf848a389046ac544fe803616fbf30a8a4f6c69ba5b75e443fec3614954a5d50426f5d3869d344f31d230f2682fc6b4d595787d6dd4909179b84c4c025026b66983cd4f3cca4de1af5ae26e2fc98cdb6c7635721297ca74cf9e9cba6c09370f3bfad411a05d798485c57f5bf67d849761fc6734bf49a397bc14705f7d3f79901adb557228eae1c5c98615dc88c39b0d8041f18ea641cc11ec6c753f87aea294ff551a5530bc3d485e15c68ed02f27f71b53373f7141da918757e4e98329bb241652b0ff725bd0cdf7a539c00aa313a99ef8e35e2e75b62ac96f7e16e83c090146bf3202e31516cde6541005d45b879f56a5689d5c07326db9d646aabb3532c21786c783ad7160992bf2c295353577ff05dd09b780ba1181f0cc6a153b675a9943dbcbc91e8d8b2994f18603702c8080c8c406f6a55360c80128516475a63ac425670a8ea1f12f29959521fedf8490b1b7121af0bc30d898788a737c8de6220329e30b652d492f7509c11ee0b9b0d3f71d46d6c0ee86e97237a9bb7935ab715a76a8aa89e9ee078723478da55c6812b137aedef906affb672950d604640fef5bf350f603ed256bc90d03147b7dcfaeac59546e918111b60cec135368fe6833002b84b7e562a06ae8954ad3fe4ff19fdda4ff529eb0893eeadf4314564f2cf06b73f57ded2827f5fa5430e2608685ee5213bdb45bf4995c6b2beabdf053ee26d4ed60a2b302b9ec92ee97cd3668545dd3a8ae108fa1ebb1e0a6f300ca2d76f831343bb3027c23fcb228ec2a385f9cc669afcbd47f42cce55cba8c6f34cfcea56c76e17ac5bebefdb59d1419ba1ac74bab6e876fb29f16e6d02e288b316289ef7ea735e77321a426ed1eeac549d228a387d39342df0ae3d2513e18f2f2c2dabf1214cb83d5b8b2c328561caf27bb1b04dc244c9f60d054bef5b7a4e4ae04140cfe3b36752c50b6d84cb412ae9dc7c494864cc0478bff8665c90d99e28f5308cd5ccff3d9f2d54428eb647c68b7a060d73f25d1e380b432f6e2082581de880e61089295ab8eb36ebc34775ee6e4c41e1908ef4418c86dae5be3dde141c0d0c2dcc7adecb4d43066b87bb59b694e1c22d90cfe6ebe54518adaf61088b308e31bd4bc6721287a0b73393777386fbf481f832eaddde699e67d76ac0291a46513d8476162726427e8202335fabea6d7dc0005351d0fda362adfb281b96396d2731837ee61ab76e525d4394791057565992ba5b1a6f00353c2a8eabba29a25696ade61f80b924cd9bff4c9c548ee5e2530f24e962235803aeed9d4da5374d95d71dd42ad50ac252717b0b978dcf96c8b83eaafc4cdb48d8293e975be67da904d36906c742e6d8b9a82e00a3f7a17e398e92a9389536447c92c4a0f5f987bc92f763fdc1e8be10b324dd838b444136e9a5b7d28828929666db0756a1e46ffca0c01a9caa25a543320420a8d70d799a94c1c090586311a2beb434b5fb45ed4d409f152a83abd72c5397f7aea9b487419335fc074bc491f1b69a997b8756568321ae5433ee2cfc7f76a4c136341f24def064c327c2912639616cc2edd492060991af94ced34cc331e083da398d129dedce91bf1819455d7f09766ce26239b70a8db48f0b5faa1f8d05fd264bc561449e86dcbcec1a47bc29f6ff838056658b3027a7fcb9d1866112a932db3583608a8b31e77bd87e8919ca2c081c8bbb03f5f7f813e6fb8e3451a4cf3acf1a072d657ee69a47d27bceaa475bcb2a75029ff7f0aa1caf513c592430d823555861075e22102c6c0487a1e049b5e9b6e64834a955c5f313c6ae5ae3a7b30524715aeeaab756823b7035d94db6f4eee0e56ab58859337d2f780d481bbc44fff4ac78720f0e35bfd7d0513cdb919bc57be5869c37d0a9885d72707a377fece2f521b2e660fc9746e93441c7d20864c71b2a040e3e52433786b7e1df2abd6ef68ce66c2ed21debc15667eb7fb1fcbe3b4ee486dcba50722e7df4a5bb7b7cf6214a98cabb028b374f5dccce985f46ab2b73a8b3cdf062a487fb09f09f08e53ee0377b22ae818d252a6d1959a8f438161e163b566a5918bd6874ebfbd7034f1f5e9259d9785675161d5ee6fc27250a7e8c379a35884b5789aea5961ef7ef22ecda962315775f720d65568734bb57b589391d8b4b6e78daed8c28ffaed31a4207b1ea79aa99c5adb921f128168ccca01163679ac33b36a853dce22614437fd261f759e7072a447685b0c4e2666bb4dadb0b426582a2c6d7e4252c4b607aa9b7b8e31c2c383f494e646a8d0e295870b2dffb08193133a6a9dbe1f71434446280838a8f95afcdf20000000000000000080d151e272e3743","attestation_type":"pqc_registry","signed_at":"2026-04-20 19:44:53"}],"hndl":null}