diff --git a/cache_ds/AI4Code/dataset.arrow b/cache_ds/AI4Code/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..a0165052c2466264ee41016d498ccc23f958ce6b --- /dev/null +++ b/cache_ds/AI4Code/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92c42590d27fd3fc17ffac61f974fb802d167991444ef453241945fc3a6a0986 +size 12750888 diff --git a/cache_ds/AI4Code/dataset_info.json b/cache_ds/AI4Code/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..2ec6375dbaea368ab84c6386fb15865be3092fa6 --- /dev/null +++ b/cache_ds/AI4Code/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dff5b1670183e549008fc4c203e05b1303d1a7c3b8903933bdc9a4d9d0e2a1b +size 1006 diff --git a/cache_ds/AI4Code/state.json b/cache_ds/AI4Code/state.json new file mode 100644 index 0000000000000000000000000000000000000000..6f2329bc33aab722582a31d0a4c4f4ca9bbdaf5b --- /dev/null +++ b/cache_ds/AI4Code/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed3fe19f0108316dab636138c17ede9692522d7efbaf165163d159ed12fa48ec +size 256 diff --git a/cache_ds/AMPS/dataset.arrow b/cache_ds/AMPS/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..1074fa45b89e3a86ccfd1f515f228ba169aac668 --- /dev/null +++ b/cache_ds/AMPS/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c9785a7a4badb3414fcf4d435e533f28eb9db2fca06c9cb5b52a89deb852aa2 +size 30492496 diff --git a/cache_ds/AMPS/dataset_info.json b/cache_ds/AMPS/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..37421c10f8ef32879e9d797ac9715c8947e6647e --- /dev/null +++ b/cache_ds/AMPS/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55f7084be1d3c57c8640137527f3af9cab7cccdb3b5af46e4d92cbc097f99595 +size 1003 diff --git a/cache_ds/AMPS/state.json b/cache_ds/AMPS/state.json new file mode 100644 index 0000000000000000000000000000000000000000..789e087299afd5fb30c0ca971a4f7f27267b6521 --- /dev/null +++ b/cache_ds/AMPS/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f209c188efcdfa0a8b0aeee42be2af070df211bf4206680591008e20d345f498 +size 256 diff --git a/cache_ds/ASFPublicMail/dataset.arrow b/cache_ds/ASFPublicMail/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..d5fcac932d143809fd77adc5867818bd9776210d --- /dev/null +++ b/cache_ds/ASFPublicMail/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8bfd39b0a095a2f427014bfd74ce5a3eec0494067885961272d33a58e04bed8 +size 51545416 diff --git a/cache_ds/ASFPublicMail/dataset_info.json b/cache_ds/ASFPublicMail/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..3aa62ec4a98082ca41f16f6e22685962c87ef4ec --- /dev/null +++ b/cache_ds/ASFPublicMail/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22e838247ba626c837a0e2f9e5441eacf21596bdedf8acef97e46b826b482d00 +size 1013 diff --git a/cache_ds/ASFPublicMail/state.json b/cache_ds/ASFPublicMail/state.json new file mode 100644 index 0000000000000000000000000000000000000000..d45a546cfdb2700985a6191f2e7353f7512d54fd --- /dev/null +++ b/cache_ds/ASFPublicMail/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17504c5e156c41e3fe80610f5687e0ae5d4c6497fde5561bfa322fc9016490ff +size 256 diff --git a/cache_ds/Bible/dataset.arrow b/cache_ds/Bible/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..e4d54619d6edf2b0bc3d9d3d4d327c3a31185116 --- /dev/null +++ b/cache_ds/Bible/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:185e23e2270d439307ee061fe0d1b5d97ebb59b5b5bc0f21b914becd7101e042 +size 760 diff --git a/cache_ds/Bible/dataset_info.json b/cache_ds/Bible/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..b5937f6352a8e929ddc56807d0f5fb121b304a78 --- /dev/null +++ b/cache_ds/Bible/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8328c9f8f981001bc6a7fb6c0570948f269d1c633bd5e4ab531a856e9c0b52bc +size 970 diff --git a/cache_ds/Bible/state.json b/cache_ds/Bible/state.json new file mode 100644 index 0000000000000000000000000000000000000000..1f8b3adc68bba75941824c38cd4bc363697b2e5b --- /dev/null +++ b/cache_ds/Bible/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c8eeceb4d4b7abf6db30e0685f9115324faed05ce987688bd2b8a466f594810 +size 256 diff --git a/cache_ds/CodePilePosts/dataset.arrow b/cache_ds/CodePilePosts/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..801ca2323fa14a437e57b0f1411e721f2879e385 --- /dev/null +++ b/cache_ds/CodePilePosts/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17f51092bc240a8c996b4e3c42a9d3ed78955df698c0b2956df9387a42fd8ab3 +size 2057816 diff --git a/cache_ds/CodePilePosts/dataset_info.json b/cache_ds/CodePilePosts/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..6639a714e3d43f7a1226a9465d1f1e8b8dd51f24 --- /dev/null +++ b/cache_ds/CodePilePosts/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2378735ce55818c4bf7317bd8a37c468d484e3296cd48d5ad6645c0de0cc71a +size 1007 diff --git a/cache_ds/CodePilePosts/state.json b/cache_ds/CodePilePosts/state.json new file mode 100644 index 0000000000000000000000000000000000000000..24b473f83b315f311306d87e1f373a546943bcf4 --- /dev/null +++ b/cache_ds/CodePilePosts/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a31cce52efe0f137af3577da478eb99600731e7260e63fb2af08ebb95431851c +size 256 diff --git a/cache_ds/CodePileReddit2019/dataset.arrow b/cache_ds/CodePileReddit2019/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..d21f1798c14b9fe9a0485426b65a0ed6ea94aa4d --- /dev/null +++ b/cache_ds/CodePileReddit2019/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78e8a89da87bdcd690c716f4d7628e91972b18b0a1a679319e428b982f44fd9c +size 1951576 diff --git a/cache_ds/CodePileReddit2019/dataset_info.json b/cache_ds/CodePileReddit2019/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..df13b0a3da33ed9e850a997e9e6acdf57c8a8e95 --- /dev/null +++ b/cache_ds/CodePileReddit2019/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1426f28c5b35c2371a9fffc720bf9c9bdcd3e46ca64e3a025b57e7156c38d27a +size 1297 diff --git a/cache_ds/CodePileReddit2019/state.json b/cache_ds/CodePileReddit2019/state.json new file mode 100644 index 0000000000000000000000000000000000000000..009c9603ec3157d4a5eecd2da5d29d9086742832 --- /dev/null +++ b/cache_ds/CodePileReddit2019/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b19494b9b0ba5743bba9403c20f553f166e42f38dbc4bad8193fbd92ba447d81 +size 256 diff --git a/cache_ds/CodePileReddit2020/dataset.arrow b/cache_ds/CodePileReddit2020/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..da97d27dae35ca363499c86bcc4e29b97766d817 --- /dev/null +++ b/cache_ds/CodePileReddit2020/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1d55ca02de76eb7827af50a124fbcdd234a1379173145e32370c4bb289e1aec +size 2791192 diff --git a/cache_ds/CodePileReddit2020/dataset_info.json b/cache_ds/CodePileReddit2020/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..81bab12eb2bd446c811e44e7db4b4ebc4b1c73bc --- /dev/null +++ b/cache_ds/CodePileReddit2020/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8fdd5fcd593e06c9180f4d3149638efe9247dce9e83ff46ad7d59f288f76e8e +size 1012 diff --git a/cache_ds/CodePileReddit2020/state.json b/cache_ds/CodePileReddit2020/state.json new file mode 100644 index 0000000000000000000000000000000000000000..34d7f0f308a8ef8b64391b69ca609cc4cbf04ef9 --- /dev/null +++ b/cache_ds/CodePileReddit2020/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b0a9e7114140594bb0680b816e25f41a89fa72b84a60b5d32fb4fa96abdaed4 +size 256 diff --git a/cache_ds/CodePileReddit2021/dataset.arrow b/cache_ds/CodePileReddit2021/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..1daa6ff6cd4fbab69d7fa753be5cd7eb366c11d6 --- /dev/null +++ b/cache_ds/CodePileReddit2021/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23a51641095deb88dda76a4a02bf1f39c25da6012f22ed742057d3d76ffdab25 +size 2890600 diff --git a/cache_ds/CodePileReddit2021/dataset_info.json b/cache_ds/CodePileReddit2021/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..a9fb69eed24385b8e08b768bb779c343f548c96f --- /dev/null +++ b/cache_ds/CodePileReddit2021/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5a912a712710a305ceb72fd7b5de07ea0805e82bf1d89dfa5f02072eeac8eeb +size 1012 diff --git a/cache_ds/CodePileReddit2021/state.json b/cache_ds/CodePileReddit2021/state.json new file mode 100644 index 0000000000000000000000000000000000000000..d106b7bbcd5d410ae1015d9543ff8182afc15f17 --- /dev/null +++ b/cache_ds/CodePileReddit2021/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8b97e19828cd10006c6e1be44d5aafc8cfef80e4a2e3dd00b51e938d8c0313e +size 256 diff --git a/cache_ds/CodePileReddit2022/dataset.arrow b/cache_ds/CodePileReddit2022/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..563a83725a085a1304d69173fc86adcbfcb0fe81 --- /dev/null +++ b/cache_ds/CodePileReddit2022/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:344320145afce19cadfe51c69ebb95d3d83a71185d6e3554901043b615272934 +size 2859528 diff --git a/cache_ds/CodePileReddit2022/dataset_info.json b/cache_ds/CodePileReddit2022/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..dff927cf496390bb5b32fa45f6bb02e6a7cd4b52 --- /dev/null +++ b/cache_ds/CodePileReddit2022/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c415fdba7f94bfdf850a6450cfba7a96a63d46981857abfe33ea79b2ae4eb408 +size 1012 diff --git a/cache_ds/CodePileReddit2022/state.json b/cache_ds/CodePileReddit2022/state.json new file mode 100644 index 0000000000000000000000000000000000000000..bacbc889445d9d59fc45e5dbaccbb3e3f9a443b0 --- /dev/null +++ b/cache_ds/CodePileReddit2022/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6822abdae07333c3854380639898c2f0e4eb1c90ff9d20fdd74890c29687e5e6 +size 256 diff --git a/cache_ds/CodePileRedditPosts/dataset.arrow b/cache_ds/CodePileRedditPosts/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..b129e77aacd031cc6fc1dfc50cf70918007afe8e --- /dev/null +++ b/cache_ds/CodePileRedditPosts/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f85e7b0763c733479fa500b7f5287650d5ccd35b7f6beead7f34dc3064c8e383 +size 1978976 diff --git a/cache_ds/CodePileRedditPosts/dataset_info.json b/cache_ds/CodePileRedditPosts/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..06ffd4c4f2bd11af556b40224cdb3b5f8eac05bc --- /dev/null +++ b/cache_ds/CodePileRedditPosts/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd01c338a78c9785cc6f9b8cd9246b7c9ca8cb3c1858b3b6ec2aee6f080747e1 +size 1013 diff --git a/cache_ds/CodePileRedditPosts/state.json b/cache_ds/CodePileRedditPosts/state.json new file mode 100644 index 0000000000000000000000000000000000000000..3d0a63a5d43aec0025c99b808cc70bd087b466f5 --- /dev/null +++ b/cache_ds/CodePileRedditPosts/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:805a46afb1d48b0e9784043e25dbd8c4615973afa51a6050e73a1306e20ecb1c +size 256 diff --git a/cache_ds/DMMath/dataset.arrow b/cache_ds/DMMath/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..aac9d13f1a97bda88696bb1b4171fc17686657ca --- /dev/null +++ b/cache_ds/DMMath/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab234ef58bb959767c341538f0c38813f52c82466bf8f90ddb7348b5db1213ab +size 8561208 diff --git a/cache_ds/DMMath/dataset_info.json b/cache_ds/DMMath/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..845bc8d09aef09c1521d8ea61b82e8be698624c3 --- /dev/null +++ b/cache_ds/DMMath/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40be88e06831383d4361dc57e753e43840005f5aed5d41e552d053714660f40d +size 1001 diff --git a/cache_ds/DMMath/state.json b/cache_ds/DMMath/state.json new file mode 100644 index 0000000000000000000000000000000000000000..f2566c443bda6aa07b46a2a476fc1cc5dcaa48bf --- /dev/null +++ b/cache_ds/DMMath/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef6bba045471e35eea94d9c2dc24477e1bb398a7e04aac23aec7ca7f01cf4750 +size 256 diff --git a/cache_ds/DevDocs/dataset.arrow b/cache_ds/DevDocs/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..23c5fbb51e731a974933bb593f667f53a4bdbcd5 --- /dev/null +++ b/cache_ds/DevDocs/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ec849e09303c65b06166b4c4551e77fbb34ca9e35da2ae1866e4d6b7cb6a164 +size 4080160 diff --git a/cache_ds/DevDocs/dataset_info.json b/cache_ds/DevDocs/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..09ce4c7eb8ab0df1b45baf05f404a50e1a38f309 --- /dev/null +++ b/cache_ds/DevDocs/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2daf81786c74f43e428fd2d9e6a5076b9786bb7c25189366c943da85cb2f748 +size 1001 diff --git a/cache_ds/DevDocs/state.json b/cache_ds/DevDocs/state.json new file mode 100644 index 0000000000000000000000000000000000000000..3a373aa4fcb68af4602cec8787f5a582638d403f --- /dev/null +++ b/cache_ds/DevDocs/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f117c06a7e5f98a8b918b9fbde296d2043bcbd4f4e4a96d1f047cea91b77800a +size 256 diff --git a/cache_ds/Discourse/dataset.arrow b/cache_ds/Discourse/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..601afa07244b680428fe2085fdc080ac69e4e71f --- /dev/null +++ b/cache_ds/Discourse/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea797075fbf7a451a69f379766da75d43ddb85d7247fba85cc28b8618ed0e38e +size 6841312 diff --git a/cache_ds/Discourse/dataset_info.json b/cache_ds/Discourse/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..9a6ca6dd4d4698cd86ea6119890caaf6b34da7f8 --- /dev/null +++ b/cache_ds/Discourse/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfdf65b3c0e5e33c110ef660ba0bc54eedd887b17bbe24b23f52513b66dc72c7 +size 1004 diff --git a/cache_ds/Discourse/state.json b/cache_ds/Discourse/state.json new file mode 100644 index 0000000000000000000000000000000000000000..211c708411a676c46119e4157e112f9a4929dedf --- /dev/null +++ b/cache_ds/Discourse/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a10c5171d3ceadcb750b5871076ce6d69ca4bc78b1eb4d316218efc88f4d3ad +size 256 diff --git a/cache_ds/Enwiki/dataset.arrow b/cache_ds/Enwiki/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..dc15907aa3e54c0a2db55303cd5015af25ac1db9 --- /dev/null +++ b/cache_ds/Enwiki/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:845c55e4e7a0759f32fbd5ec0a66273cc59968d7ad974bd879a777a0f2aa969d +size 2445648 diff --git a/cache_ds/Enwiki/dataset_info.json b/cache_ds/Enwiki/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..b54af2d02ac3ced85252ba3e236be0af4e7cb179 --- /dev/null +++ b/cache_ds/Enwiki/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d5ad2eafc8d6d03178715863063e8bee284f68e55b4619721184712f66defef +size 1000 diff --git a/cache_ds/Enwiki/state.json b/cache_ds/Enwiki/state.json new file mode 100644 index 0000000000000000000000000000000000000000..61e31a867d8cf5b4c5d3356be1e19e2f8cf8784a --- /dev/null +++ b/cache_ds/Enwiki/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04f0263d5a50edc3d3083d7124b1fbada22c4c25154d65ceff2af0de31e77d40 +size 256 diff --git a/cache_ds/EuroParliamentProceedings/dataset.arrow b/cache_ds/EuroParliamentProceedings/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..6e667e7d4791f0eb0e01a0082509dc8b9e398917 --- /dev/null +++ b/cache_ds/EuroParliamentProceedings/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad267f2e9913ced7cc7d1d50e0096733f3bb48b47c1e14fed51397c1f14aa58f +size 29868496 diff --git a/cache_ds/EuroParliamentProceedings/dataset_info.json b/cache_ds/EuroParliamentProceedings/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..02c0067d2211d62def46813917273d2b8d2303d7 --- /dev/null +++ b/cache_ds/EuroParliamentProceedings/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:441bb346ecb9991ffacded023fe293b8c8a2015c8ecb84ea5f7b5c65c5518f47 +size 1024 diff --git a/cache_ds/EuroParliamentProceedings/state.json b/cache_ds/EuroParliamentProceedings/state.json new file mode 100644 index 0000000000000000000000000000000000000000..e61dc7d7f6618cb47385f87f9435d5c64d578c2a --- /dev/null +++ b/cache_ds/EuroParliamentProceedings/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b26b3202b90e72bef983b784dcfc7b893091c58574a9b4b9a972a619d8c57a6 +size 256 diff --git a/cache_ds/FreeLaw_Options/dataset.arrow b/cache_ds/FreeLaw_Options/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..92af03348158e726b09d7c8eb5e282c0a32e5bc1 --- /dev/null +++ b/cache_ds/FreeLaw_Options/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9df0f8c2a96e2037cfce464abade39022d83d82b27d13e8951dcd7e200e91264 +size 13041200 diff --git a/cache_ds/FreeLaw_Options/dataset_info.json b/cache_ds/FreeLaw_Options/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..de4bcdd4ba7b9fc1f2779f581c789e37eee08582 --- /dev/null +++ b/cache_ds/FreeLaw_Options/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63f043f1aef3043126a5499816fa872561326cf66fca6816a80fcc1899e66f3f +size 1014 diff --git a/cache_ds/FreeLaw_Options/state.json b/cache_ds/FreeLaw_Options/state.json new file mode 100644 index 0000000000000000000000000000000000000000..9f3fc18883b4e8aa498ff40661f0995e32ba8d12 --- /dev/null +++ b/cache_ds/FreeLaw_Options/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1059b2512bf2e2ba4dae915fcb0da6de21ceae829ae0f6c7caf951573996fab2 +size 256 diff --git a/cache_ds/GNOME/dataset.arrow b/cache_ds/GNOME/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..e4d54619d6edf2b0bc3d9d3d4d327c3a31185116 --- /dev/null +++ b/cache_ds/GNOME/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:185e23e2270d439307ee061fe0d1b5d97ebb59b5b5bc0f21b914becd7101e042 +size 760 diff --git a/cache_ds/GNOME/dataset_info.json b/cache_ds/GNOME/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..fdee22fc8d2dfa59061b9319474acb538d5cfa0f --- /dev/null +++ b/cache_ds/GNOME/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcd536943d56b0b42677bf4d237f458ebacbdd78aa32d11d4105b90eb0035be0 +size 970 diff --git a/cache_ds/GNOME/state.json b/cache_ds/GNOME/state.json new file mode 100644 index 0000000000000000000000000000000000000000..5dabe3b46f7a9d1e41bf0864a41565d5cfaac96d --- /dev/null +++ b/cache_ds/GNOME/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9226e7c9f9112c93f76e43f7cbeb47bbb23170bca2b208be6ed8b59ed3aa68ad +size 256 diff --git a/cache_ds/GithubDiff/dataset.arrow b/cache_ds/GithubDiff/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..8d7d85d31c773615fc99fc707b54bf694f19346c --- /dev/null +++ b/cache_ds/GithubDiff/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac60f9d36eec995ebbba86024bea30c533aa0cc237344f47dae1e97f9f207e08 +size 99582144 diff --git a/cache_ds/GithubDiff/dataset_info.json b/cache_ds/GithubDiff/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..7e8a47bdd334a383364311d3308fac02a8c46912 --- /dev/null +++ b/cache_ds/GithubDiff/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:957884d1d165eabcc2d9a629ea10551cf3409bd9d1ff808b929e0ef86bbaae79 +size 1012 diff --git a/cache_ds/GithubDiff/state.json b/cache_ds/GithubDiff/state.json new file mode 100644 index 0000000000000000000000000000000000000000..335c3ff3f9dc47f950411ad7429ae28a82625b28 --- /dev/null +++ b/cache_ds/GithubDiff/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0003ba065c3f42d5d778f7763f23749e5f2dcfeebc988a349e15393b614a80c4 +size 256 diff --git a/cache_ds/GithubDiff_ver2/dataset.arrow b/cache_ds/GithubDiff_ver2/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..a7393de219d4877386cac6ada0f8c9b6f0db9434 --- /dev/null +++ b/cache_ds/GithubDiff_ver2/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a36e8cc807d5db92e5981a3e4b99a25479e2ec11aa3e8b23546082f9a2ee7366 +size 21428048 diff --git a/cache_ds/GithubDiff_ver2/dataset_info.json b/cache_ds/GithubDiff_ver2/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..f741cb32e495bda8ca53f16594bab63abb7e8124 --- /dev/null +++ b/cache_ds/GithubDiff_ver2/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4944b73bd5cda9d4c5c1b51b874cedaa22fcdf713af2e11363f6d12d542ebe59 +size 1014 diff --git a/cache_ds/GithubDiff_ver2/state.json b/cache_ds/GithubDiff_ver2/state.json new file mode 100644 index 0000000000000000000000000000000000000000..e97be2e86ba5bc6fab21d89bf60316ca17b77cf8 --- /dev/null +++ b/cache_ds/GithubDiff_ver2/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d68ec129ecb4bc80505b594d4fd3be8b9f4ff031c4eb76961f3608b8493070c +size 256 diff --git a/cache_ds/GithubIssues/dataset.arrow b/cache_ds/GithubIssues/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..cf3f8a75e1306bc74afbdda3ec433bf71925f590 --- /dev/null +++ b/cache_ds/GithubIssues/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6703183af39ec699f5980c9987026bcc3a6be8d759674cec923598dc5e2b01f +size 3185008 diff --git a/cache_ds/GithubIssues/dataset_info.json b/cache_ds/GithubIssues/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..1b9314b566fd42db3c8ec1b4cf60418ec26f7b09 --- /dev/null +++ b/cache_ds/GithubIssues/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:093a49858acb3b0e77108214a92c1cbe5afd0d32007bd77a7a7eaadddd953eaa +size 1006 diff --git a/cache_ds/GithubIssues/state.json b/cache_ds/GithubIssues/state.json new file mode 100644 index 0000000000000000000000000000000000000000..4ec3ac9fc4f9f9d27d1cee9def76ff22631de02a --- /dev/null +++ b/cache_ds/GithubIssues/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64ff0d11850de11fc978643c1fb4334cf8ecb895df5695605ff67cd69b9f9d8b +size 256 diff --git a/cache_ds/Gutenberg/dataset.arrow b/cache_ds/Gutenberg/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..df2723821b2bc95384cb3046659952706e2325fc --- /dev/null +++ b/cache_ds/Gutenberg/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee57d8c91476e7c2d5adb3e6c8d86279b13dce5f2f8f413f120adc87b163a497 +size 44924064 diff --git a/cache_ds/Gutenberg/dataset_info.json b/cache_ds/Gutenberg/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..4c9607b9a1835abeb3d3ea4f83b82fa09f71fcc6 --- /dev/null +++ b/cache_ds/Gutenberg/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd2ef42b2590f741e80b169ba268f2089e90c4521c6cfad09a28e7a51bfed931 +size 1008 diff --git a/cache_ds/Gutenberg/state.json b/cache_ds/Gutenberg/state.json new file mode 100644 index 0000000000000000000000000000000000000000..2dce03b2e7da10d50b0e6dcae8165024b5fcab86 --- /dev/null +++ b/cache_ds/Gutenberg/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc8e3dea2f34ca86aea526181f7937e6df651935bc0eae4e35a36b1030a482b6 +size 256 diff --git a/cache_ds/Opensubtitles/dataset.arrow b/cache_ds/Opensubtitles/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..fc504bc90cb951d2c5ef6cfda072251e41199546 --- /dev/null +++ b/cache_ds/Opensubtitles/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47dac631808c6c3b3de20ae291395d6c5ed07f973b6d3286d4b6b71f656edd64 +size 869440 diff --git a/cache_ds/Opensubtitles/dataset_info.json b/cache_ds/Opensubtitles/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..ec0b88a4cebad013690b7d35b1de3075508da199 --- /dev/null +++ b/cache_ds/Opensubtitles/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69828cad5434b7a305815dd18855925a1d9b05affd54c7841a52f3a40832ccd8 +size 1291 diff --git a/cache_ds/Opensubtitles/state.json b/cache_ds/Opensubtitles/state.json new file mode 100644 index 0000000000000000000000000000000000000000..461141eceeb77c38f45b06916b05c783026b7623 --- /dev/null +++ b/cache_ds/Opensubtitles/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d418495ec9a4008735793b118e4a6fb9c13b1df0586bebf269d7a88bcc267012 +size 256 diff --git a/cache_ds/OtherWiki/dataset.arrow b/cache_ds/OtherWiki/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..0541053cabb26d53654d9f4b04914493c519527c --- /dev/null +++ b/cache_ds/OtherWiki/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:507e8106a7e72b63d0a5b929bcd1c160ff93a770e1ade0486edf203fffb88f4c +size 7824848 diff --git a/cache_ds/OtherWiki/dataset_info.json b/cache_ds/OtherWiki/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..75e2e1a05f8b0dfbbd2018c8682df615e2744b6a --- /dev/null +++ b/cache_ds/OtherWiki/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2c4f41afd79ab58a3af3da9137ed1285c30cb9898911c1b38deaa793add7c75 +size 1004 diff --git a/cache_ds/OtherWiki/state.json b/cache_ds/OtherWiki/state.json new file mode 100644 index 0000000000000000000000000000000000000000..200502d0e861d55b4b51762a443b4efc62c1150e --- /dev/null +++ b/cache_ds/OtherWiki/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6763eda09fa4f9551b3296e18abd9e3f66caf733105aaec59375586c898adce +size 256 diff --git a/cache_ds/PileOfLaw/dataset.arrow b/cache_ds/PileOfLaw/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..a199f47f61f33272f0d867efd2a01aea5cce5475 --- /dev/null +++ b/cache_ds/PileOfLaw/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f791d494aec576262f9a357f7714b8a6f325efa336e1ea04c1e06f223d803b06 +size 15476168 diff --git a/cache_ds/PileOfLaw/dataset_info.json b/cache_ds/PileOfLaw/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..78e88992c37fd35c6b9d2bbf288e7d084bb172be --- /dev/null +++ b/cache_ds/PileOfLaw/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2aa700a492b2b449acfa0b18a9e7f44a22b84c7da4bfcb23339a9c0f44afc99 +size 1008 diff --git a/cache_ds/PileOfLaw/state.json b/cache_ds/PileOfLaw/state.json new file mode 100644 index 0000000000000000000000000000000000000000..dc0a5f88f9017162cc6e6dda8135f711a6ae61e4 --- /dev/null +++ b/cache_ds/PileOfLaw/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f9d96c88d1af5ac5d59582dd7aadc14d7cbb32ce10142056cc96497e7fc5ccb +size 256 diff --git a/cache_ds/PileV2Posts/dataset.arrow b/cache_ds/PileV2Posts/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..7bd5190fcf522111b937291db588b97209777621 --- /dev/null +++ b/cache_ds/PileV2Posts/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4110658f565855757e07f5a60425bfdd2c20f0192141f3852de1a1d11efca6e6 +size 2144448 diff --git a/cache_ds/PileV2Posts/dataset_info.json b/cache_ds/PileV2Posts/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..7680b5a556747cf2511714a6346134f06110d6ab --- /dev/null +++ b/cache_ds/PileV2Posts/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:723f43a71cb0e4f74c9e12480ad504988d7618ba5edae687670440af833cce10 +size 1291 diff --git a/cache_ds/PileV2Posts/state.json b/cache_ds/PileV2Posts/state.json new file mode 100644 index 0000000000000000000000000000000000000000..9b9e731cbfddc40d8c76362b465844b458d78b22 --- /dev/null +++ b/cache_ds/PileV2Posts/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8851e6ec8ca6f0e84c1ecec5085be2ba234ad81a72b1b92b47ce11525fa8bdc9 +size 256 diff --git a/cache_ds/PileV2Reddit2020/dataset.arrow b/cache_ds/PileV2Reddit2020/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..90307e3c625a7267fe143a5b6255e7ace35ba3a0 --- /dev/null +++ b/cache_ds/PileV2Reddit2020/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4632a85c30ddcec05a3cc4647b9ceae3401461efec868c9c56113e9740fd710d +size 2463856 diff --git a/cache_ds/PileV2Reddit2020/dataset_info.json b/cache_ds/PileV2Reddit2020/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..ef901211130c5d1c5c724769855053adee680288 --- /dev/null +++ b/cache_ds/PileV2Reddit2020/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2bc72faac4dcd61e2ccdb9348c30b11203bfdb4bc5f14c98954bce63aa0ca3c +size 1296 diff --git a/cache_ds/PileV2Reddit2020/state.json b/cache_ds/PileV2Reddit2020/state.json new file mode 100644 index 0000000000000000000000000000000000000000..c7f7fac30d56af66ad34ad5edd8775266a0f0bb1 --- /dev/null +++ b/cache_ds/PileV2Reddit2020/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e109d2c6e7e3ca744c10cd7594ce69f7805523d2684378001b14034b171a051c +size 256 diff --git a/cache_ds/PileV2RedditPosts/dataset.arrow b/cache_ds/PileV2RedditPosts/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..5e8a07d0d840ea1574a39bd0dec884e81cfc81fb --- /dev/null +++ b/cache_ds/PileV2RedditPosts/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d40dd26be58cdfa0333b1e6e7184b5819c268e0cd175d9204b54c625f709cd9 +size 2096712 diff --git a/cache_ds/PileV2RedditPosts/dataset_info.json b/cache_ds/PileV2RedditPosts/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..1f3182c15d2a8af6abf89a96546bb9dff16b9fbe --- /dev/null +++ b/cache_ds/PileV2RedditPosts/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f4db79404e92104e7af5ff2959bccff396877b7177a30164c4150d9eac1e84c +size 1297 diff --git a/cache_ds/PileV2RedditPosts/state.json b/cache_ds/PileV2RedditPosts/state.json new file mode 100644 index 0000000000000000000000000000000000000000..52c302bfa9d96477144750f654acf5613080598b --- /dev/null +++ b/cache_ds/PileV2RedditPosts/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd76909416c2285069061c6eb2404f103f395b80ff7d45fae914685805877fd5 +size 256 diff --git a/cache_ds/PubMed/dataset.arrow b/cache_ds/PubMed/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..16b8e3a0b0ece8ea69cc2deabcdc91e1f28c1cb5 --- /dev/null +++ b/cache_ds/PubMed/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33e9e755bd71dc7cfb7b0eb8329c623d3598e6bfa51712d11d122997583ed9e4 +size 39676496 diff --git a/cache_ds/PubMed/dataset_info.json b/cache_ds/PubMed/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..30970e97a4b5052cb3d8b52243f730b33e042d44 --- /dev/null +++ b/cache_ds/PubMed/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73abcfdb03446c70eca19815cd3fba8f7733e695414e7240ad234944f8246989 +size 1005 diff --git a/cache_ds/PubMed/state.json b/cache_ds/PubMed/state.json new file mode 100644 index 0000000000000000000000000000000000000000..50bf6c8ddd71dcf535113e5f4931d52188d53bb4 --- /dev/null +++ b/cache_ds/PubMed/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48febc8f75a87ee8bef533d6e3037f09928c015cfc0ab854266cde1ab02103ea +size 256 diff --git a/cache_ds/S2ORC/dataset.arrow b/cache_ds/S2ORC/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..e834121498ec56a376c9ab3ba6b50fc4e936dd9b --- /dev/null +++ b/cache_ds/S2ORC/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f5064044004532d8fa25910f6fbe1a6a711ce4ceb29b024e4d22cae53ba62a1 +size 23768264 diff --git a/cache_ds/S2ORC/dataset_info.json b/cache_ds/S2ORC/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..6bccb8f287a1014c43601f6dd6cde375b60fbbd6 --- /dev/null +++ b/cache_ds/S2ORC/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1db10aa9fde63269f934107726d81da673f7c8f6b22c38ae3c51ee487eafe08 +size 1004 diff --git a/cache_ds/S2ORC/state.json b/cache_ds/S2ORC/state.json new file mode 100644 index 0000000000000000000000000000000000000000..4903b0bdb0afa5ffe8f3058fe502a68afdcf42c4 --- /dev/null +++ b/cache_ds/S2ORC/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cd97be215c198172494a3e8be251b905944504a6931a15160bbcc2008802d37 +size 256 diff --git a/cache_ds/StackExchange_ver2/dataset.arrow b/cache_ds/StackExchange_ver2/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..66b1bae3a5026a40e7c65f19f1abf13efab6c729 --- /dev/null +++ b/cache_ds/StackExchange_ver2/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e1fe7a891b19c1d752643f0b85bf995b3f10a8ccfada56bbdb96fb1aa8a2616 +size 3775744 diff --git a/cache_ds/StackExchange_ver2/dataset_info.json b/cache_ds/StackExchange_ver2/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..70cae3422c13810a00355ab4ce3071fe820fceea --- /dev/null +++ b/cache_ds/StackExchange_ver2/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e9c5f28169c51495ea2f025e568e3c94d84f799062e35423c3504d2a85fa2f1 +size 1298 diff --git a/cache_ds/StackExchange_ver2/state.json b/cache_ds/StackExchange_ver2/state.json new file mode 100644 index 0000000000000000000000000000000000000000..269580829d2bb4e93982b042aaadcbffb87ed610 --- /dev/null +++ b/cache_ds/StackExchange_ver2/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27278cb749f7b0c117d49d8cb952e5d9c3eb22f5411be68f9c02f87f7b52fc78 +size 256 diff --git a/cache_ds/TED2020/dataset.arrow b/cache_ds/TED2020/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..3fa950a7007c62f42adf4ba7c852c6a039394221 --- /dev/null +++ b/cache_ds/TED2020/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7312df0ff9bcfe40568fd310747f229f93cb481d0852c15788914d8977b76a38 +size 14256544 diff --git a/cache_ds/TED2020/dataset_info.json b/cache_ds/TED2020/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..cb2fb407ce92d4045a1af8399b97f6be74174c98 --- /dev/null +++ b/cache_ds/TED2020/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06dc1850cbbe3335361e9f8a5d2ac1db12154f71af6d250ba970cfee5188bd88 +size 1006 diff --git a/cache_ds/TED2020/state.json b/cache_ds/TED2020/state.json new file mode 100644 index 0000000000000000000000000000000000000000..9a11031e356ac85eddd018cee059cc8f8edf12b8 --- /dev/null +++ b/cache_ds/TED2020/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7df0b87c86723d29c65dcbf8d24d775cbd3e61a3b04831e177803adf80343fd5 +size 256 diff --git a/cache_ds/Tanzil/dataset.arrow b/cache_ds/Tanzil/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..e4d54619d6edf2b0bc3d9d3d4d327c3a31185116 --- /dev/null +++ b/cache_ds/Tanzil/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:185e23e2270d439307ee061fe0d1b5d97ebb59b5b5bc0f21b914becd7101e042 +size 760 diff --git a/cache_ds/Tanzil/dataset_info.json b/cache_ds/Tanzil/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..1b1de9a6e739ad0642cd953331bccf9f89e891e4 --- /dev/null +++ b/cache_ds/Tanzil/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1c2aca3c4a3647a2ee02ce66c0f0564345be98723217592f4403c9514ee75e5 +size 971 diff --git a/cache_ds/Tanzil/state.json b/cache_ds/Tanzil/state.json new file mode 100644 index 0000000000000000000000000000000000000000..deb01abf2e30532e9660ecc3a97fa88108b82ee9 --- /dev/null +++ b/cache_ds/Tanzil/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f931fe58cef47710b1d9eb3281ce98395a210fa0bbd8175a0fa4967e71ea5d0 +size 256 diff --git a/cache_ds/TheStack/dataset.arrow b/cache_ds/TheStack/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..e203e575f55dbc68b36b9e14cc90c579f1158729 --- /dev/null +++ b/cache_ds/TheStack/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffbebe6df11fcb850a61ab70e12fac9eeb913cef094b509c1322e3259713916b +size 4640240 diff --git a/cache_ds/TheStack/dataset_info.json b/cache_ds/TheStack/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..4c540552600c02f517f2364756c7b7c27fae01ac --- /dev/null +++ b/cache_ds/TheStack/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4367a7e292a60606e8a01a3e38af7041529737cacb4e1295835e52c67b086f6 +size 1002 diff --git a/cache_ds/TheStack/state.json b/cache_ds/TheStack/state.json new file mode 100644 index 0000000000000000000000000000000000000000..99bc20d38b28a40dbb78a7726f3c972ea47b0adf --- /dev/null +++ b/cache_ds/TheStack/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dfc6a621dbb0a51e2f06b25dbdd7c2e615dc8f73754aa0aca9135febea5593a +size 256 diff --git a/cache_ds/USENET/dataset.arrow b/cache_ds/USENET/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..e9771c1b9b40162bc27560166dcf2db44087c939 --- /dev/null +++ b/cache_ds/USENET/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83dc13bb9f86c9ada1e3708e38cae054a94f0ab2c567189e24fb4bcf48b53d35 +size 4133928 diff --git a/cache_ds/USENET/dataset_info.json b/cache_ds/USENET/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..24254693309e509c3b88ffd0f8dd7825ca6c22e5 --- /dev/null +++ b/cache_ds/USENET/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea8764bbcf96e6d82e38d665685696e93ef3a15f17424cb608ca233e5cd14720 +size 1000 diff --git a/cache_ds/USENET/state.json b/cache_ds/USENET/state.json new file mode 100644 index 0000000000000000000000000000000000000000..0690da7a0fae718373a0557446c931779860b0d6 --- /dev/null +++ b/cache_ds/USENET/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66d769df83eaffca62a74d7e589f2d01ccc1f314a5d1db1a69674bc3f46a2893 +size 256 diff --git a/cache_ds/USPTO/dataset.arrow b/cache_ds/USPTO/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..3a5de691c69ddeae3f704ea2c454c929e19d282b --- /dev/null +++ b/cache_ds/USPTO/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14c2956936195e33711a582f546cbb0e9ad699860f9eecf415cb254e22cc5aa9 +size 37034288 diff --git a/cache_ds/USPTO/dataset_info.json b/cache_ds/USPTO/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..731b90429044a4a9f8523569f1b704b0fd7bb806 --- /dev/null +++ b/cache_ds/USPTO/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71620c24a5e4708f005b8eceac16d50182a8e089103ea6912878c4af73721200 +size 1290 diff --git a/cache_ds/USPTO/state.json b/cache_ds/USPTO/state.json new file mode 100644 index 0000000000000000000000000000000000000000..89fc030cfddae098c787aa5139098f6f98cda6dc --- /dev/null +++ b/cache_ds/USPTO/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:875882d78dc1159797b4b3c574009a11ef32eb499b58e3095a9d4b6fcbedf2fa +size 256 diff --git a/cache_ds/UbuntuIRC/dataset.arrow b/cache_ds/UbuntuIRC/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..f61f9ef21b4d6a20eac90178f52fe9e4f0f5259b --- /dev/null +++ b/cache_ds/UbuntuIRC/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e5dc37b6a0bfbddfce895d5cd65581fedbb504ca0d4449fdd66da08fb8e991e +size 39899832 diff --git a/cache_ds/UbuntuIRC/dataset_info.json b/cache_ds/UbuntuIRC/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..322197d83fd050a0a71a1622bd14152f42f73f37 --- /dev/null +++ b/cache_ds/UbuntuIRC/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:826ab400e5b1b8916fefd93f7c4e68113f85ab5e0befa9a17cf301e8123b3fd6 +size 1008 diff --git a/cache_ds/UbuntuIRC/state.json b/cache_ds/UbuntuIRC/state.json new file mode 100644 index 0000000000000000000000000000000000000000..1c36f862445bd74f7b37e90641710c71d9389a0d --- /dev/null +++ b/cache_ds/UbuntuIRC/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35fde071843194f5b699ad7ea3d6a29e58923d0617cc49918e8bba67d1f517c8 +size 256 diff --git a/cache_ds/arXiv/dataset.arrow b/cache_ds/arXiv/dataset.arrow new file mode 100644 index 0000000000000000000000000000000000000000..1d18cbca36abe83d632e83727afdb735b7a2f933 --- /dev/null +++ b/cache_ds/arXiv/dataset.arrow @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60a225f5315baa957484b6bb7a0e21686bf8f3d1fe1fa33f82045ccda0f6fded +size 38759384 diff --git a/cache_ds/arXiv/dataset_info.json b/cache_ds/arXiv/dataset_info.json new file mode 100644 index 0000000000000000000000000000000000000000..920bddd991ac4f3b9b6e32774909e5dac7462792 --- /dev/null +++ b/cache_ds/arXiv/dataset_info.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2891b8a270766224fa4c304a98bf762523187f01693888a12ddb62c1a7321ec5 +size 1004 diff --git a/cache_ds/arXiv/state.json b/cache_ds/arXiv/state.json new file mode 100644 index 0000000000000000000000000000000000000000..abfef67bac5496e78089a781507ea02931991544 --- /dev/null +++ b/cache_ds/arXiv/state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af4772c6a5baf3150c819416d55b1dd392462448a0b7da3cc8e2e5e06fca6e96 +size 256 diff --git a/load_dataset.py b/load_dataset.py new file mode 100644 index 0000000000000000000000000000000000000000..d0ccf215e088976dfae4fe409d1d0ba43d8aac3b --- /dev/null +++ b/load_dataset.py @@ -0,0 +1,17 @@ +import datasets +import logging +import os +from tqdm import tqdm +PATH = "/Users/reshinthadithyan/master/research/code-research/carperai/pile-v2-small-filtered/data" +dataset_subs = os.listdir(PATH) + +print(dataset_subs) + + +for ds in tqdm(dataset_subs): + try: + print(ds) + dataset = datasets.load_dataset("CarperAI/pile-v2-small-filtered",data_files=f"data/{ds}/data.json", split="train") + dataset.save_to_disk(f"cache_ds/{ds}") + except: + print(f"Error at {ds}") \ No newline at end of file