diff --git a/ibis/examples/gen_registry.py b/ibis/examples/gen_registry.py index 4cdb7df802e0..51dd20fe2fcd 100755 --- a/ibis/examples/gen_registry.py +++ b/ibis/examples/gen_registry.py @@ -9,7 +9,7 @@ import subprocess import tempfile import zipfile -from collections import defaultdict +from collections import Counter, defaultdict from pathlib import Path from typing import Iterable, Mapping @@ -224,7 +224,9 @@ def download_file(base: str, outdir: Path) -> None: convert_to_parquet(con, path, description=meta[path.name]) -def main(args): +def main(parser): + args = parser.parse_args() + bucket = args.bucket clean = args.clean @@ -255,6 +257,8 @@ def main(args): # generate data from R subprocess.check_call(["Rscript", str(EXAMPLES_DIRECTORY / "gen_examples.R")]) + verify_case(parser, data_path) + if not args.dry_run: # rsync data and descriptions with the bucket subprocess.check_call( @@ -273,37 +277,48 @@ def main(args): f.write("\n") +def verify_case(parser: argparse.ArgumentParser, data_path: Path) -> None: + keys = (p.name[: -sum(map(len, p.suffixes))] for p in data_path.glob("*")) + counter = Counter(map(str.lower, keys)) + + invalid_keys = [key for key, count in counter.items() if count > 1] + if invalid_keys: + parser.error( + f"keys {invalid_keys} are incompatible with case-insensitive file systems" + ) + + if __name__ == "__main__": import argparse - p = argparse.ArgumentParser( + parser = argparse.ArgumentParser( description="Set up the pooch registry from a GCS bucket.", formatter_class=argparse.ArgumentDefaultsHelpFormatter, ) - p.add_argument( + parser.add_argument( "-b", "--bucket", default="ibis-examples", help="GCS bucket to rsync example data to", ) - p.add_argument( + parser.add_argument( "-C", "--clean", action="store_true", help="Remove data and descriptions directories before generating examples", ) - p.add_argument( + parser.add_argument( "-I", "--imdb-source-dir", help="Directory containing imdb source data", default=None, type=str, ) - p.add_argument( + parser.add_argument( "-d", "--dry-run", action="store_true", help="Avoid executing any code that writes to the example data bucket", ) - main(p.parse_args()) + main(parser) diff --git a/ibis/examples/metadata.json b/ibis/examples/metadata.json index 3eac6d2f5c87..ed99619c265d 100644 --- a/ibis/examples/metadata.json +++ b/ibis/examples/metadata.json @@ -910,14 +910,6 @@ "description": "Number of Flaws in Cloth", "key": "cloth.csv.gz" }, - "cms_patient_care": { - "description": "Data from the Centers for Medicare & Medicaid Services", - "key": "cms_patient_care.csv.gz" - }, - "cms_patient_experience": { - "description": "Data from the Centers for Medicare & Medicaid Services", - "key": "cms_patient_experience.csv.gz" - }, "co_transfer": { "description": "Carbon Monoxide Transfer", "key": "co_transfer.csv.gz" @@ -1139,10 +1131,6 @@ "description": "Failure Time of PET Film", "key": "hirose.csv.gz" }, - "household": { - "description": "Household data", - "key": "household.csv.gz" - }, "housing": { "description": "Frequency Table from a Copenhagen Housing Conditions Survey", "key": "housing.csv.gz" @@ -1681,10 +1669,6 @@ "description": "World Health Organization TB data", "key": "who.csv.gz" }, - "who2": { - "description": "World Health Organization TB data", - "key": "who2.csv.gz" - }, "women": { "description": "Average Heights and Weights for American Women", "key": "women.csv.gz" diff --git a/ibis/examples/registry.txt b/ibis/examples/registry.txt index a018acbbed2f..45af72a17537 100644 --- a/ibis/examples/registry.txt +++ b/ibis/examples/registry.txt @@ -2,10 +2,11 @@ Aids2.csv.gz 7314938f1c7fac1b27186bc0fb4e1c746163ebc239f8bce747ed847d5394d658 Aids2_raw.csv.gz ae385214f334ccdddd94c818406bc423419ee248aad9a8ae6cc7c6d0aa3dd7a4 Alfalfa.csv.gz 049d5f31676aab22f5ded9842aa323bf2c87e31b9e33c20a527e98c371951d3d Alfalfa_raw.csv.gz 936fd85b42609584bc4d891ef638183428bb32c06b1f23e89353b7797a057639 -AllstarFull.csv.gz fbf0d30ad6d8b3a3a1a61dad624c54039a35585c5c6e7558a38ae9c7368b9d32 -AllstarFull_raw.csv.gz 500267975cbbaadb6aa2b9714dc99c2249e6964133451d037e94c09a1c737608 -Appearances.csv.gz 091321a2e3e358a3203a0bedb4bc0087ef46f2977a435be7d21f96eb1b04c4ad -Appearances_raw.csv.gz 17c81c0a2dd8b4032a4e9875539a85717b71e0757badad15ba43056ae881e805 +AllstarFull.csv.gz 206f73e2783745c772ec4f69cec512f913c360f2c54043dcc49d7c55bdb46f44 +AllstarFull_raw.csv.gz cede55d2b3f5cbf6dc874834d4a510d9f406137dd8121b9f68ff9085e16c4a38 +Animals.csv.gz 22043d50626fa221a7ed33afb2336f7a39f49165ea80bf81312c84af221fb1cc +Appearances.csv.gz df5e83d7b8daef99e60e9d726bbe338f45c159fe7776d0157cfe375ef6d9bdc9 +Appearances_raw.csv.gz 40adfd1564501b39014d0875aab23ee9c09e1892ec24d404956db14f2b79f5db Assay.csv.gz 254bdd4061b61ba37d0eb444851eec6c29431be0d0e37de3c09f8d97ab525c5f Assay_raw.csv.gz 5555e9b5a0ec998f93af7b9b956c7391cd5bebd750279ff795fd5d098aa5cbd0 AwardsManagers.csv.gz 23bb2fb85af23c9aadefec5c30d711d1e8b0d4ffe2c388149edf26f3769a6302 @@ -18,10 +19,10 @@ AwardsSharePlayers.csv.gz 040a6b8451120e2159ec1a9480c79614c50428199447f2569b1315 AwardsSharePlayers_raw.csv.gz debf95f7084bb5a504df2790ae895f4c833616f55efb01c1c6face3761522c78 BOD.csv.gz eb90d6e7bb5b640be4fe765085a998fd66eb0bbd32a6f4e0ad5f70950c5057f7 BOD_raw.csv.gz bd16d28eecc4754516c92c2a48ccafab61907e0129e894c524bbe6c6f2b9b050 -Batting.csv.gz 276f36a4c9cefe6bc293e46308f4107c85164b1f3fa455d825dc5a04bcdbc287 -BattingPost.csv.gz cac8ca5fc5d6941e1a4b80faa1722b2ecdd9bcaf02f574236b4e72804b4f7678 -BattingPost_raw.csv.gz 6e99fa22d28ed8fdbeeebb878246e23f4c6d98ae67f287b73507a16e965e8511 -Batting_raw.csv.gz 55ac8d6c7ef52bdef6017f6850cc99169eac184fa961b11444235eb89279f4c5 +Batting.csv.gz a77446da4b80b8b3c2e59b3aa93cae7e362b3fb738173f8ee719d11a5928c12b +BattingPost.csv.gz 5bf70a75d6ac48a5c0a5e8502164c5e2e3572a0d6e6ed4806c9a36784c3e9060 +BattingPost_raw.csv.gz ad901a301114cdbb1021158c5975808b17ddf6ce6e156640c609eb54b41f14da +Batting_raw.csv.gz be4f3ad733f137adab55ca793224f770c2b2311c41a57b77f68a4f0ae20060b9 BodyWeight.csv.gz 1ba52100e8f81d82e0ea56cd52ddb97bd3af596d7b1596f04e80ed37ab8cd2fe BodyWeight_raw.csv.gz 6a9f60b338796accd71a5960230d2cada164a8abf7c05b0c18dc52ad33f06ad3 Boston.csv.gz 78c2b3e413b5274ad48079126739493185e222d4a7766e98e6359324a7d2892a @@ -45,14 +46,14 @@ Earthquake.csv.gz abac894c4ec6ecdc26432c0bb920e34def2f7e221a056f427fc1224f410fa4 Earthquake_raw.csv.gz b87858c3c359e207c702e6ad54dcfa2034f89a608fcaf9666c4c3ce5da41f4e2 Fatigue.csv.gz b8f37b5e7ae8e60a215b6431de415d206515cd85817c5026c66ed3d2186a5c73 Fatigue_raw.csv.gz 5e6d4ee653ed03ae60c67413e0b9c316e52dfb6541ed06d199c477d5fc1ff0fd -Fielding.csv.gz 3710a8dac26d1ca5f25c53140aa0ef1bc838e1b15c7f381c58a51ad63717d76e +Fielding.csv.gz 41148ceca5977c66928a09f5bb6ce80843c075aff2c609f0fe6973cc7e38f069 FieldingOF.csv.gz 1c72242516e0748216df28ae1e25cf67b71e8379ca7cc98687e35f39bae0479d FieldingOF_raw.csv.gz cc2a4cc82b63a9a3ec7677c89c5697cfc08694029c8827ae7141d5af57881124 -FieldingOFsplit.csv.gz 965d656a34eb52c05b026a9676d240f9feed03e3eed5feac8e30ec1979b5b095 -FieldingOFsplit_raw.csv.gz 8027f8792866826a26b483797a473960d7bdfd2fad1bcb5264324a3458daa736 -FieldingPost.csv.gz 51a92ccc7ff2722f50776e1d718ced04ba5daf971c91d9230de521a6f87c4201 -FieldingPost_raw.csv.gz 1b1e8fc51e8e1192fef11d5ec08e54cb0fca4d6e694d9960d19c63d449f2fa27 -Fielding_raw.csv.gz 1d15867f56b05fcd0ec2440b546a78c443abb263329af4a2ae14f0af6ed69590 +FieldingOFsplit.csv.gz 8eb2136051d13e082085d750a4da240107bb99457396b373cafc9d4b94067c84 +FieldingOFsplit_raw.csv.gz 09b80abcf20c7eaaadb69b260b4195dfbaa3e9fafd90b0550c8f71369e4547cd +FieldingPost.csv.gz 90065f301aaae8087f1fccc8794e7f76eb4dda792143c7357f23315bcc2fd537 +FieldingPost_raw.csv.gz 39461d119ee77b1d82f6deff31e72237e09c8c8585420bf6f8b670dcbbea5e00 +Fielding_raw.csv.gz 3a1bdc216a5848cdffab43a7264da27183bdcf386884c516fad58a2315e68838 Formaldehyde.csv.gz dbd4cabced8862b0b2676f54bbabee93491cb7c3ce38aeb7e030963605b775cf GAGurine.csv.gz dbe4772b67e8652ce2c3cb1788f3f0d5d9dfec06d71c064e35865177122af7fd GAGurine_raw.csv.gz e0f7e916ce73f6aa2cd058367b4b199c6df7011e4781ed0c89a8d1a8e2199343 @@ -64,10 +65,10 @@ Glucose2_raw.csv.gz 306e32f46c1928003832a2ccb6ad45107a91c7e031d22a8c29617223f7b7 Glucose_raw.csv.gz 9f845abc8172ef62f2c081da52ff7d00ce2f5ddb23b285c2a6e4ebd00a1f52c2 Gun.csv.gz 735efee1fd2590f2bc1c5ee9da1795505b1162c402276279c0de00340a156467 Gun_raw.csv.gz 50800a9821345c5ac1526cf633ead0c0598f06e496ec9ea0d448008123661d9e -HallOfFame.csv.gz 7b34f955cf6069ba19267a4773b4c2527e262147617ef4e9d7b46ff4ae3c5988 -HallOfFame_raw.csv.gz 61a8570cd8d25ea7d9fa659255c80d3930d8bb2a2acfdfb5cabf4c059a8fc8d0 -HomeGames.csv.gz 045327e6ff756eefd7350e71063fce576dd2b13238a398449b6685555dff2483 -HomeGames_raw.csv.gz 36ec08268e7c1dce00b8524d0bc97147469d40db20ffc2ef4224b9ef83be3e9e +HallOfFame.csv.gz 26e1e82cfd4cc3595a8b76afff103f3320727cb48d42b7aa9a77d412c92e11ae +HallOfFame_raw.csv.gz 77865d2d836500674d3140f8eb7f9aa5ceb2ae9d15a0e60a22809f065303fbd0 +HomeGames.csv.gz bddaaa8f5611181e4e9b565bedb7067e02693983a090dfd77bc3ada0165d28ed +HomeGames_raw.csv.gz 60455b99bfe61181a466cc751fce0f750d378dd99896cd5e0db92af160cf0d69 IGF.csv.gz 9be00089c779e12577f20f648129843330efe875a4cd0f116539ea51a2b72670 IGF_raw.csv.gz cf064654611311b1c50102b2ea3e4138453ace4ec60ed7f50ca8dd136109549f Indometh.csv.gz 64e60e876f984a80a34cd1c5cd76cf8466036cd7df2e9888108cbf2c94799f77 @@ -81,10 +82,10 @@ Loblolly.csv.gz f5f8700843631d366cbbc00af0ffab3952a3d81e18e18539a4010d130840c6f4 Loblolly_raw.csv.gz a677f5067a00fbf42ddccfd604a259b9940a05a5b799ef1d3832958778764acf Machines.csv.gz d01aa1b3607056211fdb042c30364900342d87b7eb311b65c585533150abe9e1 Machines_raw.csv.gz fe25b33f6d599eda3994d280ba3b7c69f1f95360b539e736c531a938661b3f94 -Managers.csv.gz c163caf38063a8427f3a16cf64e05e228d0d8dd4a807b601bf30d05353f89b1c +Managers.csv.gz 44c8d5d0aa0f3b4fd83bd7f4ab47c12e45df49d014b9178417ad1c7da6dbd742 ManagersHalf.csv.gz e38b58485115a01ba4d3c0b5fbe86f3930dddb96877e336b0f0503b078b13b20 ManagersHalf_raw.csv.gz 4ed450785bdc1a1acd70e277abecfe420f1e22ac6efbb18994d2d162f3a27b97 -Managers_raw.csv.gz 7b912e7f8e6ed53dbc8aa5280114fd9efb0e75112d727c18a9464e761ad20a25 +Managers_raw.csv.gz 7de9521ea37e2f646f6049cdf64a05e81b2cf4f13beed5b1ecc53b22f961903b MathAchSchool.csv.gz 7fcb2238c218381f807f6651bdaec05c5a778b5cedb7934488626e5ea48143e5 MathAchSchool_raw.csv.gz 3a12c39a759213fa7139129f5d79a27e6f8638ff1351c0609de394d7179e2684 MathAchieve.csv.gz 037fc9c4158c3aa5fc0524811eeacd3ea894c713f5d2870d1a8c04f5f1526ead @@ -112,17 +113,17 @@ PBG.csv.gz 5cf8c700b79e9eec8adfa1c43fd155769347421079544165e201f63e993f69bc PBG_raw.csv.gz 3dc98791c3f74246c737fa5ef886786a4b24e0bf87f0e9f9da905fb231353e7a Parks.csv.gz 07cd2d1914ab93a2cd7363ce230f154cc0fe0f4a2a05564505a48305621a9725 Parks_raw.csv.gz 3fb07db562b7a364ca66251a0c0f4cf5067d72d1c846dbd32a6fcc4a46a1e50c -People.csv.gz a463c00a19803a862a6f306b02214bb5fc5e7fbf0b511a34c3a66f8e2b2b3833 -People_raw.csv.gz a64425fd67ebf73f563f5663d39cd621c139e97c9ef4237c4ef33b94a78615f7 +People.csv.gz e6b37b22fcf8a0b42f698e682c197ec8beebe8af3a8d48dd9d5f0869fc2f6727 +People_raw.csv.gz 61722d4f21af3c5b8a88f7e18c07401f4281d40a0d8368e980d0ca658b55dcdb Phenobarb.csv.gz b732fd9cbe462aef99ab004aca7391cb18d40f9dfa7d5208e156f4bfb927ac6d Phenobarb_raw.csv.gz 09e951f6bd50f3e4365caf4602bc1d893648cfb5640d93d9ccd7581805f611c9 Pima_te.csv.gz a969bd9f6b5831b876025ede24c9656a3de1b88e6bb26a1fd45ae950072d9ecb Pima_tr.csv.gz 06180f7477b216cddf21f1b9329da7ce691fb54f47156c1469411b18cebef344 Pima_tr2.csv.gz eee121a8088e45fbfc1b6746a3d209f5619b482a0fc685779ee13430402be6ff -Pitching.csv.gz 9d1931108e1cad36da187c5d78ac6123c11edd57304e2974b8e987ac55f7fd6e -PitchingPost.csv.gz 8a11351720bc5dae23b6b0f441eab20f4fa365f27c02907817c1023a288acf67 -PitchingPost_raw.csv.gz 88dc86f8339930216ad4583f17d59c6efaab033facdffb565e4c585e130ce647 -Pitching_raw.csv.gz e2e0aee0c3fb4fc60547d6948886ccc4b0e1e8aebb5fd5682f82f59e068e63af +Pitching.csv.gz 58f3ea23440a7dddb99566e3f19f22e7551f2920a802e073d10f755629889fe9 +PitchingPost.csv.gz 097b354dc834930e17b8dae81954014fc5211aeca63a3205902aadede99a85cd +PitchingPost_raw.csv.gz 214037d8a01b39c6fbd4bd600d535a446d154d437c79ecb8972c30a914c5697f +Pitching_raw.csv.gz 8792dbb9b7ae9f07ffff4e812e5062928bb072020628c2ce750867d99a09bc0a Pixel.csv.gz 677b11037aa3b840178676c209feed2a276669adbe870f50bd82df2286e84a3b Pixel_raw.csv.gz 7f77b9d3034d02f0b272dbaa7309b9c201142b405a7f2f30ef7eeab34927c3d2 PlantGrowth.csv.gz 2a55d1e66b0bc42dd8bdb93118c5d1870edc887cdf33602db95a03b0ea410747 @@ -144,8 +145,8 @@ Salaries.csv.gz ee70cccfadf7706255a1fd46e70ab1222565c72fb0c878e417bad53be5654d74 Salaries_raw.csv.gz 282828941abbd0209d3cc0c60e64ab766e4f5471b2ea178607247d55dcbbb664 Schools.csv.gz e4f6b01dc8d866f75ea05d3ba814facaff59206e547f26760309c252e0130c7a Schools_raw.csv.gz 4cc709ce68edc42abd4ef067bb8e622553bc2231c423a5127eeac4c041b9909e -SeriesPost.csv.gz 50786b543c06079f412eb7285961e31c8e03efab93c4599cc68bf31ee5178a68 -SeriesPost_raw.csv.gz 91475ca90a76e2d6db0c4393db17f971a019083a7b0e3815e19a80d9b1d52e63 +SeriesPost.csv.gz 6e9697fb2ab55e3119b5c3d4b170b5baa092448112da6eb2f8780700c3907d63 +SeriesPost_raw.csv.gz 9ba972be89525045091e240dff8cd6f405090344ace31fb8f55922038a1546a7 Sitka.csv.gz c9436af635eec61de73aeb8dc88a436ccb826af0982c543d4953a111aa993402 Sitka89.csv.gz 01c5157a4269c39d57719989dcca5386d4f231c6bc0edd202ad0e304484292d1 Sitka89_raw.csv.gz 5d69cb9819dfb8446c112985096345fa2f46612a0eedec9e5c00aa7afd02da31 @@ -156,12 +157,12 @@ Soybean.csv.gz 1cfbc8765f1358d077ab045cc8b2cc7f28e5eff9bab3abce8a3036e6de604e48 Soybean_raw.csv.gz 64de748f0bfe0985fef23178f4c142fa6baa85b4c71291f34fb75aeeee7cbf74 Spruce.csv.gz 6618b9c6b54463d44d14cffee4a3b7f10c83fef6917e62b705b0f19bdd25665c Spruce_raw.csv.gz b9f15dd959ab743c056194b2346edbb2ce51a50d58dcf3c48b74245d8675d3f5 -Teams.csv.gz 3ee98d36316ad6b34cf6a37f71f4d69e13e351ff92e1245deee8ed8d98d2b19e +Teams.csv.gz dfb757e130fee1c28bc6f950202905ec0cbe36ad214fd3249c3af8283494cac1 TeamsFranchises.csv.gz 6bf9ce1bec00702ec6d8620e32edd03605f142178d01d803d8c73c2d42588226 TeamsFranchises_raw.csv.gz 64803fb658818a026649e2077041a1cc00465ae36f661d5b8dcb33ecf45ba739 TeamsHalf.csv.gz 812af540ce44f9b96e153d4c3d78f1b133d26268c368648f58ea9424ebdff77a TeamsHalf_raw.csv.gz 81d9aa9c593942689370d15de00f4fa7a58158ba6d61e8bd6090fe451bc1a89c -Teams_raw.csv.gz 5a1b094ecf9320b123fba789ab66142ca6c74f987ef3fc36ffad14026f7ba789 +Teams_raw.csv.gz d45f4448ba2bd4ef47ed0d8bd07ceb2b8177e5131581cc1e49ea4f6dc28b470c Tetracycline1.csv.gz 402b0c7430774da928744e251bb6263b622c5b340e51b856066c55d1b17e38b5 Tetracycline1_raw.csv.gz dc9e76fa3ec076b8de44ccb26d7e8aac395bf499713c4d7721df3b76ba8f4431 Tetracycline2.csv.gz 252709a73252bd365796b8b504a3b523f257a01e43f0943409021e0ad7fd372e @@ -251,8 +252,6 @@ chickwts.csv.gz 7f382b1d28211fbeee5c68a82d2b9992aebba081b311c0bb62424a667fa42ea4 city.csv.gz e6d827233daba45bc656b38c084d55af00c5a422860234db3828d96cc6c33f3b claridge.csv.gz 3b49d1bb8e375d5839c54900ffe2cbfa83d3d895b06ef58df92c67ff936f346f cloth.csv.gz 34b271a52de1c711b89020786b591caa28f10d70d9d6b4258679008e8ab7ef2f -cms_patient_care.csv.gz 051ab06d5e2755bae9142d29843a75b1bff4d9b63dc00aacb8b75bbc2d23b490 -cms_patient_experience.csv.gz 84ed730c9ec4859de9001eb0b4be16cf381090853c015147c4250eb7b078b312 co_transfer.csv.gz d7e585664aa700e94e78d616d25655bec09af657426e67c52daeed79f4524afa coal.csv.gz eb4ec2fb8b55e647cd32fcc6ccd5f1ba04a3b85539f89977330f21f13d4dd516 construction.csv.gz 5ce0f2b1670ba71622bfbbbabc35072eb69494392bc1345a64cd81161fdff109 @@ -312,16 +311,15 @@ heart.csv.gz 9ec19e71d12209d639fc48292fc90f169444f4983b47bb6811a57b7cd42e2bf8 heights.csv.gz ca416bb92e8a894c3967696fb45a8431bf205bd0d1bb6cb8f409347d9ce83c4f hills.csv.gz d02e3dbdc4490c7cd58afda5c70a0a841cc01f85f49b2ad5ae1c1a89f563b112 hirose.csv.gz 105332bf4e6acb7d753827dedb4f4a5bd9165cb06fbd5f3f57006fcdd79aa6f6 -household.csv.gz e98c29f98954d36f817763db95f8df93aad1365d99e574b9e3eb185fe7abf3b7 housing.csv.gz 3fb0af8e99716bff26cecb80a98ecf87162a4ccc6d609c8f467a10a1e643c490 housing_raw.csv.gz ddb3232c1b949bfeef75329dda7a7601998eb0d4faca4d2070e974d2eb163e21 -imdb_name_basics.parquet 4787a1cdb3cb5816f6833c291eda6b93e79331720855700791f6a692ee67b044 -imdb_title_akas.parquet ae520e1d54f707b6e592fdc3e3723ae2797ad3b7f79e1bee38beb2535334680d -imdb_title_basics.parquet 8e8a5d9abf957d332113df4e253a6bfb0bebf3a131fdfd9f9b8a12f531357959 -imdb_title_crew.parquet c84de2e4f754bd6acf711c127f9cdbc5146220a5ee15ef73058011a922e21131 -imdb_title_episode.parquet 45c54309fd1bef0fd4fb12831dc31b1807c0c178077af4945a1d73a60ae8998a -imdb_title_principals.parquet a030ebe04a904187aaa136058302b23f3efa7e9e2c9b4ff71afe7d21ddebda40 -imdb_title_ratings.parquet b9447957b7a6eac8c907cac424d3da6ead50e1a7aaf256c30ceba26dfa021e27 +imdb_name_basics.parquet 70aa1eb191919996e22e6e883114c1a7767d845faae5e6a6b31ad1dd0e0ca468 +imdb_title_akas.parquet 5ef0237bc565b372aa5f722364dc811c9863455406b5ad285451d87317b1e9c4 +imdb_title_basics.parquet 5c4fb0dcadc34caf5db31b95da8515b4255059e01ec0a60f1d5ce50363275a50 +imdb_title_crew.parquet d62832460bb436322db0e824fb716417c4a0b1df54a0644bd63215ff2b13a894 +imdb_title_episode.parquet da4cd0f0a0055a6dc9985fc7d2a8b3e24957b2d04f22426d72f6877b1c8a8604 +imdb_title_principals.parquet e476441a9b9f30f4d2a706a416dbd81d9a87357aa644c482ae9b1fc397175c40 +imdb_title_ratings.parquet 03d41c8c6eca419beda41be6f3851e42b9f9878702f49425df14ae60037b8ff2 immer.csv.gz 2236a5d11381e806e90760e3e6a4b0379feb8e733bbf1c1c065c17887da4ef6f immer_raw.csv.gz 5ad18f5b2cad0f637cdc8ee8f3470e4e87e4148830fe20fb69a1d922202dd37c infert.csv.gz 729b92024164c08fd4f866ac90c7d85fb0d3a0323a6240f72c748db99e785ab9 @@ -430,7 +428,7 @@ steam.csv.gz 4441eb0b1478ca530c387d46a00beefff35190411ecdbde2c91fa467274534aa steam_raw.csv.gz c81183a41c49be896d853b4f76d27d54f7164207b980b5ed25dd185849b6a940 stormer.csv.gz d469aef33edea2731163aaf9076d3374c557f127d289749c0c48db28e94d2cf2 stormer_raw.csv.gz 7f31b0dd1b14dd2aa1662917b584c76b099e76389ca4b9e7881f8d123dcb9203 -storms.csv.gz b5b61ada20e87e7cb97284f9581fd17c0839ff732e24ceb4892243681e9fc014 +storms.csv.gz 76c1330e5a64a91c8a994f99a5db3aebcb4f96acacf85884ee0602e387a5c877 survey.csv.gz 5b7a559fbf0580cfadf29c4c825dfce508f77609fbe8c26ce2c32b57fe140d3a survey_raw.csv.gz aaab0825af4231fd07800169cacc37faba911cf6ea7575e9cde7f65e154eeb23 survival.csv.gz bf144536f62209aed50589f543d681a7949b443ff7f62618f94d4e5667e35df8 @@ -458,11 +456,10 @@ waders_raw.csv.gz 8037f1df678aee53a1f6932088d8ec1609b75f1521b5e058593d68c44bf7b5 warpbreaks.csv.gz e5faa819c0767a4637a9c658d9649b944ade8cadbaf316cd4f5674162b1c5d1d whiteside.csv.gz 9e84fffeab18647228c38e2032b0ad3fbe2bbc02082b0c4f7d4e76289e892b4c whiteside_raw.csv.gz 34c9d357c74b162b2af76f348c73684452548c35e9718357d468c93373e92cc2 -who.csv.gz 7670246d45d693728ad616811fb8f9c3b45a06fe505b5876ed36dd6a1bc639e6 -who2.csv.gz 28c37130ce982c8668281e72ef69e7dcff50e7ee2a90daa3e2c16cf2fb187c28 +who.csv.gz 8029ce0f85b439248ea1c1139c55f5c094238c284be3c7b2cdc168a2af9068ec women.csv.gz 408ae762679ca5bdd788e518ebeb40d890ae5ba6ec7bb5b37020283dc2b36713 -world_bank_pop.csv.gz ca5e984f2ee675787c44f0cc9eb43fe6b53120ba57ff259301be2583ef10cbe0 -world_bank_pop_raw.csv.gz e905f4de65670a666b1978770926ac40b82ac8bd885f6dbc9ac1fa47814fa5fd +world_bank_pop.csv.gz a3ab09a979f8c9cb3be78c57e5f75a1b2286a48f6e36d5d30cdb0fd1e4d5626c +world_bank_pop_raw.csv.gz 468d39593bffc8d458cbbc8d8727224a2be9a0468e01f4a8d10531a7ef9b8486 wowah_data_raw.parquet 527f6ac558afad0c1ed328f3adf13390e0d5cf1d0858bed037ac9db24e48ec69 wowah_location_coords_raw.parquet da7bf6cae6cb997d7bc581da5d1fd46e273f8d001b5b5fc369a0f561679a1334 wowah_locations_raw.parquet f3cea5527072cce8e4666425a2dcce878132f2cf93918596d490d39de018c356