[ Info: sorted string unique (nrow(df1), nrow(df2)) = (1000000, 20000000) 0.404470 seconds (159 allocations: 22.900 MiB) (nrow(df1), nrow(df2)) = (1000000, 20000000) 0.403119 seconds (159 allocations: 22.900 MiB) [ Info: shuffled string unique 8.952677 seconds (172 allocations: 56.901 MiB) 8.973337 seconds (172 allocations: 56.901 MiB) [ Info: sorted string duplicates (nrow(df1), nrow(df2)) = (1000000, 20000000) 0.506894 seconds (161 allocations: 38.160 MiB) (nrow(df1), nrow(df2)) = (1000000, 20000000) 0.494741 seconds (161 allocations: 38.160 MiB) [ Info: sorted string duplicates many (nrow(df1), nrow(df2)) = (1000000, 20000000) 3.210424 seconds (177 allocations: 2.455 GiB, 0.14% gc time) (nrow(df1), nrow(df2)) = (1000000, 20000000) 3.218442 seconds (177 allocations: 2.455 GiB, 0.14% gc time) [ Info: shuffled string duplicates (nrow(df1), nrow(df2)) = (1000000, 20000000) 7.044917 seconds (181 allocations: 97.076 MiB, 0.32% gc time) (nrow(df1), nrow(df2)) = (1000000, 20000000) 7.106402 seconds (181 allocations: 97.076 MiB, 0.32% gc time) [ Info: shuffled string duplicates many (nrow(df1), nrow(df2)) = (1000000, 20000000) 35.486817 seconds (197 allocations: 2.501 GiB, 80.21% gc time) (nrow(df1), nrow(df2)) = (1000000, 20000000) 33.465506 seconds (197 allocations: 2.501 GiB, 82.04% gc time) [ Info: sorted int unique (nrow(df1), nrow(df2)) = (1000000, 20000000) 0.073927 seconds (159 allocations: 22.900 MiB) (nrow(df1), nrow(df2)) = (1000000, 20000000) 0.073743 seconds (159 allocations: 22.900 MiB) [ Info: shuffled int unique (nrow(df1), nrow(df2)) = (1000000, 20000000) 0.161250 seconds (183 allocations: 30.531 MiB) (nrow(df1), nrow(df2)) = (1000000, 20000000) 0.175935 seconds (183 allocations: 30.531 MiB) [ Info: sorted int duplicates (nrow(df1), nrow(df2)) = (1000000, 20000000) 0.080433 seconds (159 allocations: 22.887 MiB) (nrow(df1), nrow(df2)) = (1000000, 20000000) 0.080351 seconds (159 allocations: 22.887 MiB) [ Info: sorted int duplicates many (nrow(df1), nrow(df2)) = (1000000, 20000000) 30.304874 seconds (177 allocations: 2.453 GiB, 90.36% gc time) (nrow(df1), nrow(df2)) = (1000000, 20000000) 30.328002 seconds (177 allocations: 2.453 GiB, 90.28% gc time) [ Info: shuffled int duplicates (nrow(df1), nrow(df2)) = (1000000, 20000000) 0.321306 seconds (190 allocations: 55.421 MiB, 1.08% gc time) (nrow(df1), nrow(df2)) = (1000000, 20000000) 0.302525 seconds (190 allocations: 55.421 MiB, 1.08% gc time) [ Info: shuffled int duplicates many (nrow(df1), nrow(df2)) = (1000000, 20000000) 31.146174 seconds (208 allocations: 2.469 GiB, 87.74% gc time) (nrow(df1), nrow(df2)) = (1000000, 20000000) 30.496350 seconds (208 allocations: 2.469 GiB, 89.63% gc time) [ Info: sorted PooledArray duplicates (nrow(df1), nrow(df2)) = (1000000, 20000000) 8.410814 seconds (214 allocations: 336.468 MiB, 87.90% gc time) (nrow(df1), nrow(df2)) = (1000000, 20000000) 8.433220 seconds (214 allocations: 385.906 MiB, 87.46% gc time) [ Info: sorted PooledArray duplicates many (nrow(df1), nrow(df2)) = (1000000, 2000000) 0.653836 seconds (214 allocations: 301.883 MiB, 57.12% gc time) (nrow(df1), nrow(df2)) = (1000000, 2000000) 0.647200 seconds (214 allocations: 309.630 MiB, 57.81% gc time) [ Info: shuffled PooledArray duplicates (nrow(df1), nrow(df2)) = (1000000, 20000000) 10.178405 seconds (222 allocations: 348.865 MiB, 74.68% gc time) (nrow(df1), nrow(df2)) = (1000000, 20000000) 10.506988 seconds (222 allocations: 398.303 MiB, 75.17% gc time) [ Info: shuffled PooledArray duplicates many (nrow(df1), nrow(df2)) = (1000000, 20000000) 37.699361 seconds (224 allocations: 2.101 GiB, 89.36% gc time) (nrow(df1), nrow(df2)) = (1000000, 20000000) 37.268210 seconds (224 allocations: 2.109 GiB, 90.08% gc time) [ Info: sorted CategoricalArray duplicates (nrow(df1), nrow(df2)) = (1000000, 20000000) 9.058517 seconds (632.71 k allocations: 368.238 MiB, 83.59% gc time) (nrow(df1), nrow(df2)) = (1000000, 20000000) 8.867881 seconds (2.00 M allocations: 469.838 MiB, 83.52% gc time) [ Info: sorted CategoricalArray duplicates many (nrow(df1), nrow(df2)) = (1000000, 2000000) 0.652793 seconds (10.22 k allocations: 303.714 MiB, 52.87% gc time) (nrow(df1), nrow(df2)) = (1000000, 2000000) 7.730151 seconds (200.22 k allocations: 318.709 MiB, 96.05% gc time) [ Info: shuffled CategoricalArray duplicates (nrow(df1), nrow(df2)) = (1000000, 20000000) 10.619555 seconds (632.20 k allocations: 372.970 MiB, 72.62% gc time) (nrow(df1), nrow(df2)) = (1000000, 20000000) 10.800947 seconds (2.00 M allocations: 474.588 MiB, 72.35% gc time) [ Info: shuffled CategoricalArray duplicates many (nrow(df1), nrow(df2)) = (1000000, 20000000) 42.441216 seconds (10.23 k allocations: 2.102 GiB, 89.44% gc time) (nrow(df1), nrow(df2)) = (1000000, 20000000) 42.184494 seconds (200.23 k allocations: 2.117 GiB, 90.64% gc time)