diff --git a/dev/.documenter-siteinfo.json b/dev/.documenter-siteinfo.json
index 29854cf58..341f6b0dc 100644
--- a/dev/.documenter-siteinfo.json
+++ b/dev/.documenter-siteinfo.json
@@ -1 +1 @@
-{"documenter":{"julia_version":"1.10.5","generation_timestamp":"2024-09-07T11:00:40","documenter_version":"1.7.0"}}
\ No newline at end of file
+{"documenter":{"julia_version":"1.10.5","generation_timestamp":"2024-09-08T08:54:13","documenter_version":"1.7.0"}}
\ No newline at end of file
diff --git a/dev/assets/README/index.html b/dev/assets/README/index.html
index 52c09ce2e..b240f3cc7 100644
--- a/dev/assets/README/index.html
+++ b/dev/assets/README/index.html
@@ -1,2 +1,2 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Introduction · DataFrames.jl</title><meta name="title" content="Introduction · DataFrames.jl"/><meta property="og:title" content="Introduction · DataFrames.jl"/><meta property="twitter:title" content="Introduction · DataFrames.jl"/><meta name="description" content="Documentation for DataFrames.jl."/><meta property="og:description" content="Documentation for DataFrames.jl."/><meta property="twitter:description" content="Documentation for DataFrames.jl."/><meta property="og:url" content="https://juliadata.github.io/DataFrames.jl/stable/assets/README/"/><meta property="twitter:url" content="https://juliadata.github.io/DataFrames.jl/stable/assets/README/"/><link rel="canonical" href="https://juliadata.github.io/DataFrames.jl/stable/assets/README/"/><script data-outdated-warner src="../warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../documenter.js"></script><script src="../../search_index.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../themeswap.js"></script><link href="../favicon.ico" rel="icon" type="image/x-icon"/></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../../"><img src="../logo.png" alt="DataFrames.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../../">DataFrames.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><a class="tocitem" href="../../">Introduction</a></li><li><a class="tocitem" href="../../man/basics/">First Steps with DataFrames.jl</a></li><li><span class="tocitem">User Guide</span><ul><li><a class="tocitem" href="../../man/getting_started/">Getting Started</a></li><li><a class="tocitem" href="../../man/working_with_dataframes/">Working with DataFrames</a></li><li><a class="tocitem" href="../../man/importing_and_exporting/">Importing and Exporting Data (I/O)</a></li><li><a class="tocitem" href="../../man/joins/">Joins</a></li><li><a class="tocitem" href="../../man/split_apply_combine/">Split-apply-combine</a></li><li><a class="tocitem" href="../../man/reshaping_and_pivoting/">Reshaping</a></li><li><a class="tocitem" href="../../man/sorting/">Sorting</a></li><li><a class="tocitem" href="../../man/categorical/">Categorical Data</a></li><li><a class="tocitem" href="../../man/missing/">Missing Data</a></li><li><a class="tocitem" href="../../man/querying_frameworks/">Data manipulation frameworks</a></li><li><a class="tocitem" href="../../man/comparisons/">Comparison with Python/R/Stata</a></li></ul></li><li><span class="tocitem">API</span><ul><li><a class="tocitem" href="../../lib/types/">Types</a></li><li><a class="tocitem" href="../../lib/functions/">Functions</a></li><li><a class="tocitem" href="../../lib/indexing/">Indexing</a></li><li><a class="tocitem" href="../../lib/metadata/">Metadata</a></li></ul></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li class="is-active"><a href>Introduction</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Introduction</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaData/DataFrames.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaData/DataFrames.jl/blob/main/docs/src/assets/README.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="Introduction"><a class="docs-heading-anchor" href="#Introduction">Introduction</a><a id="Introduction-1"></a><a class="docs-heading-anchor-permalink" href="#Introduction" title="Permalink"></a></h1><p>In this folder we store the following data sets:</p><ul><li>german_credit.csv</li><li>iris.csv</li></ul><h1 id="German-Credit-data-set"><a class="docs-heading-anchor" href="#German-Credit-data-set">German Credit data set</a><a id="German-Credit-data-set-1"></a><a class="docs-heading-anchor-permalink" href="#German-Credit-data-set" title="Permalink"></a></h1><h2 id="License:"><a class="docs-heading-anchor" href="#License:">License:</a><a id="License:-1"></a><a class="docs-heading-anchor-permalink" href="#License:" title="Permalink"></a></h2><p>https://opendatacommons.org/licenses/dbcl/1-0/</p><h2 id="Source:"><a class="docs-heading-anchor" href="#Source:">Source:</a><a id="Source:-1"></a><a class="docs-heading-anchor-permalink" href="#Source:" title="Permalink"></a></h2><p>https://archive.ics.uci.edu/ml/datasets/statlog+(german+credit+data) Professor Dr. Hans Hofmann Institut für Statistik und Ökonometrie Universität Hamburg FB Wirtschaftswissenschaften Von-Melle-Park 5 2000 Hamburg 13</p><p>The original data is from <a href="https://archive.ics.uci.edu/ml/datasets/statlog+(german+credit+data)">UCI</a>, and the file stored here is from <a href="https://www.kaggle.com/uciml/german-credit">Kaggle</a></p><h1 id="Iris-data-set"><a class="docs-heading-anchor" href="#Iris-data-set">Iris data set</a><a id="Iris-data-set-1"></a><a class="docs-heading-anchor-permalink" href="#Iris-data-set" title="Permalink"></a></h1><h2 id="License"><a class="docs-heading-anchor" href="#License">License</a><a id="License-1"></a><a class="docs-heading-anchor-permalink" href="#License" title="Permalink"></a></h2><p>https://creativecommons.org/publicdomain/zero/1.0/</p><h2 id="Source:-2"><a class="docs-heading-anchor" href="#Source:-2">Source:</a><a class="docs-heading-anchor-permalink" href="#Source:-2" title="Permalink"></a></h2><p>https://archive.ics.uci.edu/ml/datasets/Iris Creator: R.A. Fisher</p></article><nav class="docs-footer"><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Saturday 7 September 2024 11:00">Saturday 7 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Introduction · DataFrames.jl</title><meta name="title" content="Introduction · DataFrames.jl"/><meta property="og:title" content="Introduction · DataFrames.jl"/><meta property="twitter:title" content="Introduction · DataFrames.jl"/><meta name="description" content="Documentation for DataFrames.jl."/><meta property="og:description" content="Documentation for DataFrames.jl."/><meta property="twitter:description" content="Documentation for DataFrames.jl."/><meta property="og:url" content="https://juliadata.github.io/DataFrames.jl/stable/assets/README/"/><meta property="twitter:url" content="https://juliadata.github.io/DataFrames.jl/stable/assets/README/"/><link rel="canonical" href="https://juliadata.github.io/DataFrames.jl/stable/assets/README/"/><script data-outdated-warner src="../warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../documenter.js"></script><script src="../../search_index.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../themeswap.js"></script><link href="../favicon.ico" rel="icon" type="image/x-icon"/></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../../"><img src="../logo.png" alt="DataFrames.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../../">DataFrames.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><a class="tocitem" href="../../">Introduction</a></li><li><a class="tocitem" href="../../man/basics/">First Steps with DataFrames.jl</a></li><li><span class="tocitem">User Guide</span><ul><li><a class="tocitem" href="../../man/getting_started/">Getting Started</a></li><li><a class="tocitem" href="../../man/working_with_dataframes/">Working with DataFrames</a></li><li><a class="tocitem" href="../../man/importing_and_exporting/">Importing and Exporting Data (I/O)</a></li><li><a class="tocitem" href="../../man/joins/">Joins</a></li><li><a class="tocitem" href="../../man/split_apply_combine/">Split-apply-combine</a></li><li><a class="tocitem" href="../../man/reshaping_and_pivoting/">Reshaping</a></li><li><a class="tocitem" href="../../man/sorting/">Sorting</a></li><li><a class="tocitem" href="../../man/categorical/">Categorical Data</a></li><li><a class="tocitem" href="../../man/missing/">Missing Data</a></li><li><a class="tocitem" href="../../man/querying_frameworks/">Data manipulation frameworks</a></li><li><a class="tocitem" href="../../man/comparisons/">Comparison with Python/R/Stata</a></li></ul></li><li><span class="tocitem">API</span><ul><li><a class="tocitem" href="../../lib/types/">Types</a></li><li><a class="tocitem" href="../../lib/functions/">Functions</a></li><li><a class="tocitem" href="../../lib/indexing/">Indexing</a></li><li><a class="tocitem" href="../../lib/metadata/">Metadata</a></li></ul></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li class="is-active"><a href>Introduction</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Introduction</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaData/DataFrames.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaData/DataFrames.jl/blob/main/docs/src/assets/README.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="Introduction"><a class="docs-heading-anchor" href="#Introduction">Introduction</a><a id="Introduction-1"></a><a class="docs-heading-anchor-permalink" href="#Introduction" title="Permalink"></a></h1><p>In this folder we store the following data sets:</p><ul><li>german_credit.csv</li><li>iris.csv</li></ul><h1 id="German-Credit-data-set"><a class="docs-heading-anchor" href="#German-Credit-data-set">German Credit data set</a><a id="German-Credit-data-set-1"></a><a class="docs-heading-anchor-permalink" href="#German-Credit-data-set" title="Permalink"></a></h1><h2 id="License:"><a class="docs-heading-anchor" href="#License:">License:</a><a id="License:-1"></a><a class="docs-heading-anchor-permalink" href="#License:" title="Permalink"></a></h2><p>https://opendatacommons.org/licenses/dbcl/1-0/</p><h2 id="Source:"><a class="docs-heading-anchor" href="#Source:">Source:</a><a id="Source:-1"></a><a class="docs-heading-anchor-permalink" href="#Source:" title="Permalink"></a></h2><p>https://archive.ics.uci.edu/ml/datasets/statlog+(german+credit+data) Professor Dr. Hans Hofmann Institut für Statistik und Ökonometrie Universität Hamburg FB Wirtschaftswissenschaften Von-Melle-Park 5 2000 Hamburg 13</p><p>The original data is from <a href="https://archive.ics.uci.edu/ml/datasets/statlog+(german+credit+data)">UCI</a>, and the file stored here is from <a href="https://www.kaggle.com/uciml/german-credit">Kaggle</a></p><h1 id="Iris-data-set"><a class="docs-heading-anchor" href="#Iris-data-set">Iris data set</a><a id="Iris-data-set-1"></a><a class="docs-heading-anchor-permalink" href="#Iris-data-set" title="Permalink"></a></h1><h2 id="License"><a class="docs-heading-anchor" href="#License">License</a><a id="License-1"></a><a class="docs-heading-anchor-permalink" href="#License" title="Permalink"></a></h2><p>https://creativecommons.org/publicdomain/zero/1.0/</p><h2 id="Source:-2"><a class="docs-heading-anchor" href="#Source:-2">Source:</a><a class="docs-heading-anchor-permalink" href="#Source:-2" title="Permalink"></a></h2><p>https://archive.ics.uci.edu/ml/datasets/Iris Creator: R.A. Fisher</p></article><nav class="docs-footer"><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Sunday 8 September 2024 08:54">Sunday 8 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/index.html b/dev/index.html
index 57deb7272..63d9e8eeb 100644
--- a/dev/index.html
+++ b/dev/index.html
@@ -1,2 +1,2 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Introduction · DataFrames.jl</title><meta name="title" content="Introduction · DataFrames.jl"/><meta property="og:title" content="Introduction · DataFrames.jl"/><meta property="twitter:title" content="Introduction · DataFrames.jl"/><meta name="description" content="Documentation for DataFrames.jl."/><meta property="og:description" content="Documentation for DataFrames.jl."/><meta property="twitter:description" content="Documentation for DataFrames.jl."/><meta property="og:url" content="https://juliadata.github.io/DataFrames.jl/stable/"/><meta property="twitter:url" content="https://juliadata.github.io/DataFrames.jl/stable/"/><link rel="canonical" href="https://juliadata.github.io/DataFrames.jl/stable/"/><script data-outdated-warner src="assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="assets/documenter.js"></script><script src="search_index.js"></script><script src="siteinfo.js"></script><script src="../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="assets/themeswap.js"></script><link href="assets/favicon.ico" rel="icon" type="image/x-icon"/></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href><img src="assets/logo.png" alt="DataFrames.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href>DataFrames.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li class="is-active"><a class="tocitem" href>Introduction</a><ul class="internal"><li><a class="tocitem" href="#What-is-DataFrames.jl?"><span>What is DataFrames.jl?</span></a></li><li><a class="tocitem" href="#DataFrames.jl-and-the-Julia-Data-Ecosystem"><span>DataFrames.jl and the Julia Data Ecosystem</span></a></li><li><a class="tocitem" href="#Questions?"><span>Questions?</span></a></li><li><a class="tocitem" href="#Package-Manual"><span>Package Manual</span></a></li><li><a class="tocitem" href="#API"><span>API</span></a></li><li><a class="tocitem" href="#Index"><span>Index</span></a></li></ul></li><li><a class="tocitem" href="man/basics/">First Steps with DataFrames.jl</a></li><li><span class="tocitem">User Guide</span><ul><li><a class="tocitem" href="man/getting_started/">Getting Started</a></li><li><a class="tocitem" href="man/working_with_dataframes/">Working with DataFrames</a></li><li><a class="tocitem" href="man/importing_and_exporting/">Importing and Exporting Data (I/O)</a></li><li><a class="tocitem" href="man/joins/">Joins</a></li><li><a class="tocitem" href="man/split_apply_combine/">Split-apply-combine</a></li><li><a class="tocitem" href="man/reshaping_and_pivoting/">Reshaping</a></li><li><a class="tocitem" href="man/sorting/">Sorting</a></li><li><a class="tocitem" href="man/categorical/">Categorical Data</a></li><li><a class="tocitem" href="man/missing/">Missing Data</a></li><li><a class="tocitem" href="man/querying_frameworks/">Data manipulation frameworks</a></li><li><a class="tocitem" href="man/comparisons/">Comparison with Python/R/Stata</a></li></ul></li><li><span class="tocitem">API</span><ul><li><a class="tocitem" href="lib/types/">Types</a></li><li><a class="tocitem" href="lib/functions/">Functions</a></li><li><a class="tocitem" href="lib/indexing/">Indexing</a></li><li><a class="tocitem" href="lib/metadata/">Metadata</a></li></ul></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li class="is-active"><a href>Introduction</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Introduction</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaData/DataFrames.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaData/DataFrames.jl/blob/main/docs/src/index.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="DataFrames.jl"><a class="docs-heading-anchor" href="#DataFrames.jl">DataFrames.jl</a><a id="DataFrames.jl-1"></a><a class="docs-heading-anchor-permalink" href="#DataFrames.jl" title="Permalink"></a></h1><p>Welcome to the DataFrames.jl documentation!</p><p>This resource aims to teach you everything you need to know to get up and running with tabular data manipulation using the DataFrames.jl package.</p><p>For more illustrations of DataFrames.jl usage, in particular in conjunction with other packages you can check-out the following resources (they are kept up to date with the released version of DataFrames.jl):</p><ul><li><a href="https://www.jstatsoft.org/article/view/v107i04">DataFrames.jl: Flexible and Fast Tabular Data in Julia</a> article published in the <em>Journal of Statistical Software</em></li><li><a href="https://www.ahsmart.com/pub/data-wrangling-with-data-frames-jl-cheat-sheet/">Data Wrangling with DataFrames.jl Cheat Sheet</a></li><li><a href="https://github.com/bkamins/Julia-DataFrames-Tutorial/">DataFrames Tutorial using Jupyter Notebooks</a></li><li><a href="https://github.com/JuliaAcademy/DataFrames">Julia Academy DataFrames.jl tutorial</a></li><li><a href="https://github.com/bkamins/JuliaCon2023-Tutorial">JuliaCon 2023</a>, <a href="https://github.com/bkamins/JuliaCon2022-DataFrames-Tutorial">JuliaCon 2022</a>, <a href="https://github.com/bkamins/JuliaCon2021-DataFrames-Tutorial">JuliaCon 2021</a>, <a href="https://github.com/bkamins/JuliaCon2020-DataFrames-Tutorial">JuliaCon 2020</a>, <a href="https://github.com/bkamins/JuliaCon2019-DataFrames-Tutorial">JuliaCon 2019</a>, <a href="https://github.com/bkamins/ODSC-EUROPE-2021">ODSC Europe 2021</a> tutorials, and <a href="https://github.com/bkamins/PyDataGlobal2020">PyData Global 2020</a></li><li><a href="https://github.com/bkamins/DataFrames-Showcase">DataFrames.jl showcase</a></li></ul><p>If you prefer to learn DataFrames.jl from a book you can consider reading:</p><ul><li><a href="https://github.com/bkamins/JuliaForDataAnalysis">Julia for Data Analysis</a>;</li><li><a href="https://juliadatascience.io/">Julia Data Science</a>.</li></ul><h2 id="What-is-DataFrames.jl?"><a class="docs-heading-anchor" href="#What-is-DataFrames.jl?">What is DataFrames.jl?</a><a id="What-is-DataFrames.jl?-1"></a><a class="docs-heading-anchor-permalink" href="#What-is-DataFrames.jl?" title="Permalink"></a></h2><p>DataFrames.jl provides a set of tools for working with tabular data in Julia. Its design and functionality are similar to those of <a href="https://pandas.pydata.org/">pandas</a> (in Python) and <code>data.frame</code>, <a href="https://rdatatable.gitlab.io/data.table/"><code>data.table</code></a> and <a href="https://dplyr.tidyverse.org/">dplyr</a> (in R), making it  a great general purpose data science tool.</p><p>DataFrames.jl plays a central role in the Julia Data ecosystem, and has tight integrations with a range of different libraries. DataFrames.jl isn&#39;t the only tool for working with tabular data in Julia – as noted below, there are some other great libraries for certain use-cases – but it provides great data wrangling functionality through a familiar interface.</p><p>To understand the toolchain in more detail, have a look at the tutorials in this manual. New users can start with the <a href="man/basics/#First-Steps-with-DataFrames.jl">First Steps with DataFrames.jl</a> section.</p><p>You may find the <a href="https://juliadata.github.io/DataFramesMeta.jl/stable/">DataFramesMeta.jl</a> package or one of the other convenience packages discussed in the <a href="man/querying_frameworks/#Data-manipulation-frameworks">Data manipulation frameworks</a> section of this manual helpful when writing more advanced data transformations, especially if you do not have a significant programming experience. These packages provide convenience syntax similar to <a href="https://dplyr.tidyverse.org/">dplyr</a> in R.</p><p>If you use metadata when working with DataFrames.jl you might find the <a href="https://github.com/JuliaData/TableMetadataTools.jl">TableMetadataTools.jl</a> package useful. This package defines several convenience functions for performing typical metadata operations.</p><h2 id="DataFrames.jl-and-the-Julia-Data-Ecosystem"><a class="docs-heading-anchor" href="#DataFrames.jl-and-the-Julia-Data-Ecosystem">DataFrames.jl and the Julia Data Ecosystem</a><a id="DataFrames.jl-and-the-Julia-Data-Ecosystem-1"></a><a class="docs-heading-anchor-permalink" href="#DataFrames.jl-and-the-Julia-Data-Ecosystem" title="Permalink"></a></h2><p>The Julia data ecosystem can be a difficult space for new users to navigate, in part because the Julia ecosystem tends to distribute functionality across different libraries more than some other languages. Because many people coming to DataFrames.jl are just starting to explore the Julia data ecosystem, below is a list of well-supported libraries that provide different data science tools, along with a few notes about what makes each library special, and how well integrated they are with DataFrames.jl.</p><ul><li><strong>Statistics</strong><ul><li><a href="https://github.com/JuliaStats/StatsKit.jl">StatsKit.jl</a>: A convenience meta-package which loads a set of essential packages for statistics, including those mentioned below in this section and DataFrames.jl itself.</li><li><a href="https://docs.julialang.org/en/v1/stdlib/Statistics/">Statistics</a>: The Julia standard library comes with a wide range of statistics functionality, but to gain access to these functions you must call <code>using Statistics</code>.</li><li><a href="https://docs.julialang.org/en/v1/stdlib/LinearAlgebra/">LinearAlgebra</a>: Like <code>Statistics</code>, many linear algebra features (factorizations, inversions, etc.) live in a library you have to load to use.</li><li><a href="https://docs.julialang.org/en/v1/stdlib/SparseArrays/">SparseArrays</a> are also in the standard library but must be loaded to be used.</li><li><a href="https://github.com/nalimilan/FreqTables.jl">FreqTables.jl</a>: Create frequency tables / cross-tabulations. Tightly integrated with DataFrames.jl.</li><li><a href="https://juliastats.org/HypothesisTests.jl/stable/">HypothesisTests.jl</a>: A range of hypothesis testing tools.</li><li><a href="https://juliastats.org/GLM.jl/stable/manual/">GLM.jl</a>: Tools for estimating linear and generalized linear models. Tightly integrated with DataFrames.jl.</li><li><a href="https://juliastats.org/StatsModels.jl/stable/">StatsModels.jl</a>: For converting heterogeneous <code>DataFrame</code> into homogeneous matrices for use with linear algebra libraries or machine learning applications that don&#39;t directly support <code>DataFrame</code>s. Will do things like convert categorical variables into indicators/one-hot-encodings, create interaction terms, etc.</li><li><a href="https://multivariatestatsjl.readthedocs.io/en/stable/index.html">MultivariateStats.jl</a>: linear regression, ridge regression, PCA, component analyses tools. Not well integrated with DataFrames.jl, but easily used in combination with <code>StatsModels</code>.</li></ul></li><li><strong>Machine Learning</strong><ul><li><a href="https://github.com/alan-turing-institute/MLJ.jl">MLJ.jl</a>: if you&#39;re more of an applied user, there is a single package the pulls from all these different libraries and provides a single, scikit-learn inspired API: MLJ.jl. MLJ.jl provides a common interface for a wide range of machine learning algorithms.</li><li><a href="https://cstjean.github.io/ScikitLearn.jl/stable/">ScikitLearn.jl</a>: A Julia wrapper around the full Python scikit-learn machine learning library. Not well integrated with DataFrames.jl, but can be combined using StatsModels.jl.</li><li><a href="https://github.com/IBM/AutoMLPipeline.jl">AutoMLPipeline</a>: A package that makes it trivial to create complex ML pipeline structures using simple expressions. It leverages on the built-in macro programming features of Julia to symbolically process, manipulate pipeline expressions, and makes it easy to discover optimal structures for machine learning regression and classification.</li><li>Deep learning: <a href="https://denizyuret.github.io/Knet.jl/stable/tutorial/#Introduction-to-Knet-1">KNet.jl</a> and <a href="https://github.com/FluxML/Flux.jl">Flux.jl</a>.</li></ul></li><li><strong>Plotting</strong><ul><li><a href="http://docs.juliaplots.org/latest/">Plots.jl</a>: Powerful, modern plotting library with a syntax akin to that of <a href="https://matplotlib.org/">matplotlib</a> (in Python) or <code>plot</code> (in R). <a href="http://docs.juliaplots.org/latest/tutorial/#Using-Plot-Recipes-1">StatsPlots.jl</a> provides Plots.jl with recipes for many standard statistical plots.</li><li><a href="http://gadflyjl.org/stable/">Gadfly.jl</a>: High-level plotting library with a &quot;grammar of graphics&quot; syntax akin to that of <a href="https://ggplot2.tidyverse.org/reference/ggplot.html">ggplot</a> (in R).</li><li><a href="http://juliaplots.org/AlgebraOfGraphics.jl/stable/">AlgebraOfGraphics.jl</a>: A &quot;grammar of graphics&quot; library build upon <a href="https://docs.makie.org/stable/">Makie.jl</a>.</li><li><a href="https://www.queryverse.org/VegaLite.jl/stable/">VegaLite.jl</a>: High-level plotting library that uses a different &quot;grammar of graphics&quot; syntax and has an emphasis on interactive graphics.</li></ul></li><li><strong>Data Wrangling</strong>:<ul><li><a href="https://github.com/invenia/Impute.jl">Impute.jl</a>: various methods for handling missing data in vectors, matrices and tables.</li><li><a href="https://github.com/JuliaData/DataFramesMeta.jl">DataFramesMeta.jl</a>: A range of convenience functions for DataFrames.jl that augment <code>select</code> and <code>transform</code> to provide a user experience similar to that provided by <a href="https://dplyr.tidyverse.org/">dplyr</a> in R.</li><li><a href="https://github.com/jkrumbiegel/DataFrameMacros.jl">DataFrameMacros.jl</a>: Provides macro versions of the common DataFrames.jl functions similar to DataFramesMeta.jl, with convenient syntax for the manipulation of multiple columns at once.</li><li><a href="https://github.com/queryverse/Query.jl">Query.jl</a>: Query.jl provides a single framework for data wrangling that works with a range of libraries, including DataFrames.jl, other tabular data libraries (more on those below), and even non-tabular data. Provides many convenience functions analogous to those in dplyr in R or <a href="https://en.wikipedia.org/wiki/Language_Integrated_Query">LINQ</a>.</li><li>You can find more information on these packages in the <a href="man/querying_frameworks/#Data-manipulation-frameworks">Data manipulation frameworks</a> section of this manual.</li></ul></li><li><strong>And More!</strong><ul><li><a href="https://github.com/JuliaGraphs/Graphs.jl">Graphs.jl</a>: A pure-Julia, high performance network analysis library. Edgelists in <code>DataFrame</code>s can be easily converted into graphs using the <a href="https://github.com/JuliaGraphs/GraphDataFrameBridge.jl">GraphDataFrameBridge.jl</a> package.</li></ul></li><li><strong>IO</strong>:<ul><li>DataFrames.jl work well with a range of formats, including:<ul><li>CSV files (using <a href="https://github.com/JuliaData/CSV.jl">CSV.jl</a>),</li><li>Apache Arrow (using <a href="https://github.com/JuliaData/Arrow.jl">Arrow.jl</a>)</li><li>reading Stata, SAS and SPSS files (using <a href="https://github.com/junyuan-chen/ReadStatTables.jl">ReadStatTables.jl</a>; alternatively <a href="https://www.queryverse.org/">Queryverse</a> users can choose <a href="https://github.com/queryverse/StatFiles.jl">StatFiles.jl</a>),</li><li>Parquet files (using <a href="https://gitlab.com/ExpandingMan/Parquet2.jl">Parquet2.jl</a>),</li><li>reading R data files (.rda, .RData) (using <a href="https://github.com/JuliaData/RData.jl">RData.jl</a>).</li></ul></li></ul></li></ul><p>While not all of these libraries are tightly integrated with DataFrames.jl, because <code>DataFrame</code>s are essentially collections of aligned Julia vectors, so it is easy to (a) pull out a vector for use with a non-DataFrames-integrated library, or (b) convert your table into a homogeneously-typed matrix using the <code>Matrix</code> constructor or StatsModels.jl.</p><h3 id="Other-Julia-Tabular-Libraries"><a class="docs-heading-anchor" href="#Other-Julia-Tabular-Libraries">Other Julia Tabular Libraries</a><a id="Other-Julia-Tabular-Libraries-1"></a><a class="docs-heading-anchor-permalink" href="#Other-Julia-Tabular-Libraries" title="Permalink"></a></h3><p>DataFrames.jl is a great general purpose tool for data manipulation and wrangling, but it&#39;s not ideal for all applications. For users with more specialized needs, consider using:</p><ul><li><a href="https://juliadata.github.io/TypedTables.jl/stable/">TypedTables.jl</a>: Type-stable heterogeneous tables. Useful for improved performance when the structure of your table is relatively stable and does not feature thousands of columns.</li><li><a href="https://juliadata.github.io/JuliaDB.jl/stable/">JuliaDB.jl</a>: For users working with data that is too large to fit in memory, we suggest JuliaDB.jl, which offers better performance for large datasets, and can handle out-of-core data manipulations (Python users can think of JuliaDB.jl as the Julia version of <a href="https://dask.org/">dask</a>).</li></ul><p>Note that most tabular data libraries in the Julia ecosystem (including DataFrames.jl) support a common interface (defined in the <a href="https://github.com/JuliaData/Tables.jl">Tables.jl</a> package). As a result, some libraries are capable or working with a range of tabular data structures, making it easy to move between tabular libraries as your needs change. A user of <a href="https://github.com/queryverse/Query.jl">Query.jl</a>, for example, can use the same code to manipulate data in a <code>DataFrame</code>, a <code>Table</code> (defined by TypedTables.jl), or a JuliaDB table.</p><h2 id="Questions?"><a class="docs-heading-anchor" href="#Questions?">Questions?</a><a id="Questions?-1"></a><a class="docs-heading-anchor-permalink" href="#Questions?" title="Permalink"></a></h2><p>If there is something you expect DataFrames to be capable of, but cannot figure out how to do, please reach out with questions in Domains/Data on <a href="https://discourse.julialang.org/new-topic?title=[DataFrames%20Question]:%20&amp;body=%23%20Question:%0A%0A%23%20Dataset%20(if%20applicable):%0A%0A%23%20Minimal%20Working%20Example%20(if%20applicable):%0A&amp;category=Domains/Data&amp;tags=question">Discourse</a>. Additionally you might want to listen to an introduction to DataFrames.jl on <a href="https://juliaacademy.com/p/introduction-to-dataframes-jl">JuliaAcademy</a>.</p><p>Please report bugs by <a href="https://github.com/JuliaData/DataFrames.jl/issues/new">opening an issue</a>.</p><p>You can follow the <strong>source</strong> links throughout the documentation to jump right to the source files on GitHub to make pull requests for improving the documentation and function capabilities.</p><p>Please review <a href="https://github.com/JuliaData/DataFrames.jl/blob/main/CONTRIBUTING.md">DataFrames contributing guidelines</a> before submitting your first PR!</p><p>Information on specific versions can be found on the <a href="https://github.com/JuliaData/DataFrames.jl/releases">Release page</a>.</p><h2 id="Package-Manual"><a class="docs-heading-anchor" href="#Package-Manual">Package Manual</a><a id="Package-Manual-1"></a><a class="docs-heading-anchor-permalink" href="#Package-Manual" title="Permalink"></a></h2><ul><li><a href="man/basics/#First-Steps-with-DataFrames.jl">First Steps with DataFrames.jl</a></li><li class="no-marker"><ul><li><a href="man/basics/#Setting-up-the-Environment">Setting up the Environment</a></li><li><a href="man/basics/#Constructors-and-Basic-Utility-Functions">Constructors and Basic Utility Functions</a></li><li><a href="man/basics/#Getting-and-Setting-Data-in-a-Data-Frame">Getting and Setting Data in a Data Frame</a></li><li><a href="man/basics/#Basic-Usage-of-Transformation-Functions">Basic Usage of Transformation Functions</a></li></ul></li><li><a href="man/getting_started/#Getting-Started">Getting Started</a></li><li class="no-marker"><ul><li><a href="man/getting_started/#Installation">Installation</a></li><li><a href="man/getting_started/#The-DataFrame-Type">The <code>DataFrame</code> Type</a></li></ul></li><li><a href="man/joins/#Database-Style-Joins">Database-Style Joins</a></li><li class="no-marker"><ul><li><a href="man/joins/#Introduction-to-joins">Introduction to joins</a></li><li><a href="man/joins/#Key-value-comparisons-and-floating-point-values">Key value comparisons and floating point values</a></li><li><a href="man/joins/#Joining-on-key-columns-with-different-names">Joining on key columns with different names</a></li><li><a href="man/joins/#Handling-of-duplicate-keys-and-tracking-source-data-frame">Handling of duplicate keys and tracking source data frame</a></li><li><a href="man/joins/#Renaming-joined-columns">Renaming joined columns</a></li><li><a href="man/joins/#Matching-missing-values-in-joins">Matching missing values in joins</a></li><li><a href="man/joins/#Specifying-row-order-in-the-join-result">Specifying row order in the join result</a></li><li><a href="man/joins/#In-place-left-join">In-place left join</a></li></ul></li><li><a href="man/split_apply_combine/#The-Split-Apply-Combine-Strategy">The Split-Apply-Combine Strategy</a></li><li class="no-marker"><ul><li><a href="man/split_apply_combine/#Design-of-the-split-apply-combine-support">Design of the split-apply-combine support</a></li><li><a href="man/split_apply_combine/#Examples-of-the-split-apply-combine-operations">Examples of the split-apply-combine operations</a></li><li><a href="man/split_apply_combine/#Using-GroupedDataFrame-as-an-iterable-and-indexable-object">Using <code>GroupedDataFrame</code> as an iterable and indexable object</a></li><li><a href="man/split_apply_combine/#Simulating-the-SQL-where-clause">Simulating the SQL <code>where</code> clause</a></li><li><a href="man/split_apply_combine/#Column-independent-operations">Column-independent operations</a></li><li><a href="man/split_apply_combine/#Column-independent-operations-versus-functions">Column-independent operations versus functions</a></li><li><a href="man/split_apply_combine/#Specifying-group-order-in-groupby">Specifying group order in <code>groupby</code></a></li></ul></li><li><a href="man/reshaping_and_pivoting/#Reshaping-and-Pivoting-Data">Reshaping and Pivoting Data</a></li><li><a href="man/sorting/#Sorting">Sorting</a></li><li><a href="man/categorical/#man-categorical">Categorical Data</a></li><li><a href="man/missing/#Missing-Data">Missing Data</a></li><li><a href="man/comparisons/#Comparisons">Comparisons</a></li><li class="no-marker"><ul><li><a href="man/comparisons/#Comparison-with-the-Python-package-pandas">Comparison with the Python package pandas</a></li><li><a href="man/comparisons/#Comparison-with-the-R-package-dplyr">Comparison with the R package dplyr</a></li><li><a href="man/comparisons/#Comparison-with-the-R-package-data.table">Comparison with the R package data.table</a></li><li><a href="man/comparisons/#Comparison-with-Stata-(version-8-and-above)">Comparison with Stata (version 8 and above)</a></li></ul></li><li><a href="man/querying_frameworks/#Data-manipulation-frameworks">Data manipulation frameworks</a></li><li class="no-marker"><ul><li><a href="man/querying_frameworks/#TidierData.jl">TidierData.jl</a></li><li><a href="man/querying_frameworks/#DataFramesMeta.jl">DataFramesMeta.jl</a></li><li><a href="man/querying_frameworks/#DataFrameMacros.jl">DataFrameMacros.jl</a></li><li><a href="man/querying_frameworks/#Query.jl">Query.jl</a></li></ul></li></ul><h2 id="API"><a class="docs-heading-anchor" href="#API">API</a><a id="API-1"></a><a class="docs-heading-anchor-permalink" href="#API" title="Permalink"></a></h2><p>Only exported (i.e. available for use without <code>DataFrames.</code> qualifier after loading the DataFrames.jl package with <code>using DataFrames</code>) types and functions are considered a part of the public API of the DataFrames.jl package. In general all such objects are documented in this manual (in case some documentation is missing please kindly report an issue <a href="https://github.com/JuliaData/DataFrames.jl/issues/new">here</a>).</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>Breaking changes to public and documented API are avoided in DataFrames.jl where possible.</p><p>The following changes are not considered breaking:</p><ul><li>specific floating point values computed by operations may change at any time; users should rely only on approximate accuracy;</li><li>in functions that use the default random number generator provided by Base Julia the specific random numbers computed may change across Julia versions;</li><li>if the changed functionality is classified as a bug;</li><li>if the changed behavior was not documented; two major cases are:<ol><li>in its implementation some function accepted a wider range of arguments that it was documented to handle - changes in handling of undocumented arguments are not considered as breaking;</li><li>the type of the value returned by a function changes, but it still follows the contract specified in the documentation; for example if a function is documented to return a vector then changing its type from <code>Vector</code> to <code>PooledVector</code> is not considered as breaking;</li></ol></li><li>error behavior: code that threw an exception can change exception type thrown or stop throwing an exception;</li><li>changes in display (how objects are printed);</li><li>changes to the state of global objects from Base Julia whose state normally is considered volatile (e.g. state of global random number generator).</li></ul><p>All types and functions that are part of public API are guaranteed to go through a deprecation period before a breaking change is made to them or they would be removed.</p><p>The standard practice is that breaking changes are implemented when a major release of DataFrames.jl is made (e.g. functionalities deprecated in a 1.x release would be changed in the 2.0 release).</p><p>In rare cases a breaking change might be introduced in a minor release. In such a case the changed behavior still goes through one minor release during which it is deprecated. The situations where such a breaking change might be allowed are (still such breaking changes will be avoided if possible):</p><ul><li>the affected functionality was previously clearly identified in the documentation as being subject to changes (for example in DataFrames.jl 1.4 release propagation rules of <code>:note</code>-style metadata are documented as such);</li><li>the change is on the border of being classified as a bug (in rare cases even if a behavior of some function was documented its consequences for certain argument combinations could be decided to be unintended and not wanted);</li><li>the change is needed to adjust DataFrames.jl functionality to changes in Base Julia.</li></ul></div></div><p>Please be warned that while Julia allows you to access internal functions or types of DataFrames.jl these can change without warning between versions of DataFrames.jl. In particular it is not safe to directly access fields of types that are a part of public API of the DataFrames.jl package using e.g. the <code>getfield</code> function. Whenever some operation on fields of defined types is considered allowed an appropriate exported function should be used instead.</p><ul><li><a href="lib/types/#Types">Types</a></li><li class="no-marker"><ul><li><a href="lib/types/#Type-hierarchy-design">Type hierarchy design</a></li><li><a href="lib/types/#man-columnhandling">The design of handling of columns of a <code>DataFrame</code></a></li><li><a href="lib/types/#Types-specification">Types specification</a></li></ul></li><li><a href="lib/functions/#Functions">Functions</a></li><li class="no-marker"><ul><li><a href="lib/functions/#Multithreading-support">Multithreading support</a></li><li><a href="lib/functions/#Index">Index</a></li><li><a href="lib/functions/#Constructing-data-frames">Constructing data frames</a></li><li><a href="lib/functions/#Summary-information">Summary information</a></li><li><a href="lib/functions/#Working-with-column-names">Working with column names</a></li><li><a href="lib/functions/#Mutating-and-transforming-data-frames-and-grouped-data-frames">Mutating and transforming data frames and grouped data frames</a></li><li><a href="lib/functions/#Reshaping-data-frames-between-tall-and-wide-formats">Reshaping data frames between tall and wide formats</a></li><li><a href="lib/functions/#Sorting">Sorting</a></li><li><a href="lib/functions/#Joining">Joining</a></li><li><a href="lib/functions/#Grouping">Grouping</a></li><li><a href="lib/functions/#Filtering-rows">Filtering rows</a></li><li><a href="lib/functions/#Working-with-missing-values">Working with missing values</a></li><li><a href="lib/functions/#Iteration">Iteration</a></li><li><a href="lib/functions/#Equality">Equality</a></li><li><a href="lib/functions/#Metadata">Metadata</a></li></ul></li><li><a href="lib/indexing/#Indexing">Indexing</a></li><li class="no-marker"><ul><li><a href="lib/indexing/#General-rules">General rules</a></li><li><a href="lib/indexing/#getindex-and-view"><code>getindex</code> and <code>view</code></a></li><li><a href="lib/indexing/#setindex!"><code>setindex!</code></a></li><li><a href="lib/indexing/#Broadcasting">Broadcasting</a></li><li><a href="lib/indexing/#Indexing-GroupedDataFrames">Indexing <code>GroupedDataFrame</code>s</a></li></ul></li><li><a href="lib/indexing/#Common-API-for-types-defined-in-DataFrames.jl">Common API for types defined in DataFrames.jl</a></li></ul><h2 id="Index"><a class="docs-heading-anchor" href="#Index">Index</a><a id="Index-1"></a><a class="docs-heading-anchor-permalink" href="#Index" title="Permalink"></a></h2><ul><li><a href="lib/types/#DataFrames.AbstractDataFrame"><code>DataFrames.AbstractDataFrame</code></a></li><li><a href="lib/types/#DataFrames.AsTable"><code>DataFrames.AsTable</code></a></li><li><a href="lib/types/#DataFrames.DataFrame"><code>DataFrames.DataFrame</code></a></li><li><a href="lib/types/#DataFrames.DataFrameColumns"><code>DataFrames.DataFrameColumns</code></a></li><li><a href="lib/types/#DataFrames.DataFrameRow"><code>DataFrames.DataFrameRow</code></a></li><li><a href="lib/types/#DataFrames.DataFrameRows"><code>DataFrames.DataFrameRows</code></a></li><li><a href="lib/types/#DataFrames.GroupKey"><code>DataFrames.GroupKey</code></a></li><li><a href="lib/types/#DataFrames.GroupKeys"><code>DataFrames.GroupKeys</code></a></li><li><a href="lib/types/#DataFrames.GroupedDataFrame"><code>DataFrames.GroupedDataFrame</code></a></li><li><a href="lib/types/#DataFrames.RepeatedVector"><code>DataFrames.RepeatedVector</code></a></li><li><a href="lib/types/#DataFrames.StackedVector"><code>DataFrames.StackedVector</code></a></li><li><a href="lib/types/#DataFrames.SubDataFrame"><code>DataFrames.SubDataFrame</code></a></li><li><a href="lib/functions/#Base.Iterators.only"><code>Base.Iterators.only</code></a></li><li><a href="lib/functions/#Base.Iterators.partition"><code>Base.Iterators.partition</code></a></li><li><a href="lib/functions/#Base.allunique"><code>Base.allunique</code></a></li><li><a href="lib/functions/#Base.append!"><code>Base.append!</code></a></li><li><a href="lib/functions/#Base.copy"><code>Base.copy</code></a></li><li><a href="lib/functions/#Base.deleteat!"><code>Base.deleteat!</code></a></li><li><a href="lib/functions/#Base.eachcol"><code>Base.eachcol</code></a></li><li><a href="lib/functions/#Base.eachrow"><code>Base.eachrow</code></a></li><li><a href="lib/functions/#Base.empty"><code>Base.empty</code></a></li><li><a href="lib/functions/#Base.empty!"><code>Base.empty!</code></a></li><li><a href="lib/functions/#Base.filter"><code>Base.filter</code></a></li><li><a href="lib/functions/#Base.filter!"><code>Base.filter!</code></a></li><li><a href="lib/functions/#Base.first"><code>Base.first</code></a></li><li><a href="lib/functions/#Base.get"><code>Base.get</code></a></li><li><a href="lib/functions/#Base.hcat"><code>Base.hcat</code></a></li><li><a href="lib/functions/#Base.insert!"><code>Base.insert!</code></a></li><li><a href="lib/functions/#Base.invpermute!"><code>Base.invpermute!</code></a></li><li><a href="lib/functions/#Base.isapprox"><code>Base.isapprox</code></a></li><li><a href="lib/functions/#Base.isempty"><code>Base.isempty</code></a></li><li><a href="lib/functions/#Base.issorted"><code>Base.issorted</code></a></li><li><a href="lib/functions/#Base.keepat!"><code>Base.keepat!</code></a></li><li><a href="lib/functions/#Base.keys"><code>Base.keys</code></a></li><li><a href="lib/functions/#Base.last"><code>Base.last</code></a></li><li><a href="lib/functions/#Base.length"><code>Base.length</code></a></li><li><a href="lib/functions/#Base.names"><code>Base.names</code></a></li><li><a href="lib/functions/#Base.ndims"><code>Base.ndims</code></a></li><li><a href="lib/functions/#Base.pairs"><code>Base.pairs</code></a></li><li><a href="lib/functions/#Base.parent"><code>Base.parent</code></a></li><li><a href="lib/functions/#Base.permute!"><code>Base.permute!</code></a></li><li><a href="lib/functions/#Base.permutedims"><code>Base.permutedims</code></a></li><li><a href="lib/functions/#Base.pop!"><code>Base.pop!</code></a></li><li><a href="lib/functions/#Base.popat!"><code>Base.popat!</code></a></li><li><a href="lib/functions/#Base.popfirst!"><code>Base.popfirst!</code></a></li><li><a href="lib/functions/#Base.prepend!"><code>Base.prepend!</code></a></li><li><a href="lib/functions/#Base.propertynames"><code>Base.propertynames</code></a></li><li><a href="lib/functions/#Base.push!"><code>Base.push!</code></a></li><li><a href="lib/functions/#Base.pushfirst!"><code>Base.pushfirst!</code></a></li><li><a href="lib/functions/#Base.reduce"><code>Base.reduce</code></a></li><li><a href="lib/functions/#Base.repeat"><code>Base.repeat</code></a></li><li><a href="lib/functions/#Base.resize!"><code>Base.resize!</code></a></li><li><a href="lib/functions/#Base.reverse"><code>Base.reverse</code></a></li><li><a href="lib/functions/#Base.reverse!"><code>Base.reverse!</code></a></li><li><a href="lib/functions/#Base.show"><code>Base.show</code></a></li><li><a href="lib/functions/#Base.similar"><code>Base.similar</code></a></li><li><a href="lib/functions/#Base.size"><code>Base.size</code></a></li><li><a href="lib/functions/#Base.sort"><code>Base.sort</code></a></li><li><a href="lib/functions/#Base.sort!"><code>Base.sort!</code></a></li><li><a href="lib/functions/#Base.sortperm"><code>Base.sortperm</code></a></li><li><a href="lib/functions/#Base.stack"><code>Base.stack</code></a></li><li><a href="lib/functions/#Base.unique"><code>Base.unique</code></a></li><li><a href="lib/functions/#Base.unique!"><code>Base.unique!</code></a></li><li><a href="lib/functions/#Base.values"><code>Base.values</code></a></li><li><a href="lib/functions/#Base.vcat"><code>Base.vcat</code></a></li><li><a href="lib/functions/#DataAPI.allcombinations"><code>DataAPI.allcombinations</code></a></li><li><a href="lib/functions/#DataAPI.antijoin"><code>DataAPI.antijoin</code></a></li><li><a href="lib/functions/#DataAPI.colmetadata"><code>DataAPI.colmetadata</code></a></li><li><a href="lib/functions/#DataAPI.colmetadata!"><code>DataAPI.colmetadata!</code></a></li><li><a href="lib/functions/#DataAPI.colmetadatakeys"><code>DataAPI.colmetadatakeys</code></a></li><li><a href="lib/functions/#DataAPI.crossjoin"><code>DataAPI.crossjoin</code></a></li><li><a href="lib/functions/#DataAPI.deletecolmetadata!"><code>DataAPI.deletecolmetadata!</code></a></li><li><a href="lib/functions/#DataAPI.deletemetadata!"><code>DataAPI.deletemetadata!</code></a></li><li><a href="lib/functions/#DataAPI.describe"><code>DataAPI.describe</code></a></li><li><a href="lib/functions/#DataAPI.emptycolmetadata!"><code>DataAPI.emptycolmetadata!</code></a></li><li><a href="lib/functions/#DataAPI.emptymetadata!"><code>DataAPI.emptymetadata!</code></a></li><li><a href="lib/functions/#DataAPI.groupby"><code>DataAPI.groupby</code></a></li><li><a href="lib/functions/#DataAPI.innerjoin"><code>DataAPI.innerjoin</code></a></li><li><a href="lib/functions/#DataAPI.leftjoin"><code>DataAPI.leftjoin</code></a></li><li><a href="lib/functions/#DataAPI.metadata"><code>DataAPI.metadata</code></a></li><li><a href="lib/functions/#DataAPI.metadata!"><code>DataAPI.metadata!</code></a></li><li><a href="lib/functions/#DataAPI.metadatakeys"><code>DataAPI.metadatakeys</code></a></li><li><a href="lib/functions/#DataAPI.ncol"><code>DataAPI.ncol</code></a></li><li><a href="lib/functions/#DataAPI.nrow"><code>DataAPI.nrow</code></a></li><li><a href="lib/functions/#DataAPI.outerjoin"><code>DataAPI.outerjoin</code></a></li><li><a href="lib/functions/#DataAPI.rightjoin"><code>DataAPI.rightjoin</code></a></li><li><a href="lib/functions/#DataAPI.rownumber"><code>DataAPI.rownumber</code></a></li><li><a href="lib/functions/#DataAPI.semijoin"><code>DataAPI.semijoin</code></a></li><li><a href="lib/functions/#DataFrames.allowmissing!"><code>DataFrames.allowmissing!</code></a></li><li><a href="lib/functions/#DataFrames.combine"><code>DataFrames.combine</code></a></li><li><a href="lib/functions/#DataFrames.completecases"><code>DataFrames.completecases</code></a></li><li><a href="lib/functions/#DataFrames.disallowmissing!"><code>DataFrames.disallowmissing!</code></a></li><li><a href="lib/functions/#DataFrames.dropmissing"><code>DataFrames.dropmissing</code></a></li><li><a href="lib/functions/#DataFrames.dropmissing!"><code>DataFrames.dropmissing!</code></a></li><li><a href="lib/functions/#DataFrames.fillcombinations"><code>DataFrames.fillcombinations</code></a></li><li><a href="lib/functions/#DataFrames.flatten"><code>DataFrames.flatten</code></a></li><li><a href="lib/functions/#DataFrames.groupcols"><code>DataFrames.groupcols</code></a></li><li><a href="lib/functions/#DataFrames.groupindices"><code>DataFrames.groupindices</code></a></li><li><a href="lib/functions/#DataFrames.insertcols"><code>DataFrames.insertcols</code></a></li><li><a href="lib/functions/#DataFrames.insertcols!"><code>DataFrames.insertcols!</code></a></li><li><a href="lib/functions/#DataFrames.leftjoin!"><code>DataFrames.leftjoin!</code></a></li><li><a href="lib/functions/#DataFrames.mapcols"><code>DataFrames.mapcols</code></a></li><li><a href="lib/functions/#DataFrames.mapcols!"><code>DataFrames.mapcols!</code></a></li><li><a href="lib/functions/#DataFrames.nonunique"><code>DataFrames.nonunique</code></a></li><li><a href="lib/functions/#DataFrames.order"><code>DataFrames.order</code></a></li><li><a href="lib/functions/#DataFrames.proprow"><code>DataFrames.proprow</code></a></li><li><a href="lib/functions/#DataFrames.rename"><code>DataFrames.rename</code></a></li><li><a href="lib/functions/#DataFrames.rename!"><code>DataFrames.rename!</code></a></li><li><a href="lib/functions/#DataFrames.repeat!"><code>DataFrames.repeat!</code></a></li><li><a href="lib/functions/#DataFrames.select"><code>DataFrames.select</code></a></li><li><a href="lib/functions/#DataFrames.select!"><code>DataFrames.select!</code></a></li><li><a href="lib/functions/#DataFrames.subset"><code>DataFrames.subset</code></a></li><li><a href="lib/functions/#DataFrames.subset!"><code>DataFrames.subset!</code></a></li><li><a href="lib/functions/#DataFrames.table_transformation"><code>DataFrames.table_transformation</code></a></li><li><a href="lib/functions/#DataFrames.transform"><code>DataFrames.transform</code></a></li><li><a href="lib/functions/#DataFrames.transform!"><code>DataFrames.transform!</code></a></li><li><a href="lib/functions/#DataFrames.unstack"><code>DataFrames.unstack</code></a></li><li><a href="lib/functions/#DataFrames.valuecols"><code>DataFrames.valuecols</code></a></li><li><a href="lib/functions/#Missings.allowmissing"><code>Missings.allowmissing</code></a></li><li><a href="lib/functions/#Missings.disallowmissing"><code>Missings.disallowmissing</code></a></li><li><a href="lib/functions/#Random.shuffle"><code>Random.shuffle</code></a></li><li><a href="lib/functions/#Random.shuffle!"><code>Random.shuffle!</code></a></li></ul></article><nav class="docs-footer"><a class="docs-footer-nextpage" href="man/basics/">First Steps with DataFrames.jl »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Saturday 7 September 2024 11:00">Saturday 7 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Introduction · DataFrames.jl</title><meta name="title" content="Introduction · DataFrames.jl"/><meta property="og:title" content="Introduction · DataFrames.jl"/><meta property="twitter:title" content="Introduction · DataFrames.jl"/><meta name="description" content="Documentation for DataFrames.jl."/><meta property="og:description" content="Documentation for DataFrames.jl."/><meta property="twitter:description" content="Documentation for DataFrames.jl."/><meta property="og:url" content="https://juliadata.github.io/DataFrames.jl/stable/"/><meta property="twitter:url" content="https://juliadata.github.io/DataFrames.jl/stable/"/><link rel="canonical" href="https://juliadata.github.io/DataFrames.jl/stable/"/><script data-outdated-warner src="assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="assets/documenter.js"></script><script src="search_index.js"></script><script src="siteinfo.js"></script><script src="../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="assets/themeswap.js"></script><link href="assets/favicon.ico" rel="icon" type="image/x-icon"/></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href><img src="assets/logo.png" alt="DataFrames.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href>DataFrames.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li class="is-active"><a class="tocitem" href>Introduction</a><ul class="internal"><li><a class="tocitem" href="#What-is-DataFrames.jl?"><span>What is DataFrames.jl?</span></a></li><li><a class="tocitem" href="#DataFrames.jl-and-the-Julia-Data-Ecosystem"><span>DataFrames.jl and the Julia Data Ecosystem</span></a></li><li><a class="tocitem" href="#Questions?"><span>Questions?</span></a></li><li><a class="tocitem" href="#Package-Manual"><span>Package Manual</span></a></li><li><a class="tocitem" href="#API"><span>API</span></a></li><li><a class="tocitem" href="#Index"><span>Index</span></a></li></ul></li><li><a class="tocitem" href="man/basics/">First Steps with DataFrames.jl</a></li><li><span class="tocitem">User Guide</span><ul><li><a class="tocitem" href="man/getting_started/">Getting Started</a></li><li><a class="tocitem" href="man/working_with_dataframes/">Working with DataFrames</a></li><li><a class="tocitem" href="man/importing_and_exporting/">Importing and Exporting Data (I/O)</a></li><li><a class="tocitem" href="man/joins/">Joins</a></li><li><a class="tocitem" href="man/split_apply_combine/">Split-apply-combine</a></li><li><a class="tocitem" href="man/reshaping_and_pivoting/">Reshaping</a></li><li><a class="tocitem" href="man/sorting/">Sorting</a></li><li><a class="tocitem" href="man/categorical/">Categorical Data</a></li><li><a class="tocitem" href="man/missing/">Missing Data</a></li><li><a class="tocitem" href="man/querying_frameworks/">Data manipulation frameworks</a></li><li><a class="tocitem" href="man/comparisons/">Comparison with Python/R/Stata</a></li></ul></li><li><span class="tocitem">API</span><ul><li><a class="tocitem" href="lib/types/">Types</a></li><li><a class="tocitem" href="lib/functions/">Functions</a></li><li><a class="tocitem" href="lib/indexing/">Indexing</a></li><li><a class="tocitem" href="lib/metadata/">Metadata</a></li></ul></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li class="is-active"><a href>Introduction</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Introduction</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaData/DataFrames.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaData/DataFrames.jl/blob/main/docs/src/index.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="DataFrames.jl"><a class="docs-heading-anchor" href="#DataFrames.jl">DataFrames.jl</a><a id="DataFrames.jl-1"></a><a class="docs-heading-anchor-permalink" href="#DataFrames.jl" title="Permalink"></a></h1><p>Welcome to the DataFrames.jl documentation!</p><p>This resource aims to teach you everything you need to know to get up and running with tabular data manipulation using the DataFrames.jl package.</p><p>For more illustrations of DataFrames.jl usage, in particular in conjunction with other packages you can check-out the following resources (they are kept up to date with the released version of DataFrames.jl):</p><ul><li><a href="https://www.jstatsoft.org/article/view/v107i04">DataFrames.jl: Flexible and Fast Tabular Data in Julia</a> article published in the <em>Journal of Statistical Software</em></li><li><a href="https://www.ahsmart.com/pub/data-wrangling-with-data-frames-jl-cheat-sheet/">Data Wrangling with DataFrames.jl Cheat Sheet</a></li><li><a href="https://github.com/bkamins/Julia-DataFrames-Tutorial/">DataFrames Tutorial using Jupyter Notebooks</a></li><li><a href="https://github.com/JuliaAcademy/DataFrames">Julia Academy DataFrames.jl tutorial</a></li><li><a href="https://github.com/bkamins/JuliaCon2023-Tutorial">JuliaCon 2023</a>, <a href="https://github.com/bkamins/JuliaCon2022-DataFrames-Tutorial">JuliaCon 2022</a>, <a href="https://github.com/bkamins/JuliaCon2021-DataFrames-Tutorial">JuliaCon 2021</a>, <a href="https://github.com/bkamins/JuliaCon2020-DataFrames-Tutorial">JuliaCon 2020</a>, <a href="https://github.com/bkamins/JuliaCon2019-DataFrames-Tutorial">JuliaCon 2019</a>, <a href="https://github.com/bkamins/ODSC-EUROPE-2021">ODSC Europe 2021</a> tutorials, and <a href="https://github.com/bkamins/PyDataGlobal2020">PyData Global 2020</a></li><li><a href="https://github.com/bkamins/DataFrames-Showcase">DataFrames.jl showcase</a></li></ul><p>If you prefer to learn DataFrames.jl from a book you can consider reading:</p><ul><li><a href="https://github.com/bkamins/JuliaForDataAnalysis">Julia for Data Analysis</a>;</li><li><a href="https://juliadatascience.io/">Julia Data Science</a>.</li></ul><h2 id="What-is-DataFrames.jl?"><a class="docs-heading-anchor" href="#What-is-DataFrames.jl?">What is DataFrames.jl?</a><a id="What-is-DataFrames.jl?-1"></a><a class="docs-heading-anchor-permalink" href="#What-is-DataFrames.jl?" title="Permalink"></a></h2><p>DataFrames.jl provides a set of tools for working with tabular data in Julia. Its design and functionality are similar to those of <a href="https://pandas.pydata.org/">pandas</a> (in Python) and <code>data.frame</code>, <a href="https://rdatatable.gitlab.io/data.table/"><code>data.table</code></a> and <a href="https://dplyr.tidyverse.org/">dplyr</a> (in R), making it  a great general purpose data science tool.</p><p>DataFrames.jl plays a central role in the Julia Data ecosystem, and has tight integrations with a range of different libraries. DataFrames.jl isn&#39;t the only tool for working with tabular data in Julia – as noted below, there are some other great libraries for certain use-cases – but it provides great data wrangling functionality through a familiar interface.</p><p>To understand the toolchain in more detail, have a look at the tutorials in this manual. New users can start with the <a href="man/basics/#First-Steps-with-DataFrames.jl">First Steps with DataFrames.jl</a> section.</p><p>You may find the <a href="https://juliadata.github.io/DataFramesMeta.jl/stable/">DataFramesMeta.jl</a> package or one of the other convenience packages discussed in the <a href="man/querying_frameworks/#Data-manipulation-frameworks">Data manipulation frameworks</a> section of this manual helpful when writing more advanced data transformations, especially if you do not have a significant programming experience. These packages provide convenience syntax similar to <a href="https://dplyr.tidyverse.org/">dplyr</a> in R.</p><p>If you use metadata when working with DataFrames.jl you might find the <a href="https://github.com/JuliaData/TableMetadataTools.jl">TableMetadataTools.jl</a> package useful. This package defines several convenience functions for performing typical metadata operations.</p><h2 id="DataFrames.jl-and-the-Julia-Data-Ecosystem"><a class="docs-heading-anchor" href="#DataFrames.jl-and-the-Julia-Data-Ecosystem">DataFrames.jl and the Julia Data Ecosystem</a><a id="DataFrames.jl-and-the-Julia-Data-Ecosystem-1"></a><a class="docs-heading-anchor-permalink" href="#DataFrames.jl-and-the-Julia-Data-Ecosystem" title="Permalink"></a></h2><p>The Julia data ecosystem can be a difficult space for new users to navigate, in part because the Julia ecosystem tends to distribute functionality across different libraries more than some other languages. Because many people coming to DataFrames.jl are just starting to explore the Julia data ecosystem, below is a list of well-supported libraries that provide different data science tools, along with a few notes about what makes each library special, and how well integrated they are with DataFrames.jl.</p><ul><li><strong>Statistics</strong><ul><li><a href="https://github.com/JuliaStats/StatsKit.jl">StatsKit.jl</a>: A convenience meta-package which loads a set of essential packages for statistics, including those mentioned below in this section and DataFrames.jl itself.</li><li><a href="https://docs.julialang.org/en/v1/stdlib/Statistics/">Statistics</a>: The Julia standard library comes with a wide range of statistics functionality, but to gain access to these functions you must call <code>using Statistics</code>.</li><li><a href="https://docs.julialang.org/en/v1/stdlib/LinearAlgebra/">LinearAlgebra</a>: Like <code>Statistics</code>, many linear algebra features (factorizations, inversions, etc.) live in a library you have to load to use.</li><li><a href="https://docs.julialang.org/en/v1/stdlib/SparseArrays/">SparseArrays</a> are also in the standard library but must be loaded to be used.</li><li><a href="https://github.com/nalimilan/FreqTables.jl">FreqTables.jl</a>: Create frequency tables / cross-tabulations. Tightly integrated with DataFrames.jl.</li><li><a href="https://juliastats.org/HypothesisTests.jl/stable/">HypothesisTests.jl</a>: A range of hypothesis testing tools.</li><li><a href="https://juliastats.org/GLM.jl/stable/manual/">GLM.jl</a>: Tools for estimating linear and generalized linear models. Tightly integrated with DataFrames.jl.</li><li><a href="https://juliastats.org/StatsModels.jl/stable/">StatsModels.jl</a>: For converting heterogeneous <code>DataFrame</code> into homogeneous matrices for use with linear algebra libraries or machine learning applications that don&#39;t directly support <code>DataFrame</code>s. Will do things like convert categorical variables into indicators/one-hot-encodings, create interaction terms, etc.</li><li><a href="https://multivariatestatsjl.readthedocs.io/en/stable/index.html">MultivariateStats.jl</a>: linear regression, ridge regression, PCA, component analyses tools. Not well integrated with DataFrames.jl, but easily used in combination with <code>StatsModels</code>.</li></ul></li><li><strong>Machine Learning</strong><ul><li><a href="https://github.com/alan-turing-institute/MLJ.jl">MLJ.jl</a>: if you&#39;re more of an applied user, there is a single package the pulls from all these different libraries and provides a single, scikit-learn inspired API: MLJ.jl. MLJ.jl provides a common interface for a wide range of machine learning algorithms.</li><li><a href="https://cstjean.github.io/ScikitLearn.jl/stable/">ScikitLearn.jl</a>: A Julia wrapper around the full Python scikit-learn machine learning library. Not well integrated with DataFrames.jl, but can be combined using StatsModels.jl.</li><li><a href="https://github.com/IBM/AutoMLPipeline.jl">AutoMLPipeline</a>: A package that makes it trivial to create complex ML pipeline structures using simple expressions. It leverages on the built-in macro programming features of Julia to symbolically process, manipulate pipeline expressions, and makes it easy to discover optimal structures for machine learning regression and classification.</li><li>Deep learning: <a href="https://denizyuret.github.io/Knet.jl/stable/tutorial/#Introduction-to-Knet-1">KNet.jl</a> and <a href="https://github.com/FluxML/Flux.jl">Flux.jl</a>.</li></ul></li><li><strong>Plotting</strong><ul><li><a href="http://docs.juliaplots.org/latest/">Plots.jl</a>: Powerful, modern plotting library with a syntax akin to that of <a href="https://matplotlib.org/">matplotlib</a> (in Python) or <code>plot</code> (in R). <a href="http://docs.juliaplots.org/latest/tutorial/#Using-Plot-Recipes-1">StatsPlots.jl</a> provides Plots.jl with recipes for many standard statistical plots.</li><li><a href="http://gadflyjl.org/stable/">Gadfly.jl</a>: High-level plotting library with a &quot;grammar of graphics&quot; syntax akin to that of <a href="https://ggplot2.tidyverse.org/reference/ggplot.html">ggplot</a> (in R).</li><li><a href="http://juliaplots.org/AlgebraOfGraphics.jl/stable/">AlgebraOfGraphics.jl</a>: A &quot;grammar of graphics&quot; library build upon <a href="https://docs.makie.org/stable/">Makie.jl</a>.</li><li><a href="https://www.queryverse.org/VegaLite.jl/stable/">VegaLite.jl</a>: High-level plotting library that uses a different &quot;grammar of graphics&quot; syntax and has an emphasis on interactive graphics.</li></ul></li><li><strong>Data Wrangling</strong>:<ul><li><a href="https://github.com/invenia/Impute.jl">Impute.jl</a>: various methods for handling missing data in vectors, matrices and tables.</li><li><a href="https://github.com/JuliaData/DataFramesMeta.jl">DataFramesMeta.jl</a>: A range of convenience functions for DataFrames.jl that augment <code>select</code> and <code>transform</code> to provide a user experience similar to that provided by <a href="https://dplyr.tidyverse.org/">dplyr</a> in R.</li><li><a href="https://github.com/jkrumbiegel/DataFrameMacros.jl">DataFrameMacros.jl</a>: Provides macro versions of the common DataFrames.jl functions similar to DataFramesMeta.jl, with convenient syntax for the manipulation of multiple columns at once.</li><li><a href="https://github.com/queryverse/Query.jl">Query.jl</a>: Query.jl provides a single framework for data wrangling that works with a range of libraries, including DataFrames.jl, other tabular data libraries (more on those below), and even non-tabular data. Provides many convenience functions analogous to those in dplyr in R or <a href="https://en.wikipedia.org/wiki/Language_Integrated_Query">LINQ</a>.</li><li>You can find more information on these packages in the <a href="man/querying_frameworks/#Data-manipulation-frameworks">Data manipulation frameworks</a> section of this manual.</li></ul></li><li><strong>And More!</strong><ul><li><a href="https://github.com/JuliaGraphs/Graphs.jl">Graphs.jl</a>: A pure-Julia, high performance network analysis library. Edgelists in <code>DataFrame</code>s can be easily converted into graphs using the <a href="https://github.com/JuliaGraphs/GraphDataFrameBridge.jl">GraphDataFrameBridge.jl</a> package.</li></ul></li><li><strong>IO</strong>:<ul><li>DataFrames.jl work well with a range of formats, including:<ul><li>CSV files (using <a href="https://github.com/JuliaData/CSV.jl">CSV.jl</a>),</li><li>Apache Arrow (using <a href="https://github.com/JuliaData/Arrow.jl">Arrow.jl</a>)</li><li>reading Stata, SAS and SPSS files (using <a href="https://github.com/junyuan-chen/ReadStatTables.jl">ReadStatTables.jl</a>; alternatively <a href="https://www.queryverse.org/">Queryverse</a> users can choose <a href="https://github.com/queryverse/StatFiles.jl">StatFiles.jl</a>),</li><li>Parquet files (using <a href="https://gitlab.com/ExpandingMan/Parquet2.jl">Parquet2.jl</a>),</li><li>reading R data files (.rda, .RData) (using <a href="https://github.com/JuliaData/RData.jl">RData.jl</a>).</li></ul></li></ul></li></ul><p>While not all of these libraries are tightly integrated with DataFrames.jl, because <code>DataFrame</code>s are essentially collections of aligned Julia vectors, so it is easy to (a) pull out a vector for use with a non-DataFrames-integrated library, or (b) convert your table into a homogeneously-typed matrix using the <code>Matrix</code> constructor or StatsModels.jl.</p><h3 id="Other-Julia-Tabular-Libraries"><a class="docs-heading-anchor" href="#Other-Julia-Tabular-Libraries">Other Julia Tabular Libraries</a><a id="Other-Julia-Tabular-Libraries-1"></a><a class="docs-heading-anchor-permalink" href="#Other-Julia-Tabular-Libraries" title="Permalink"></a></h3><p>DataFrames.jl is a great general purpose tool for data manipulation and wrangling, but it&#39;s not ideal for all applications. For users with more specialized needs, consider using:</p><ul><li><a href="https://juliadata.github.io/TypedTables.jl/stable/">TypedTables.jl</a>: Type-stable heterogeneous tables. Useful for improved performance when the structure of your table is relatively stable and does not feature thousands of columns.</li><li><a href="https://juliadata.github.io/JuliaDB.jl/stable/">JuliaDB.jl</a>: For users working with data that is too large to fit in memory, we suggest JuliaDB.jl, which offers better performance for large datasets, and can handle out-of-core data manipulations (Python users can think of JuliaDB.jl as the Julia version of <a href="https://dask.org/">dask</a>).</li></ul><p>Note that most tabular data libraries in the Julia ecosystem (including DataFrames.jl) support a common interface (defined in the <a href="https://github.com/JuliaData/Tables.jl">Tables.jl</a> package). As a result, some libraries are capable or working with a range of tabular data structures, making it easy to move between tabular libraries as your needs change. A user of <a href="https://github.com/queryverse/Query.jl">Query.jl</a>, for example, can use the same code to manipulate data in a <code>DataFrame</code>, a <code>Table</code> (defined by TypedTables.jl), or a JuliaDB table.</p><h2 id="Questions?"><a class="docs-heading-anchor" href="#Questions?">Questions?</a><a id="Questions?-1"></a><a class="docs-heading-anchor-permalink" href="#Questions?" title="Permalink"></a></h2><p>If there is something you expect DataFrames to be capable of, but cannot figure out how to do, please reach out with questions in Domains/Data on <a href="https://discourse.julialang.org/new-topic?title=[DataFrames%20Question]:%20&amp;body=%23%20Question:%0A%0A%23%20Dataset%20(if%20applicable):%0A%0A%23%20Minimal%20Working%20Example%20(if%20applicable):%0A&amp;category=Domains/Data&amp;tags=question">Discourse</a>. Additionally you might want to listen to an introduction to DataFrames.jl on <a href="https://juliaacademy.com/p/introduction-to-dataframes-jl">JuliaAcademy</a>.</p><p>Please report bugs by <a href="https://github.com/JuliaData/DataFrames.jl/issues/new">opening an issue</a>.</p><p>You can follow the <strong>source</strong> links throughout the documentation to jump right to the source files on GitHub to make pull requests for improving the documentation and function capabilities.</p><p>Please review <a href="https://github.com/JuliaData/DataFrames.jl/blob/main/CONTRIBUTING.md">DataFrames contributing guidelines</a> before submitting your first PR!</p><p>Information on specific versions can be found on the <a href="https://github.com/JuliaData/DataFrames.jl/releases">Release page</a>.</p><h2 id="Package-Manual"><a class="docs-heading-anchor" href="#Package-Manual">Package Manual</a><a id="Package-Manual-1"></a><a class="docs-heading-anchor-permalink" href="#Package-Manual" title="Permalink"></a></h2><ul><li><a href="man/basics/#First-Steps-with-DataFrames.jl">First Steps with DataFrames.jl</a></li><li class="no-marker"><ul><li><a href="man/basics/#Setting-up-the-Environment">Setting up the Environment</a></li><li><a href="man/basics/#Constructors-and-Basic-Utility-Functions">Constructors and Basic Utility Functions</a></li><li><a href="man/basics/#Getting-and-Setting-Data-in-a-Data-Frame">Getting and Setting Data in a Data Frame</a></li><li><a href="man/basics/#Basic-Usage-of-Transformation-Functions">Basic Usage of Transformation Functions</a></li></ul></li><li><a href="man/getting_started/#Getting-Started">Getting Started</a></li><li class="no-marker"><ul><li><a href="man/getting_started/#Installation">Installation</a></li><li><a href="man/getting_started/#The-DataFrame-Type">The <code>DataFrame</code> Type</a></li></ul></li><li><a href="man/joins/#Database-Style-Joins">Database-Style Joins</a></li><li class="no-marker"><ul><li><a href="man/joins/#Introduction-to-joins">Introduction to joins</a></li><li><a href="man/joins/#Key-value-comparisons-and-floating-point-values">Key value comparisons and floating point values</a></li><li><a href="man/joins/#Joining-on-key-columns-with-different-names">Joining on key columns with different names</a></li><li><a href="man/joins/#Handling-of-duplicate-keys-and-tracking-source-data-frame">Handling of duplicate keys and tracking source data frame</a></li><li><a href="man/joins/#Renaming-joined-columns">Renaming joined columns</a></li><li><a href="man/joins/#Matching-missing-values-in-joins">Matching missing values in joins</a></li><li><a href="man/joins/#Specifying-row-order-in-the-join-result">Specifying row order in the join result</a></li><li><a href="man/joins/#In-place-left-join">In-place left join</a></li></ul></li><li><a href="man/split_apply_combine/#The-Split-Apply-Combine-Strategy">The Split-Apply-Combine Strategy</a></li><li class="no-marker"><ul><li><a href="man/split_apply_combine/#Design-of-the-split-apply-combine-support">Design of the split-apply-combine support</a></li><li><a href="man/split_apply_combine/#Examples-of-the-split-apply-combine-operations">Examples of the split-apply-combine operations</a></li><li><a href="man/split_apply_combine/#Using-GroupedDataFrame-as-an-iterable-and-indexable-object">Using <code>GroupedDataFrame</code> as an iterable and indexable object</a></li><li><a href="man/split_apply_combine/#Simulating-the-SQL-where-clause">Simulating the SQL <code>where</code> clause</a></li><li><a href="man/split_apply_combine/#Column-independent-operations">Column-independent operations</a></li><li><a href="man/split_apply_combine/#Column-independent-operations-versus-functions">Column-independent operations versus functions</a></li><li><a href="man/split_apply_combine/#Specifying-group-order-in-groupby">Specifying group order in <code>groupby</code></a></li></ul></li><li><a href="man/reshaping_and_pivoting/#Reshaping-and-Pivoting-Data">Reshaping and Pivoting Data</a></li><li><a href="man/sorting/#Sorting">Sorting</a></li><li><a href="man/categorical/#man-categorical">Categorical Data</a></li><li><a href="man/missing/#Missing-Data">Missing Data</a></li><li><a href="man/comparisons/#Comparisons">Comparisons</a></li><li class="no-marker"><ul><li><a href="man/comparisons/#Comparison-with-the-Python-package-pandas">Comparison with the Python package pandas</a></li><li><a href="man/comparisons/#Comparison-with-the-R-package-dplyr">Comparison with the R package dplyr</a></li><li><a href="man/comparisons/#Comparison-with-the-R-package-data.table">Comparison with the R package data.table</a></li><li><a href="man/comparisons/#Comparison-with-Stata-(version-8-and-above)">Comparison with Stata (version 8 and above)</a></li></ul></li><li><a href="man/querying_frameworks/#Data-manipulation-frameworks">Data manipulation frameworks</a></li><li class="no-marker"><ul><li><a href="man/querying_frameworks/#TidierData.jl">TidierData.jl</a></li><li><a href="man/querying_frameworks/#DataFramesMeta.jl">DataFramesMeta.jl</a></li><li><a href="man/querying_frameworks/#DataFrameMacros.jl">DataFrameMacros.jl</a></li><li><a href="man/querying_frameworks/#Query.jl">Query.jl</a></li></ul></li></ul><h2 id="API"><a class="docs-heading-anchor" href="#API">API</a><a id="API-1"></a><a class="docs-heading-anchor-permalink" href="#API" title="Permalink"></a></h2><p>Only exported (i.e. available for use without <code>DataFrames.</code> qualifier after loading the DataFrames.jl package with <code>using DataFrames</code>) types and functions are considered a part of the public API of the DataFrames.jl package. In general all such objects are documented in this manual (in case some documentation is missing please kindly report an issue <a href="https://github.com/JuliaData/DataFrames.jl/issues/new">here</a>).</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>Breaking changes to public and documented API are avoided in DataFrames.jl where possible.</p><p>The following changes are not considered breaking:</p><ul><li>specific floating point values computed by operations may change at any time; users should rely only on approximate accuracy;</li><li>in functions that use the default random number generator provided by Base Julia the specific random numbers computed may change across Julia versions;</li><li>if the changed functionality is classified as a bug;</li><li>if the changed behavior was not documented; two major cases are:<ol><li>in its implementation some function accepted a wider range of arguments that it was documented to handle - changes in handling of undocumented arguments are not considered as breaking;</li><li>the type of the value returned by a function changes, but it still follows the contract specified in the documentation; for example if a function is documented to return a vector then changing its type from <code>Vector</code> to <code>PooledVector</code> is not considered as breaking;</li></ol></li><li>error behavior: code that threw an exception can change exception type thrown or stop throwing an exception;</li><li>changes in display (how objects are printed);</li><li>changes to the state of global objects from Base Julia whose state normally is considered volatile (e.g. state of global random number generator).</li></ul><p>All types and functions that are part of public API are guaranteed to go through a deprecation period before a breaking change is made to them or they would be removed.</p><p>The standard practice is that breaking changes are implemented when a major release of DataFrames.jl is made (e.g. functionalities deprecated in a 1.x release would be changed in the 2.0 release).</p><p>In rare cases a breaking change might be introduced in a minor release. In such a case the changed behavior still goes through one minor release during which it is deprecated. The situations where such a breaking change might be allowed are (still such breaking changes will be avoided if possible):</p><ul><li>the affected functionality was previously clearly identified in the documentation as being subject to changes (for example in DataFrames.jl 1.4 release propagation rules of <code>:note</code>-style metadata are documented as such);</li><li>the change is on the border of being classified as a bug (in rare cases even if a behavior of some function was documented its consequences for certain argument combinations could be decided to be unintended and not wanted);</li><li>the change is needed to adjust DataFrames.jl functionality to changes in Base Julia.</li></ul></div></div><p>Please be warned that while Julia allows you to access internal functions or types of DataFrames.jl these can change without warning between versions of DataFrames.jl. In particular it is not safe to directly access fields of types that are a part of public API of the DataFrames.jl package using e.g. the <code>getfield</code> function. Whenever some operation on fields of defined types is considered allowed an appropriate exported function should be used instead.</p><ul><li><a href="lib/types/#Types">Types</a></li><li class="no-marker"><ul><li><a href="lib/types/#Type-hierarchy-design">Type hierarchy design</a></li><li><a href="lib/types/#man-columnhandling">The design of handling of columns of a <code>DataFrame</code></a></li><li><a href="lib/types/#Types-specification">Types specification</a></li></ul></li><li><a href="lib/functions/#Functions">Functions</a></li><li class="no-marker"><ul><li><a href="lib/functions/#Multithreading-support">Multithreading support</a></li><li><a href="lib/functions/#Index">Index</a></li><li><a href="lib/functions/#Constructing-data-frames">Constructing data frames</a></li><li><a href="lib/functions/#Summary-information">Summary information</a></li><li><a href="lib/functions/#Working-with-column-names">Working with column names</a></li><li><a href="lib/functions/#Mutating-and-transforming-data-frames-and-grouped-data-frames">Mutating and transforming data frames and grouped data frames</a></li><li><a href="lib/functions/#Reshaping-data-frames-between-tall-and-wide-formats">Reshaping data frames between tall and wide formats</a></li><li><a href="lib/functions/#Sorting">Sorting</a></li><li><a href="lib/functions/#Joining">Joining</a></li><li><a href="lib/functions/#Grouping">Grouping</a></li><li><a href="lib/functions/#Filtering-rows">Filtering rows</a></li><li><a href="lib/functions/#Working-with-missing-values">Working with missing values</a></li><li><a href="lib/functions/#Iteration">Iteration</a></li><li><a href="lib/functions/#Equality">Equality</a></li><li><a href="lib/functions/#Metadata">Metadata</a></li></ul></li><li><a href="lib/indexing/#Indexing">Indexing</a></li><li class="no-marker"><ul><li><a href="lib/indexing/#General-rules">General rules</a></li><li><a href="lib/indexing/#getindex-and-view"><code>getindex</code> and <code>view</code></a></li><li><a href="lib/indexing/#setindex!"><code>setindex!</code></a></li><li><a href="lib/indexing/#Broadcasting">Broadcasting</a></li><li><a href="lib/indexing/#Indexing-GroupedDataFrames">Indexing <code>GroupedDataFrame</code>s</a></li></ul></li><li><a href="lib/indexing/#Common-API-for-types-defined-in-DataFrames.jl">Common API for types defined in DataFrames.jl</a></li></ul><h2 id="Index"><a class="docs-heading-anchor" href="#Index">Index</a><a id="Index-1"></a><a class="docs-heading-anchor-permalink" href="#Index" title="Permalink"></a></h2><ul><li><a href="lib/types/#DataFrames.AbstractDataFrame"><code>DataFrames.AbstractDataFrame</code></a></li><li><a href="lib/types/#DataFrames.AsTable"><code>DataFrames.AsTable</code></a></li><li><a href="lib/types/#DataFrames.DataFrame"><code>DataFrames.DataFrame</code></a></li><li><a href="lib/types/#DataFrames.DataFrameColumns"><code>DataFrames.DataFrameColumns</code></a></li><li><a href="lib/types/#DataFrames.DataFrameRow"><code>DataFrames.DataFrameRow</code></a></li><li><a href="lib/types/#DataFrames.DataFrameRows"><code>DataFrames.DataFrameRows</code></a></li><li><a href="lib/types/#DataFrames.GroupKey"><code>DataFrames.GroupKey</code></a></li><li><a href="lib/types/#DataFrames.GroupKeys"><code>DataFrames.GroupKeys</code></a></li><li><a href="lib/types/#DataFrames.GroupedDataFrame"><code>DataFrames.GroupedDataFrame</code></a></li><li><a href="lib/types/#DataFrames.RepeatedVector"><code>DataFrames.RepeatedVector</code></a></li><li><a href="lib/types/#DataFrames.StackedVector"><code>DataFrames.StackedVector</code></a></li><li><a href="lib/types/#DataFrames.SubDataFrame"><code>DataFrames.SubDataFrame</code></a></li><li><a href="lib/functions/#Base.Iterators.only"><code>Base.Iterators.only</code></a></li><li><a href="lib/functions/#Base.Iterators.partition"><code>Base.Iterators.partition</code></a></li><li><a href="lib/functions/#Base.allunique"><code>Base.allunique</code></a></li><li><a href="lib/functions/#Base.append!"><code>Base.append!</code></a></li><li><a href="lib/functions/#Base.copy"><code>Base.copy</code></a></li><li><a href="lib/functions/#Base.deleteat!"><code>Base.deleteat!</code></a></li><li><a href="lib/functions/#Base.eachcol"><code>Base.eachcol</code></a></li><li><a href="lib/functions/#Base.eachrow"><code>Base.eachrow</code></a></li><li><a href="lib/functions/#Base.empty"><code>Base.empty</code></a></li><li><a href="lib/functions/#Base.empty!"><code>Base.empty!</code></a></li><li><a href="lib/functions/#Base.filter"><code>Base.filter</code></a></li><li><a href="lib/functions/#Base.filter!"><code>Base.filter!</code></a></li><li><a href="lib/functions/#Base.first"><code>Base.first</code></a></li><li><a href="lib/functions/#Base.get"><code>Base.get</code></a></li><li><a href="lib/functions/#Base.hcat"><code>Base.hcat</code></a></li><li><a href="lib/functions/#Base.insert!"><code>Base.insert!</code></a></li><li><a href="lib/functions/#Base.invpermute!"><code>Base.invpermute!</code></a></li><li><a href="lib/functions/#Base.isapprox"><code>Base.isapprox</code></a></li><li><a href="lib/functions/#Base.isempty"><code>Base.isempty</code></a></li><li><a href="lib/functions/#Base.issorted"><code>Base.issorted</code></a></li><li><a href="lib/functions/#Base.keepat!"><code>Base.keepat!</code></a></li><li><a href="lib/functions/#Base.keys"><code>Base.keys</code></a></li><li><a href="lib/functions/#Base.last"><code>Base.last</code></a></li><li><a href="lib/functions/#Base.length"><code>Base.length</code></a></li><li><a href="lib/functions/#Base.names"><code>Base.names</code></a></li><li><a href="lib/functions/#Base.ndims"><code>Base.ndims</code></a></li><li><a href="lib/functions/#Base.pairs"><code>Base.pairs</code></a></li><li><a href="lib/functions/#Base.parent"><code>Base.parent</code></a></li><li><a href="lib/functions/#Base.permute!"><code>Base.permute!</code></a></li><li><a href="lib/functions/#Base.permutedims"><code>Base.permutedims</code></a></li><li><a href="lib/functions/#Base.pop!"><code>Base.pop!</code></a></li><li><a href="lib/functions/#Base.popat!"><code>Base.popat!</code></a></li><li><a href="lib/functions/#Base.popfirst!"><code>Base.popfirst!</code></a></li><li><a href="lib/functions/#Base.prepend!"><code>Base.prepend!</code></a></li><li><a href="lib/functions/#Base.propertynames"><code>Base.propertynames</code></a></li><li><a href="lib/functions/#Base.push!"><code>Base.push!</code></a></li><li><a href="lib/functions/#Base.pushfirst!"><code>Base.pushfirst!</code></a></li><li><a href="lib/functions/#Base.reduce"><code>Base.reduce</code></a></li><li><a href="lib/functions/#Base.repeat"><code>Base.repeat</code></a></li><li><a href="lib/functions/#Base.resize!"><code>Base.resize!</code></a></li><li><a href="lib/functions/#Base.reverse"><code>Base.reverse</code></a></li><li><a href="lib/functions/#Base.reverse!"><code>Base.reverse!</code></a></li><li><a href="lib/functions/#Base.show"><code>Base.show</code></a></li><li><a href="lib/functions/#Base.similar"><code>Base.similar</code></a></li><li><a href="lib/functions/#Base.size"><code>Base.size</code></a></li><li><a href="lib/functions/#Base.sort"><code>Base.sort</code></a></li><li><a href="lib/functions/#Base.sort!"><code>Base.sort!</code></a></li><li><a href="lib/functions/#Base.sortperm"><code>Base.sortperm</code></a></li><li><a href="lib/functions/#Base.stack"><code>Base.stack</code></a></li><li><a href="lib/functions/#Base.unique"><code>Base.unique</code></a></li><li><a href="lib/functions/#Base.unique!"><code>Base.unique!</code></a></li><li><a href="lib/functions/#Base.values"><code>Base.values</code></a></li><li><a href="lib/functions/#Base.vcat"><code>Base.vcat</code></a></li><li><a href="lib/functions/#DataAPI.allcombinations"><code>DataAPI.allcombinations</code></a></li><li><a href="lib/functions/#DataAPI.antijoin"><code>DataAPI.antijoin</code></a></li><li><a href="lib/functions/#DataAPI.colmetadata"><code>DataAPI.colmetadata</code></a></li><li><a href="lib/functions/#DataAPI.colmetadata!"><code>DataAPI.colmetadata!</code></a></li><li><a href="lib/functions/#DataAPI.colmetadatakeys"><code>DataAPI.colmetadatakeys</code></a></li><li><a href="lib/functions/#DataAPI.crossjoin"><code>DataAPI.crossjoin</code></a></li><li><a href="lib/functions/#DataAPI.deletecolmetadata!"><code>DataAPI.deletecolmetadata!</code></a></li><li><a href="lib/functions/#DataAPI.deletemetadata!"><code>DataAPI.deletemetadata!</code></a></li><li><a href="lib/functions/#DataAPI.describe"><code>DataAPI.describe</code></a></li><li><a href="lib/functions/#DataAPI.emptycolmetadata!"><code>DataAPI.emptycolmetadata!</code></a></li><li><a href="lib/functions/#DataAPI.emptymetadata!"><code>DataAPI.emptymetadata!</code></a></li><li><a href="lib/functions/#DataAPI.groupby"><code>DataAPI.groupby</code></a></li><li><a href="lib/functions/#DataAPI.innerjoin"><code>DataAPI.innerjoin</code></a></li><li><a href="lib/functions/#DataAPI.leftjoin"><code>DataAPI.leftjoin</code></a></li><li><a href="lib/functions/#DataAPI.metadata"><code>DataAPI.metadata</code></a></li><li><a href="lib/functions/#DataAPI.metadata!"><code>DataAPI.metadata!</code></a></li><li><a href="lib/functions/#DataAPI.metadatakeys"><code>DataAPI.metadatakeys</code></a></li><li><a href="lib/functions/#DataAPI.ncol"><code>DataAPI.ncol</code></a></li><li><a href="lib/functions/#DataAPI.nrow"><code>DataAPI.nrow</code></a></li><li><a href="lib/functions/#DataAPI.outerjoin"><code>DataAPI.outerjoin</code></a></li><li><a href="lib/functions/#DataAPI.rightjoin"><code>DataAPI.rightjoin</code></a></li><li><a href="lib/functions/#DataAPI.rownumber"><code>DataAPI.rownumber</code></a></li><li><a href="lib/functions/#DataAPI.semijoin"><code>DataAPI.semijoin</code></a></li><li><a href="lib/functions/#DataFrames.allowmissing!"><code>DataFrames.allowmissing!</code></a></li><li><a href="lib/functions/#DataFrames.combine"><code>DataFrames.combine</code></a></li><li><a href="lib/functions/#DataFrames.completecases"><code>DataFrames.completecases</code></a></li><li><a href="lib/functions/#DataFrames.disallowmissing!"><code>DataFrames.disallowmissing!</code></a></li><li><a href="lib/functions/#DataFrames.dropmissing"><code>DataFrames.dropmissing</code></a></li><li><a href="lib/functions/#DataFrames.dropmissing!"><code>DataFrames.dropmissing!</code></a></li><li><a href="lib/functions/#DataFrames.fillcombinations"><code>DataFrames.fillcombinations</code></a></li><li><a href="lib/functions/#DataFrames.flatten"><code>DataFrames.flatten</code></a></li><li><a href="lib/functions/#DataFrames.groupcols"><code>DataFrames.groupcols</code></a></li><li><a href="lib/functions/#DataFrames.groupindices"><code>DataFrames.groupindices</code></a></li><li><a href="lib/functions/#DataFrames.insertcols"><code>DataFrames.insertcols</code></a></li><li><a href="lib/functions/#DataFrames.insertcols!"><code>DataFrames.insertcols!</code></a></li><li><a href="lib/functions/#DataFrames.leftjoin!"><code>DataFrames.leftjoin!</code></a></li><li><a href="lib/functions/#DataFrames.mapcols"><code>DataFrames.mapcols</code></a></li><li><a href="lib/functions/#DataFrames.mapcols!"><code>DataFrames.mapcols!</code></a></li><li><a href="lib/functions/#DataFrames.nonunique"><code>DataFrames.nonunique</code></a></li><li><a href="lib/functions/#DataFrames.order"><code>DataFrames.order</code></a></li><li><a href="lib/functions/#DataFrames.proprow"><code>DataFrames.proprow</code></a></li><li><a href="lib/functions/#DataFrames.rename"><code>DataFrames.rename</code></a></li><li><a href="lib/functions/#DataFrames.rename!"><code>DataFrames.rename!</code></a></li><li><a href="lib/functions/#DataFrames.repeat!"><code>DataFrames.repeat!</code></a></li><li><a href="lib/functions/#DataFrames.select"><code>DataFrames.select</code></a></li><li><a href="lib/functions/#DataFrames.select!"><code>DataFrames.select!</code></a></li><li><a href="lib/functions/#DataFrames.subset"><code>DataFrames.subset</code></a></li><li><a href="lib/functions/#DataFrames.subset!"><code>DataFrames.subset!</code></a></li><li><a href="lib/functions/#DataFrames.table_transformation"><code>DataFrames.table_transformation</code></a></li><li><a href="lib/functions/#DataFrames.transform"><code>DataFrames.transform</code></a></li><li><a href="lib/functions/#DataFrames.transform!"><code>DataFrames.transform!</code></a></li><li><a href="lib/functions/#DataFrames.unstack"><code>DataFrames.unstack</code></a></li><li><a href="lib/functions/#DataFrames.valuecols"><code>DataFrames.valuecols</code></a></li><li><a href="lib/functions/#Missings.allowmissing"><code>Missings.allowmissing</code></a></li><li><a href="lib/functions/#Missings.disallowmissing"><code>Missings.disallowmissing</code></a></li><li><a href="lib/functions/#Random.shuffle"><code>Random.shuffle</code></a></li><li><a href="lib/functions/#Random.shuffle!"><code>Random.shuffle!</code></a></li></ul></article><nav class="docs-footer"><a class="docs-footer-nextpage" href="man/basics/">First Steps with DataFrames.jl »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Sunday 8 September 2024 08:54">Sunday 8 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/lib/functions/index.html b/dev/lib/functions/index.html
index 916d950d4..2aef46abc 100644
--- a/dev/lib/functions/index.html
+++ b/dev/lib/functions/index.html
@@ -22,7 +22,7 @@
    3 │     1  b     const
    4 │     2  b     const
    5 │     1  c     const
-   6 │     2  c     const</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/dataframe/dataframe.jl#L1480-L1526">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.copy" href="#Base.copy"><code>Base.copy</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">copy(df::DataFrame; copycols::Bool=true)</code></pre><p>Copy data frame <code>df</code>. If <code>copycols=true</code> (the default), return a new  <code>DataFrame</code> holding copies of column vectors in <code>df</code>. If <code>copycols=false</code>, return a new <code>DataFrame</code> sharing column vectors with <code>df</code>.</p><p>Metadata: this function preserves all table-level and column-level metadata.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/dataframe/dataframe.jl#L795-L804">source</a></section><section><div><pre><code class="language-julia hljs">copy(dfr::DataFrameRow)</code></pre><p>Construct a <code>NamedTuple</code> with the same contents as the <a href="../types/#DataFrames.DataFrameRow"><code>DataFrameRow</code></a>. This method returns a <code>NamedTuple</code> so that the returned object is not affected by changes to the parent data frame of which <code>dfr</code> is a view.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/dataframerow/dataframerow.jl#L433-L440">source</a></section><section><div><pre><code class="language-julia hljs">copy(key::GroupKey)</code></pre><p>Construct a <code>NamedTuple</code> with the same contents as the <a href="../types/#DataFrames.GroupKey"><code>GroupKey</code></a>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/groupeddataframe/groupeddataframe.jl#L740-L744">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.similar" href="#Base.similar"><code>Base.similar</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">similar(df::AbstractDataFrame, rows::Integer=nrow(df))</code></pre><p>Create a new <code>DataFrame</code> with the same column names and column element types as <code>df</code>. An optional second argument can be provided to request a number of rows that is different than the number of rows present in <code>df</code>.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L464-L472">source</a></section></article><h2 id="Summary-information"><a class="docs-heading-anchor" href="#Summary-information">Summary information</a><a id="Summary-information-1"></a><a class="docs-heading-anchor-permalink" href="#Summary-information" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.describe" href="#DataAPI.describe"><code>DataAPI.describe</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">describe(df::AbstractDataFrame; cols=:)
+   6 │     2  c     const</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/dataframe/dataframe.jl#L1480-L1526">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.copy" href="#Base.copy"><code>Base.copy</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">copy(df::DataFrame; copycols::Bool=true)</code></pre><p>Copy data frame <code>df</code>. If <code>copycols=true</code> (the default), return a new  <code>DataFrame</code> holding copies of column vectors in <code>df</code>. If <code>copycols=false</code>, return a new <code>DataFrame</code> sharing column vectors with <code>df</code>.</p><p>Metadata: this function preserves all table-level and column-level metadata.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/dataframe/dataframe.jl#L795-L804">source</a></section><section><div><pre><code class="language-julia hljs">copy(dfr::DataFrameRow)</code></pre><p>Construct a <code>NamedTuple</code> with the same contents as the <a href="../types/#DataFrames.DataFrameRow"><code>DataFrameRow</code></a>. This method returns a <code>NamedTuple</code> so that the returned object is not affected by changes to the parent data frame of which <code>dfr</code> is a view.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/dataframerow/dataframerow.jl#L433-L440">source</a></section><section><div><pre><code class="language-julia hljs">copy(key::GroupKey)</code></pre><p>Construct a <code>NamedTuple</code> with the same contents as the <a href="../types/#DataFrames.GroupKey"><code>GroupKey</code></a>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/groupeddataframe/groupeddataframe.jl#L740-L744">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.similar" href="#Base.similar"><code>Base.similar</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">similar(df::AbstractDataFrame, rows::Integer=nrow(df))</code></pre><p>Create a new <code>DataFrame</code> with the same column names and column element types as <code>df</code>. An optional second argument can be provided to request a number of rows that is different than the number of rows present in <code>df</code>.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L464-L472">source</a></section></article><h2 id="Summary-information"><a class="docs-heading-anchor" href="#Summary-information">Summary information</a><a id="Summary-information-1"></a><a class="docs-heading-anchor-permalink" href="#Summary-information" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.describe" href="#DataAPI.describe"><code>DataAPI.describe</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">describe(df::AbstractDataFrame; cols=:)
 describe(df::AbstractDataFrame, stats::Union{Symbol, Pair}...; cols=:)</code></pre><p>Return descriptive statistics for a data frame as a new <code>DataFrame</code> where each row represents a variable and each column a summary statistic.</p><p><strong>Arguments</strong></p><ul><li><code>df</code> : the <code>AbstractDataFrame</code></li><li><code>stats::Union{Symbol, Pair}...</code> : the summary statistics to report. Arguments can be:<ul><li>A symbol from the list <code>:mean</code>, <code>:std</code>, <code>:min</code>, <code>:q25</code>, <code>:median</code>, <code>:q75</code>, <code>:max</code>, <code>:sum</code>, <code>:eltype</code>, <code>:nunique</code>, <code>:nuniqueall</code>, <code>:first</code>, <code>:last</code>, <code>:nnonmissing</code>, and <code>:nmissing</code>. The default statistics used are <code>:mean</code>, <code>:min</code>, <code>:median</code>, <code>:max</code>, <code>:nmissing</code>, and <code>:eltype</code>.</li><li><code>:detailed</code> as the only <code>Symbol</code> argument to return all statistics except <code>:first</code>, <code>:last</code>, <code>:sum</code>, <code>:nuniqueall</code>, and <code>:nnonmissing</code>.</li><li><code>:all</code> as the only <code>Symbol</code> argument to return all statistics.</li><li>A <code>function =&gt; name</code> pair where <code>name</code> is a <code>Symbol</code> or string. This will create a column of summary statistics with the provided name.</li></ul></li><li><code>cols</code> : a keyword argument allowing to select only a subset or transformation of columns from <code>df</code> to describe. Can be any column selector or transformation accepted by <a href="#DataFrames.select"><code>select</code></a>.</li></ul><p><strong>Details</strong></p><p>For <code>Real</code> columns, compute the mean, standard deviation, minimum, first quantile, median, third quantile, and maximum. If a column does not derive from <code>Real</code>, <code>describe</code> will attempt to calculate all statistics, using <code>nothing</code> as a fall-back in the case of an error.</p><p>When <code>stats</code> contains <code>:nunique</code>, <code>describe</code> will report the number of unique values in a column. If a column&#39;s base type derives from <code>Real</code>, <code>:nunique</code> will return <code>nothing</code>s. Use <code>:nuniqueall</code> to report the number of unique values in all columns.</p><p>Missing values are filtered in the calculation of all statistics, however the column <code>:nmissing</code> will report the number of missing values of that variable and <code>:nnonmissing</code> the number of non-missing values.</p><p>If custom functions are provided, they are called repeatedly with the vector corresponding to each column as the only argument. For columns allowing for missing values, the vector is wrapped in a call to <code>skipmissing</code>: custom functions must therefore support such objects (and not only vectors), and cannot access missing values.</p><p>Metadata: this function drops all metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(i=1:10, x=0.1:0.1:1.0, y=&#39;a&#39;:&#39;j&#39;);
 
 julia&gt; describe(df)
@@ -57,7 +57,7 @@
  Row │ variable  min      sum
      │ Symbol    Float64  Float64
 ─────┼────────────────────────────
-   1 │ x             0.1      5.5</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L602-L688">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.isempty" href="#Base.isempty"><code>Base.isempty</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">isempty(df::AbstractDataFrame)</code></pre><p>Return <code>true</code> if data frame <code>df</code> has zero rows, and <code>false</code> otherwise.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L428-L432">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.length" href="#Base.length"><code>Base.length</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">length(dfr::DataFrameRow)</code></pre><p>Return the number of elements of <code>dfr</code>.</p><p>See also: <a href="#Base.size"><code>size</code></a></p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; dfr = DataFrame(a=1:3, b=&#39;a&#39;:&#39;c&#39;)[1, :]
+   1 │ x             0.1      5.5</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L602-L688">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.isempty" href="#Base.isempty"><code>Base.isempty</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">isempty(df::AbstractDataFrame)</code></pre><p>Return <code>true</code> if data frame <code>df</code> has zero rows, and <code>false</code> otherwise.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L428-L432">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.length" href="#Base.length"><code>Base.length</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">length(dfr::DataFrameRow)</code></pre><p>Return the number of elements of <code>dfr</code>.</p><p>See also: <a href="#Base.size"><code>size</code></a></p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; dfr = DataFrame(a=1:3, b=&#39;a&#39;:&#39;c&#39;)[1, :]
 DataFrameRow
  Row │ a      b
      │ Int64  Char
@@ -65,15 +65,15 @@
    1 │     1  a
 
 julia&gt; length(dfr)
-2</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/dataframerow/dataframerow.jl#L355-L374">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.ncol" href="#DataAPI.ncol"><code>DataAPI.ncol</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">ncol(df::AbstractDataFrame)</code></pre><p>Return the number of columns in an <code>AbstractDataFrame</code> <code>df</code>.</p><p>See also <a href="#DataAPI.nrow"><code>nrow</code></a>, <a href="#Base.size"><code>size</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(i=1:10, x=rand(10), y=rand([&quot;a&quot;, &quot;b&quot;, &quot;c&quot;], 10));
+2</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/dataframerow/dataframerow.jl#L355-L374">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.ncol" href="#DataAPI.ncol"><code>DataAPI.ncol</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">ncol(df::AbstractDataFrame)</code></pre><p>Return the number of columns in an <code>AbstractDataFrame</code> <code>df</code>.</p><p>See also <a href="#DataAPI.nrow"><code>nrow</code></a>, <a href="#Base.size"><code>size</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(i=1:10, x=rand(10), y=rand([&quot;a&quot;, &quot;b&quot;, &quot;c&quot;], 10));
 
 julia&gt; ncol(df)
-3</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L410-L425">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.ndims" href="#Base.ndims"><code>Base.ndims</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">ndims(::AbstractDataFrame)
-ndims(::Type{&lt;:AbstractDataFrame})</code></pre><p>Return the number of dimensions of a data frame, which is always <code>2</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L437-L442">source</a></section><section><div><pre><code class="language-julia hljs">ndims(::DataFrameRow)
-ndims(::Type{&lt;:DataFrameRow})</code></pre><p>Return the number of dimensions of a data frame row, which is always <code>1</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/dataframerow/dataframerow.jl#L377-L382">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.nrow" href="#DataAPI.nrow"><code>DataAPI.nrow</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">nrow(df::AbstractDataFrame)</code></pre><p>Return the number of rows in an <code>AbstractDataFrame</code> <code>df</code>.</p><p>See also: <a href="#DataAPI.ncol"><code>ncol</code></a>, <a href="#Base.size"><code>size</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(i=1:10, x=rand(10), y=rand([&quot;a&quot;, &quot;b&quot;, &quot;c&quot;], 10));
+3</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L410-L425">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.ndims" href="#Base.ndims"><code>Base.ndims</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">ndims(::AbstractDataFrame)
+ndims(::Type{&lt;:AbstractDataFrame})</code></pre><p>Return the number of dimensions of a data frame, which is always <code>2</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L437-L442">source</a></section><section><div><pre><code class="language-julia hljs">ndims(::DataFrameRow)
+ndims(::Type{&lt;:DataFrameRow})</code></pre><p>Return the number of dimensions of a data frame row, which is always <code>1</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/dataframerow/dataframerow.jl#L377-L382">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.nrow" href="#DataAPI.nrow"><code>DataAPI.nrow</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">nrow(df::AbstractDataFrame)</code></pre><p>Return the number of rows in an <code>AbstractDataFrame</code> <code>df</code>.</p><p>See also: <a href="#DataAPI.ncol"><code>ncol</code></a>, <a href="#Base.size"><code>size</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(i=1:10, x=rand(10), y=rand([&quot;a&quot;, &quot;b&quot;, &quot;c&quot;], 10));
 
 julia&gt; nrow(df)
-10</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/dataframe/dataframe.jl#L449-L464">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.rownumber" href="#DataAPI.rownumber"><code>DataAPI.rownumber</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">rownumber(dfr::DataFrameRow)</code></pre><p>Return a row number in the <code>AbstractDataFrame</code> that <code>dfr</code> was created from.</p><p>Note that this differs from the first element in the tuple returned by <code>parentindices</code>. The latter gives the row number in the <code>parent(dfr)</code>, which is the source <code>DataFrame</code> where data that <code>dfr</code> gives access to is stored.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(reshape(1:12, 3, 4), :auto)
+10</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/dataframe/dataframe.jl#L449-L464">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.rownumber" href="#DataAPI.rownumber"><code>DataAPI.rownumber</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">rownumber(dfr::DataFrameRow)</code></pre><p>Return a row number in the <code>AbstractDataFrame</code> that <code>dfr</code> was created from.</p><p>Note that this differs from the first element in the tuple returned by <code>parentindices</code>. The latter gives the row number in the <code>parent(dfr)</code>, which is the source <code>DataFrame</code> where data that <code>dfr</code> gives access to is stored.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(reshape(1:12, 3, 4), :auto)
 3×4 DataFrame
  Row │ x1     x2     x3     x4
      │ Int64  Int64  Int64  Int64
@@ -132,7 +132,7 @@
 ─────┼────────────────────────────
    1 │     1      4      7     10
    2 │     2      5      8     11
-   3 │     3      6      9     12</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/dataframerow/dataframerow.jl#L121-L193">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.show" href="#Base.show"><code>Base.show</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">show([io::IO, ]df::AbstractDataFrame;
+   3 │     3      6      9     12</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/dataframerow/dataframerow.jl#L121-L193">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.show" href="#Base.show"><code>Base.show</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">show([io::IO, ]df::AbstractDataFrame;
      allrows::Bool = !get(io, :limit, false),
      allcols::Bool = !get(io, :limit, false),
      allgroups::Bool = !get(io, :limit, false),
@@ -151,7 +151,7 @@
 ───────────────
      1  x
      2  y
-     3  z</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/show.jl#L284-L338">source</a></section><section><div><pre><code class="language-julia hljs">show(io::IO, mime::MIME, df::AbstractDataFrame)</code></pre><p>Render a data frame to an I/O stream in MIME type <code>mime</code>.</p><p><strong>Arguments</strong></p><ul><li><code>io::IO</code>: The I/O stream to which <code>df</code> will be printed.</li><li><code>mime::MIME</code>: supported MIME types are: <code>&quot;text/plain&quot;</code>, <code>&quot;text/html&quot;</code>, <code>&quot;text/latex&quot;</code>, <code>&quot;text/csv&quot;</code>, <code>&quot;text/tab-separated-values&quot;</code> (the last two MIME types do not support  showing <code>#undef</code> values)</li><li><code>df::AbstractDataFrame</code>: The data frame to print.</li></ul><p>Additionally selected MIME types support passing the following keyword arguments:</p><ul><li>MIME type <code>&quot;text/plain&quot;</code> accepts all listed keyword arguments and their behavior is identical as for <code>show(::IO, ::AbstractDataFrame)</code></li><li>MIME type <code>&quot;text/html&quot;</code> accepts the following keyword arguments:<ul><li><code>eltypes::Bool = true</code>: Whether to print the column types under column names.</li><li><code>summary::Bool = true</code>: Whether to print a brief string summary of the data frame.</li><li><code>max_column_width::AbstractString = &quot;&quot;</code>: The maximum column width. It must     be a string containing a valid CSS length. For example, passing     &quot;100px&quot; will limit the width of all columns to 100 pixels. If empty,     the columns will be rendered without limits.</li><li><code>kwargs...</code>: Any keyword argument supported by the function <code>pretty_table</code> of PrettyTables.jl can be passed here to customize the output.</li></ul></li></ul><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; show(stdout, MIME(&quot;text/latex&quot;), DataFrame(A=1:3, B=[&quot;x&quot;, &quot;y&quot;, &quot;z&quot;]))
+     3  z</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/show.jl#L284-L338">source</a></section><section><div><pre><code class="language-julia hljs">show(io::IO, mime::MIME, df::AbstractDataFrame)</code></pre><p>Render a data frame to an I/O stream in MIME type <code>mime</code>.</p><p><strong>Arguments</strong></p><ul><li><code>io::IO</code>: The I/O stream to which <code>df</code> will be printed.</li><li><code>mime::MIME</code>: supported MIME types are: <code>&quot;text/plain&quot;</code>, <code>&quot;text/html&quot;</code>, <code>&quot;text/latex&quot;</code>, <code>&quot;text/csv&quot;</code>, <code>&quot;text/tab-separated-values&quot;</code> (the last two MIME types do not support  showing <code>#undef</code> values)</li><li><code>df::AbstractDataFrame</code>: The data frame to print.</li></ul><p>Additionally selected MIME types support passing the following keyword arguments:</p><ul><li>MIME type <code>&quot;text/plain&quot;</code> accepts all listed keyword arguments and their behavior is identical as for <code>show(::IO, ::AbstractDataFrame)</code></li><li>MIME type <code>&quot;text/html&quot;</code> accepts the following keyword arguments:<ul><li><code>eltypes::Bool = true</code>: Whether to print the column types under column names.</li><li><code>summary::Bool = true</code>: Whether to print a brief string summary of the data frame.</li><li><code>max_column_width::AbstractString = &quot;&quot;</code>: The maximum column width. It must     be a string containing a valid CSS length. For example, passing     &quot;100px&quot; will limit the width of all columns to 100 pixels. If empty,     the columns will be rendered without limits.</li><li><code>kwargs...</code>: Any keyword argument supported by the function <code>pretty_table</code> of PrettyTables.jl can be passed here to customize the output.</li></ul></li></ul><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; show(stdout, MIME(&quot;text/latex&quot;), DataFrame(A=1:3, B=[&quot;x&quot;, &quot;y&quot;, &quot;z&quot;]))
 \begin{tabular}{r|cc}
 	&amp; A &amp; B\\
 	\hline
@@ -167,13 +167,13 @@
 &quot;A&quot;,&quot;B&quot;
 1,&quot;x&quot;
 2,&quot;y&quot;
-3,&quot;z&quot;</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/io.jl#L89-L134">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.size" href="#Base.size"><code>Base.size</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">size(df::AbstractDataFrame[, dim])</code></pre><p>Return a tuple containing the number of rows and columns of <code>df</code>. Optionally a dimension <code>dim</code> can be specified, where <code>1</code> corresponds to rows and <code>2</code> corresponds to columns.</p><p>See also: <a href="#DataAPI.nrow"><code>nrow</code></a>, <a href="#DataAPI.ncol"><code>ncol</code></a></p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:3, b=&#39;a&#39;:&#39;c&#39;);
+3,&quot;z&quot;</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/io.jl#L89-L134">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.size" href="#Base.size"><code>Base.size</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">size(df::AbstractDataFrame[, dim])</code></pre><p>Return a tuple containing the number of rows and columns of <code>df</code>. Optionally a dimension <code>dim</code> can be specified, where <code>1</code> corresponds to rows and <code>2</code> corresponds to columns.</p><p>See also: <a href="#DataAPI.nrow"><code>nrow</code></a>, <a href="#DataAPI.ncol"><code>ncol</code></a></p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:3, b=&#39;a&#39;:&#39;c&#39;);
 
 julia&gt; size(df)
 (3, 2)
 
 julia&gt; size(df, 1)
-3</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L378-L398">source</a></section><section><div><pre><code class="language-julia hljs">size(dfr::DataFrameRow[, dim])</code></pre><p>Return a 1-tuple containing the number of elements of <code>dfr</code>. If an optional dimension <code>dim</code> is specified, it must be <code>1</code>, and the number of elements is returned directly as a number.</p><p>See also: <a href="#Base.length"><code>length</code></a></p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; dfr = DataFrame(a=1:3, b=&#39;a&#39;:&#39;c&#39;)[1, :]
+3</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L378-L398">source</a></section><section><div><pre><code class="language-julia hljs">size(dfr::DataFrameRow[, dim])</code></pre><p>Return a 1-tuple containing the number of elements of <code>dfr</code>. If an optional dimension <code>dim</code> is specified, it must be <code>1</code>, and the number of elements is returned directly as a number.</p><p>See also: <a href="#Base.length"><code>length</code></a></p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; dfr = DataFrame(a=1:3, b=&#39;a&#39;:&#39;c&#39;)[1, :]
 DataFrameRow
  Row │ a      b
      │ Int64  Char
@@ -184,7 +184,7 @@
 (2,)
 
 julia&gt; size(dfr, 1)
-2</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/dataframerow/dataframerow.jl#L327-L351">source</a></section></article><h2 id="Working-with-column-names"><a class="docs-heading-anchor" href="#Working-with-column-names">Working with column names</a><a id="Working-with-column-names-1"></a><a class="docs-heading-anchor-permalink" href="#Working-with-column-names" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.names" href="#Base.names"><code>Base.names</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">names(df::AbstractDataFrame, cols=:)
+2</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/dataframerow/dataframerow.jl#L327-L351">source</a></section></article><h2 id="Working-with-column-names"><a class="docs-heading-anchor" href="#Working-with-column-names">Working with column names</a><a id="Working-with-column-names-1"></a><a class="docs-heading-anchor-permalink" href="#Working-with-column-names" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.names" href="#Base.names"><code>Base.names</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">names(df::AbstractDataFrame, cols=:)
 names(df::DataFrameRow, cols=:)
 names(df::GroupedDataFrame, cols=:)
 names(df::DataFrameRows, cols=:)
@@ -229,7 +229,7 @@
 julia&gt; names(df, any.(ismissing, eachcol(df))) # pick columns that contain missing values
 2-element Vector{String}:
  &quot;x1&quot;
- &quot;x3&quot;</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L29-L97">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.propertynames" href="#Base.propertynames"><code>Base.propertynames</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">propertynames(df::AbstractDataFrame)</code></pre><p>Return a freshly allocated <code>Vector{Symbol}</code> of names of columns contained in <code>df</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L451-L455">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.rename" href="#DataFrames.rename"><code>DataFrames.rename</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">rename(df::AbstractDataFrame, vals::AbstractVector{Symbol};
+ &quot;x3&quot;</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L29-L97">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.propertynames" href="#Base.propertynames"><code>Base.propertynames</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">propertynames(df::AbstractDataFrame)</code></pre><p>Return a freshly allocated <code>Vector{Symbol}</code> of names of columns contained in <code>df</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L451-L455">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.rename" href="#DataFrames.rename"><code>DataFrames.rename</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">rename(df::AbstractDataFrame, vals::AbstractVector{Symbol};
        makeunique::Bool=false)
 rename(df::AbstractDataFrame, vals::AbstractVector{&lt;:AbstractString};
        makeunique::Bool=false)
@@ -291,7 +291,7 @@
      │ Int64  Int64  Int64
 ─────┼─────────────────────
    1 │     1      2      3
-</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L268-L370">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.rename!" href="#DataFrames.rename!"><code>DataFrames.rename!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">rename!(df::AbstractDataFrame, vals::AbstractVector{Symbol};
+</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L268-L370">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.rename!" href="#DataFrames.rename!"><code>DataFrames.rename!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">rename!(df::AbstractDataFrame, vals::AbstractVector{Symbol};
         makeunique::Bool=false)
 rename!(df::AbstractDataFrame, vals::AbstractVector{&lt;:AbstractString};
         makeunique::Bool=false)
@@ -342,7 +342,7 @@
      │ Int64  Int64  Int64
 ─────┼─────────────────────
    1 │     1      2      3
-</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L118-L208">source</a></section></article><h2 id="Mutating-and-transforming-data-frames-and-grouped-data-frames"><a class="docs-heading-anchor" href="#Mutating-and-transforming-data-frames-and-grouped-data-frames">Mutating and transforming data frames and grouped data frames</a><a id="Mutating-and-transforming-data-frames-and-grouped-data-frames-1"></a><a class="docs-heading-anchor-permalink" href="#Mutating-and-transforming-data-frames-and-grouped-data-frames" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.append!" href="#Base.append!"><code>Base.append!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">append!(df::DataFrame, tables...; cols::Symbol=:setequal,
+</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L118-L208">source</a></section></article><h2 id="Mutating-and-transforming-data-frames-and-grouped-data-frames"><a class="docs-heading-anchor" href="#Mutating-and-transforming-data-frames-and-grouped-data-frames">Mutating and transforming data frames and grouped data frames</a><a id="Mutating-and-transforming-data-frames-and-grouped-data-frames-1"></a><a class="docs-heading-anchor-permalink" href="#Mutating-and-transforming-data-frames-and-grouped-data-frames" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.append!" href="#Base.append!"><code>Base.append!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">append!(df::DataFrame, tables...; cols::Symbol=:setequal,
         promote::Bool=(cols in [:union, :subset]))</code></pre><p>Add the rows of tables passed as <code>tables</code> to the end of <code>df</code>. If the table is not an <code>AbstractDataFrame</code> then it is converted using <code>DataFrame(table, copycols=false)</code> before being appended.</p><p>The exact behavior of <code>append!</code> depends on the <code>cols</code> argument:</p><ul><li>If <code>cols == :setequal</code> (this is the default) then <code>df2</code> must contain exactly the same columns as <code>df</code> (but possibly in a different order).</li><li>If <code>cols == :orderequal</code> then <code>df2</code> must contain the same columns in the same order (for <code>AbstractDict</code> this option requires that <code>keys(row)</code> matches <code>propertynames(df)</code> to allow for support of ordered dicts; however, if <code>df2</code> is a <code>Dict</code> an error is thrown as it is an unordered collection).</li><li>If <code>cols == :intersect</code> then <code>df2</code> may contain more columns than <code>df</code>, but all column names that are present in <code>df</code> must be present in <code>df2</code> and only these are used.</li><li>If <code>cols == :subset</code> then <code>append!</code> behaves like for <code>:intersect</code> but if some column is missing in <code>df2</code> then a <code>missing</code> value is pushed to <code>df</code>.</li><li>If <code>cols == :union</code> then <code>append!</code> adds columns missing in <code>df</code> that are present in <code>df2</code>, for columns present in <code>df</code> but missing in <code>df2</code> a <code>missing</code> value is pushed.</li></ul><p>If <code>promote=true</code> and element type of a column present in <code>df</code> does not allow the type of a pushed argument then a new column with a promoted element type allowing it is freshly allocated and stored in <code>df</code>. If <code>promote=false</code> an error is thrown.</p><p>The above rule has the following exceptions:</p><ul><li>If <code>df</code> has no columns then copies of columns from <code>df2</code> are added to it.</li><li>If <code>df2</code> has no columns then calling <code>append!</code> leaves <code>df</code> unchanged.</li></ul><p>Please note that <code>append!</code> must not be used on a <code>DataFrame</code> that contains columns that are aliases (equal when compared with <code>===</code>).</p><p>Metadata: table-level <code>:note</code>-style metadata and column-level <code>:note</code>-style metadata for columns present in <code>df</code> are preserved. If new columns are added their <code>:note</code>-style metadata is copied from the appended table. Other metadata is dropped.</p><p>See also: use <a href="#Base.push!"><code>push!</code></a> to add individual rows to a data frame, <a href="#Base.prepend!"><code>prepend!</code></a> to add a table at the beginning, and <a href="#Base.vcat"><code>vcat</code></a> to vertically concatenate data frames.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df1 = DataFrame(A=1:3, B=1:3)
 3×2 DataFrame
  Row │ A      B
@@ -385,7 +385,7 @@
    3 │       6.0        6  missing
    4 │       1.0  missing  missing
    5 │ missing    missing        1
-   6 │ missing    missing        2</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/dataframe/insertion.jl#L1-L92">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.combine" href="#DataFrames.combine"><code>DataFrames.combine</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">combine(df::AbstractDataFrame, args...;
+   6 │ missing    missing        2</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/dataframe/insertion.jl#L1-L92">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.combine" href="#DataFrames.combine"><code>DataFrames.combine</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">combine(df::AbstractDataFrame, args...;
         renamecols::Bool=true, threads::Bool=true)
 combine(f::Callable, df::AbstractDataFrame;
         renamecols::Bool=true, threads::Bool=true)
@@ -625,7 +625,7 @@
    5 │     3      2      3      5
    6 │     3      2      7      9
    7 │     4      1      4      5
-   8 │     4      1      8      9</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/selection.jl#L1396-L1673">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.fillcombinations" href="#DataFrames.fillcombinations"><code>DataFrames.fillcombinations</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">fillcombinations(df::AbstractDataFrame, indexcols;
+   8 │     4      1      8      9</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/selection.jl#L1396-L1673">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.fillcombinations" href="#DataFrames.fillcombinations"><code>DataFrames.fillcombinations</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">fillcombinations(df::AbstractDataFrame, indexcols;
                      allowduplicates::Bool=false,
                      fill=missing)</code></pre><p>Generate all combinations of levels of column(s) <code>indexcols</code> in data frame <code>df</code>. Levels and their order are determined by the <code>levels</code> function (i.e. unique values sorted lexicographically by default, or a custom set of levels for e.g. <code>CategoricalArray</code> columns), in addition to <code>missing</code> if present.</p><p>For combinations of <code>indexcols</code> not present in <code>df</code> these columns are filled with the <code>fill</code> value (<code>missing</code> by default).</p><p>If <code>allowduplicates=false</code> (the default) <code>indexcols</code> may only contain unique combinations of <code>indexcols</code> values. If <code>allowduplicates=true</code> duplicates are allowed.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(x=1:2, y=&#39;a&#39;:&#39;b&#39;, z=[&quot;x&quot;, &quot;y&quot;])
 2×3 DataFrame
@@ -653,7 +653,7 @@
    1 │      1  a     x
    2 │      0  b     x
    3 │      0  a     y
-   4 │      2  b     y</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L1420-L1470">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.flatten" href="#DataFrames.flatten"><code>DataFrames.flatten</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">flatten(df::AbstractDataFrame, cols; scalar::Type=Union{})</code></pre><p>When columns <code>cols</code> of data frame <code>df</code> have iterable elements that define <code>length</code> (for example a <code>Vector</code> of <code>Vector</code>s), return a <code>DataFrame</code> where each element of each <code>col</code> in <code>cols</code> is flattened, meaning the column corresponding to <code>col</code> becomes a longer vector where the original entries are concatenated. Elements of row <code>i</code> of <code>df</code> in columns other than <code>cols</code> will be repeated according to the length of <code>df[i, col]</code>. These lengths must therefore be the same for each <code>col</code> in <code>cols</code>, or else an error is raised. Note that these elements are not copied, and thus if they are mutable changing them in the returned <code>DataFrame</code> will affect <code>df</code>.</p><p><code>cols</code> can be any column selector (<code>Symbol</code>, string or integer; <code>:</code>, <code>Cols</code>, <code>All</code>, <code>Between</code>, <code>Not</code>, a regular expression, or a vector of <code>Symbol</code>s, strings or integers).</p><p>If <code>scalar</code> is passed then values that have this type in flattened columns are treated as scalars and broadcasted as many times as is needed to match lengths of values stored in other columns. If all values in a row are scalars, a single row is produced.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df1 = DataFrame(a=[1, 2], b=[[1, 2], [3, 4]], c=[[5, 6], [7, 8]])
+   4 │      2  b     y</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L1420-L1470">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.flatten" href="#DataFrames.flatten"><code>DataFrames.flatten</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">flatten(df::AbstractDataFrame, cols; scalar::Type=Union{})</code></pre><p>When columns <code>cols</code> of data frame <code>df</code> have iterable elements that define <code>length</code> (for example a <code>Vector</code> of <code>Vector</code>s), return a <code>DataFrame</code> where each element of each <code>col</code> in <code>cols</code> is flattened, meaning the column corresponding to <code>col</code> becomes a longer vector where the original entries are concatenated. Elements of row <code>i</code> of <code>df</code> in columns other than <code>cols</code> will be repeated according to the length of <code>df[i, col]</code>. These lengths must therefore be the same for each <code>col</code> in <code>cols</code>, or else an error is raised. Note that these elements are not copied, and thus if they are mutable changing them in the returned <code>DataFrame</code> will affect <code>df</code>.</p><p><code>cols</code> can be any column selector (<code>Symbol</code>, string or integer; <code>:</code>, <code>Cols</code>, <code>All</code>, <code>Between</code>, <code>Not</code>, a regular expression, or a vector of <code>Symbol</code>s, strings or integers).</p><p>If <code>scalar</code> is passed then values that have this type in flattened columns are treated as scalars and broadcasted as many times as is needed to match lengths of values stored in other columns. If all values in a row are scalars, a single row is produced.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df1 = DataFrame(a=[1, 2], b=[[1, 2], [3, 4]], c=[[5, 6], [7, 8]])
 2×3 DataFrame
  Row │ a      b       c
      │ Int64  Array…  Array…
@@ -730,7 +730,7 @@
    2 │     1        2        6
    3 │     2  missing  missing
    4 │     3  missing        7
-   5 │     3  missing        8</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L2335-L2439">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.hcat" href="#Base.hcat"><code>Base.hcat</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">hcat(df::AbstractDataFrame...;
+   5 │     3  missing        8</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L2335-L2439">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.hcat" href="#Base.hcat"><code>Base.hcat</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">hcat(df::AbstractDataFrame...;
      makeunique::Bool=false, copycols::Bool=true)</code></pre><p>Horizontally concatenate data frames.</p><p>If <code>makeunique=false</code> (the default) column names of passed objects must be unique. If <code>makeunique=true</code> then duplicate column names will be suffixed with <code>_i</code> (<code>i</code> starting at 1 for the first duplicate).</p><p>If <code>copycols=true</code> (the default) then the <code>DataFrame</code> returned by <code>hcat</code> will contain copied columns from the source data frames. If <code>copycols=false</code> then it will contain columns as they are stored in the source (without copying). This option should be used with caution as mutating either the columns in sources or in the returned <code>DataFrame</code> might lead to the corruption of the other object.</p><p>Metadata: <code>hcat</code> propagates table-level <code>:note</code>-style metadata for keys that are present in all passed data frames and have the same value; it propagates column-level <code>:note</code>-style metadata.</p><p><strong>Example</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df1 = DataFrame(A=1:3, B=1:3)
 3×2 DataFrame
  Row │ A      B
@@ -764,7 +764,7 @@
 julia&gt; df3 = hcat(df1, df2, makeunique=true, copycols=false);
 
 julia&gt; df3.A === df1.A
-true</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L1573-L1631">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.insert!" href="#Base.insert!"><code>Base.insert!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">insert!(df::DataFrame, index::Integer, row::Union{Tuple, AbstractArray};
+true</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L1573-L1631">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.insert!" href="#Base.insert!"><code>Base.insert!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">insert!(df::DataFrame, index::Integer, row::Union{Tuple, AbstractArray};
         cols::Symbol=:setequal, promote::Bool=false)
 insert!(df::DataFrame, index::Integer, row::Union{DataFrameRow, NamedTuple,
                                                   AbstractDict, Tables.AbstractRow};
@@ -835,7 +835,7 @@
    5 │ b              2  missing
    6 │ c              3  missing
    7 │ a              1  missing
-   8 │ 1.0      missing        1.0</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/dataframe/insertion.jl#L653-L738">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.insertcols" href="#DataFrames.insertcols"><code>DataFrames.insertcols</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">insertcols(df::AbstractDataFrame[, col], (name=&gt;val)::Pair...;
+   8 │ 1.0      missing        1.0</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/dataframe/insertion.jl#L653-L738">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.insertcols" href="#DataFrames.insertcols"><code>DataFrames.insertcols</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">insertcols(df::AbstractDataFrame[, col], (name=&gt;val)::Pair...;
            after::Bool=false, makeunique::Bool=false, copycols::Bool=true)</code></pre><p>Insert a column into a copy of <code>df</code> data frame using the <a href="#DataFrames.insertcols!"><code>insertcols!</code></a> function and return the newly created data frame.</p><p>If <code>col</code> is omitted it is set to <code>ncol(df)+1</code> (the column is inserted as the last column).</p><p><strong>Arguments</strong></p><ul><li><code>df</code> : the data frame to which we want to add columns</li><li><code>col</code> : a position at which we want to insert a column, passed as an integer or a column name (a string or a <code>Symbol</code>); the column selected with <code>col</code> and columns following it are shifted to the right in <code>df</code> after the operation</li><li><code>name</code> : the name of the new column</li><li><code>val</code> : an <code>AbstractVector</code> giving the contents of the new column or a value of any type other than <code>AbstractArray</code> which will be repeated to fill a new vector; As a particular rule a values stored in a <code>Ref</code> or a <code>0</code>-dimensional <code>AbstractArray</code> are unwrapped and treated in the same way</li><li><code>after</code> : if <code>true</code> columns are inserted after <code>col</code></li><li><code>makeunique</code> : defines what to do if <code>name</code> already exists in <code>df</code>; if it is <code>false</code> an error will be thrown; if it is <code>true</code> a new unique name will be generated by adding a suffix</li><li><code>copycols</code> : whether vectors passed as columns should be copied</li></ul><p>If <code>val</code> is an <code>AbstractRange</code> then the result of <code>collect(val)</code> is inserted.</p><p>If <code>df</code> is a <code>SubDataFrame</code> then it must have been created with <code>:</code> as column selector (otherwise an error is thrown). In this case the <code>copycols</code> keyword argument is ignored (i.e. the added column is always copied) and the parent data frame&#39;s column is filled with <code>missing</code> in rows that are filtered out by <code>df</code>.</p><p>If <code>df</code> isa <code>DataFrame</code> that has no columns and only values other than <code>AbstractVector</code> are passed then it is used to create a one-element column. If <code>df</code> isa <code>DataFrame</code> that has no columns and at least one <code>AbstractVector</code> is passed then its length is used to determine the number of elements in all created columns. In all other cases the number of rows in all created columns must match <code>nrow(df)</code>.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p>See also <a href="#DataFrames.insertcols!"><code>insertcols!</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:3)
 3×1 DataFrame
  Row │ a
@@ -870,7 +870,7 @@
 ─────┼──────────────
    1 │     1      7
    2 │     2      8
-   3 │     3      9</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L2928-L2979">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.insertcols!" href="#DataFrames.insertcols!"><code>DataFrames.insertcols!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">insertcols!(df::AbstractDataFrame[, col], (name=&gt;val)::Pair...;
+   3 │     3      9</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L2928-L2979">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.insertcols!" href="#DataFrames.insertcols!"><code>DataFrames.insertcols!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">insertcols!(df::AbstractDataFrame[, col], (name=&gt;val)::Pair...;
             after::Bool=false, makeunique::Bool=false, copycols::Bool=true)</code></pre><p>Insert a column into a data frame in place. Return the updated data frame.</p><p>If <code>col</code> is omitted it is set to <code>ncol(df)+1</code> (the column is inserted as the last column).</p><p><strong>Arguments</strong></p><ul><li><code>df</code> : the data frame to which we want to add columns</li><li><code>col</code> : a position at which we want to insert a column, passed as an integer or a column name (a string or a <code>Symbol</code>); the column selected with <code>col</code> and columns following it are shifted to the right in <code>df</code> after the operation</li><li><code>name</code> : the name of the new column</li><li><code>val</code> : an <code>AbstractVector</code> giving the contents of the new column or a value of any type other than <code>AbstractArray</code> which will be repeated to fill a new vector; As a particular rule a values stored in a <code>Ref</code> or a <code>0</code>-dimensional <code>AbstractArray</code> are unwrapped and treated in the same way</li><li><code>after</code> : if <code>true</code> columns are inserted after <code>col</code></li><li><code>makeunique</code> : defines what to do if <code>name</code> already exists in <code>df</code>; if it is <code>false</code> an error will be thrown; if it is <code>true</code> a new unique name will be generated by adding a suffix</li><li><code>copycols</code> : whether vectors passed as columns should be copied</li></ul><p>If <code>val</code> is an <code>AbstractRange</code> then the result of <code>collect(val)</code> is inserted.</p><p>If <code>df</code> is a <code>SubDataFrame</code> then it must have been created with <code>:</code> as column selector (otherwise an error is thrown). In this case the <code>copycols</code> keyword argument is ignored (i.e. the added column is always copied) and the parent data frame&#39;s column is filled with <code>missing</code> in rows that are filtered out by <code>df</code>.</p><p>If <code>df</code> isa <code>DataFrame</code> that has no columns and only values other than <code>AbstractVector</code> are passed then it is used to create a one-element column. If <code>df</code> isa <code>DataFrame</code> that has no columns and at least one <code>AbstractVector</code> is passed then its length is used to determine the number of elements in all created columns. In all other cases the number of rows in all created columns must match <code>nrow(df)</code>.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p>Metadata having other styles is dropped (from parent data frame when <code>df</code> is a <code>SubDataFrame</code>).</p><p>See also <a href="#DataFrames.insertcols"><code>insertcols</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:3)
 3×1 DataFrame
  Row │ a
@@ -905,7 +905,7 @@
 ─────┼──────────────────────────────────
    1 │ a         7      2      3      1
    2 │ b         8      3      4      2
-   3 │ c         9      4      5      3</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L2985-L3036">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.invpermute!" href="#Base.invpermute!"><code>Base.invpermute!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">invpermute!(df::AbstractDataFrame, p)</code></pre><p>Like <a href="#Base.permute!"><code>permute!</code></a>, but the inverse of the given permutation is applied.</p><p><code>invpermute!</code> will produce a correct result even if some columns of passed data frame or permutation <code>p</code> are identical (checked with <code>===</code>). Otherwise, if two columns share some part of memory but are not identical (e.g. are different views of the same parent vector) then <code>invpermute!</code> result might be incorrect.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p>Metadata having other styles is dropped (from parent data frame when <code>df</code> is a <code>SubDataFrame</code>).</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:5, b=6:10, c=11:15)
+   3 │ c         9      4      5      3</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L2985-L3036">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.invpermute!" href="#Base.invpermute!"><code>Base.invpermute!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">invpermute!(df::AbstractDataFrame, p)</code></pre><p>Like <a href="#Base.permute!"><code>permute!</code></a>, but the inverse of the given permutation is applied.</p><p><code>invpermute!</code> will produce a correct result even if some columns of passed data frame or permutation <code>p</code> are identical (checked with <code>===</code>). Otherwise, if two columns share some part of memory but are not identical (e.g. are different views of the same parent vector) then <code>invpermute!</code> result might be incorrect.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p>Metadata having other styles is dropped (from parent data frame when <code>df</code> is a <code>SubDataFrame</code>).</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:5, b=6:10, c=11:15)
 5×3 DataFrame
  Row │ a      b      c
      │ Int64  Int64  Int64
@@ -936,7 +936,7 @@
    2 │     2      7     12
    3 │     3      8     13
    4 │     4      9     14
-   5 │     5     10     15</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L2767-L2816">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.mapcols" href="#DataFrames.mapcols"><code>DataFrames.mapcols</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">mapcols(f::Union{Function, Type}, df::AbstractDataFrame; cols=All())</code></pre><p>Return a <code>DataFrame</code> where each column of <code>df</code> selected by <code>cols</code> (by default, all columns) is transformed using function <code>f</code>. Columns not selected by <code>cols</code> are copied.</p><p><code>f</code> must return <code>AbstractVector</code> objects all with the same length or scalars (all values other than <code>AbstractVector</code> are considered to be a scalar).</p><p>The <code>cols</code> column selector can be any value accepted as column selector by the <code>names</code> function.</p><p>Note that <code>mapcols</code> guarantees not to reuse the columns from <code>df</code> in the returned <code>DataFrame</code>. If <code>f</code> returns its argument then it gets copied before being stored.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(x=1:4, y=11:14)
+   5 │     5     10     15</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L2767-L2816">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.mapcols" href="#DataFrames.mapcols"><code>DataFrames.mapcols</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">mapcols(f::Union{Function, Type}, df::AbstractDataFrame; cols=All())</code></pre><p>Return a <code>DataFrame</code> where each column of <code>df</code> selected by <code>cols</code> (by default, all columns) is transformed using function <code>f</code>. Columns not selected by <code>cols</code> are copied.</p><p><code>f</code> must return <code>AbstractVector</code> objects all with the same length or scalars (all values other than <code>AbstractVector</code> are considered to be a scalar).</p><p>The <code>cols</code> column selector can be any value accepted as column selector by the <code>names</code> function.</p><p>Note that <code>mapcols</code> guarantees not to reuse the columns from <code>df</code> in the returned <code>DataFrame</code>. If <code>f</code> returns its argument then it gets copied before being stored.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(x=1:4, y=11:14)
 4×2 DataFrame
  Row │ x      y
      │ Int64  Int64
@@ -964,7 +964,7 @@
    1 │     1    121
    2 │     2    144
    3 │     3    169
-   4 │     4    196</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/iteration.jl#L413-L462">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.mapcols!" href="#DataFrames.mapcols!"><code>DataFrames.mapcols!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">mapcols!(f::Union{Function, Type}, df::DataFrame; cols=All())</code></pre><p>Update a <code>DataFrame</code> in-place where each column of <code>df</code> selected by <code>cols</code> (by default, all columns) is transformed using function <code>f</code>. Columns not selected by <code>cols</code> are left unchanged.</p><p><code>f</code> must return <code>AbstractVector</code> objects all with the same length or scalars (all values other than <code>AbstractVector</code> are considered to be a scalar).</p><p>Note that <code>mapcols!</code> reuses the columns from <code>df</code> if they are returned by <code>f</code>.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(x=1:4, y=11:14)
+   4 │     4    196</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/iteration.jl#L413-L462">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.mapcols!" href="#DataFrames.mapcols!"><code>DataFrames.mapcols!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">mapcols!(f::Union{Function, Type}, df::DataFrame; cols=All())</code></pre><p>Update a <code>DataFrame</code> in-place where each column of <code>df</code> selected by <code>cols</code> (by default, all columns) is transformed using function <code>f</code>. Columns not selected by <code>cols</code> are left unchanged.</p><p><code>f</code> must return <code>AbstractVector</code> objects all with the same length or scalars (all values other than <code>AbstractVector</code> are considered to be a scalar).</p><p>Note that <code>mapcols!</code> reuses the columns from <code>df</code> if they are returned by <code>f</code>.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(x=1:4, y=11:14)
 4×2 DataFrame
  Row │ x      y
      │ Int64  Int64
@@ -996,7 +996,7 @@
    1 │     2    121
    2 │     8    144
    3 │    18    169
-   4 │    32    196</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/iteration.jl#L497-L547">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.permute!" href="#Base.permute!"><code>Base.permute!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">permute!(df::AbstractDataFrame, p)</code></pre><p>Permute data frame <code>df</code> in-place, according to permutation <code>p</code>. Throws <code>ArgumentError</code> if <code>p</code> is not a permutation.</p><p>To return a new data frame instead of permuting <code>df</code> in-place, use <code>df[p, :]</code>.</p><p><code>permute!</code> will produce a correct result even if some columns of passed data frame or permutation <code>p</code> are identical (checked with <code>===</code>). Otherwise, if two columns share some part of memory but are not identical (e.g. are different views of the same parent vector) then <code>permute!</code> result might be incorrect.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p>Metadata having other styles is dropped (from parent data frame when <code>df</code> is a <code>SubDataFrame</code>).</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:5, b=6:10, c=11:15)
+   4 │    32    196</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/iteration.jl#L497-L547">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.permute!" href="#Base.permute!"><code>Base.permute!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">permute!(df::AbstractDataFrame, p)</code></pre><p>Permute data frame <code>df</code> in-place, according to permutation <code>p</code>. Throws <code>ArgumentError</code> if <code>p</code> is not a permutation.</p><p>To return a new data frame instead of permuting <code>df</code> in-place, use <code>df[p, :]</code>.</p><p><code>permute!</code> will produce a correct result even if some columns of passed data frame or permutation <code>p</code> are identical (checked with <code>===</code>). Otherwise, if two columns share some part of memory but are not identical (e.g. are different views of the same parent vector) then <code>permute!</code> result might be incorrect.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p>Metadata having other styles is dropped (from parent data frame when <code>df</code> is a <code>SubDataFrame</code>).</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:5, b=6:10, c=11:15)
 5×3 DataFrame
  Row │ a      b      c
      │ Int64  Int64  Int64
@@ -1016,7 +1016,7 @@
    2 │     3      8     13
    3 │     1      6     11
    4 │     2      7     12
-   5 │     4      9     14</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L2722-L2763">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.prepend!" href="#Base.prepend!"><code>Base.prepend!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">prepend!(df::DataFrame, tables...; cols::Symbol=:setequal,
+   5 │     4      9     14</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L2722-L2763">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.prepend!" href="#Base.prepend!"><code>Base.prepend!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">prepend!(df::DataFrame, tables...; cols::Symbol=:setequal,
          promote::Bool=(cols in [:union, :subset]))</code></pre><p>Add the rows of tables passed as <code>tables</code> to the beginning of <code>df</code>. If the table is not an <code>AbstractDataFrame</code> then it is converted using <code>DataFrame(table, copycols=false)</code> before being appended.</p><p>Add the rows of <code>df2</code> to the beginning of <code>df</code>. If the second argument <code>table</code> is not an <code>AbstractDataFrame</code> then it is converted using <code>DataFrame(table, copycols=false)</code> before being prepended.</p><p>The exact behavior of <code>prepend!</code> depends on the <code>cols</code> argument:</p><ul><li>If <code>cols == :setequal</code> (this is the default) then <code>df2</code> must contain exactly the same columns as <code>df</code> (but possibly in a different order).</li><li>If <code>cols == :orderequal</code> then <code>df2</code> must contain the same columns in the same order (for <code>AbstractDict</code> this option requires that <code>keys(row)</code> matches <code>propertynames(df)</code> to allow for support of ordered dicts; however, if <code>df2</code> is a <code>Dict</code> an error is thrown as it is an unordered collection).</li><li>If <code>cols == :intersect</code> then <code>df2</code> may contain more columns than <code>df</code>, but all column names that are present in <code>df</code> must be present in <code>df2</code> and only these are used.</li><li>If <code>cols == :subset</code> then <code>append!</code> behaves like for <code>:intersect</code> but if some column is missing in <code>df2</code> then a <code>missing</code> value is pushed to <code>df</code>.</li><li>If <code>cols == :union</code> then <code>append!</code> adds columns missing in <code>df</code> that are present in <code>df2</code>, for columns present in <code>df</code> but missing in <code>df2</code> a <code>missing</code> value is pushed.</li></ul><p>If <code>promote=true</code> and element type of a column present in <code>df</code> does not allow the type of a pushed argument then a new column with a promoted element type allowing it is freshly allocated and stored in <code>df</code>. If <code>promote=false</code> an error is thrown.</p><p>The above rule has the following exceptions:</p><ul><li>If <code>df</code> has no columns then copies of columns from <code>df2</code> are added to it.</li><li>If <code>df2</code> has no columns then calling <code>prepend!</code> leaves <code>df</code> unchanged.</li></ul><p>Please note that <code>prepend!</code> must not be used on a <code>DataFrame</code> that contains columns that are aliases (equal when compared with <code>===</code>).</p><p>Metadata: table-level <code>:note</code>-style metadata and column-level <code>:note</code>-style metadata for columns present in <code>df</code> are preserved. If new columns are added their <code>:note</code>-style metadata is copied from the appended table. Other metadata is dropped.</p><p>See also: use <a href="#Base.pushfirst!"><code>pushfirst!</code></a> to add individual rows at the beginning of a data frame, <a href="#Base.append!"><code>append!</code></a> to add a table at the end, and <a href="#Base.vcat"><code>vcat</code></a> to vertically concatenate data frames.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df1 = DataFrame(A=1:3, B=1:3)
 3×2 DataFrame
  Row │ A      B
@@ -1059,7 +1059,7 @@
    3 │ missing    missing        2
    4 │       4.0        4  missing
    5 │       5.0        5  missing
-   6 │       6.0        6  missing</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/dataframe/insertion.jl#L118-L213">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.push!" href="#Base.push!"><code>Base.push!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">push!(df::DataFrame, row::Union{Tuple, AbstractArray}...;
+   6 │       6.0        6  missing</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/dataframe/insertion.jl#L118-L213">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.push!" href="#Base.push!"><code>Base.push!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">push!(df::DataFrame, row::Union{Tuple, AbstractArray}...;
       cols::Symbol=:setequal, promote::Bool=false)
 push!(df::DataFrame, row::Union{DataFrameRow, NamedTuple, AbstractDict,
                                 Tables.AbstractRow}...;
@@ -1139,7 +1139,7 @@
 ─────┼──────────────
    1 │     1      2
    2 │     3      4
-   3 │     5      6</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/dataframe/insertion.jl#L443-L537">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.pushfirst!" href="#Base.pushfirst!"><code>Base.pushfirst!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">pushfirst!(df::DataFrame, row::Union{Tuple, AbstractArray}...;
+   3 │     5      6</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/dataframe/insertion.jl#L443-L537">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.pushfirst!" href="#Base.pushfirst!"><code>Base.pushfirst!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">pushfirst!(df::DataFrame, row::Union{Tuple, AbstractArray}...;
            cols::Symbol=:setequal, promote::Bool=false)
 pushfirst!(df::DataFrame, row::Union{DataFrameRow, NamedTuple, AbstractDict,
                                      Tables.AbstractRow}...;
@@ -1219,7 +1219,7 @@
 ─────┼──────────────
    1 │     3      4
    2 │     5      6
-   3 │     1      2</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/dataframe/insertion.jl#L548-L642">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.reduce" href="#Base.reduce"><code>Base.reduce</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">reduce(::typeof(vcat),
+   3 │     1      2</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/dataframe/insertion.jl#L548-L642">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.reduce" href="#Base.reduce"><code>Base.reduce</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">reduce(::typeof(vcat),
        dfs::Union{AbstractVector{&lt;:AbstractDataFrame},
                   Tuple{AbstractDataFrame, Vararg{AbstractDataFrame}}};
        cols::Union{Symbol, AbstractVector{Symbol},
@@ -1278,7 +1278,7 @@
    6 │     6        6  missing       2
    7 │     7  missing        7       3
    8 │     8  missing        8       3
-   9 │     9  missing        9       3</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L1817-L1903">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.repeat" href="#Base.repeat"><code>Base.repeat</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">repeat(df::AbstractDataFrame; inner::Integer = 1, outer::Integer = 1)</code></pre><p>Construct a data frame by repeating rows in <code>df</code>. <code>inner</code> specifies how many times each row is repeated, and <code>outer</code> specifies how many times the full set of rows is repeated.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Example</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:2, b=3:4)
+   9 │     9  missing        9       3</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L1817-L1903">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.repeat" href="#Base.repeat"><code>Base.repeat</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">repeat(df::AbstractDataFrame; inner::Integer = 1, outer::Integer = 1)</code></pre><p>Construct a data frame by repeating rows in <code>df</code>. <code>inner</code> specifies how many times each row is repeated, and <code>outer</code> specifies how many times the full set of rows is repeated.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Example</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:2, b=3:4)
 2×2 DataFrame
  Row │ a      b
      │ Int64  Int64
@@ -1302,7 +1302,7 @@
    9 │     1      3
   10 │     1      3
   11 │     2      4
-  12 │     2      4</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L2099-L2136">source</a></section><section><div><pre><code class="language-julia hljs">repeat(df::AbstractDataFrame, count::Integer)</code></pre><p>Construct a data frame by repeating each row in <code>df</code> the number of times specified by <code>count</code>.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Example</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:2, b=3:4)
+  12 │     2      4</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L2099-L2136">source</a></section><section><div><pre><code class="language-julia hljs">repeat(df::AbstractDataFrame, count::Integer)</code></pre><p>Construct a data frame by repeating each row in <code>df</code> the number of times specified by <code>count</code>.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Example</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:2, b=3:4)
 2×2 DataFrame
  Row │ a      b
      │ Int64  Int64
@@ -1318,7 +1318,7 @@
    1 │     1      3
    2 │     2      4
    3 │     1      3
-   4 │     2      4</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L2143-L2171">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.repeat!" href="#DataFrames.repeat!"><code>DataFrames.repeat!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">repeat!(df::DataFrame; inner::Integer=1, outer::Integer=1)</code></pre><p>Update a data frame <code>df</code> in-place by repeating its rows. <code>inner</code> specifies how many times each row is repeated, and <code>outer</code> specifies how many times the full set of rows is repeated. Columns of <code>df</code> are freshly allocated.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Example</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:2, b=3:4)
+   4 │     2      4</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L2143-L2171">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.repeat!" href="#DataFrames.repeat!"><code>DataFrames.repeat!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">repeat!(df::DataFrame; inner::Integer=1, outer::Integer=1)</code></pre><p>Update a data frame <code>df</code> in-place by repeating its rows. <code>inner</code> specifies how many times each row is repeated, and <code>outer</code> specifies how many times the full set of rows is repeated. Columns of <code>df</code> are freshly allocated.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Example</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:2, b=3:4)
 2×2 DataFrame
  Row │ a      b
      │ Int64  Int64
@@ -1344,7 +1344,7 @@
    9 │     1      3
   10 │     1      3
   11 │     2      4
-  12 │     2      4</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/dataframe/dataframe.jl#L1356-L1395">source</a></section><section><div><pre><code class="language-julia hljs">repeat!(df::DataFrame, count::Integer)</code></pre><p>Update a data frame <code>df</code> in-place by repeating its rows the number of times specified by <code>count</code>. Columns of <code>df</code> are freshly allocated.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Example</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:2, b=3:4)
+  12 │     2      4</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/dataframe/dataframe.jl#L1356-L1395">source</a></section><section><div><pre><code class="language-julia hljs">repeat!(df::DataFrame, count::Integer)</code></pre><p>Update a data frame <code>df</code> in-place by repeating its rows the number of times specified by <code>count</code>. Columns of <code>df</code> are freshly allocated.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Example</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:2, b=3:4)
 2×2 DataFrame
  Row │ a      b
      │ Int64  Int64
@@ -1360,7 +1360,7 @@
    1 │     1      3
    2 │     2      4
    3 │     1      3
-   4 │     2      4</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/dataframe/dataframe.jl#L1409-L1437">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.reverse" href="#Base.reverse"><code>Base.reverse</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">reverse(df::AbstractDataFrame, start=1, stop=nrow(df))</code></pre><p>Return a data frame containing the rows in <code>df</code> in reversed order. If <code>start</code> and <code>stop</code> are provided, only rows in the <code>start:stop</code> range are affected.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:5, b=6:10, c=11:15)
+   4 │     2      4</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/dataframe/dataframe.jl#L1409-L1437">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.reverse" href="#Base.reverse"><code>Base.reverse</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">reverse(df::AbstractDataFrame, start=1, stop=nrow(df))</code></pre><p>Return a data frame containing the rows in <code>df</code> in reversed order. If <code>start</code> and <code>stop</code> are provided, only rows in the <code>start:stop</code> range are affected.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:5, b=6:10, c=11:15)
 5×3 DataFrame
  Row │ a      b      c
      │ Int64  Int64  Int64
@@ -1391,7 +1391,7 @@
    2 │     3      8     13
    3 │     2      7     12
    4 │     4      9     14
-   5 │     5     10     15</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L2522-L2566">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.reverse!" href="#Base.reverse!"><code>Base.reverse!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">reverse!(df::AbstractDataFrame, start=1, stop=nrow(df))</code></pre><p>Mutate data frame in-place to reverse its row order. If <code>start</code> and <code>stop</code> are provided, only rows in the <code>start:stop</code> range are affected.</p><p><code>reverse!</code> will produce a correct result even if some columns of passed data frame are identical (checked with <code>===</code>). Otherwise, if two columns share some part of memory but are not identical (e.g. are different views of the same parent vector) then <code>reverse!</code> result might be incorrect.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p>Metadata having other styles is dropped (from parent data frame when <code>df</code> is a <code>SubDataFrame</code>).</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:5, b=6:10, c=11:15)
+   5 │     5     10     15</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L2522-L2566">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.reverse!" href="#Base.reverse!"><code>Base.reverse!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">reverse!(df::AbstractDataFrame, start=1, stop=nrow(df))</code></pre><p>Mutate data frame in-place to reverse its row order. If <code>start</code> and <code>stop</code> are provided, only rows in the <code>start:stop</code> range are affected.</p><p><code>reverse!</code> will produce a correct result even if some columns of passed data frame are identical (checked with <code>===</code>). Otherwise, if two columns share some part of memory but are not identical (e.g. are different views of the same parent vector) then <code>reverse!</code> result might be incorrect.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p>Metadata having other styles is dropped (from parent data frame when <code>df</code> is a <code>SubDataFrame</code>).</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:5, b=6:10, c=11:15)
 5×3 DataFrame
  Row │ a      b      c
      │ Int64  Int64  Int64
@@ -1422,7 +1422,7 @@
    2 │     3      8     13
    3 │     4      9     14
    4 │     2      7     12
-   5 │     1      6     11</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L2570-L2620">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.select" href="#DataFrames.select"><code>DataFrames.select</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">select(df::AbstractDataFrame, args...;
+   5 │     1      6     11</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L2570-L2620">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.select" href="#DataFrames.select"><code>DataFrames.select</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">select(df::AbstractDataFrame, args...;
        copycols::Bool=true, renamecols::Bool=true, threads::Bool=true)
 select(args::Callable, df::DataFrame;
        renamecols::Bool=true, threads::Bool=true)
@@ -1658,14 +1658,14 @@
    5 │     2      3    0.375             2          2
    6 │     1      5    0.625             1          4
    7 │     1      5    0.625             1          5
-   8 │     2      3    0.375             2          3</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/selection.jl#L1016-L1302">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.select!" href="#DataFrames.select!"><code>DataFrames.select!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">select!(df::AbstractDataFrame, args...;
+   8 │     2      3    0.375             2          3</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/selection.jl#L1016-L1302">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.select!" href="#DataFrames.select!"><code>DataFrames.select!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">select!(df::AbstractDataFrame, args...;
         renamecols::Bool=true, threads::Bool=true)
 select!(args::Base.Callable, df::DataFrame;
         renamecols::Bool=true, threads::Bool=true)
 select!(gd::GroupedDataFrame, args...; ungroup::Bool=true,
         renamecols::Bool=true, threads::Bool=true)
 select!(f::Base.Callable, gd::GroupedDataFrame; ungroup::Bool=true,
-        renamecols::Bool=true, threads::Bool=true)</code></pre><p>Mutate <code>df</code> or <code>gd</code> in place to retain only columns or transformations specified by <code>args...</code> and return it. The result is guaranteed to have the same number of rows as <code>df</code> or parent of <code>gd</code>, except when no columns are selected (in which case the result has zero rows).</p><p>If a <code>SubDataFrame</code> or <code>GroupedDataFrame{SubDataFrame}</code> is passed, the parent data frame is updated using columns generated by <code>args...</code>, following the same rules as indexing:</p><ul><li>for existing columns filtered-out rows are filled with values present in the old columns</li><li>for new columns (which is only allowed if <code>SubDataFrame</code> was created with <code>:</code> as column selector) filtered-out rows are filled with <code>missing</code></li><li>dropped columns (which are only allowed if <code>SubDataFrame</code> was created with <code>:</code> as column selector) are removed</li><li>if <code>SubDataFrame</code> was not created with <code>:</code> as column selector then <code>select!</code> is only allowed if the transformations keep exactly the same sequence of column names as is in the passed <code>df</code></li></ul><p>If a <code>GroupedDataFrame</code> is passed then it is updated to reflect the new rows of its updated parent. If there are independent <code>GroupedDataFrame</code> objects constructed using the same parent data frame they might get corrupt.</p><p>Below detailed common rules for all transformation functions supported by DataFrames.jl are explained and compared.</p><p>All these operations are supported both for <code>AbstractDataFrame</code> (when split and combine steps are skipped) and <code>GroupedDataFrame</code>. Technically, <code>AbstractDataFrame</code> is just considered as being grouped on no columns (meaning it has a single group, or zero groups if it is empty). The only difference is that in this case the <code>keepkeys</code> and <code>ungroup</code> keyword arguments (described below) are not supported and a data frame is always returned, as there are no split and combine steps in this case.</p><p>In order to perform operations by groups you first need to create a <code>GroupedDataFrame</code> object from your data frame using the <code>groupby</code> function that takes two arguments: (1) a data frame to be grouped, and (2) a set of columns to group by.</p><p>Operations can then be applied on each group using one of the following functions:</p><ul><li><code>combine</code>: does not put restrictions on number of rows returned per group; the returned values are vertically concatenated following order of groups in <code>GroupedDataFrame</code>; it is typically used to compute summary statistics by group; for <code>GroupedDataFrame</code> if grouping columns are kept they are put as first columns in the result;</li><li><code>select</code>: return a data frame with the number and order of rows exactly the same as the source data frame, including only new calculated columns; <code>select!</code> is an in-place version of <code>select</code>; for <code>GroupedDataFrame</code> if grouping columns are kept they are put as first columns in the result;</li><li><code>transform</code>: return a data frame with the number and order of rows exactly the same as the source data frame, including all columns from the source and new calculated columns; <code>transform!</code> is an in-place version of <code>transform</code>; existing columns in the source data frame are put as first columns in the result;</li></ul><p>As a special case, if a <code>GroupedDataFrame</code> that has zero groups is passed then the result of the operation is determined by performing a single call to the transformation function with a 0-row argument passed to it. The output of this operation is only used to identify the number and type of produced columns, but the result has zero rows.</p><p>All these functions take a specification of one or more functions to apply to each subset of the <code>DataFrame</code>. This specification can be of the following forms:</p><ol><li>standard column selectors (integers, <code>Symbol</code>s, strings, vectors of integers, vectors of <code>Symbol</code>s, vectors of strings, <code>All</code>, <code>Cols</code>, <code>:</code>, <code>Between</code>, <code>Not</code> and regular expressions)</li><li>a <code>cols =&gt; function</code> pair indicating that <code>function</code> should be called with positional arguments holding columns <code>cols</code>, which can be any valid column selector; in this case target column name is automatically generated and it is assumed that <code>function</code> returns a single value or a vector; the generated name is created by concatenating source column name and <code>function</code> name by default (see examples below).</li><li>a <code>cols =&gt; function =&gt; target_cols</code> form additionally explicitly specifying the target column or columns, which must be a single name (as a <code>Symbol</code> or a string), a vector of names or <code>AsTable</code>. Additionally it can be a <code>Function</code> which takes a string or a vector of strings as an argument containing names of columns selected by <code>cols</code>, and returns the target columns names (all accepted types except <code>AsTable</code> are allowed).</li><li>a <code>col =&gt; target_cols</code> pair, which renames the column <code>col</code> to <code>target_cols</code>, which must be single name (as a <code>Symbol</code> or a string), a vector of names or <code>AsTable</code>.</li><li>column-independent operations <code>function =&gt; target_cols</code> or just <code>function</code> for specific <code>function</code>s where the input columns are omitted; without <code>target_cols</code> the new column has the same name as <code>function</code>, otherwise it must be single name (as a <code>Symbol</code> or a string). Supported <code>function</code>s are:<ul><li><code>nrow</code> to efficiently compute the number of rows in each group.</li><li><code>proprow</code> to efficiently compute the proportion of rows in each group.</li><li><code>eachindex</code> to return a vector holding the number of each row within each group.</li><li><code>groupindices</code> to return the group number.</li></ul></li><li>vectors or matrices containing transformations specified by the <code>Pair</code> syntax described in points 2 to 5</li><li>a function which will be called with a <code>SubDataFrame</code> corresponding to each group if a <code>GroupedDataFrame</code> is processed, or with the data frame itself if an <code>AbstractDataFrame</code> is processed; this form should be avoided due to its poor performance unless the number of groups is small or a very large number of columns are processed (in which case <code>SubDataFrame</code> avoids excessive compilation)</li></ol><p>Note! If the expression of the form <code>x =&gt; y</code> is passed then except for the special convenience form <code>nrow =&gt; target_cols</code> it is always interpreted as <code>cols =&gt; function</code>. In particular the following expression <code>function =&gt; target_cols</code> is not a valid transformation specification.</p><p>Note! If <code>cols</code> or <code>target_cols</code> are one of <code>All</code>, <code>Cols</code>, <code>Between</code>, or <code>Not</code>, broadcasting using <code>.=&gt;</code> is supported and is equivalent to broadcasting the result of <code>names(df, cols)</code> or <code>names(df, target_cols)</code>. This behaves as if broadcasting happened after replacing the selector with selected column names within the data frame scope.</p><p>All functions have two types of signatures. One of them takes a <code>GroupedDataFrame</code> as the first argument and an arbitrary number of transformations described above as following arguments. The second type of signature is when a <code>Function</code> or a <code>Type</code> is passed as the first argument and a <code>GroupedDataFrame</code> as the second argument (similar to <code>map</code>).</p><p>As a special rule, with the <code>cols =&gt; function</code> and <code>cols =&gt; function =&gt; target_cols</code> syntaxes, if <code>cols</code> is wrapped in an <code>AsTable</code> object then a <code>NamedTuple</code> containing columns selected by <code>cols</code> is passed to <code>function</code>. The documentation of <a href="#DataFrames.table_transformation"><code>DataFrames.table_transformation</code></a> provides more information about this functionality, in particular covering performance considerations.</p><p>What is allowed for <code>function</code> to return is determined by the <code>target_cols</code> value:</p><ol><li>If both <code>cols</code> and <code>target_cols</code> are omitted (so only a <code>function</code> is passed), then returning a data frame, a matrix, a <code>NamedTuple</code>, a <code>Tables.AbstractRow</code> or a <code>DataFrameRow</code> will produce multiple columns in the result. Returning any other value produces a single column.</li><li>If <code>target_cols</code> is a <code>Symbol</code> or a string then the function is assumed to return a single column. In this case returning a data frame, a matrix, a <code>NamedTuple</code>, a <code>Tables.AbstractRow</code>, or a <code>DataFrameRow</code> raises an error.</li><li>If <code>target_cols</code> is a vector of <code>Symbol</code>s or strings or <code>AsTable</code> it is assumed that <code>function</code> returns multiple columns. If <code>function</code> returns one of <code>AbstractDataFrame</code>, <code>NamedTuple</code>, <code>DataFrameRow</code>, <code>Tables.AbstractRow</code>, <code>AbstractMatrix</code> then rules described in point 1 above apply. If <code>function</code> returns an <code>AbstractVector</code> then each element of this vector must support the <code>keys</code> function, which must return a collection of <code>Symbol</code>s, strings or integers; the return value of <code>keys</code> must be identical for all elements. Then as many columns are created as there are elements in the return value of the <code>keys</code> function. If <code>target_cols</code> is <code>AsTable</code> then their names are set to be equal to the key names except if <code>keys</code> returns integers, in which case they are prefixed by <code>x</code> (so the column names are e.g. <code>x1</code>, <code>x2</code>, ...). If <code>target_cols</code> is a vector of <code>Symbol</code>s or strings then column names produced using the rules above are ignored and replaced by <code>target_cols</code> (the number of columns must be the same as the length of <code>target_cols</code> in this case). If <code>fun</code> returns a value of any other type then it is assumed that it is a table conforming to the Tables.jl API and the <code>Tables.columntable</code> function is called on it to get the resulting columns and their names. The names are retained when <code>target_cols</code> is <code>AsTable</code> and are replaced if <code>target_cols</code> is a vector of <code>Symbol</code>s or strings.</li></ol><p>In all of these cases, <code>function</code> can return either a single row or multiple rows. As a particular rule, values wrapped in a <code>Ref</code> or a <code>0</code>-dimensional <code>AbstractArray</code> are unwrapped and then treated as a single row.</p><p><code>select</code>/<code>select!</code> and <code>transform</code>/<code>transform!</code> always return a data frame with the same number and order of rows as the source (even if <code>GroupedDataFrame</code> had its groups reordered), except when selection results in zero columns in the resulting data frame (in which case the result has zero rows).</p><p>For <code>combine</code>, rows in the returned object appear in the order of groups in the <code>GroupedDataFrame</code>. The functions can return an arbitrary number of rows for each group, but the kind of returned object and the number and names of columns must be the same for all groups, except when a <code>DataFrame()</code> or <code>NamedTuple()</code> is returned, in which case a given group is skipped.</p><p>It is allowed to mix single values and vectors if multiple transformations are requested. In this case single value will be repeated to match the length of columns specified by returned vectors.</p><p>To apply <code>function</code> to each row instead of whole columns, it can be wrapped in a <code>ByRow</code> struct. <code>cols</code> can be any column indexing syntax, in which case <code>function</code> will be passed one argument for each of the columns specified by <code>cols</code> or a <code>NamedTuple</code> of them if specified columns are wrapped in <code>AsTable</code>. If <code>ByRow</code> is used it is allowed for <code>cols</code> to select an empty set of columns, in which case <code>function</code> is called for each row without any arguments and an empty <code>NamedTuple</code> is passed if empty set of columns is wrapped in <code>AsTable</code>.</p><p>If a collection of column names is passed then requesting duplicate column names in target data frame are accepted (e.g. <code>select!(df, [:a], :, r&quot;a&quot;)</code> is allowed) and only the first occurrence is used. In particular a syntax to move column <code>:col</code> to the first position in the data frame is <code>select!(df, :col, :)</code>. On the contrary, output column names of renaming, transformation and single column selection operations must be unique, so e.g. <code>select!(df, :a, :a =&gt; :a)</code> or <code>select!(df, :a, :a =&gt; ByRow(sin) =&gt; :a)</code> are not allowed.</p><p>In general columns returned by transformations are stored in the target data frame without copying. An exception to this rule is when columns from the source data frame are reused in the target data frame. This can happen via expressions like: <code>:x1</code>, <code>[:x1, :x2]</code>, <code>:x1 =&gt; :x2</code>, <code>:x1 =&gt; identity =&gt; :x2</code>, or <code>:x1 =&gt; (x -&gt; @view x[inds])</code> (note that in the last case the source column is reused indirectly via a view). In such cases the behavior depends on the value of the <code>copycols</code> keyword argument:</p><ul><li>if <code>copycols=true</code> then results of such transformations always perform a copy of the source column or its view;</li><li>if <code>copycols=false</code> then copies are only performed to avoid storing the same column several times in the target data frame; more precisely, no copy is made the first time a column is used, but each subsequent reuse of a source column (when compared using <code>===</code>, which excludes views of source columns) performs a copy;</li></ul><p>Note that performing <code>transform!</code> or <code>select!</code> assumes that <code>copycols=false</code>.</p><p>If <code>df</code> is a <code>SubDataFrame</code> and <code>copycols=true</code> then a <code>DataFrame</code> is returned and the same copying rules apply as for a <code>DataFrame</code> input: this means in particular that selected columns will be copied. If <code>copycols=false</code>, a <code>SubDataFrame</code> is returned without copying columns and in this case transforming or renaming columns is not allowed.</p><p>If a <code>GroupedDataFrame</code> is passed and <code>threads=true</code> (the default), a separate task is spawned for each specified transformation; each transformation then spawns as many tasks as Julia threads, and splits processing of groups across them (however, currently transformations with optimized implementations like <code>sum</code> and transformations that return multiple rows use a single task for all groups). This allows for parallel operation when Julia was started with more than one thread. Passed transformation functions must therefore not modify global variables (i.e. they must be pure), use locks to control parallel accesses, or <code>threads=false</code> must be passed to disable multithreading. In the future, parallelism may be extended to other cases, so this requirement also holds for <code>DataFrame</code> inputs.</p><p>In order to improve the performance of the operations some transformations invoke optimized implementation, see <a href="#DataFrames.table_transformation"><code>DataFrames.table_transformation</code></a> for details.</p><p><strong>Keyword arguments</strong></p><ul><li><code>renamecols::Bool=true</code> : whether in the <code>cols =&gt; function</code> form automatically generated column names should include the name of transformation functions or not.</li><li><code>ungroup::Bool=true</code> : whether the return value of the operation on <code>gd</code> should be a data frame or a <code>GroupedDataFrame</code>.</li><li><code>threads::Bool=true</code> : whether transformations may be run in separate tasks which can execute in parallel (possibly being applied to multiple rows or groups at the same time). Whether or not tasks are actually spawned and their number are determined automatically. Set to <code>false</code> if some transformations require serial execution or are not thread-safe.</li></ul><p>Metadata: this function propagates table-level <code>:note</code>-style metadata. Column-level <code>:note</code>-style metadata is propagated if: a) a single column is transformed to a single column and the name of the column   does not change (this includes all column selection operations), or b) a single column is transformed with <code>identity</code> or <code>copy</code> to a single column    even if column name is changed (this includes column renaming).    As a special case for <code>GroupedDataFrame</code> if the output has the same name    as a grouping column and <code>keepkeys=true</code>, metadata is taken from    original grouping column.</p><p>See <a href="#DataFrames.select"><code>select</code></a> for examples.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/selection.jl#L903-L949">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Random.shuffle" href="#Random.shuffle"><code>Random.shuffle</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">shuffle([rng=GLOBAL_RNG,] df::AbstractDataFrame)</code></pre><p>Return a copy of <code>df</code> with randomly permuted rows. The optional <code>rng</code> argument specifies a random number generator.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; using Random
+        renamecols::Bool=true, threads::Bool=true)</code></pre><p>Mutate <code>df</code> or <code>gd</code> in place to retain only columns or transformations specified by <code>args...</code> and return it. The result is guaranteed to have the same number of rows as <code>df</code> or parent of <code>gd</code>, except when no columns are selected (in which case the result has zero rows).</p><p>If a <code>SubDataFrame</code> or <code>GroupedDataFrame{SubDataFrame}</code> is passed, the parent data frame is updated using columns generated by <code>args...</code>, following the same rules as indexing:</p><ul><li>for existing columns filtered-out rows are filled with values present in the old columns</li><li>for new columns (which is only allowed if <code>SubDataFrame</code> was created with <code>:</code> as column selector) filtered-out rows are filled with <code>missing</code></li><li>dropped columns (which are only allowed if <code>SubDataFrame</code> was created with <code>:</code> as column selector) are removed</li><li>if <code>SubDataFrame</code> was not created with <code>:</code> as column selector then <code>select!</code> is only allowed if the transformations keep exactly the same sequence of column names as is in the passed <code>df</code></li></ul><p>If a <code>GroupedDataFrame</code> is passed then it is updated to reflect the new rows of its updated parent. If there are independent <code>GroupedDataFrame</code> objects constructed using the same parent data frame they might get corrupt.</p><p>Below detailed common rules for all transformation functions supported by DataFrames.jl are explained and compared.</p><p>All these operations are supported both for <code>AbstractDataFrame</code> (when split and combine steps are skipped) and <code>GroupedDataFrame</code>. Technically, <code>AbstractDataFrame</code> is just considered as being grouped on no columns (meaning it has a single group, or zero groups if it is empty). The only difference is that in this case the <code>keepkeys</code> and <code>ungroup</code> keyword arguments (described below) are not supported and a data frame is always returned, as there are no split and combine steps in this case.</p><p>In order to perform operations by groups you first need to create a <code>GroupedDataFrame</code> object from your data frame using the <code>groupby</code> function that takes two arguments: (1) a data frame to be grouped, and (2) a set of columns to group by.</p><p>Operations can then be applied on each group using one of the following functions:</p><ul><li><code>combine</code>: does not put restrictions on number of rows returned per group; the returned values are vertically concatenated following order of groups in <code>GroupedDataFrame</code>; it is typically used to compute summary statistics by group; for <code>GroupedDataFrame</code> if grouping columns are kept they are put as first columns in the result;</li><li><code>select</code>: return a data frame with the number and order of rows exactly the same as the source data frame, including only new calculated columns; <code>select!</code> is an in-place version of <code>select</code>; for <code>GroupedDataFrame</code> if grouping columns are kept they are put as first columns in the result;</li><li><code>transform</code>: return a data frame with the number and order of rows exactly the same as the source data frame, including all columns from the source and new calculated columns; <code>transform!</code> is an in-place version of <code>transform</code>; existing columns in the source data frame are put as first columns in the result;</li></ul><p>As a special case, if a <code>GroupedDataFrame</code> that has zero groups is passed then the result of the operation is determined by performing a single call to the transformation function with a 0-row argument passed to it. The output of this operation is only used to identify the number and type of produced columns, but the result has zero rows.</p><p>All these functions take a specification of one or more functions to apply to each subset of the <code>DataFrame</code>. This specification can be of the following forms:</p><ol><li>standard column selectors (integers, <code>Symbol</code>s, strings, vectors of integers, vectors of <code>Symbol</code>s, vectors of strings, <code>All</code>, <code>Cols</code>, <code>:</code>, <code>Between</code>, <code>Not</code> and regular expressions)</li><li>a <code>cols =&gt; function</code> pair indicating that <code>function</code> should be called with positional arguments holding columns <code>cols</code>, which can be any valid column selector; in this case target column name is automatically generated and it is assumed that <code>function</code> returns a single value or a vector; the generated name is created by concatenating source column name and <code>function</code> name by default (see examples below).</li><li>a <code>cols =&gt; function =&gt; target_cols</code> form additionally explicitly specifying the target column or columns, which must be a single name (as a <code>Symbol</code> or a string), a vector of names or <code>AsTable</code>. Additionally it can be a <code>Function</code> which takes a string or a vector of strings as an argument containing names of columns selected by <code>cols</code>, and returns the target columns names (all accepted types except <code>AsTable</code> are allowed).</li><li>a <code>col =&gt; target_cols</code> pair, which renames the column <code>col</code> to <code>target_cols</code>, which must be single name (as a <code>Symbol</code> or a string), a vector of names or <code>AsTable</code>.</li><li>column-independent operations <code>function =&gt; target_cols</code> or just <code>function</code> for specific <code>function</code>s where the input columns are omitted; without <code>target_cols</code> the new column has the same name as <code>function</code>, otherwise it must be single name (as a <code>Symbol</code> or a string). Supported <code>function</code>s are:<ul><li><code>nrow</code> to efficiently compute the number of rows in each group.</li><li><code>proprow</code> to efficiently compute the proportion of rows in each group.</li><li><code>eachindex</code> to return a vector holding the number of each row within each group.</li><li><code>groupindices</code> to return the group number.</li></ul></li><li>vectors or matrices containing transformations specified by the <code>Pair</code> syntax described in points 2 to 5</li><li>a function which will be called with a <code>SubDataFrame</code> corresponding to each group if a <code>GroupedDataFrame</code> is processed, or with the data frame itself if an <code>AbstractDataFrame</code> is processed; this form should be avoided due to its poor performance unless the number of groups is small or a very large number of columns are processed (in which case <code>SubDataFrame</code> avoids excessive compilation)</li></ol><p>Note! If the expression of the form <code>x =&gt; y</code> is passed then except for the special convenience form <code>nrow =&gt; target_cols</code> it is always interpreted as <code>cols =&gt; function</code>. In particular the following expression <code>function =&gt; target_cols</code> is not a valid transformation specification.</p><p>Note! If <code>cols</code> or <code>target_cols</code> are one of <code>All</code>, <code>Cols</code>, <code>Between</code>, or <code>Not</code>, broadcasting using <code>.=&gt;</code> is supported and is equivalent to broadcasting the result of <code>names(df, cols)</code> or <code>names(df, target_cols)</code>. This behaves as if broadcasting happened after replacing the selector with selected column names within the data frame scope.</p><p>All functions have two types of signatures. One of them takes a <code>GroupedDataFrame</code> as the first argument and an arbitrary number of transformations described above as following arguments. The second type of signature is when a <code>Function</code> or a <code>Type</code> is passed as the first argument and a <code>GroupedDataFrame</code> as the second argument (similar to <code>map</code>).</p><p>As a special rule, with the <code>cols =&gt; function</code> and <code>cols =&gt; function =&gt; target_cols</code> syntaxes, if <code>cols</code> is wrapped in an <code>AsTable</code> object then a <code>NamedTuple</code> containing columns selected by <code>cols</code> is passed to <code>function</code>. The documentation of <a href="#DataFrames.table_transformation"><code>DataFrames.table_transformation</code></a> provides more information about this functionality, in particular covering performance considerations.</p><p>What is allowed for <code>function</code> to return is determined by the <code>target_cols</code> value:</p><ol><li>If both <code>cols</code> and <code>target_cols</code> are omitted (so only a <code>function</code> is passed), then returning a data frame, a matrix, a <code>NamedTuple</code>, a <code>Tables.AbstractRow</code> or a <code>DataFrameRow</code> will produce multiple columns in the result. Returning any other value produces a single column.</li><li>If <code>target_cols</code> is a <code>Symbol</code> or a string then the function is assumed to return a single column. In this case returning a data frame, a matrix, a <code>NamedTuple</code>, a <code>Tables.AbstractRow</code>, or a <code>DataFrameRow</code> raises an error.</li><li>If <code>target_cols</code> is a vector of <code>Symbol</code>s or strings or <code>AsTable</code> it is assumed that <code>function</code> returns multiple columns. If <code>function</code> returns one of <code>AbstractDataFrame</code>, <code>NamedTuple</code>, <code>DataFrameRow</code>, <code>Tables.AbstractRow</code>, <code>AbstractMatrix</code> then rules described in point 1 above apply. If <code>function</code> returns an <code>AbstractVector</code> then each element of this vector must support the <code>keys</code> function, which must return a collection of <code>Symbol</code>s, strings or integers; the return value of <code>keys</code> must be identical for all elements. Then as many columns are created as there are elements in the return value of the <code>keys</code> function. If <code>target_cols</code> is <code>AsTable</code> then their names are set to be equal to the key names except if <code>keys</code> returns integers, in which case they are prefixed by <code>x</code> (so the column names are e.g. <code>x1</code>, <code>x2</code>, ...). If <code>target_cols</code> is a vector of <code>Symbol</code>s or strings then column names produced using the rules above are ignored and replaced by <code>target_cols</code> (the number of columns must be the same as the length of <code>target_cols</code> in this case). If <code>fun</code> returns a value of any other type then it is assumed that it is a table conforming to the Tables.jl API and the <code>Tables.columntable</code> function is called on it to get the resulting columns and their names. The names are retained when <code>target_cols</code> is <code>AsTable</code> and are replaced if <code>target_cols</code> is a vector of <code>Symbol</code>s or strings.</li></ol><p>In all of these cases, <code>function</code> can return either a single row or multiple rows. As a particular rule, values wrapped in a <code>Ref</code> or a <code>0</code>-dimensional <code>AbstractArray</code> are unwrapped and then treated as a single row.</p><p><code>select</code>/<code>select!</code> and <code>transform</code>/<code>transform!</code> always return a data frame with the same number and order of rows as the source (even if <code>GroupedDataFrame</code> had its groups reordered), except when selection results in zero columns in the resulting data frame (in which case the result has zero rows).</p><p>For <code>combine</code>, rows in the returned object appear in the order of groups in the <code>GroupedDataFrame</code>. The functions can return an arbitrary number of rows for each group, but the kind of returned object and the number and names of columns must be the same for all groups, except when a <code>DataFrame()</code> or <code>NamedTuple()</code> is returned, in which case a given group is skipped.</p><p>It is allowed to mix single values and vectors if multiple transformations are requested. In this case single value will be repeated to match the length of columns specified by returned vectors.</p><p>To apply <code>function</code> to each row instead of whole columns, it can be wrapped in a <code>ByRow</code> struct. <code>cols</code> can be any column indexing syntax, in which case <code>function</code> will be passed one argument for each of the columns specified by <code>cols</code> or a <code>NamedTuple</code> of them if specified columns are wrapped in <code>AsTable</code>. If <code>ByRow</code> is used it is allowed for <code>cols</code> to select an empty set of columns, in which case <code>function</code> is called for each row without any arguments and an empty <code>NamedTuple</code> is passed if empty set of columns is wrapped in <code>AsTable</code>.</p><p>If a collection of column names is passed then requesting duplicate column names in target data frame are accepted (e.g. <code>select!(df, [:a], :, r&quot;a&quot;)</code> is allowed) and only the first occurrence is used. In particular a syntax to move column <code>:col</code> to the first position in the data frame is <code>select!(df, :col, :)</code>. On the contrary, output column names of renaming, transformation and single column selection operations must be unique, so e.g. <code>select!(df, :a, :a =&gt; :a)</code> or <code>select!(df, :a, :a =&gt; ByRow(sin) =&gt; :a)</code> are not allowed.</p><p>In general columns returned by transformations are stored in the target data frame without copying. An exception to this rule is when columns from the source data frame are reused in the target data frame. This can happen via expressions like: <code>:x1</code>, <code>[:x1, :x2]</code>, <code>:x1 =&gt; :x2</code>, <code>:x1 =&gt; identity =&gt; :x2</code>, or <code>:x1 =&gt; (x -&gt; @view x[inds])</code> (note that in the last case the source column is reused indirectly via a view). In such cases the behavior depends on the value of the <code>copycols</code> keyword argument:</p><ul><li>if <code>copycols=true</code> then results of such transformations always perform a copy of the source column or its view;</li><li>if <code>copycols=false</code> then copies are only performed to avoid storing the same column several times in the target data frame; more precisely, no copy is made the first time a column is used, but each subsequent reuse of a source column (when compared using <code>===</code>, which excludes views of source columns) performs a copy;</li></ul><p>Note that performing <code>transform!</code> or <code>select!</code> assumes that <code>copycols=false</code>.</p><p>If <code>df</code> is a <code>SubDataFrame</code> and <code>copycols=true</code> then a <code>DataFrame</code> is returned and the same copying rules apply as for a <code>DataFrame</code> input: this means in particular that selected columns will be copied. If <code>copycols=false</code>, a <code>SubDataFrame</code> is returned without copying columns and in this case transforming or renaming columns is not allowed.</p><p>If a <code>GroupedDataFrame</code> is passed and <code>threads=true</code> (the default), a separate task is spawned for each specified transformation; each transformation then spawns as many tasks as Julia threads, and splits processing of groups across them (however, currently transformations with optimized implementations like <code>sum</code> and transformations that return multiple rows use a single task for all groups). This allows for parallel operation when Julia was started with more than one thread. Passed transformation functions must therefore not modify global variables (i.e. they must be pure), use locks to control parallel accesses, or <code>threads=false</code> must be passed to disable multithreading. In the future, parallelism may be extended to other cases, so this requirement also holds for <code>DataFrame</code> inputs.</p><p>In order to improve the performance of the operations some transformations invoke optimized implementation, see <a href="#DataFrames.table_transformation"><code>DataFrames.table_transformation</code></a> for details.</p><p><strong>Keyword arguments</strong></p><ul><li><code>renamecols::Bool=true</code> : whether in the <code>cols =&gt; function</code> form automatically generated column names should include the name of transformation functions or not.</li><li><code>ungroup::Bool=true</code> : whether the return value of the operation on <code>gd</code> should be a data frame or a <code>GroupedDataFrame</code>.</li><li><code>threads::Bool=true</code> : whether transformations may be run in separate tasks which can execute in parallel (possibly being applied to multiple rows or groups at the same time). Whether or not tasks are actually spawned and their number are determined automatically. Set to <code>false</code> if some transformations require serial execution or are not thread-safe.</li></ul><p>Metadata: this function propagates table-level <code>:note</code>-style metadata. Column-level <code>:note</code>-style metadata is propagated if: a) a single column is transformed to a single column and the name of the column   does not change (this includes all column selection operations), or b) a single column is transformed with <code>identity</code> or <code>copy</code> to a single column    even if column name is changed (this includes column renaming).    As a special case for <code>GroupedDataFrame</code> if the output has the same name    as a grouping column and <code>keepkeys=true</code>, metadata is taken from    original grouping column.</p><p>See <a href="#DataFrames.select"><code>select</code></a> for examples.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/selection.jl#L903-L949">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Random.shuffle" href="#Random.shuffle"><code>Random.shuffle</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">shuffle([rng=GLOBAL_RNG,] df::AbstractDataFrame)</code></pre><p>Return a copy of <code>df</code> with randomly permuted rows. The optional <code>rng</code> argument specifies a random number generator.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; using Random
 
 julia&gt; rng = MersenneTwister(1234);
 
@@ -1678,7 +1678,7 @@
    2 │     1      1
    3 │     4      4
    4 │     3      3
-   5 │     5      5</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L2820-L2846">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Random.shuffle!" href="#Random.shuffle!"><code>Random.shuffle!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">shuffle!([rng=GLOBAL_RNG,] df::AbstractDataFrame)</code></pre><p>Randomly permute rows of <code>df</code> in-place. The optional <code>rng</code> argument specifies a random number generator.</p><p><code>shuffle!</code> will produce a correct result even if some columns of passed data frame are identical (checked with <code>===</code>). Otherwise, if two columns share some part of memory but are not identical (e.g. are different views of the same parent vector) then <code>shuffle!</code> result might be incorrect.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p>Metadata having other styles is dropped (from parent data frame when <code>df</code> is a <code>SubDataFrame</code>).</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; using Random
+   5 │     5      5</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L2820-L2846">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Random.shuffle!" href="#Random.shuffle!"><code>Random.shuffle!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">shuffle!([rng=GLOBAL_RNG,] df::AbstractDataFrame)</code></pre><p>Randomly permute rows of <code>df</code> in-place. The optional <code>rng</code> argument specifies a random number generator.</p><p><code>shuffle!</code> will produce a correct result even if some columns of passed data frame are identical (checked with <code>===</code>). Otherwise, if two columns share some part of memory but are not identical (e.g. are different views of the same parent vector) then <code>shuffle!</code> result might be incorrect.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p>Metadata having other styles is dropped (from parent data frame when <code>df</code> is a <code>SubDataFrame</code>).</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; using Random
 
 julia&gt; rng = MersenneTwister(1234);
 
@@ -1691,11 +1691,11 @@
    2 │     1      1
    3 │     4      4
    4 │     3      3
-   5 │     5      5</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L2852-L2884">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.table_transformation" href="#DataFrames.table_transformation"><code>DataFrames.table_transformation</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">table_transformation(df_sel::AbstractDataFrame, fun)</code></pre><p>This is the function called when <code>AsTable(...) =&gt; fun</code> is requested. The <code>df_sel</code> argument is a data frame storing columns selected by the <code>AsTable(...)</code> selector.</p><p>By default it calls <code>default_table_transformation</code>. However, it is allowed to add special methods for specific types of <code>fun</code>, as long as the result matches what would be produced by <code>default_table_transformation</code>, except that it is allowed to perform <code>eltype</code> conversion of the resulting vectors or value type promotions that are consistent with <code>promote_type</code>.</p><p>It is guaranteed that <code>df_sel</code> has at least one column.</p><p>The main use of special <code>table_transformation</code> methods is to provide more efficient than the default implementations of requested <code>fun</code> transformation.</p><p>This function might become a part of the public API of DataFrames.jl in the future, currently it should be considered experimental.</p><p>Fast paths are implemented within DataFrames.jl for the following functions <code>fun</code>:</p><ul><li><code>sum</code>, <code>ByRow(sum)</code>, <code>ByRow(sum∘skipmissing)</code></li><li><code>length</code>, <code>ByRow(length)</code>, <code>ByRow(length∘skipmissing)</code></li><li><code>mean</code>, <code>ByRow(mean)</code>, <code>ByRow(mean∘skipmissing)</code></li><li><code>ByRow(var)</code>, <code>ByRow(var∘skipmissing)</code></li><li><code>ByRow(std)</code>, <code>ByRow(std∘skipmissing)</code></li><li><code>ByRow(median)</code>, <code>ByRow(median∘skipmissing)</code></li><li><code>minimum</code>, <code>ByRow(minimum)</code>, <code>ByRow(minimum∘skipmissing)</code></li><li><code>maximum</code>, <code>ByRow(maximum)</code>, <code>ByRow(maximum∘skipmissing)</code></li><li><code>fun∘collect</code> and <code>ByRow(fun∘collect)</code> where <code>fun</code> is any function</li></ul><p>Note that in order to improve the performance <code>ByRow(sum)</code>, <code>ByRow(sum∘skipmissing)</code>, <code>ByRow(mean)</code>, and <code>ByRow(mean∘skipmissing)</code> perform all operations in the target element type. In some very rare cases (like mixing very large <code>Int64</code> values and <code>Float64</code> values) it can lead to a result different from the one that would be obtained by calling the function outside of DataFrames.jl. The way to avoid this precision loss is to use an anonymous function, e.g. instead of <code>ByRow(sum)</code> use <code>ByRow(x -&gt; sum(x))</code>. However, in general for such scenarios even standard aggregation functions should not be considered to provide reliable output, and users are recommended to switch to higher precision calculations. An example of a case when standard <code>sum</code> is affected by the situation discussed is:</p><pre><code class="nohighlight hljs">julia&gt; sum(Any[typemax(Int), typemax(Int), 1.0])
+   5 │     5      5</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L2852-L2884">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.table_transformation" href="#DataFrames.table_transformation"><code>DataFrames.table_transformation</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">table_transformation(df_sel::AbstractDataFrame, fun)</code></pre><p>This is the function called when <code>AsTable(...) =&gt; fun</code> is requested. The <code>df_sel</code> argument is a data frame storing columns selected by the <code>AsTable(...)</code> selector.</p><p>By default it calls <code>default_table_transformation</code>. However, it is allowed to add special methods for specific types of <code>fun</code>, as long as the result matches what would be produced by <code>default_table_transformation</code>, except that it is allowed to perform <code>eltype</code> conversion of the resulting vectors or value type promotions that are consistent with <code>promote_type</code>.</p><p>It is guaranteed that <code>df_sel</code> has at least one column.</p><p>The main use of special <code>table_transformation</code> methods is to provide more efficient than the default implementations of requested <code>fun</code> transformation.</p><p>This function might become a part of the public API of DataFrames.jl in the future, currently it should be considered experimental.</p><p>Fast paths are implemented within DataFrames.jl for the following functions <code>fun</code>:</p><ul><li><code>sum</code>, <code>ByRow(sum)</code>, <code>ByRow(sum∘skipmissing)</code></li><li><code>length</code>, <code>ByRow(length)</code>, <code>ByRow(length∘skipmissing)</code></li><li><code>mean</code>, <code>ByRow(mean)</code>, <code>ByRow(mean∘skipmissing)</code></li><li><code>ByRow(var)</code>, <code>ByRow(var∘skipmissing)</code></li><li><code>ByRow(std)</code>, <code>ByRow(std∘skipmissing)</code></li><li><code>ByRow(median)</code>, <code>ByRow(median∘skipmissing)</code></li><li><code>minimum</code>, <code>ByRow(minimum)</code>, <code>ByRow(minimum∘skipmissing)</code></li><li><code>maximum</code>, <code>ByRow(maximum)</code>, <code>ByRow(maximum∘skipmissing)</code></li><li><code>fun∘collect</code> and <code>ByRow(fun∘collect)</code> where <code>fun</code> is any function</li></ul><p>Note that in order to improve the performance <code>ByRow(sum)</code>, <code>ByRow(sum∘skipmissing)</code>, <code>ByRow(mean)</code>, and <code>ByRow(mean∘skipmissing)</code> perform all operations in the target element type. In some very rare cases (like mixing very large <code>Int64</code> values and <code>Float64</code> values) it can lead to a result different from the one that would be obtained by calling the function outside of DataFrames.jl. The way to avoid this precision loss is to use an anonymous function, e.g. instead of <code>ByRow(sum)</code> use <code>ByRow(x -&gt; sum(x))</code>. However, in general for such scenarios even standard aggregation functions should not be considered to provide reliable output, and users are recommended to switch to higher precision calculations. An example of a case when standard <code>sum</code> is affected by the situation discussed is:</p><pre><code class="nohighlight hljs">julia&gt; sum(Any[typemax(Int), typemax(Int), 1.0])
 -1.0
 
 julia&gt; sum(Any[1.0, typemax(Int), typemax(Int)])
-1.8446744073709552e19</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/selectionfast.jl#L1-L53">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.transform" href="#DataFrames.transform"><code>DataFrames.transform</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">transform(df::AbstractDataFrame, args...;
+1.8446744073709552e19</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/selectionfast.jl#L1-L53">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.transform" href="#DataFrames.transform"><code>DataFrames.transform</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">transform(df::AbstractDataFrame, args...;
           copycols::Bool=true, renamecols::Bool=true, threads::Bool=true)
 transform(f::Callable, df::DataFrame;
           renamecols::Bool=true, threads::Bool=true)
@@ -1727,14 +1727,14 @@
    2 │    10
 
 julia&gt; transform(gdf, x -&gt; (x=10,), keepkeys=true)
-ERROR: ArgumentError: column :x in returned data frame is not equal to grouping key :x</code></pre><p>See <a href="#DataFrames.select"><code>select</code></a> for more examples.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/selection.jl#L1316-L1382">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.transform!" href="#DataFrames.transform!"><code>DataFrames.transform!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">transform!(df::AbstractDataFrame, args...;
+ERROR: ArgumentError: column :x in returned data frame is not equal to grouping key :x</code></pre><p>See <a href="#DataFrames.select"><code>select</code></a> for more examples.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/selection.jl#L1316-L1382">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.transform!" href="#DataFrames.transform!"><code>DataFrames.transform!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">transform!(df::AbstractDataFrame, args...;
            renamecols::Bool=true, threads::Bool=true)
 transform!(args::Callable, df::AbstractDataFrame;
            renamecols::Bool=true, threads::Bool=true)
 transform!(gd::GroupedDataFrame, args...;
            ungroup::Bool=true, renamecols::Bool=true, threads::Bool=true)
 transform!(f::Base.Callable, gd::GroupedDataFrame;
-           ungroup::Bool=true, renamecols::Bool=true, threads::Bool=true)</code></pre><p>Mutate <code>df</code> or <code>gd</code> in place to add columns specified by <code>args...</code> and return it. The result is guaranteed to have the same number of rows as <code>df</code>. Equivalent to <code>select!(df, :, args...)</code> or <code>select!(gd, :, args...)</code>, except that column renaming performs a copy.</p><p>Below detailed common rules for all transformation functions supported by DataFrames.jl are explained and compared.</p><p>All these operations are supported both for <code>AbstractDataFrame</code> (when split and combine steps are skipped) and <code>GroupedDataFrame</code>. Technically, <code>AbstractDataFrame</code> is just considered as being grouped on no columns (meaning it has a single group, or zero groups if it is empty). The only difference is that in this case the <code>keepkeys</code> and <code>ungroup</code> keyword arguments (described below) are not supported and a data frame is always returned, as there are no split and combine steps in this case.</p><p>In order to perform operations by groups you first need to create a <code>GroupedDataFrame</code> object from your data frame using the <code>groupby</code> function that takes two arguments: (1) a data frame to be grouped, and (2) a set of columns to group by.</p><p>Operations can then be applied on each group using one of the following functions:</p><ul><li><code>combine</code>: does not put restrictions on number of rows returned per group; the returned values are vertically concatenated following order of groups in <code>GroupedDataFrame</code>; it is typically used to compute summary statistics by group; for <code>GroupedDataFrame</code> if grouping columns are kept they are put as first columns in the result;</li><li><code>select</code>: return a data frame with the number and order of rows exactly the same as the source data frame, including only new calculated columns; <code>select!</code> is an in-place version of <code>select</code>; for <code>GroupedDataFrame</code> if grouping columns are kept they are put as first columns in the result;</li><li><code>transform</code>: return a data frame with the number and order of rows exactly the same as the source data frame, including all columns from the source and new calculated columns; <code>transform!</code> is an in-place version of <code>transform</code>; existing columns in the source data frame are put as first columns in the result;</li></ul><p>As a special case, if a <code>GroupedDataFrame</code> that has zero groups is passed then the result of the operation is determined by performing a single call to the transformation function with a 0-row argument passed to it. The output of this operation is only used to identify the number and type of produced columns, but the result has zero rows.</p><p>All these functions take a specification of one or more functions to apply to each subset of the <code>DataFrame</code>. This specification can be of the following forms:</p><ol><li>standard column selectors (integers, <code>Symbol</code>s, strings, vectors of integers, vectors of <code>Symbol</code>s, vectors of strings, <code>All</code>, <code>Cols</code>, <code>:</code>, <code>Between</code>, <code>Not</code> and regular expressions)</li><li>a <code>cols =&gt; function</code> pair indicating that <code>function</code> should be called with positional arguments holding columns <code>cols</code>, which can be any valid column selector; in this case target column name is automatically generated and it is assumed that <code>function</code> returns a single value or a vector; the generated name is created by concatenating source column name and <code>function</code> name by default (see examples below).</li><li>a <code>cols =&gt; function =&gt; target_cols</code> form additionally explicitly specifying the target column or columns, which must be a single name (as a <code>Symbol</code> or a string), a vector of names or <code>AsTable</code>. Additionally it can be a <code>Function</code> which takes a string or a vector of strings as an argument containing names of columns selected by <code>cols</code>, and returns the target columns names (all accepted types except <code>AsTable</code> are allowed).</li><li>a <code>col =&gt; target_cols</code> pair, which renames the column <code>col</code> to <code>target_cols</code>, which must be single name (as a <code>Symbol</code> or a string), a vector of names or <code>AsTable</code>.</li><li>column-independent operations <code>function =&gt; target_cols</code> or just <code>function</code> for specific <code>function</code>s where the input columns are omitted; without <code>target_cols</code> the new column has the same name as <code>function</code>, otherwise it must be single name (as a <code>Symbol</code> or a string). Supported <code>function</code>s are:<ul><li><code>nrow</code> to efficiently compute the number of rows in each group.</li><li><code>proprow</code> to efficiently compute the proportion of rows in each group.</li><li><code>eachindex</code> to return a vector holding the number of each row within each group.</li><li><code>groupindices</code> to return the group number.</li></ul></li><li>vectors or matrices containing transformations specified by the <code>Pair</code> syntax described in points 2 to 5</li><li>a function which will be called with a <code>SubDataFrame</code> corresponding to each group if a <code>GroupedDataFrame</code> is processed, or with the data frame itself if an <code>AbstractDataFrame</code> is processed; this form should be avoided due to its poor performance unless the number of groups is small or a very large number of columns are processed (in which case <code>SubDataFrame</code> avoids excessive compilation)</li></ol><p>Note! If the expression of the form <code>x =&gt; y</code> is passed then except for the special convenience form <code>nrow =&gt; target_cols</code> it is always interpreted as <code>cols =&gt; function</code>. In particular the following expression <code>function =&gt; target_cols</code> is not a valid transformation specification.</p><p>Note! If <code>cols</code> or <code>target_cols</code> are one of <code>All</code>, <code>Cols</code>, <code>Between</code>, or <code>Not</code>, broadcasting using <code>.=&gt;</code> is supported and is equivalent to broadcasting the result of <code>names(df, cols)</code> or <code>names(df, target_cols)</code>. This behaves as if broadcasting happened after replacing the selector with selected column names within the data frame scope.</p><p>All functions have two types of signatures. One of them takes a <code>GroupedDataFrame</code> as the first argument and an arbitrary number of transformations described above as following arguments. The second type of signature is when a <code>Function</code> or a <code>Type</code> is passed as the first argument and a <code>GroupedDataFrame</code> as the second argument (similar to <code>map</code>).</p><p>As a special rule, with the <code>cols =&gt; function</code> and <code>cols =&gt; function =&gt; target_cols</code> syntaxes, if <code>cols</code> is wrapped in an <code>AsTable</code> object then a <code>NamedTuple</code> containing columns selected by <code>cols</code> is passed to <code>function</code>. The documentation of <a href="#DataFrames.table_transformation"><code>DataFrames.table_transformation</code></a> provides more information about this functionality, in particular covering performance considerations.</p><p>What is allowed for <code>function</code> to return is determined by the <code>target_cols</code> value:</p><ol><li>If both <code>cols</code> and <code>target_cols</code> are omitted (so only a <code>function</code> is passed), then returning a data frame, a matrix, a <code>NamedTuple</code>, a <code>Tables.AbstractRow</code> or a <code>DataFrameRow</code> will produce multiple columns in the result. Returning any other value produces a single column.</li><li>If <code>target_cols</code> is a <code>Symbol</code> or a string then the function is assumed to return a single column. In this case returning a data frame, a matrix, a <code>NamedTuple</code>, a <code>Tables.AbstractRow</code>, or a <code>DataFrameRow</code> raises an error.</li><li>If <code>target_cols</code> is a vector of <code>Symbol</code>s or strings or <code>AsTable</code> it is assumed that <code>function</code> returns multiple columns. If <code>function</code> returns one of <code>AbstractDataFrame</code>, <code>NamedTuple</code>, <code>DataFrameRow</code>, <code>Tables.AbstractRow</code>, <code>AbstractMatrix</code> then rules described in point 1 above apply. If <code>function</code> returns an <code>AbstractVector</code> then each element of this vector must support the <code>keys</code> function, which must return a collection of <code>Symbol</code>s, strings or integers; the return value of <code>keys</code> must be identical for all elements. Then as many columns are created as there are elements in the return value of the <code>keys</code> function. If <code>target_cols</code> is <code>AsTable</code> then their names are set to be equal to the key names except if <code>keys</code> returns integers, in which case they are prefixed by <code>x</code> (so the column names are e.g. <code>x1</code>, <code>x2</code>, ...). If <code>target_cols</code> is a vector of <code>Symbol</code>s or strings then column names produced using the rules above are ignored and replaced by <code>target_cols</code> (the number of columns must be the same as the length of <code>target_cols</code> in this case). If <code>fun</code> returns a value of any other type then it is assumed that it is a table conforming to the Tables.jl API and the <code>Tables.columntable</code> function is called on it to get the resulting columns and their names. The names are retained when <code>target_cols</code> is <code>AsTable</code> and are replaced if <code>target_cols</code> is a vector of <code>Symbol</code>s or strings.</li></ol><p>In all of these cases, <code>function</code> can return either a single row or multiple rows. As a particular rule, values wrapped in a <code>Ref</code> or a <code>0</code>-dimensional <code>AbstractArray</code> are unwrapped and then treated as a single row.</p><p><code>select</code>/<code>select!</code> and <code>transform</code>/<code>transform!</code> always return a data frame with the same number and order of rows as the source (even if <code>GroupedDataFrame</code> had its groups reordered), except when selection results in zero columns in the resulting data frame (in which case the result has zero rows).</p><p>For <code>combine</code>, rows in the returned object appear in the order of groups in the <code>GroupedDataFrame</code>. The functions can return an arbitrary number of rows for each group, but the kind of returned object and the number and names of columns must be the same for all groups, except when a <code>DataFrame()</code> or <code>NamedTuple()</code> is returned, in which case a given group is skipped.</p><p>It is allowed to mix single values and vectors if multiple transformations are requested. In this case single value will be repeated to match the length of columns specified by returned vectors.</p><p>To apply <code>function</code> to each row instead of whole columns, it can be wrapped in a <code>ByRow</code> struct. <code>cols</code> can be any column indexing syntax, in which case <code>function</code> will be passed one argument for each of the columns specified by <code>cols</code> or a <code>NamedTuple</code> of them if specified columns are wrapped in <code>AsTable</code>. If <code>ByRow</code> is used it is allowed for <code>cols</code> to select an empty set of columns, in which case <code>function</code> is called for each row without any arguments and an empty <code>NamedTuple</code> is passed if empty set of columns is wrapped in <code>AsTable</code>.</p><p>If a collection of column names is passed then requesting duplicate column names in target data frame are accepted (e.g. <code>select!(df, [:a], :, r&quot;a&quot;)</code> is allowed) and only the first occurrence is used. In particular a syntax to move column <code>:col</code> to the first position in the data frame is <code>select!(df, :col, :)</code>. On the contrary, output column names of renaming, transformation and single column selection operations must be unique, so e.g. <code>select!(df, :a, :a =&gt; :a)</code> or <code>select!(df, :a, :a =&gt; ByRow(sin) =&gt; :a)</code> are not allowed.</p><p>In general columns returned by transformations are stored in the target data frame without copying. An exception to this rule is when columns from the source data frame are reused in the target data frame. This can happen via expressions like: <code>:x1</code>, <code>[:x1, :x2]</code>, <code>:x1 =&gt; :x2</code>, <code>:x1 =&gt; identity =&gt; :x2</code>, or <code>:x1 =&gt; (x -&gt; @view x[inds])</code> (note that in the last case the source column is reused indirectly via a view). In such cases the behavior depends on the value of the <code>copycols</code> keyword argument:</p><ul><li>if <code>copycols=true</code> then results of such transformations always perform a copy of the source column or its view;</li><li>if <code>copycols=false</code> then copies are only performed to avoid storing the same column several times in the target data frame; more precisely, no copy is made the first time a column is used, but each subsequent reuse of a source column (when compared using <code>===</code>, which excludes views of source columns) performs a copy;</li></ul><p>Note that performing <code>transform!</code> or <code>select!</code> assumes that <code>copycols=false</code>.</p><p>If <code>df</code> is a <code>SubDataFrame</code> and <code>copycols=true</code> then a <code>DataFrame</code> is returned and the same copying rules apply as for a <code>DataFrame</code> input: this means in particular that selected columns will be copied. If <code>copycols=false</code>, a <code>SubDataFrame</code> is returned without copying columns and in this case transforming or renaming columns is not allowed.</p><p>If a <code>GroupedDataFrame</code> is passed and <code>threads=true</code> (the default), a separate task is spawned for each specified transformation; each transformation then spawns as many tasks as Julia threads, and splits processing of groups across them (however, currently transformations with optimized implementations like <code>sum</code> and transformations that return multiple rows use a single task for all groups). This allows for parallel operation when Julia was started with more than one thread. Passed transformation functions must therefore not modify global variables (i.e. they must be pure), use locks to control parallel accesses, or <code>threads=false</code> must be passed to disable multithreading. In the future, parallelism may be extended to other cases, so this requirement also holds for <code>DataFrame</code> inputs.</p><p>In order to improve the performance of the operations some transformations invoke optimized implementation, see <a href="#DataFrames.table_transformation"><code>DataFrames.table_transformation</code></a> for details.</p><p><strong>Keyword arguments</strong></p><ul><li><code>renamecols::Bool=true</code> : whether in the <code>cols =&gt; function</code> form automatically generated column names should include the name of transformation functions or not.</li><li><code>ungroup::Bool=true</code> : whether the return value of the operation on <code>gd</code> should be a data frame or a <code>GroupedDataFrame</code>.</li><li><code>threads::Bool=true</code> : whether transformations may be run in separate tasks which can execute in parallel (possibly being applied to multiple rows or groups at the same time). Whether or not tasks are actually spawned and their number are determined automatically. Set to <code>false</code> if some transformations require serial execution or are not thread-safe.</li></ul><p>Metadata: this function propagates table-level <code>:note</code>-style metadata. Column-level <code>:note</code>-style metadata is propagated if: a) a single column is transformed to a single column and the name of the column   does not change (this includes all column selection operations), or b) a single column is transformed with <code>identity</code> or <code>copy</code> to a single column    even if column name is changed (this includes column renaming).    As a special case for <code>GroupedDataFrame</code> if the output has the same name    as a grouping column and <code>keepkeys=true</code>, metadata is taken from    original grouping column.</p><p>See <a href="#DataFrames.select"><code>select</code></a> for examples.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/selection.jl#L969-L999">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.vcat" href="#Base.vcat"><code>Base.vcat</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">vcat(dfs::AbstractDataFrame...;
+           ungroup::Bool=true, renamecols::Bool=true, threads::Bool=true)</code></pre><p>Mutate <code>df</code> or <code>gd</code> in place to add columns specified by <code>args...</code> and return it. The result is guaranteed to have the same number of rows as <code>df</code>. Equivalent to <code>select!(df, :, args...)</code> or <code>select!(gd, :, args...)</code>, except that column renaming performs a copy.</p><p>Below detailed common rules for all transformation functions supported by DataFrames.jl are explained and compared.</p><p>All these operations are supported both for <code>AbstractDataFrame</code> (when split and combine steps are skipped) and <code>GroupedDataFrame</code>. Technically, <code>AbstractDataFrame</code> is just considered as being grouped on no columns (meaning it has a single group, or zero groups if it is empty). The only difference is that in this case the <code>keepkeys</code> and <code>ungroup</code> keyword arguments (described below) are not supported and a data frame is always returned, as there are no split and combine steps in this case.</p><p>In order to perform operations by groups you first need to create a <code>GroupedDataFrame</code> object from your data frame using the <code>groupby</code> function that takes two arguments: (1) a data frame to be grouped, and (2) a set of columns to group by.</p><p>Operations can then be applied on each group using one of the following functions:</p><ul><li><code>combine</code>: does not put restrictions on number of rows returned per group; the returned values are vertically concatenated following order of groups in <code>GroupedDataFrame</code>; it is typically used to compute summary statistics by group; for <code>GroupedDataFrame</code> if grouping columns are kept they are put as first columns in the result;</li><li><code>select</code>: return a data frame with the number and order of rows exactly the same as the source data frame, including only new calculated columns; <code>select!</code> is an in-place version of <code>select</code>; for <code>GroupedDataFrame</code> if grouping columns are kept they are put as first columns in the result;</li><li><code>transform</code>: return a data frame with the number and order of rows exactly the same as the source data frame, including all columns from the source and new calculated columns; <code>transform!</code> is an in-place version of <code>transform</code>; existing columns in the source data frame are put as first columns in the result;</li></ul><p>As a special case, if a <code>GroupedDataFrame</code> that has zero groups is passed then the result of the operation is determined by performing a single call to the transformation function with a 0-row argument passed to it. The output of this operation is only used to identify the number and type of produced columns, but the result has zero rows.</p><p>All these functions take a specification of one or more functions to apply to each subset of the <code>DataFrame</code>. This specification can be of the following forms:</p><ol><li>standard column selectors (integers, <code>Symbol</code>s, strings, vectors of integers, vectors of <code>Symbol</code>s, vectors of strings, <code>All</code>, <code>Cols</code>, <code>:</code>, <code>Between</code>, <code>Not</code> and regular expressions)</li><li>a <code>cols =&gt; function</code> pair indicating that <code>function</code> should be called with positional arguments holding columns <code>cols</code>, which can be any valid column selector; in this case target column name is automatically generated and it is assumed that <code>function</code> returns a single value or a vector; the generated name is created by concatenating source column name and <code>function</code> name by default (see examples below).</li><li>a <code>cols =&gt; function =&gt; target_cols</code> form additionally explicitly specifying the target column or columns, which must be a single name (as a <code>Symbol</code> or a string), a vector of names or <code>AsTable</code>. Additionally it can be a <code>Function</code> which takes a string or a vector of strings as an argument containing names of columns selected by <code>cols</code>, and returns the target columns names (all accepted types except <code>AsTable</code> are allowed).</li><li>a <code>col =&gt; target_cols</code> pair, which renames the column <code>col</code> to <code>target_cols</code>, which must be single name (as a <code>Symbol</code> or a string), a vector of names or <code>AsTable</code>.</li><li>column-independent operations <code>function =&gt; target_cols</code> or just <code>function</code> for specific <code>function</code>s where the input columns are omitted; without <code>target_cols</code> the new column has the same name as <code>function</code>, otherwise it must be single name (as a <code>Symbol</code> or a string). Supported <code>function</code>s are:<ul><li><code>nrow</code> to efficiently compute the number of rows in each group.</li><li><code>proprow</code> to efficiently compute the proportion of rows in each group.</li><li><code>eachindex</code> to return a vector holding the number of each row within each group.</li><li><code>groupindices</code> to return the group number.</li></ul></li><li>vectors or matrices containing transformations specified by the <code>Pair</code> syntax described in points 2 to 5</li><li>a function which will be called with a <code>SubDataFrame</code> corresponding to each group if a <code>GroupedDataFrame</code> is processed, or with the data frame itself if an <code>AbstractDataFrame</code> is processed; this form should be avoided due to its poor performance unless the number of groups is small or a very large number of columns are processed (in which case <code>SubDataFrame</code> avoids excessive compilation)</li></ol><p>Note! If the expression of the form <code>x =&gt; y</code> is passed then except for the special convenience form <code>nrow =&gt; target_cols</code> it is always interpreted as <code>cols =&gt; function</code>. In particular the following expression <code>function =&gt; target_cols</code> is not a valid transformation specification.</p><p>Note! If <code>cols</code> or <code>target_cols</code> are one of <code>All</code>, <code>Cols</code>, <code>Between</code>, or <code>Not</code>, broadcasting using <code>.=&gt;</code> is supported and is equivalent to broadcasting the result of <code>names(df, cols)</code> or <code>names(df, target_cols)</code>. This behaves as if broadcasting happened after replacing the selector with selected column names within the data frame scope.</p><p>All functions have two types of signatures. One of them takes a <code>GroupedDataFrame</code> as the first argument and an arbitrary number of transformations described above as following arguments. The second type of signature is when a <code>Function</code> or a <code>Type</code> is passed as the first argument and a <code>GroupedDataFrame</code> as the second argument (similar to <code>map</code>).</p><p>As a special rule, with the <code>cols =&gt; function</code> and <code>cols =&gt; function =&gt; target_cols</code> syntaxes, if <code>cols</code> is wrapped in an <code>AsTable</code> object then a <code>NamedTuple</code> containing columns selected by <code>cols</code> is passed to <code>function</code>. The documentation of <a href="#DataFrames.table_transformation"><code>DataFrames.table_transformation</code></a> provides more information about this functionality, in particular covering performance considerations.</p><p>What is allowed for <code>function</code> to return is determined by the <code>target_cols</code> value:</p><ol><li>If both <code>cols</code> and <code>target_cols</code> are omitted (so only a <code>function</code> is passed), then returning a data frame, a matrix, a <code>NamedTuple</code>, a <code>Tables.AbstractRow</code> or a <code>DataFrameRow</code> will produce multiple columns in the result. Returning any other value produces a single column.</li><li>If <code>target_cols</code> is a <code>Symbol</code> or a string then the function is assumed to return a single column. In this case returning a data frame, a matrix, a <code>NamedTuple</code>, a <code>Tables.AbstractRow</code>, or a <code>DataFrameRow</code> raises an error.</li><li>If <code>target_cols</code> is a vector of <code>Symbol</code>s or strings or <code>AsTable</code> it is assumed that <code>function</code> returns multiple columns. If <code>function</code> returns one of <code>AbstractDataFrame</code>, <code>NamedTuple</code>, <code>DataFrameRow</code>, <code>Tables.AbstractRow</code>, <code>AbstractMatrix</code> then rules described in point 1 above apply. If <code>function</code> returns an <code>AbstractVector</code> then each element of this vector must support the <code>keys</code> function, which must return a collection of <code>Symbol</code>s, strings or integers; the return value of <code>keys</code> must be identical for all elements. Then as many columns are created as there are elements in the return value of the <code>keys</code> function. If <code>target_cols</code> is <code>AsTable</code> then their names are set to be equal to the key names except if <code>keys</code> returns integers, in which case they are prefixed by <code>x</code> (so the column names are e.g. <code>x1</code>, <code>x2</code>, ...). If <code>target_cols</code> is a vector of <code>Symbol</code>s or strings then column names produced using the rules above are ignored and replaced by <code>target_cols</code> (the number of columns must be the same as the length of <code>target_cols</code> in this case). If <code>fun</code> returns a value of any other type then it is assumed that it is a table conforming to the Tables.jl API and the <code>Tables.columntable</code> function is called on it to get the resulting columns and their names. The names are retained when <code>target_cols</code> is <code>AsTable</code> and are replaced if <code>target_cols</code> is a vector of <code>Symbol</code>s or strings.</li></ol><p>In all of these cases, <code>function</code> can return either a single row or multiple rows. As a particular rule, values wrapped in a <code>Ref</code> or a <code>0</code>-dimensional <code>AbstractArray</code> are unwrapped and then treated as a single row.</p><p><code>select</code>/<code>select!</code> and <code>transform</code>/<code>transform!</code> always return a data frame with the same number and order of rows as the source (even if <code>GroupedDataFrame</code> had its groups reordered), except when selection results in zero columns in the resulting data frame (in which case the result has zero rows).</p><p>For <code>combine</code>, rows in the returned object appear in the order of groups in the <code>GroupedDataFrame</code>. The functions can return an arbitrary number of rows for each group, but the kind of returned object and the number and names of columns must be the same for all groups, except when a <code>DataFrame()</code> or <code>NamedTuple()</code> is returned, in which case a given group is skipped.</p><p>It is allowed to mix single values and vectors if multiple transformations are requested. In this case single value will be repeated to match the length of columns specified by returned vectors.</p><p>To apply <code>function</code> to each row instead of whole columns, it can be wrapped in a <code>ByRow</code> struct. <code>cols</code> can be any column indexing syntax, in which case <code>function</code> will be passed one argument for each of the columns specified by <code>cols</code> or a <code>NamedTuple</code> of them if specified columns are wrapped in <code>AsTable</code>. If <code>ByRow</code> is used it is allowed for <code>cols</code> to select an empty set of columns, in which case <code>function</code> is called for each row without any arguments and an empty <code>NamedTuple</code> is passed if empty set of columns is wrapped in <code>AsTable</code>.</p><p>If a collection of column names is passed then requesting duplicate column names in target data frame are accepted (e.g. <code>select!(df, [:a], :, r&quot;a&quot;)</code> is allowed) and only the first occurrence is used. In particular a syntax to move column <code>:col</code> to the first position in the data frame is <code>select!(df, :col, :)</code>. On the contrary, output column names of renaming, transformation and single column selection operations must be unique, so e.g. <code>select!(df, :a, :a =&gt; :a)</code> or <code>select!(df, :a, :a =&gt; ByRow(sin) =&gt; :a)</code> are not allowed.</p><p>In general columns returned by transformations are stored in the target data frame without copying. An exception to this rule is when columns from the source data frame are reused in the target data frame. This can happen via expressions like: <code>:x1</code>, <code>[:x1, :x2]</code>, <code>:x1 =&gt; :x2</code>, <code>:x1 =&gt; identity =&gt; :x2</code>, or <code>:x1 =&gt; (x -&gt; @view x[inds])</code> (note that in the last case the source column is reused indirectly via a view). In such cases the behavior depends on the value of the <code>copycols</code> keyword argument:</p><ul><li>if <code>copycols=true</code> then results of such transformations always perform a copy of the source column or its view;</li><li>if <code>copycols=false</code> then copies are only performed to avoid storing the same column several times in the target data frame; more precisely, no copy is made the first time a column is used, but each subsequent reuse of a source column (when compared using <code>===</code>, which excludes views of source columns) performs a copy;</li></ul><p>Note that performing <code>transform!</code> or <code>select!</code> assumes that <code>copycols=false</code>.</p><p>If <code>df</code> is a <code>SubDataFrame</code> and <code>copycols=true</code> then a <code>DataFrame</code> is returned and the same copying rules apply as for a <code>DataFrame</code> input: this means in particular that selected columns will be copied. If <code>copycols=false</code>, a <code>SubDataFrame</code> is returned without copying columns and in this case transforming or renaming columns is not allowed.</p><p>If a <code>GroupedDataFrame</code> is passed and <code>threads=true</code> (the default), a separate task is spawned for each specified transformation; each transformation then spawns as many tasks as Julia threads, and splits processing of groups across them (however, currently transformations with optimized implementations like <code>sum</code> and transformations that return multiple rows use a single task for all groups). This allows for parallel operation when Julia was started with more than one thread. Passed transformation functions must therefore not modify global variables (i.e. they must be pure), use locks to control parallel accesses, or <code>threads=false</code> must be passed to disable multithreading. In the future, parallelism may be extended to other cases, so this requirement also holds for <code>DataFrame</code> inputs.</p><p>In order to improve the performance of the operations some transformations invoke optimized implementation, see <a href="#DataFrames.table_transformation"><code>DataFrames.table_transformation</code></a> for details.</p><p><strong>Keyword arguments</strong></p><ul><li><code>renamecols::Bool=true</code> : whether in the <code>cols =&gt; function</code> form automatically generated column names should include the name of transformation functions or not.</li><li><code>ungroup::Bool=true</code> : whether the return value of the operation on <code>gd</code> should be a data frame or a <code>GroupedDataFrame</code>.</li><li><code>threads::Bool=true</code> : whether transformations may be run in separate tasks which can execute in parallel (possibly being applied to multiple rows or groups at the same time). Whether or not tasks are actually spawned and their number are determined automatically. Set to <code>false</code> if some transformations require serial execution or are not thread-safe.</li></ul><p>Metadata: this function propagates table-level <code>:note</code>-style metadata. Column-level <code>:note</code>-style metadata is propagated if: a) a single column is transformed to a single column and the name of the column   does not change (this includes all column selection operations), or b) a single column is transformed with <code>identity</code> or <code>copy</code> to a single column    even if column name is changed (this includes column renaming).    As a special case for <code>GroupedDataFrame</code> if the output has the same name    as a grouping column and <code>keepkeys=true</code>, metadata is taken from    original grouping column.</p><p>See <a href="#DataFrames.select"><code>select</code></a> for examples.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/selection.jl#L969-L999">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.vcat" href="#Base.vcat"><code>Base.vcat</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">vcat(dfs::AbstractDataFrame...;
      cols::Union{Symbol, AbstractVector{Symbol},
                  AbstractVector{&lt;:AbstractString}}=:setequal,
      source::Union{Nothing, Symbol, AbstractString,
@@ -1841,7 +1841,7 @@
    6 │     6        6  missing  b
    7 │     7  missing        7  d
    8 │     8  missing        8  d
-   9 │     9  missing        9  d</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L1653-L1809">source</a></section></article><h2 id="Reshaping-data-frames-between-tall-and-wide-formats"><a class="docs-heading-anchor" href="#Reshaping-data-frames-between-tall-and-wide-formats">Reshaping data frames between tall and wide formats</a><a id="Reshaping-data-frames-between-tall-and-wide-formats-1"></a><a class="docs-heading-anchor-permalink" href="#Reshaping-data-frames-between-tall-and-wide-formats" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.stack" href="#Base.stack"><code>Base.stack</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">stack(df::AbstractDataFrame[, measure_vars[, id_vars] ];
+   9 │     9  missing        9  d</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L1653-L1809">source</a></section></article><h2 id="Reshaping-data-frames-between-tall-and-wide-formats"><a class="docs-heading-anchor" href="#Reshaping-data-frames-between-tall-and-wide-formats">Reshaping data frames between tall and wide formats</a><a id="Reshaping-data-frames-between-tall-and-wide-formats-1"></a><a class="docs-heading-anchor-permalink" href="#Reshaping-data-frames-between-tall-and-wide-formats" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.stack" href="#Base.stack"><code>Base.stack</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">stack(df::AbstractDataFrame[, measure_vars[, id_vars] ];
       variable_name=:variable, value_name=:value,
       view::Bool=false, variable_eltype::Type=String)</code></pre><p>Stack a data frame <code>df</code>, i.e. convert it from wide to long format.</p><p>Return the long-format <code>DataFrame</code> with: columns for each of the <code>id_vars</code>, column <code>value_name</code> (<code>:value</code> by default) holding the values of the stacked columns (<code>measure_vars</code>), and column <code>variable_name</code> (<code>:variable</code> by default) a vector holding the name of the corresponding <code>measure_vars</code> variable.</p><p>If <code>view=true</code> then return a stacked view of a data frame (long format). The result is a view because the columns are special <code>AbstractVectors</code> that return views into the original data frame.</p><p><strong>Arguments</strong></p><ul><li><code>df</code> : the AbstractDataFrame to be stacked</li><li><code>measure_vars</code> : the columns to be stacked (the measurement variables), as a column selector (<code>Symbol</code>, string or integer; <code>:</code>, <code>Cols</code>, <code>All</code>, <code>Between</code>, <code>Not</code>, a regular expression, or a vector of <code>Symbol</code>s, strings or integers). If neither <code>measure_vars</code> or <code>id_vars</code> are given, <code>measure_vars</code> defaults to all floating point columns.</li><li><code>id_vars</code> : the identifier columns that are repeated during stacking, as a column selector (<code>Symbol</code>, string or integer; <code>:</code>, <code>Cols</code>, <code>All</code>, <code>Between</code>, <code>Not</code>, a regular expression, or a vector of <code>Symbol</code>s, strings or integers). Defaults to all variables that are not <code>measure_vars</code></li><li><code>variable_name</code> : the name (<code>Symbol</code> or string) of the new stacked column that shall hold the names of each of <code>measure_vars</code></li><li><code>value_name</code> : the name (<code>Symbol</code> or string) of the new stacked column containing the values from each of <code>measure_vars</code></li><li><code>view</code> : whether the stacked data frame should be a view rather than contain freshly allocated vectors.</li><li><code>variable_eltype</code> : determines the element type of column <code>variable_name</code>. By default a <code>PooledArray{String}</code> is created. If <code>variable_eltype=Symbol</code> a <code>PooledVector{Symbol}</code> is created, and if <code>variable_eltype=CategoricalValue{String}</code> a <code>CategoricalArray{String}</code> is produced (call <code>using CategoricalArrays</code> first if needed) Passing any other type <code>T</code> will produce a <code>PooledVector{T}</code> column as long as it supports conversion from <code>String</code>. When <code>view=true</code>, a <code>RepeatedVector{T}</code> is produced.</li></ul><p>Metadata: table-level <code>:note</code>-style metadata and column-level <code>:note</code>-style metadata for identifier columns are preserved.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=repeat(1:3, inner=2),
                       b=repeat(1:2, inner=3),
@@ -1929,7 +1929,7 @@
    9 │     2      1  c       d                3
   10 │     2      2  d       d                4
   11 │     3      2  e       d                5
-  12 │     3      2  f       d                6</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/reshape.jl#L1-L135">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.unstack" href="#DataFrames.unstack"><code>DataFrames.unstack</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">unstack(df::AbstractDataFrame, rowkeys, colkey, value;
+  12 │     3      2  f       d                6</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/reshape.jl#L1-L135">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.unstack" href="#DataFrames.unstack"><code>DataFrames.unstack</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">unstack(df::AbstractDataFrame, rowkeys, colkey, value;
         renamecols::Function=identity, allowmissing::Bool=false,
         combine=only, fill=missing, threads::Bool=true)
 unstack(df::AbstractDataFrame, colkey, value;
@@ -2074,7 +2074,7 @@
  Row │ a       b
      │ Int64?  Int64?
 ─────┼────────────────
-   1 │      3       4</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/reshape.jl#L215-L419">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.permutedims" href="#Base.permutedims"><code>Base.permutedims</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">permutedims(df::AbstractDataFrame,
+   1 │      3       4</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/reshape.jl#L215-L419">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.permutedims" href="#Base.permutedims"><code>Base.permutedims</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">permutedims(df::AbstractDataFrame,
             [src_namescol::Union{Int, Symbol, AbstractString}],
             [dest_namescol::Union{Symbol, AbstractString}];
             makeunique::Bool=false, strict::Bool=true)</code></pre><p>Turn <code>df</code> on its side such that rows become columns and values in the column indexed by <code>src_namescol</code> become the names of new columns. In the resulting <code>DataFrame</code>, column names of <code>df</code> will become the first column with name specified by <code>dest_namescol</code>.</p><p><strong>Arguments</strong></p><ul><li><code>df</code> : the <code>AbstractDataFrame</code></li><li><code>src_namescol</code> : the column that will become the new header.  If omitted then column names <code>:x1</code>, <code>:x2</code>, ... are generated automatically.</li><li><code>dest_namescol</code> : the name of the first column in the returned <code>DataFrame</code>. Defaults to the same name as <code>src_namescol</code>. Not supported when <code>src_namescol</code> is a vector or is omitted.</li><li><code>makeunique</code> : if <code>false</code> (the default), an error will be raised if duplicate names are found; if <code>true</code>, duplicate names will be suffixed with <code>_i</code> (<code>i</code> starting at 1 for the first duplicate). Not supported when <code>src_namescol</code> is omitted.</li><li><code>strict</code> : if <code>true</code> (the default), an error will be raised if the values contained in the <code>src_namescol</code> are not all <code>Symbol</code> or all <code>AbstractString</code>, or can all be converted to <code>String</code> using <code>convert</code>. If <code>false</code> then any values are accepted and the will be changed to strings using the <code>string</code> function. Not supported when <code>src_namescol</code> is a vector or is omitted.</li></ul><p>Note: The element types of columns in resulting <code>DataFrame</code> (other than the first column if it is created from <code>df</code> column names, which always has element type <code>String</code>) will depend on the element types of <em>all</em> input columns based on the result of <code>promote_type</code>. That is, if the source data frame contains <code>Int</code> and <code>Float64</code> columns, resulting columns will have element type <code>Float64</code>. If the source has <code>Int</code> and <code>String</code> columns, resulting columns will have element type <code>Any</code>.</p><p>Metadata: table-level <code>:note</code>-style metadata is preserved and column-level metadata is dropped.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:2, b=3:4)
@@ -2133,7 +2133,7 @@
 ─────┼─────────────────────────────
    1 │ b               1     two
    2 │ c               3     4
-   3 │ d               true  false</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/reshape.jl#L722-L823">source</a></section></article><h2 id="Sorting"><a class="docs-heading-anchor" href="#Sorting">Sorting</a><a id="Sorting-1"></a><a class="docs-heading-anchor-permalink" href="#Sorting" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.issorted" href="#Base.issorted"><code>Base.issorted</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">issorted(df::AbstractDataFrame, cols=All();
+   3 │ d               true  false</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/reshape.jl#L722-L823">source</a></section></article><h2 id="Sorting"><a class="docs-heading-anchor" href="#Sorting">Sorting</a><a id="Sorting-1"></a><a class="docs-heading-anchor-permalink" href="#Sorting" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.issorted" href="#Base.issorted"><code>Base.issorted</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">issorted(df::AbstractDataFrame, cols=All();
          lt::Union{Function, AbstractVector{&lt;:Function}}=isless,
          by::Union{Function, AbstractVector{&lt;:Function}}=identity,
          rev::Union{Bool, AbstractVector{Bool}}=false,
@@ -2158,7 +2158,7 @@
 false
 
 julia&gt; issorted(df, :b, rev=true)
-true</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/sort.jl#L367-L408">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.order" href="#DataFrames.order"><code>DataFrames.order</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">order(col::ColumnIndex; kwargs...)</code></pre><p>Specify sorting order for a column <code>col</code> in a data frame. <code>kwargs</code> can be <code>lt</code>, <code>by</code>, <code>rev</code>, and <code>order</code> with values following the rules defined in <a href="#Base.sort!"><code>sort!</code></a>.</p><p>See also: <a href="#Base.sort!"><code>sort!</code></a>, <a href="#Base.sort"><code>sort</code></a></p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(x=[-3, -1, 0, 2, 4], y=1:5)
+true</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/sort.jl#L367-L408">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.order" href="#DataFrames.order"><code>DataFrames.order</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">order(col::ColumnIndex; kwargs...)</code></pre><p>Specify sorting order for a column <code>col</code> in a data frame. <code>kwargs</code> can be <code>lt</code>, <code>by</code>, <code>rev</code>, and <code>order</code> with values following the rules defined in <a href="#Base.sort!"><code>sort!</code></a>.</p><p>See also: <a href="#Base.sort!"><code>sort!</code></a>, <a href="#Base.sort"><code>sort</code></a></p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(x=[-3, -1, 0, 2, 4], y=1:5)
 5×2 DataFrame
  Row │ x      y
      │ Int64  Int64
@@ -2189,7 +2189,7 @@
    2 │    -1      2
    3 │     2      4
    4 │    -3      1
-   5 │     4      5</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/sort.jl#L25-L69">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.sort" href="#Base.sort"><code>Base.sort</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">sort(df::AbstractDataFrame, cols=All();
+   5 │     4      5</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/sort.jl#L25-L69">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.sort" href="#Base.sort"><code>Base.sort</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">sort(df::AbstractDataFrame, cols=All();
      alg::Union{Algorithm, Nothing}=nothing,
      lt::Union{Function, AbstractVector{&lt;:Function}}=isless,
      by::Union{Function, AbstractVector{&lt;:Function}}=identity,
@@ -2244,7 +2244,7 @@
    1 │     1  c
    2 │     1  b
    3 │     2  a
-   4 │     3  b</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/sort.jl#L438-L518">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.sort!" href="#Base.sort!"><code>Base.sort!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">sort!(df::AbstractDataFrame, cols=All();
+   4 │     3  b</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/sort.jl#L438-L518">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.sort!" href="#Base.sort!"><code>Base.sort!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">sort!(df::AbstractDataFrame, cols=All();
       alg::Union{Algorithm, Nothing}=nothing,
       lt::Union{Function, AbstractVector{&lt;:Function}}=isless,
       by::Union{Function, AbstractVector{&lt;:Function}}=identity,
@@ -2298,7 +2298,7 @@
    1 │     1  c
    2 │     1  b
    3 │     2  a
-   4 │     3  b</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/sort.jl#L619-L701">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.sortperm" href="#Base.sortperm"><code>Base.sortperm</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">sortperm(df::AbstractDataFrame, cols=All();
+   4 │     3  b</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/sort.jl#L619-L701">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.sortperm" href="#Base.sortperm"><code>Base.sortperm</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">sortperm(df::AbstractDataFrame, cols=All();
          alg::Union{Algorithm, Nothing}=nothing,
          lt::Union{Function, AbstractVector{&lt;:Function}}=isless,
          by::Union{Function, AbstractVector{&lt;:Function}}=identity,
@@ -2340,7 +2340,7 @@
  2
  4
  3
- 1</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/sort.jl#L532-L595">source</a></section></article><h2 id="Joining"><a class="docs-heading-anchor" href="#Joining">Joining</a><a id="Joining-1"></a><a class="docs-heading-anchor-permalink" href="#Joining" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.antijoin" href="#DataAPI.antijoin"><code>DataAPI.antijoin</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">antijoin(df1, df2; on, makeunique=false, validate=(false, false), matchmissing=:error)</code></pre><p>Perform an anti join of two data frame objects and return a <code>DataFrame</code> containing the result. An anti join returns the subset of rows of <code>df1</code> that do not match with the keys in <code>df2</code>.</p><p>The order of rows in the result is kept from <code>df1</code>.</p><p><strong>Arguments</strong></p><ul><li><code>df1</code>, <code>df2</code>: the <code>AbstractDataFrames</code> to be joined</li></ul><p><strong>Keyword Arguments</strong></p><ul><li><code>on</code> : The names of the key columns on which to join the data frames. This can be a single name, or a vector of names (for joining on multiple columns). A <code>left=&gt;right</code> pair of names can be used instead of a name, for the case where a key has different names in <code>df1</code> and <code>df2</code> (it is allowed to mix names and name pairs in a vector). Key values are compared using <code>isequal</code>. <code>on</code> is a required argument.</li><li><code>makeunique</code> : ignored as no columns are added to <code>df1</code> columns (it is provided for consistency with other functions).</li><li><code>validate</code> : whether to check that columns passed as the <code>on</code> argument  define unique keys in each input data frame (according to <code>isequal</code>).  Can be a tuple or a pair, with the first element indicating whether to  run check for <code>df1</code> and the second element for <code>df2</code>.  By default no check is performed.</li><li><code>matchmissing</code> : if equal to <code>:error</code> throw an error if <code>missing</code> is present in <code>on</code> columns; if equal to <code>:equal</code> then <code>missing</code> is allowed and missings are matched; if equal to <code>:notequal</code> then missings are dropped in <code>df2</code> <code>on</code> columns.</li></ul><p>It is not allowed to join on columns that contain <code>NaN</code> or <code>-0.0</code> in real or imaginary part of the number. If you need to perform a join on such values use CategoricalArrays.jl and transform a column containing such values into a <code>CategoricalVector</code>.</p><p>When merging <code>on</code> categorical columns that differ in the ordering of their levels, the ordering of the left data frame takes precedence over the ordering of the right data frame.</p><p>Metadata: table-level and column-level <code>:note</code>-style metadata are taken from <code>df1</code>.</p><p>See also: <a href="#DataAPI.innerjoin"><code>innerjoin</code></a>, <a href="#DataAPI.leftjoin"><code>leftjoin</code></a>, <a href="#DataAPI.rightjoin"><code>rightjoin</code></a>,           <a href="#DataAPI.outerjoin"><code>outerjoin</code></a>, <a href="#DataAPI.semijoin"><code>semijoin</code></a>, <a href="#DataAPI.crossjoin"><code>crossjoin</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; name = DataFrame(ID=[1, 2, 3], Name=[&quot;John Doe&quot;, &quot;Jane Doe&quot;, &quot;Joe Blogs&quot;])
+ 1</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/sort.jl#L532-L595">source</a></section></article><h2 id="Joining"><a class="docs-heading-anchor" href="#Joining">Joining</a><a id="Joining-1"></a><a class="docs-heading-anchor-permalink" href="#Joining" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.antijoin" href="#DataAPI.antijoin"><code>DataAPI.antijoin</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">antijoin(df1, df2; on, makeunique=false, validate=(false, false), matchmissing=:error)</code></pre><p>Perform an anti join of two data frame objects and return a <code>DataFrame</code> containing the result. An anti join returns the subset of rows of <code>df1</code> that do not match with the keys in <code>df2</code>.</p><p>The order of rows in the result is kept from <code>df1</code>.</p><p><strong>Arguments</strong></p><ul><li><code>df1</code>, <code>df2</code>: the <code>AbstractDataFrames</code> to be joined</li></ul><p><strong>Keyword Arguments</strong></p><ul><li><code>on</code> : The names of the key columns on which to join the data frames. This can be a single name, or a vector of names (for joining on multiple columns). A <code>left=&gt;right</code> pair of names can be used instead of a name, for the case where a key has different names in <code>df1</code> and <code>df2</code> (it is allowed to mix names and name pairs in a vector). Key values are compared using <code>isequal</code>. <code>on</code> is a required argument.</li><li><code>makeunique</code> : ignored as no columns are added to <code>df1</code> columns (it is provided for consistency with other functions).</li><li><code>validate</code> : whether to check that columns passed as the <code>on</code> argument  define unique keys in each input data frame (according to <code>isequal</code>).  Can be a tuple or a pair, with the first element indicating whether to  run check for <code>df1</code> and the second element for <code>df2</code>.  By default no check is performed.</li><li><code>matchmissing</code> : if equal to <code>:error</code> throw an error if <code>missing</code> is present in <code>on</code> columns; if equal to <code>:equal</code> then <code>missing</code> is allowed and missings are matched; if equal to <code>:notequal</code> then missings are dropped in <code>df2</code> <code>on</code> columns.</li></ul><p>It is not allowed to join on columns that contain <code>NaN</code> or <code>-0.0</code> in real or imaginary part of the number. If you need to perform a join on such values use CategoricalArrays.jl and transform a column containing such values into a <code>CategoricalVector</code>.</p><p>When merging <code>on</code> categorical columns that differ in the ordering of their levels, the ordering of the left data frame takes precedence over the ordering of the right data frame.</p><p>Metadata: table-level and column-level <code>:note</code>-style metadata are taken from <code>df1</code>.</p><p>See also: <a href="#DataAPI.innerjoin"><code>innerjoin</code></a>, <a href="#DataAPI.leftjoin"><code>leftjoin</code></a>, <a href="#DataAPI.rightjoin"><code>rightjoin</code></a>,           <a href="#DataAPI.outerjoin"><code>outerjoin</code></a>, <a href="#DataAPI.semijoin"><code>semijoin</code></a>, <a href="#DataAPI.crossjoin"><code>crossjoin</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; name = DataFrame(ID=[1, 2, 3], Name=[&quot;John Doe&quot;, &quot;Jane Doe&quot;, &quot;Joe Blogs&quot;])
 3×2 DataFrame
  Row │ ID     Name
      │ Int64  String
@@ -2386,7 +2386,7 @@
  Row │ ID     Name
      │ Int64  String
 ─────┼──────────────────
-   1 │     3  Joe Blogs</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/join/composer.jl#L1395-L1489">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.crossjoin" href="#DataAPI.crossjoin"><code>DataAPI.crossjoin</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">crossjoin(df1::AbstractDataFrame, df2::AbstractDataFrame;
+   1 │     3  Joe Blogs</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/join/composer.jl#L1395-L1489">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.crossjoin" href="#DataAPI.crossjoin"><code>DataAPI.crossjoin</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">crossjoin(df1::AbstractDataFrame, df2::AbstractDataFrame;
           makeunique::Bool=false, renamecols=identity =&gt; identity)
 crossjoin(df1, df2, dfs...; makeunique = false)</code></pre><p>Perform a cross join of two or more data frame objects and return a <code>DataFrame</code> containing the result. A cross join returns the cartesian product of rows from all passed data frames, where the first passed data frame is assigned to the dimension that changes the slowest and the last data frame is assigned to the dimension that changes the fastest.</p><p><strong>Arguments</strong></p><ul><li><code>df1</code>, <code>df2</code>, <code>dfs...</code> : the <code>AbstractDataFrames</code> to be joined</li></ul><p><strong>Keyword Arguments</strong></p><ul><li><code>makeunique</code> : if <code>false</code> (the default), an error will be raised if duplicate names are found in columns not joined on; if <code>true</code>, duplicate names will be suffixed with <code>_i</code> (<code>i</code> starting at 1 for the first duplicate).</li><li><code>renamecols</code> : a <code>Pair</code> specifying how columns of left and right data frames should be renamed in the resulting data frame. Each element of the pair can be a string or a <code>Symbol</code> can be passed in which case it is appended to the original column name; alternatively a function can be passed in which case it is applied to each column name, which is passed to it as a <code>String</code>.</li></ul><p>If more than two data frames are passed, the join is performed recursively with left associativity.</p><p>Metadata: table-level <code>:note</code>-style metadata is preserved only for keys which are defined in all passed tables and have the same value. Column-level <code>:note</code>-style metadata is preserved from both tables.</p><p>See also: <a href="#DataAPI.innerjoin"><code>innerjoin</code></a>, <a href="#DataAPI.leftjoin"><code>leftjoin</code></a>, <a href="#DataAPI.rightjoin"><code>rightjoin</code></a>,           <a href="#DataAPI.outerjoin"><code>outerjoin</code></a>, <a href="#DataAPI.semijoin"><code>semijoin</code></a>, <a href="#DataAPI.antijoin"><code>antijoin</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df1 = DataFrame(X=1:3)
 3×1 DataFrame
@@ -2415,7 +2415,7 @@
    3 │     2  a
    4 │     2  b
    5 │     3  a
-   6 │     3  b</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/join/composer.jl#L1500-L1566">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.innerjoin" href="#DataAPI.innerjoin"><code>DataAPI.innerjoin</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">innerjoin(df1, df2; on, makeunique=false, validate=(false, false),
+   6 │     3  b</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/join/composer.jl#L1500-L1566">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.innerjoin" href="#DataAPI.innerjoin"><code>DataAPI.innerjoin</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">innerjoin(df1, df2; on, makeunique=false, validate=(false, false),
           renamecols=(identity =&gt; identity), matchmissing=:error,
           order=:undefined)
 innerjoin(df1, df2, dfs...; on, makeunique=false,
@@ -2469,7 +2469,7 @@
      │ Int64  String    String
 ─────┼─────────────────────────
    1 │     1  John Doe  Lawyer
-   2 │     2  Jane Doe  Doctor</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/join/composer.jl#L630-L755">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.leftjoin" href="#DataAPI.leftjoin"><code>DataAPI.leftjoin</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">leftjoin(df1, df2; on, makeunique=false, source=nothing, validate=(false, false),
+   2 │     2  Jane Doe  Doctor</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/join/composer.jl#L630-L755">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.leftjoin" href="#DataAPI.leftjoin"><code>DataAPI.leftjoin</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">leftjoin(df1, df2; on, makeunique=false, source=nothing, validate=(false, false),
          renamecols=(identity =&gt; identity), matchmissing=:error, order=:undefined)</code></pre><p>Perform a left join of two data frame objects and return a <code>DataFrame</code> containing the result. A left join includes all rows from <code>df1</code>.</p><p>In the returned data frame the type of the columns on which the data frames are joined is determined by the type of these columns in <code>df1</code>. This behavior may change in future releases.</p><p><strong>Arguments</strong></p><ul><li><code>df1</code>, <code>df2</code>: the <code>AbstractDataFrames</code> to be joined</li></ul><p><strong>Keyword Arguments</strong></p><ul><li><code>on</code> : The names of the key columns on which to join the data frames. This can be a single name, or a vector of names (for joining on multiple columns). A <code>left=&gt;right</code> pair of names can be used instead of a name, for the case where a key has different names in <code>df1</code> and <code>df2</code> (it is allowed to mix names and name pairs in a vector). Key values are compared using <code>isequal</code>. <code>on</code> is a required argument.</li><li><code>makeunique</code> : if <code>false</code> (the default), an error will be raised if duplicate names are found in columns not joined on; if <code>true</code>, duplicate names will be suffixed with <code>_i</code> (<code>i</code> starting at 1 for the first duplicate).</li><li><code>source</code> : Default: <code>nothing</code>. If a <code>Symbol</code> or string, adds indicator column with the given name, for whether a row appeared in only <code>df1</code> (<code>&quot;left_only&quot;</code>) or in both (<code>&quot;both&quot;</code>). If the name is already in use, the column name will be modified if <code>makeunique=true</code>.</li><li><code>validate</code> : whether to check that columns passed as the <code>on</code> argument define unique keys in each input data frame (according to <code>isequal</code>). Can be a tuple or a pair, with the first element indicating whether to run check for <code>df1</code> and the second element for <code>df2</code>. By default no check is performed.</li><li><code>renamecols</code> : a <code>Pair</code> specifying how columns of left and right data frames should be renamed in the resulting data frame. Each element of the pair can be a string or a <code>Symbol</code> can be passed in which case it is appended to the original column name; alternatively a function can be passed in which case it is applied to each column name, which is passed to it as a <code>String</code>. Note that <code>renamecols</code> does not affect <code>on</code> columns, whose names are always taken from the left data frame and left unchanged.</li><li><code>matchmissing</code> : if equal to <code>:error</code> throw an error if <code>missing</code> is present in <code>on</code> columns; if equal to <code>:equal</code> then <code>missing</code> is allowed and missings are matched; if equal to <code>:notequal</code> then missings are dropped in <code>df2</code> <code>on</code> columns.</li><li><code>order</code> : if <code>:undefined</code> (the default) the order of rows in the result is  undefined and may change in future releases. If <code>:left</code> then the order of  rows from the left data frame is retained. If <code>:right</code> then the order of rows  from the right data frame is retained (non-matching rows are put at the end).</li></ul><p>All columns of the returned data frame will support missing values.</p><p>It is not allowed to join on columns that contain <code>NaN</code> or <code>-0.0</code> in real or imaginary part of the number. If you need to perform a join on such values use CategoricalArrays.jl and transform a column containing such values into a <code>CategoricalVector</code>.</p><p>When merging <code>on</code> categorical columns that differ in the ordering of their levels, the ordering of the left data frame takes precedence over the ordering of the right data frame.</p><p>Metadata: table-level and column-level <code>:note</code>-style metadata is taken from <code>df1</code> (including key columns), except for columns added to it from <code>df2</code>, whose column-level <code>:note</code>-style metadata is taken from <code>df2</code>.</p><p>See also: <a href="#DataAPI.innerjoin"><code>innerjoin</code></a>, <a href="#DataAPI.rightjoin"><code>rightjoin</code></a>, <a href="#DataAPI.outerjoin"><code>outerjoin</code></a>,           <a href="#DataAPI.semijoin"><code>semijoin</code></a>, <a href="#DataAPI.antijoin"><code>antijoin</code></a>, <a href="#DataAPI.crossjoin"><code>crossjoin</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; name = DataFrame(ID=[1, 2, 3], Name=[&quot;John Doe&quot;, &quot;Jane Doe&quot;, &quot;Joe Blogs&quot;])
 3×2 DataFrame
  Row │ ID     Name
@@ -2522,7 +2522,7 @@
 ─────┼───────────────────────────
    1 │     1  John Doe   Lawyer
    2 │     2  Jane Doe   Doctor
-   3 │     3  Joe Blogs  missing</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/join/composer.jl#L793-L916">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.leftjoin!" href="#DataFrames.leftjoin!"><code>DataFrames.leftjoin!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">leftjoin!(df1, df2; on, makeunique=false, source=nothing,
+   3 │     3  Joe Blogs  missing</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/join/composer.jl#L793-L916">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.leftjoin!" href="#DataFrames.leftjoin!"><code>DataFrames.leftjoin!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">leftjoin!(df1, df2; on, makeunique=false, source=nothing,
           matchmissing=:error)</code></pre><p>Perform a left join of two data frame objects by updating the <code>df1</code> with the joined columns from <code>df2</code>.</p><p>A left join includes all rows from <code>df1</code> and leaves all rows and columns from <code>df1</code> untouched. Note that each row in <code>df1</code> must have at most one match in <code>df2</code>. Otherwise, this function would not be able to execute the join in-place since new rows would need to be added to <code>df1</code>.</p><p><strong>Arguments</strong></p><ul><li><code>df1</code>, <code>df2</code>: the <code>AbstractDataFrames</code> to be joined</li></ul><p><strong>Keyword Arguments</strong></p><ul><li><code>on</code> : The names of the key columns on which to join the data frames. This can be a single name, or a vector of names (for joining on multiple columns). A <code>left=&gt;right</code> pair of names can be used instead of a name, for the case where a key has different names in <code>df1</code> and <code>df2</code> (it is allowed to mix names and name pairs in a vector). Key values are compared using <code>isequal</code>. <code>on</code> is a required argument.</li><li><code>makeunique</code> : if <code>false</code> (the default), an error will be raised if duplicate names are found in columns not joined on; if <code>true</code>, duplicate names will be suffixed with <code>_i</code> (<code>i</code> starting at 1 for the first duplicate).</li><li><code>source</code> : Default: <code>nothing</code>. If a <code>Symbol</code> or string, adds indicator column with the given name, for whether a row appeared in only <code>df1</code> (<code>&quot;left_only&quot;</code>) or in both (<code>&quot;both&quot;</code>). If the name is already in use, the column name will be modified if <code>makeunique=true</code>.</li><li><code>matchmissing</code> : if equal to <code>:error</code> throw an error if <code>missing</code> is present in <code>on</code> columns; if equal to <code>:equal</code> then <code>missing</code> is allowed and missings are matched; if equal to <code>:notequal</code> then missings are dropped in <code>df2</code> <code>on</code> columns.</li></ul><p>The columns added to <code>df1</code> from <code>df2</code> will support missing values.</p><p>It is not allowed to join on columns that contain <code>NaN</code> or <code>-0.0</code> in real or imaginary part of the number. If you need to perform a join on such values use CategoricalArrays.jl and transform a column containing such values into a <code>CategoricalVector</code>.</p><p>Metadata: table-level and column-level <code>:note</code>-style metadata are taken from <code>df1</code> (including key columns), except for columns added to it from <code>df2</code>, whose column-level <code>:note</code>-style metadata is taken from <code>df2</code>.</p><p>See also: <a href="#DataAPI.leftjoin"><code>leftjoin</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; name = DataFrame(ID=[1, 2, 3], Name=[&quot;John Doe&quot;, &quot;Jane Doe&quot;, &quot;Joe Blogs&quot;])
 3×2 DataFrame
  Row │ ID     Name
@@ -2566,7 +2566,7 @@
 ─────┼───────────────────────────────────────────────
    1 │     1  John Doe   Lawyer   Lawyer   both
    2 │     2  Jane Doe   Doctor   Doctor   both
-   3 │     3  Joe Blogs  missing  missing  left_only</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/join/inplace.jl#L1-L96">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.outerjoin" href="#DataAPI.outerjoin"><code>DataAPI.outerjoin</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">outerjoin(df1, df2; on, makeunique=false, source=nothing, validate=(false, false),
+   3 │     3  Joe Blogs  missing  missing  left_only</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/join/inplace.jl#L1-L96">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.outerjoin" href="#DataAPI.outerjoin"><code>DataAPI.outerjoin</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">outerjoin(df1, df2; on, makeunique=false, source=nothing, validate=(false, false),
           renamecols=(identity =&gt; identity), matchmissing=:error, order=:undefined)
 outerjoin(df1, df2, dfs...; on, makeunique = false,
           validate = (false, false), matchmissing=:error, order=:undefined)</code></pre><p>Perform an outer join of two or more data frame objects and return a <code>DataFrame</code> containing the result. An outer join includes rows with keys that appear in any of the passed data frames.</p><p>The order of rows in the result is undefined and may change in future releases.</p><p>In the returned data frame the type of the columns on which the data frames are joined is determined by the element type of these columns both <code>df1</code> and <code>df2</code>. This behavior may change in future releases.</p><p><strong>Arguments</strong></p><ul><li><code>df1</code>, <code>df2</code>, <code>dfs...</code> : the <code>AbstractDataFrames</code> to be joined</li></ul><p><strong>Keyword Arguments</strong></p><ul><li><code>on</code> : The names of the key columns on which to join the data frames. This can be a single name, or a vector of names (for joining on multiple columns). When joining only two data frames, a <code>left=&gt;right</code> pair of names can be used instead of a name, for the case where a key has different names in <code>df1</code> and <code>df2</code> (it is allowed to mix names and name pairs in a vector). Key values are compared using <code>isequal</code>. <code>on</code> is a required argument.</li><li><code>makeunique</code> : if <code>false</code> (the default), an error will be raised if duplicate names are found in columns not joined on; if <code>true</code>, duplicate names will be suffixed with <code>_i</code> (<code>i</code> starting at 1 for the first duplicate).</li><li><code>source</code> : Default: <code>nothing</code>. If a <code>Symbol</code> or string, adds indicator column with the given name for whether a row appeared in only <code>df1</code> (<code>&quot;left_only&quot;</code>), only <code>df2</code> (<code>&quot;right_only&quot;</code>) or in both (<code>&quot;both&quot;</code>). If the name is already in use, the column name will be modified if <code>makeunique=true</code>. This argument is only supported when joining exactly two data frames.</li><li><code>validate</code> : whether to check that columns passed as the <code>on</code> argument define unique keys in each input data frame (according to <code>isequal</code>). Can be a tuple or a pair, with the first element indicating whether to run check for <code>df1</code> and the second element for <code>df2</code>. By default no check is performed.</li><li><code>renamecols</code> : a <code>Pair</code> specifying how columns of left and right data frames should be renamed in the resulting data frame. Each element of the pair can be a string or a <code>Symbol</code> can be passed in which case it is appended to the original column name; alternatively a function can be passed in which case it is applied to each column name, which is passed to it as a <code>String</code>. Note that <code>renamecols</code> does not affect <code>on</code> columns, whose names are always taken from the left data frame and left unchanged.</li><li><code>matchmissing</code> : if equal to <code>:error</code> throw an error if <code>missing</code> is present in <code>on</code> columns; if equal to <code>:equal</code> then <code>missing</code> is allowed and missings are matched.</li><li><code>order</code> : if <code>:undefined</code> (the default) the order of rows in the result is  undefined and may change in future releases. If <code>:left</code> then the order of  rows from the left data frame is retained (non-matching rows are put at the end).  If <code>:right</code> then the order of rows from the right data frame is retained  (non-matching rows are put at the end).</li></ul><p>All columns of the returned data frame will support missing values.</p><p>It is not allowed to join on columns that contain <code>NaN</code> or <code>-0.0</code> in real or imaginary part of the number. If you need to perform a join on such values use CategoricalArrays.jl and transform a column containing such values into a <code>CategoricalVector</code>.</p><p>When merging <code>on</code> categorical columns that differ in the ordering of their levels, the ordering of the left data frame takes precedence over the ordering of the right data frame.</p><p>If more than two data frames are passed, the join is performed recursively with left associativity. In this case the <code>indicator</code> keyword argument is not supported and <code>validate</code> keyword argument is applied recursively with left associativity.</p><p>Metadata: table-level <code>:note</code>-style metadata and column-level <code>:note</code>-style metadata for key columns is preserved only for keys which are defined in all passed tables and have the same value. Column-level <code>:note</code>-style metadata is preserved for all other columns.</p><p>See also: <a href="#DataAPI.innerjoin"><code>innerjoin</code></a>, <a href="#DataAPI.leftjoin"><code>leftjoin</code></a>, <a href="#DataAPI.rightjoin"><code>rightjoin</code></a>,           <a href="#DataAPI.semijoin"><code>semijoin</code></a>, <a href="#DataAPI.antijoin"><code>antijoin</code></a>, <a href="#DataAPI.crossjoin"><code>crossjoin</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; name = DataFrame(ID=[1, 2, 3], Name=[&quot;John Doe&quot;, &quot;Jane Doe&quot;, &quot;Joe Blogs&quot;])
@@ -2624,7 +2624,7 @@
    1 │     1  John Doe   Lawyer
    2 │     2  Jane Doe   Doctor
    3 │     3  Joe Blogs  missing
-   4 │     4  missing    Farmer</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/join/composer.jl#L1102-L1241">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.rightjoin" href="#DataAPI.rightjoin"><code>DataAPI.rightjoin</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">rightjoin(df1, df2; on, makeunique=false, source=nothing,
+   4 │     4  missing    Farmer</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/join/composer.jl#L1102-L1241">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.rightjoin" href="#DataAPI.rightjoin"><code>DataAPI.rightjoin</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">rightjoin(df1, df2; on, makeunique=false, source=nothing,
           validate=(false, false), renamecols=(identity =&gt; identity),
           matchmissing=:error, order=:undefined)</code></pre><p>Perform a right join on two data frame objects and return a <code>DataFrame</code> containing the result. A right join includes all rows from <code>df2</code>.</p><p>The order of rows in the result is undefined and may change in future releases.</p><p>In the returned data frame the type of the columns on which the data frames are joined is determined by the type of these columns in <code>df2</code>. This behavior may change in future releases.</p><p><strong>Arguments</strong></p><ul><li><code>df1</code>, <code>df2</code>: the <code>AbstractDataFrames</code> to be joined</li></ul><p><strong>Keyword Arguments</strong></p><ul><li><code>on</code> : The names of the key columns on which to join the data frames. This can be a single name, or a vector of names (for joining on multiple columns). A <code>left=&gt;right</code> pair of names can be used instead of a name, for the case where a key has different names in <code>df1</code> and <code>df2</code> (it is allowed to mix names and name pairs in a vector). Key values are compared using <code>isequal</code>. <code>on</code> is a required argument.</li><li><code>makeunique</code> : if <code>false</code> (the default), an error will be raised if duplicate names are found in columns not joined on; if <code>true</code>, duplicate names will be suffixed with <code>_i</code> (<code>i</code> starting at 1 for the first duplicate).</li><li><code>source</code> : Default: <code>nothing</code>. If a <code>Symbol</code> or string, adds indicator column with the given name for whether a row appeared in only <code>df2</code> (<code>&quot;right_only&quot;</code>) or in both (<code>&quot;both&quot;</code>). If the name is already in use, the column name will be modified if <code>makeunique=true</code>.</li><li><code>validate</code> : whether to check that columns passed as the <code>on</code> argument define unique keys in each input data frame (according to <code>isequal</code>). Can be a tuple or a pair, with the first element indicating whether to run check for <code>df1</code> and the second element for <code>df2</code>. By default no check is performed.</li><li><code>renamecols</code> : a <code>Pair</code> specifying how columns of left and right data frames should be renamed in the resulting data frame. Each element of the pair can be a string or a <code>Symbol</code> can be passed in which case it is appended to the original column name; alternatively a function can be passed in which case it is applied to each column name, which is passed to it as a <code>String</code>. Note that <code>renamecols</code> does not affect <code>on</code> columns, whose names are always taken from the left data frame and left unchanged.</li><li><code>matchmissing</code> : if equal to <code>:error</code> throw an error if <code>missing</code> is present in <code>on</code> columns; if equal to <code>:equal</code> then <code>missing</code> is allowed and missings are matched; if equal to <code>:notequal</code> then missings are dropped in <code>df1</code> <code>on</code> columns.</li><li><code>order</code> : if <code>:undefined</code> (the default) the order of rows in the result is  undefined and may change in future releases. If <code>:left</code> then the order of  rows from the left data frame is retained (non-matching rows are put at the end).  If <code>:right</code> then the order of rows from the right data frame is retained.</li></ul><p>All columns of the returned data frame will support missing values.</p><p>It is not allowed to join on columns that contain <code>NaN</code> or <code>-0.0</code> in real or imaginary part of the number. If you need to perform a join on such values use CategoricalArrays.jl and transform a column containing such values into a <code>CategoricalVector</code>.</p><p>When merging <code>on</code> categorical columns that differ in the ordering of their levels, the ordering of the left data frame takes precedence over the ordering of the right data frame.</p><p>Metadata: table-level and column-level <code>:note</code>-style metadata is taken from <code>df2</code> (including key columns), except for columns added to it from <code>df1</code>, whose column-level <code>:note</code>-style metadata is taken from <code>df1</code>.</p><p>See also: <a href="#DataAPI.innerjoin"><code>innerjoin</code></a>, <a href="#DataAPI.leftjoin"><code>leftjoin</code></a>, <a href="#DataAPI.outerjoin"><code>outerjoin</code></a>,           <a href="#DataAPI.semijoin"><code>semijoin</code></a>, <a href="#DataAPI.antijoin"><code>antijoin</code></a>, <a href="#DataAPI.crossjoin"><code>crossjoin</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; name = DataFrame(ID=[1, 2, 3], Name=[&quot;John Doe&quot;, &quot;Jane Doe&quot;, &quot;Joe Blogs&quot;])
 3×2 DataFrame
@@ -2678,7 +2678,7 @@
 ─────┼─────────────────────────
    1 │     1  John Doe  Lawyer
    2 │     2  Jane Doe  Doctor
-   3 │     4  missing   Farmer</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/join/composer.jl#L946-L1072">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.semijoin" href="#DataAPI.semijoin"><code>DataAPI.semijoin</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">semijoin(df1, df2; on, makeunique=false, validate=(false, false), matchmissing=:error)</code></pre><p>Perform a semi join of two data frame objects and return a <code>DataFrame</code> containing the result. A semi join returns the subset of rows of <code>df1</code> that match with the keys in <code>df2</code>.</p><p>The order of rows in the result is kept from <code>df1</code>.</p><p><strong>Arguments</strong></p><ul><li><code>df1</code>, <code>df2</code>: the <code>AbstractDataFrames</code> to be joined</li></ul><p><strong>Keyword Arguments</strong></p><ul><li><code>on</code> : The names of the key columns on which to join the data frames. This can be a single name, or a vector of names (for joining on multiple columns). A <code>left=&gt;right</code> pair of names can be used instead of a name, for the case where a key has different names in <code>df1</code> and <code>df2</code> (it is allowed to mix names and name pairs in a vector). Key values are compared using <code>isequal</code>. <code>on</code> is a required argument.</li><li><code>makeunique</code> : ignored as no columns are added to <code>df1</code> columns (it is provided for consistency with other functions).</li><li><code>indicator</code> : Default: <code>nothing</code>. If a <code>Symbol</code> or string, adds categorical indicator  column with the given name for whether a row appeared in only <code>df1</code> (<code>&quot;left_only&quot;</code>),  only <code>df2</code> (<code>&quot;right_only&quot;</code>) or in both (<code>&quot;both&quot;</code>). If the name is already in use,  the column name will be modified if <code>makeunique=true</code>.</li><li><code>validate</code> : whether to check that columns passed as the <code>on</code> argument  define unique keys in each input data frame (according to <code>isequal</code>).  Can be a tuple or a pair, with the first element indicating whether to  run check for <code>df1</code> and the second element for <code>df2</code>.  By default no check is performed.</li><li><code>matchmissing</code> : if equal to <code>:error</code> throw an error if <code>missing</code> is present in <code>on</code> columns; if equal to <code>:equal</code> then <code>missing</code> is allowed and missings are matched; if equal to <code>:notequal</code> then missings are dropped in <code>df2</code> <code>on</code> columns.</li></ul><p>It is not allowed to join on columns that contain <code>NaN</code> or <code>-0.0</code> in real or imaginary part of the number. If you need to perform a join on such values use CategoricalArrays.jl and transform a column containing such values into a <code>CategoricalVector</code>.</p><p>When merging <code>on</code> categorical columns that differ in the ordering of their levels, the ordering of the left data frame takes precedence over the ordering of the right data frame.</p><p>Metadata: table-level and column-level <code>:note</code>-style metadata are taken from <code>df1</code>.</p><p>See also: <a href="#DataAPI.innerjoin"><code>innerjoin</code></a>, <a href="#DataAPI.leftjoin"><code>leftjoin</code></a>, <a href="#DataAPI.rightjoin"><code>rightjoin</code></a>,           <a href="#DataAPI.outerjoin"><code>outerjoin</code></a>, <a href="#DataAPI.antijoin"><code>antijoin</code></a>, <a href="#DataAPI.crossjoin"><code>crossjoin</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; name = DataFrame(ID=[1, 2, 3], Name=[&quot;John Doe&quot;, &quot;Jane Doe&quot;, &quot;Joe Blogs&quot;])
+   3 │     4  missing   Farmer</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/join/composer.jl#L946-L1072">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.semijoin" href="#DataAPI.semijoin"><code>DataAPI.semijoin</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">semijoin(df1, df2; on, makeunique=false, validate=(false, false), matchmissing=:error)</code></pre><p>Perform a semi join of two data frame objects and return a <code>DataFrame</code> containing the result. A semi join returns the subset of rows of <code>df1</code> that match with the keys in <code>df2</code>.</p><p>The order of rows in the result is kept from <code>df1</code>.</p><p><strong>Arguments</strong></p><ul><li><code>df1</code>, <code>df2</code>: the <code>AbstractDataFrames</code> to be joined</li></ul><p><strong>Keyword Arguments</strong></p><ul><li><code>on</code> : The names of the key columns on which to join the data frames. This can be a single name, or a vector of names (for joining on multiple columns). A <code>left=&gt;right</code> pair of names can be used instead of a name, for the case where a key has different names in <code>df1</code> and <code>df2</code> (it is allowed to mix names and name pairs in a vector). Key values are compared using <code>isequal</code>. <code>on</code> is a required argument.</li><li><code>makeunique</code> : ignored as no columns are added to <code>df1</code> columns (it is provided for consistency with other functions).</li><li><code>indicator</code> : Default: <code>nothing</code>. If a <code>Symbol</code> or string, adds categorical indicator  column with the given name for whether a row appeared in only <code>df1</code> (<code>&quot;left_only&quot;</code>),  only <code>df2</code> (<code>&quot;right_only&quot;</code>) or in both (<code>&quot;both&quot;</code>). If the name is already in use,  the column name will be modified if <code>makeunique=true</code>.</li><li><code>validate</code> : whether to check that columns passed as the <code>on</code> argument  define unique keys in each input data frame (according to <code>isequal</code>).  Can be a tuple or a pair, with the first element indicating whether to  run check for <code>df1</code> and the second element for <code>df2</code>.  By default no check is performed.</li><li><code>matchmissing</code> : if equal to <code>:error</code> throw an error if <code>missing</code> is present in <code>on</code> columns; if equal to <code>:equal</code> then <code>missing</code> is allowed and missings are matched; if equal to <code>:notequal</code> then missings are dropped in <code>df2</code> <code>on</code> columns.</li></ul><p>It is not allowed to join on columns that contain <code>NaN</code> or <code>-0.0</code> in real or imaginary part of the number. If you need to perform a join on such values use CategoricalArrays.jl and transform a column containing such values into a <code>CategoricalVector</code>.</p><p>When merging <code>on</code> categorical columns that differ in the ordering of their levels, the ordering of the left data frame takes precedence over the ordering of the right data frame.</p><p>Metadata: table-level and column-level <code>:note</code>-style metadata are taken from <code>df1</code>.</p><p>See also: <a href="#DataAPI.innerjoin"><code>innerjoin</code></a>, <a href="#DataAPI.leftjoin"><code>leftjoin</code></a>, <a href="#DataAPI.rightjoin"><code>rightjoin</code></a>,           <a href="#DataAPI.outerjoin"><code>outerjoin</code></a>, <a href="#DataAPI.antijoin"><code>antijoin</code></a>, <a href="#DataAPI.crossjoin"><code>crossjoin</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; name = DataFrame(ID=[1, 2, 3], Name=[&quot;John Doe&quot;, &quot;Jane Doe&quot;, &quot;Joe Blogs&quot;])
 3×2 DataFrame
  Row │ ID     Name
      │ Int64  String
@@ -2727,7 +2727,7 @@
      │ Int64  String
 ─────┼─────────────────
    1 │     1  John Doe
-   2 │     2  Jane Doe</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/join/composer.jl#L1284-L1385">source</a></section></article><h2 id="Grouping"><a class="docs-heading-anchor" href="#Grouping">Grouping</a><a id="Grouping-1"></a><a class="docs-heading-anchor-permalink" href="#Grouping" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.get" href="#Base.get"><code>Base.get</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">get(gd::GroupedDataFrame, key, default)</code></pre><p>Get a group based on the values of the grouping columns.</p><p><code>key</code> may be a <code>GroupKey</code>, <code>NamedTuple</code> or <code>Tuple</code> of grouping column values (in the same order as the <code>cols</code> argument to <code>groupby</code>). It may also be an <code>AbstractDict</code>, in which case the order of the arguments does not matter.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=repeat([:foo, :bar, :baz], outer=[2]),
+   2 │     2  Jane Doe</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/join/composer.jl#L1284-L1385">source</a></section></article><h2 id="Grouping"><a class="docs-heading-anchor" href="#Grouping">Grouping</a><a id="Grouping-1"></a><a class="docs-heading-anchor-permalink" href="#Grouping" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.get" href="#Base.get"><code>Base.get</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">get(gd::GroupedDataFrame, key, default)</code></pre><p>Get a group based on the values of the grouping columns.</p><p><code>key</code> may be a <code>GroupKey</code>, <code>NamedTuple</code> or <code>Tuple</code> of grouping column values (in the same order as the <code>cols</code> argument to <code>groupby</code>). It may also be an <code>AbstractDict</code>, in which case the order of the arguments does not matter.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=repeat([:foo, :bar, :baz], outer=[2]),
                       b=repeat([2, 1], outer=[3]),
                       c=1:6);
 
@@ -2763,7 +2763,7 @@
    1 │ baz         2      3
    2 │ baz         1      6
 
-julia&gt; get(gd, (:qux,), nothing)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/groupeddataframe/groupeddataframe.jl#L1055-L1105">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.groupby" href="#DataAPI.groupby"><code>DataAPI.groupby</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">groupby(d::AbstractDataFrame, cols;
+julia&gt; get(gd, (:qux,), nothing)</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/groupeddataframe/groupeddataframe.jl#L1055-L1105">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.groupby" href="#DataAPI.groupby"><code>DataAPI.groupby</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">groupby(d::AbstractDataFrame, cols;
         sort::Union{Bool, Nothing, NamedTuple}=nothing,
         skipmissing::Bool=false)</code></pre><p>Return a <code>GroupedDataFrame</code> representing a view of an <code>AbstractDataFrame</code> split into row groups.</p><p><strong>Arguments</strong></p><ul><li><code>df</code> : an <code>AbstractDataFrame</code> to split</li><li><code>cols</code> : data frame columns to group by. Can be any column selector (<code>Symbol</code>, string or integer; <code>:</code>, <code>Cols</code>, <code>All</code>, <code>Between</code>, <code>Not</code>, a regular expression, or a vector of <code>Symbol</code>s, strings or integers). In particular if the selector picks no columns then a single-group <code>GroupedDataFrame</code> is created. As a special case, if <code>cols</code> is a single column or a vector of columns then it can contain columns wrapped in <a href="#DataFrames.order"><code>order</code></a> that will be used to determine the order of groups if <code>sort</code> is <code>true</code> or a <code>NamedTuple</code> (if <code>sort</code> is <code>false</code>, then passing <code>order</code> is an error; if <code>sort</code> is <code>nothing</code> then it is set to <code>true</code> when <code>order</code> is passed).</li><li><code>sort</code> : if <code>sort=true</code> sort groups according to the values of the grouping columns <code>cols</code>; if <code>sort=false</code> groups are created in their order of appearance in <code>df</code>; if <code>sort=nothing</code> (the default) then the fastest available grouping algorithm is picked and in consequence the order of groups in the result is undefined and may change in future releases; below a description of the current implementation is provided. Additionally <code>sort</code> can be a <code>NamedTuple</code> having some or all of <code>alg</code>, <code>lt</code>, <code>by</code>, <code>rev</code>, and <code>order</code> fields. In this case the groups are sorted and their order follows the <a href="#Base.sortperm"><code>sortperm</code></a> order.</li><li><code>skipmissing</code> : whether to skip groups with <code>missing</code> values in one of the grouping columns <code>cols</code></li></ul><p><strong>Details</strong></p><p>An iterator over a <code>GroupedDataFrame</code> returns a <code>SubDataFrame</code> view for each grouping into <code>df</code>. Within each group, the order of rows in <code>df</code> is preserved.</p><p>A <code>GroupedDataFrame</code> also supports indexing by groups, <code>select</code>, <code>transform</code>, and <code>combine</code> (which applies a function to each group and combines the result into a data frame).</p><p><code>GroupedDataFrame</code> also supports the dictionary interface. The keys are <a href="../types/#DataFrames.GroupKey"><code>GroupKey</code></a> objects returned by <a href="#Base.keys"><code>keys(::GroupedDataFrame)</code></a>, which can also be used to get the values of the grouping columns for each group. <code>Tuples</code> and <code>NamedTuple</code>s containing the values of the grouping columns (in the same order as the <code>cols</code> argument) are also accepted as indices. Finally, an <code>AbstractDict</code> can be used to index into a grouped data frame where the keys are column names of the data frame. The order of the keys does not matter in this case.</p><p>In the current implementation if <code>sort=nothing</code> groups are ordered following the order of appearance of values in the grouping columns, except when all grouping columns provide non-<code>nothing</code> <code>DataAPI.refpool</code>, in which case the order of groups follows the order of values returned by <code>DataAPI.refpool</code>. As a particular application of this rule if all <code>cols</code> are <code>CategoricalVector</code>s then groups are always sorted. Integer columns with a narrow range also use this this optimization, so to the order of groups when grouping on integer columns is undefined. A column is considered to be an integer column when deciding on the grouping algorithm choice if its <code>eltype</code> is a subtype of <code>Union{Missing, Real}</code>, all its elements are either <code>missing</code> or pass <code>isinteger</code> test, and none of them is equal to <code>-0.0</code>.</p><p><strong>See also</strong></p><p><a href="#DataFrames.combine"><code>combine</code></a>, <a href="#DataFrames.select"><code>select</code></a>, <a href="#DataFrames.select!"><code>select!</code></a>, <a href="#DataFrames.transform"><code>transform</code></a>, <a href="#DataFrames.transform!"><code>transform!</code></a></p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=repeat([1, 2, 3, 4], outer=[2]),
                       b=repeat([2, 1], outer=[4]),
@@ -2862,7 +2862,7 @@
      │ Int64  Int64  Int64
 ─────┼─────────────────────
    1 │     4      1      4
-   2 │     4      1      8</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/groupeddataframe/groupeddataframe.jl#L50-L217">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.groupcols" href="#DataFrames.groupcols"><code>DataFrames.groupcols</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">groupcols(gd::GroupedDataFrame)</code></pre><p>Return a vector of <code>Symbol</code> column names in <code>parent(gd)</code> used for grouping.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/groupeddataframe/groupeddataframe.jl#L493-L497">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.groupindices" href="#DataFrames.groupindices"><code>DataFrames.groupindices</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">groupindices(gd::GroupedDataFrame)</code></pre><p>Return a vector of group indices for each row of <code>parent(gd)</code>.</p><p>Rows appearing in group <code>gd[i]</code> are attributed index <code>i</code>. Rows not present in any group are attributed <code>missing</code> (this can happen if <code>skipmissing=true</code> was passed when creating <code>gd</code>, or if <code>gd</code> is a subset from a larger <a href="../types/#DataFrames.GroupedDataFrame"><code>GroupedDataFrame</code></a>).</p><p>The <code>groupindices =&gt; target_col_name</code> syntax (or just <code>groupindices</code> without specifying the target column name) is also supported in the transformation mini-language when passing a <code>GroupedDataFrame</code> to transformation functions (<a href="#DataFrames.combine"><code>combine</code></a>, <a href="#DataFrames.select"><code>select</code></a>, etc.).</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(id=[&quot;a&quot;, &quot;c&quot;, &quot;b&quot;, &quot;b&quot;, &quot;a&quot;])
+   2 │     4      1      8</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/groupeddataframe/groupeddataframe.jl#L50-L217">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.groupcols" href="#DataFrames.groupcols"><code>DataFrames.groupcols</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">groupcols(gd::GroupedDataFrame)</code></pre><p>Return a vector of <code>Symbol</code> column names in <code>parent(gd)</code> used for grouping.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/groupeddataframe/groupeddataframe.jl#L493-L497">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.groupindices" href="#DataFrames.groupindices"><code>DataFrames.groupindices</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">groupindices(gd::GroupedDataFrame)</code></pre><p>Return a vector of group indices for each row of <code>parent(gd)</code>.</p><p>Rows appearing in group <code>gd[i]</code> are attributed index <code>i</code>. Rows not present in any group are attributed <code>missing</code> (this can happen if <code>skipmissing=true</code> was passed when creating <code>gd</code>, or if <code>gd</code> is a subset from a larger <a href="../types/#DataFrames.GroupedDataFrame"><code>GroupedDataFrame</code></a>).</p><p>The <code>groupindices =&gt; target_col_name</code> syntax (or just <code>groupindices</code> without specifying the target column name) is also supported in the transformation mini-language when passing a <code>GroupedDataFrame</code> to transformation functions (<a href="#DataFrames.combine"><code>combine</code></a>, <a href="#DataFrames.select"><code>select</code></a>, etc.).</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(id=[&quot;a&quot;, &quot;c&quot;, &quot;b&quot;, &quot;b&quot;, &quot;a&quot;])
 5×1 DataFrame
  Row │ id
      │ String
@@ -2893,7 +2893,7 @@
    2 │ c           2
    3 │ b           3
    4 │ b           3
-   5 │ a           1</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/groupeddataframe/groupeddataframe.jl#L379-L430">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.keys" href="#Base.keys"><code>Base.keys</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">keys(gd::GroupedDataFrame)</code></pre><p>Get the set of keys for each group of the <code>GroupedDataFrame</code> <code>gd</code> as a <a href="../types/#DataFrames.GroupKeys"><code>GroupKeys</code></a> object. Each key is a <a href="../types/#DataFrames.GroupKey"><code>GroupKey</code></a>, which behaves like a <code>NamedTuple</code> holding the values of the grouping columns for a given group. Unlike the equivalent <code>Tuple</code>, <code>NamedTuple</code>, and <code>AbstractDict</code>, these keys can be used to index into <code>gd</code> efficiently. The ordering of the keys is identical to the ordering of the groups of <code>gd</code> under iteration and integer indexing.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=repeat([:foo, :bar, :baz], outer=[4]),
+   5 │ a           1</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/groupeddataframe/groupeddataframe.jl#L379-L430">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.keys" href="#Base.keys"><code>Base.keys</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">keys(gd::GroupedDataFrame)</code></pre><p>Get the set of keys for each group of the <code>GroupedDataFrame</code> <code>gd</code> as a <a href="../types/#DataFrames.GroupKeys"><code>GroupKeys</code></a> object. Each key is a <a href="../types/#DataFrames.GroupKey"><code>GroupKey</code></a>, which behaves like a <code>NamedTuple</code> holding the values of the grouping columns for a given group. Unlike the equivalent <code>Tuple</code>, <code>NamedTuple</code>, and <code>AbstractDict</code>, these keys can be used to index into <code>gd</code> efficiently. The ordering of the keys is identical to the ordering of the groups of <code>gd</code> under iteration and integer indexing.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=repeat([:foo, :bar, :baz], outer=[4]),
                       b=repeat([2, 1], outer=[6]),
                       c=1:12);
 
@@ -2952,7 +2952,7 @@
    2 │ foo         2      7
 
 julia&gt; gd[keys(gd)[1]] == gd[1]
-true</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/groupeddataframe/groupeddataframe.jl#L929-L1010">source</a></section><section><div><pre><code class="language-julia hljs">keys(dfc::DataFrameColumns)</code></pre><p>Get a vector of column names of <code>dfc</code> as <code>Symbol</code>s.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/iteration.jl#L290-L294">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.parent" href="#Base.parent"><code>Base.parent</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">parent(gd::GroupedDataFrame)</code></pre><p>Return the parent data frame of <code>gd</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/groupeddataframe/groupeddataframe.jl#L329-L333">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.proprow" href="#DataFrames.proprow"><code>DataFrames.proprow</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">proprow</code></pre><p>Compute the proportion of rows which belong to each group, i.e. its number of rows divided by the total number of rows in a <code>GroupedDataFrame</code>.</p><p>This function can only be used in the transformation mini-language via the <code>proprow =&gt; target_col_name</code> syntax (or just <code>proprow</code> without specifying the target column name), when passing a <code>GroupedDataFrame</code> to transformation functions (<a href="#DataFrames.combine"><code>combine</code></a>, <a href="#DataFrames.select"><code>select</code></a>, etc.).</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(id=[&quot;a&quot;, &quot;c&quot;, &quot;b&quot;, &quot;b&quot;, &quot;a&quot;, &quot;b&quot;])
+true</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/groupeddataframe/groupeddataframe.jl#L929-L1010">source</a></section><section><div><pre><code class="language-julia hljs">keys(dfc::DataFrameColumns)</code></pre><p>Get a vector of column names of <code>dfc</code> as <code>Symbol</code>s.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/iteration.jl#L290-L294">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.parent" href="#Base.parent"><code>Base.parent</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">parent(gd::GroupedDataFrame)</code></pre><p>Return the parent data frame of <code>gd</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/groupeddataframe/groupeddataframe.jl#L329-L333">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.proprow" href="#DataFrames.proprow"><code>DataFrames.proprow</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">proprow</code></pre><p>Compute the proportion of rows which belong to each group, i.e. its number of rows divided by the total number of rows in a <code>GroupedDataFrame</code>.</p><p>This function can only be used in the transformation mini-language via the <code>proprow =&gt; target_col_name</code> syntax (or just <code>proprow</code> without specifying the target column name), when passing a <code>GroupedDataFrame</code> to transformation functions (<a href="#DataFrames.combine"><code>combine</code></a>, <a href="#DataFrames.select"><code>select</code></a>, etc.).</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(id=[&quot;a&quot;, &quot;c&quot;, &quot;b&quot;, &quot;b&quot;, &quot;a&quot;, &quot;b&quot;])
 6×1 DataFrame
  Row │ id
      │ String
@@ -2985,7 +2985,7 @@
    3 │ b       0.5
    4 │ b       0.5
    5 │ a       0.333333
-   6 │ b       0.5</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/groupeddataframe/groupeddataframe.jl#L438-L487">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.valuecols" href="#DataFrames.valuecols"><code>DataFrames.valuecols</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">valuecols(gd::GroupedDataFrame)</code></pre><p>Return a vector of <code>Symbol</code> column names in <code>parent(gd)</code> not used for grouping.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/groupeddataframe/groupeddataframe.jl#L504-L508">source</a></section></article><h2 id="Filtering-rows"><a class="docs-heading-anchor" href="#Filtering-rows">Filtering rows</a><a id="Filtering-rows-1"></a><a class="docs-heading-anchor-permalink" href="#Filtering-rows" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.allunique" href="#Base.allunique"><code>Base.allunique</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">allunique(df::AbstractDataFrame, cols=:)</code></pre><p>Return <code>true</code> if none of the rows of <code>df</code> are duplicated. Two rows are duplicates if all their columns contain equal values (according to <code>isequal</code>) for all columns in <code>cols</code> (by default, all columns).</p><p><strong>Arguments</strong></p><ul><li><code>df</code> : <code>AbstractDataFrame</code></li><li><code>cols</code> : a selector specifying the column(s) or their transformations to compare. Can be any column selector or transformation accepted by <a href="#DataFrames.select"><code>select</code></a>.</li></ul><p>See also <a href="#Base.unique"><code>unique</code></a> and <a href="#DataFrames.nonunique"><code>nonunique</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(i=1:4, x=[1, 2, 1, 2])
+   6 │ b       0.5</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/groupeddataframe/groupeddataframe.jl#L438-L487">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.valuecols" href="#DataFrames.valuecols"><code>DataFrames.valuecols</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">valuecols(gd::GroupedDataFrame)</code></pre><p>Return a vector of <code>Symbol</code> column names in <code>parent(gd)</code> not used for grouping.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/groupeddataframe/groupeddataframe.jl#L504-L508">source</a></section></article><h2 id="Filtering-rows"><a class="docs-heading-anchor" href="#Filtering-rows">Filtering rows</a><a id="Filtering-rows-1"></a><a class="docs-heading-anchor-permalink" href="#Filtering-rows" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.allunique" href="#Base.allunique"><code>Base.allunique</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">allunique(df::AbstractDataFrame, cols=:)</code></pre><p>Return <code>true</code> if none of the rows of <code>df</code> are duplicated. Two rows are duplicates if all their columns contain equal values (according to <code>isequal</code>) for all columns in <code>cols</code> (by default, all columns).</p><p><strong>Arguments</strong></p><ul><li><code>df</code> : <code>AbstractDataFrame</code></li><li><code>cols</code> : a selector specifying the column(s) or their transformations to compare. Can be any column selector or transformation accepted by <a href="#DataFrames.select"><code>select</code></a>.</li></ul><p>See also <a href="#Base.unique"><code>unique</code></a> and <a href="#DataFrames.nonunique"><code>nonunique</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(i=1:4, x=[1, 2, 1, 2])
 4×2 DataFrame
  Row │ i      x
      │ Int64  Int64
@@ -3002,7 +3002,7 @@
 false
 
 julia&gt; allunique(df, :i =&gt; ByRow(isodd))
-false</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/unique.jl#L165-L202">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.deleteat!" href="#Base.deleteat!"><code>Base.deleteat!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">deleteat!(df::DataFrame, inds)</code></pre><p>Delete rows specified by <code>inds</code> from a <code>DataFrame</code> <code>df</code> in place and return it.</p><p>Internally <code>deleteat!</code> is called for all columns so <code>inds</code> must be: a vector of sorted and unique integers, a boolean vector, an integer, or <code>Not</code> wrapping any valid selector.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:3, b=4:6)
+false</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/unique.jl#L165-L202">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.deleteat!" href="#Base.deleteat!"><code>Base.deleteat!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">deleteat!(df::DataFrame, inds)</code></pre><p>Delete rows specified by <code>inds</code> from a <code>DataFrame</code> <code>df</code> in place and return it.</p><p>Internally <code>deleteat!</code> is called for all columns so <code>inds</code> must be: a vector of sorted and unique integers, a boolean vector, an integer, or <code>Not</code> wrapping any valid selector.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:3, b=4:6)
 3×2 DataFrame
  Row │ a      b
      │ Int64  Int64
@@ -3017,7 +3017,7 @@
      │ Int64  Int64
 ─────┼──────────────
    1 │     1      4
-   2 │     3      6</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/dataframe/dataframe.jl#L823-L853">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.empty" href="#Base.empty"><code>Base.empty</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">empty(df::AbstractDataFrame)</code></pre><p>Create a new <code>DataFrame</code> with the same column names and column element types as <code>df</code> but with zero rows.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L481-L488">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.empty!" href="#Base.empty!"><code>Base.empty!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">empty!(df::DataFrame)</code></pre><p>Remove all rows from <code>df</code>, making each of its columns empty.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:3, b=4:6)
+   2 │     3      6</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/dataframe/dataframe.jl#L823-L853">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.empty" href="#Base.empty"><code>Base.empty</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">empty(df::AbstractDataFrame)</code></pre><p>Create a new <code>DataFrame</code> with the same column names and column element types as <code>df</code> but with zero rows.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L481-L488">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.empty!" href="#Base.empty!"><code>Base.empty!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">empty!(df::DataFrame)</code></pre><p>Remove all rows from <code>df</code>, making each of its columns empty.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:3, b=4:6)
 3×2 DataFrame
  Row │ a      b
      │ Int64  Int64
@@ -3033,7 +3033,7 @@
 ─────┴──────────────
 
 julia&gt; df.a, df.b
-(Int64[], Int64[])</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/dataframe/dataframe.jl#L1011-L1039">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.filter" href="#Base.filter"><code>Base.filter</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">filter(fun, df::AbstractDataFrame; view::Bool=false)
+(Int64[], Int64[])</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/dataframe/dataframe.jl#L1011-L1039">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.filter" href="#Base.filter"><code>Base.filter</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">filter(fun, df::AbstractDataFrame; view::Bool=false)
 filter(cols =&gt; fun, df::AbstractDataFrame; view::Bool=false)</code></pre><p>Return a data frame containing only rows from <code>df</code> for which <code>fun</code> returns <code>true</code>.</p><p>If <code>cols</code> is not specified then the predicate <code>fun</code> is passed <code>DataFrameRow</code>s. Elements of a <code>DataFrameRow</code> may be accessed with dot syntax or column indexing inside <code>fun</code>.</p><p>If <code>cols</code> is specified then the predicate <code>fun</code> is passed elements of the corresponding columns as separate positional arguments, unless <code>cols</code> is an <code>AsTable</code> selector, in which case a <code>NamedTuple</code> of these arguments is passed. <code>cols</code> can be any column selector (<code>Symbol</code>, string or integer; <code>:</code>, <code>Cols</code>, <code>All</code>, <code>Between</code>, <code>Not</code>, a regular expression, or a vector of <code>Symbol</code>s, strings or integers), and column duplicates are allowed if a vector of <code>Symbol</code>s, strings, or integers is passed.</p><p>If <code>view=false</code> a freshly allocated <code>DataFrame</code> is returned. If <code>view=true</code> then a <code>SubDataFrame</code> view into <code>df</code> is returned.</p><p>Passing <code>cols</code> leads to a more efficient execution of the operation for large data frames.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>This method is defined so that DataFrames.jl implements the Julia API for collections, but it is generally recommended to use the <a href="#DataFrames.subset"><code>subset</code></a> function instead as it is consistent with other DataFrames.jl functions (as opposed to <code>filter</code>).</p></div></div><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>Due to type stability the <code>filter(cols =&gt; fun, df::AbstractDataFrame; view::Bool=false)</code> call is preferred in performance critical applications.</p></div></div><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p>See also: <a href="#Base.filter!"><code>filter!</code></a></p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(x=[3, 1, 2, 1], y=[&quot;b&quot;, &quot;c&quot;, &quot;a&quot;, &quot;b&quot;])
 4×2 DataFrame
  Row │ x      y
@@ -3084,7 +3084,7 @@
 ─────┼───────────────
    1 │     3  b
    2 │     1  c
-   3 │     1  b</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L1124-L1218">source</a></section><section><div><pre><code class="language-julia hljs">filter(fun, gdf::GroupedDataFrame; ungroup::Bool=false)
+   3 │     1  b</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L1124-L1218">source</a></section><section><div><pre><code class="language-julia hljs">filter(fun, gdf::GroupedDataFrame; ungroup::Bool=false)
 filter(cols =&gt; fun, gdf::GroupedDataFrame; ungroup::Bool=false)</code></pre><p>Return only groups in <code>gd</code> for which <code>fun</code> returns <code>true</code> as a <code>GroupedDataFrame</code> if <code>ungroup=false</code> (the default), or as a data frame if <code>ungroup=true</code>.</p><p>If <code>cols</code> is not specified then the predicate <code>fun</code> is called with a <code>SubDataFrame</code> for each group.</p><p>If <code>cols</code> is specified then the predicate <code>fun</code> is called for each group with views of the corresponding columns as separate positional arguments, unless <code>cols</code> is an <code>AsTable</code> selector, in which case a <code>NamedTuple</code> of these arguments is passed. <code>cols</code> can be any column selector (<code>Symbol</code>, string or integer; <code>:</code>, <code>Cols</code>, <code>All</code>, <code>Between</code>, <code>Not</code>, a regular expression, or a vector of <code>Symbol</code>s, strings or integers), and column duplicates are allowed if a vector of <code>Symbol</code>s, strings, or integers is passed.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>This method is defined so that DataFrames.jl implements the Julia API for collections, but it is generally recommended to use the <a href="#DataFrames.subset"><code>subset</code></a> function instead as it is consistent with other DataFrames.jl functions (as opposed to <code>filter</code>).</p></div></div><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(g=[1, 2], x=[&#39;a&#39;, &#39;b&#39;]);
 
 julia&gt; gd = groupby(df, :g)
@@ -3122,7 +3122,7 @@
  Row │ g      x
      │ Int64  Char
 ─────┼─────────────
-   1 │     1  a</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/groupeddataframe/groupeddataframe.jl#L1114-L1180">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.filter!" href="#Base.filter!"><code>Base.filter!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">filter!(fun, df::AbstractDataFrame)
+   1 │     1  a</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/groupeddataframe/groupeddataframe.jl#L1114-L1180">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.filter!" href="#Base.filter!"><code>Base.filter!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">filter!(fun, df::AbstractDataFrame)
 filter!(cols =&gt; fun, df::AbstractDataFrame)</code></pre><p>Remove rows from data frame <code>df</code> for which <code>fun</code> returns <code>false</code>.</p><p>If <code>cols</code> is not specified then the predicate <code>fun</code> is passed <code>DataFrameRow</code>s. Elements of a <code>DataFrameRow</code> may be accessed with dot syntax or column indexing inside <code>fun</code>.</p><p>If <code>cols</code> is specified then the predicate <code>fun</code> is passed elements of the corresponding columns as separate positional arguments, unless <code>cols</code> is an <code>AsTable</code> selector, in which case a <code>NamedTuple</code> of these arguments is passed. <code>cols</code> can be any column selector (<code>Symbol</code>, string or integer; <code>:</code>, <code>Cols</code>, <code>All</code>, <code>Between</code>, <code>Not</code>, a regular expression, or a vector of <code>Symbol</code>s, strings or integers), and column duplicates are allowed if a vector of <code>Symbol</code>s, strings, or integers is passed.</p><p>Passing <code>cols</code> leads to a more efficient execution of the operation for large data frames.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>This method is defined so that DataFrames.jl implements the Julia API for collections, but it is generally recommended to use the <a href="#DataFrames.subset!"><code>subset!</code></a> function instead as it is consistent with other DataFrames.jl functions (as opposed to <code>filter!</code>).</p></div></div><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>Due to type stability the <code>filter!(cols =&gt; fun, df::AbstractDataFrame)</code> call is preferred in performance critical applications.</p></div></div><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p>See also: <a href="#Base.filter"><code>filter</code></a></p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(x=[3, 1, 2, 1], y=[&quot;b&quot;, &quot;c&quot;, &quot;a&quot;, &quot;b&quot;])
 4×2 DataFrame
  Row │ x      y
@@ -3176,7 +3176,7 @@
 ─────┼───────────────
    1 │     3  b
    2 │     1  c
-   3 │     1  b</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L1263-L1356">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.keepat!" href="#Base.keepat!"><code>Base.keepat!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">keepat!(df::DataFrame, inds)</code></pre><p>Delete rows at all indices not specified by <code>inds</code> from a <code>DataFrame</code> <code>df</code> in place and return it.</p><p>Internally <code>deleteat!</code> is called for all columns so <code>inds</code> must be: a vector of sorted and unique integers, a boolean vector, an integer, or <code>Not</code> wrapping any valid selector.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:3, b=4:6)
+   3 │     1  b</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L1263-L1356">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.keepat!" href="#Base.keepat!"><code>Base.keepat!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">keepat!(df::DataFrame, inds)</code></pre><p>Delete rows at all indices not specified by <code>inds</code> from a <code>DataFrame</code> <code>df</code> in place and return it.</p><p>Internally <code>deleteat!</code> is called for all columns so <code>inds</code> must be: a vector of sorted and unique integers, a boolean vector, an integer, or <code>Not</code> wrapping any valid selector.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:3, b=4:6)
 3×2 DataFrame
  Row │ a      b
      │ Int64  Int64
@@ -3191,7 +3191,7 @@
      │ Int64  Int64
 ─────┼──────────────
    1 │     1      4
-   2 │     3      6</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/dataframe/dataframe.jl#L945-L976">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.first" href="#Base.first"><code>Base.first</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">first(df::AbstractDataFrame)</code></pre><p>Get the first row of <code>df</code> as a <code>DataFrameRow</code>.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L548-L554">source</a></section><section><div><pre><code class="language-julia hljs">first(df::AbstractDataFrame, n::Integer; view::Bool=false)</code></pre><p>Get a data frame with the <code>n</code> first rows of <code>df</code>. Get all rows if <code>n</code> is greater than the number of rows in <code>df</code>. Error if <code>n</code> is negative.</p><p>If <code>view=false</code> a freshly allocated <code>DataFrame</code> is returned. If <code>view=true</code> then a <code>SubDataFrame</code> view into <code>df</code> is returned.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L557-L568">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.last" href="#Base.last"><code>Base.last</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">last(df::AbstractDataFrame)</code></pre><p>Get the last row of <code>df</code> as a <code>DataFrameRow</code>.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L575-L581">source</a></section><section><div><pre><code class="language-julia hljs">last(df::AbstractDataFrame, n::Integer; view::Bool=false)</code></pre><p>Get a data frame with the <code>n</code> last rows of <code>df</code>. Get all rows if <code>n</code> is greater than the number of rows in <code>df</code>. Error if <code>n</code> is negative.</p><p>If <code>view=false</code> a freshly allocated <code>DataFrame</code> is returned. If <code>view=true</code> then a <code>SubDataFrame</code> view into <code>df</code> is returned.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L584-L595">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.nonunique" href="#DataFrames.nonunique"><code>DataFrames.nonunique</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">nonunique(df::AbstractDataFrame; keep::Symbol=:first)
+   2 │     3      6</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/dataframe/dataframe.jl#L945-L976">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.first" href="#Base.first"><code>Base.first</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">first(df::AbstractDataFrame)</code></pre><p>Get the first row of <code>df</code> as a <code>DataFrameRow</code>.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L548-L554">source</a></section><section><div><pre><code class="language-julia hljs">first(df::AbstractDataFrame, n::Integer; view::Bool=false)</code></pre><p>Get a data frame with the <code>n</code> first rows of <code>df</code>. Get all rows if <code>n</code> is greater than the number of rows in <code>df</code>. Error if <code>n</code> is negative.</p><p>If <code>view=false</code> a freshly allocated <code>DataFrame</code> is returned. If <code>view=true</code> then a <code>SubDataFrame</code> view into <code>df</code> is returned.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L557-L568">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.last" href="#Base.last"><code>Base.last</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">last(df::AbstractDataFrame)</code></pre><p>Get the last row of <code>df</code> as a <code>DataFrameRow</code>.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L575-L581">source</a></section><section><div><pre><code class="language-julia hljs">last(df::AbstractDataFrame, n::Integer; view::Bool=false)</code></pre><p>Get a data frame with the <code>n</code> last rows of <code>df</code>. Get all rows if <code>n</code> is greater than the number of rows in <code>df</code>. Error if <code>n</code> is negative.</p><p>If <code>view=false</code> a freshly allocated <code>DataFrame</code> is returned. If <code>view=true</code> then a <code>SubDataFrame</code> view into <code>df</code> is returned.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L584-L595">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.nonunique" href="#DataFrames.nonunique"><code>DataFrames.nonunique</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">nonunique(df::AbstractDataFrame; keep::Symbol=:first)
 nonunique(df::AbstractDataFrame, cols; keep::Symbol=:first)</code></pre><p>Return a <code>Vector{Bool}</code> in which <code>true</code> entries indicate duplicate rows.</p><p>Duplicate rows are those for which at least another row contains equal values (according to <code>isequal</code>) for all columns in <code>cols</code> (by default, all columns). If <code>keep=:first</code> (the default), only the first occurrence of a set of duplicate rows is indicated with a <code>false</code> entry. If <code>keep=:last</code>, only the last occurrence of a set of duplicate rows is indicated with a <code>false</code> entry. If <code>keep=:noduplicates</code>, only rows without any duplicates are indicated with a <code>false</code> entry.</p><p><strong>Arguments</strong></p><ul><li><code>df</code> : <code>AbstractDataFrame</code></li><li><code>cols</code> : a selector specifying the column(s) or their transformations to compare. Can be any column selector or transformation accepted by <a href="#DataFrames.select"><code>select</code></a> that returns at least one column if <code>df</code> has at least one column.</li></ul><p>See also <a href="#Base.unique"><code>unique</code></a> and <a href="#Base.unique!"><code>unique!</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(i=1:4, x=[1, 2, 1, 2])
 4×2 DataFrame
  Row │ i      x
@@ -3247,7 +3247,7 @@
  1
  1
  1
- 1</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/unique.jl#L1-L85">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.Iterators.only" href="#Base.Iterators.only"><code>Base.Iterators.only</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">only(df::AbstractDataFrame)</code></pre><p>If <code>df</code> has a single row return it as a <code>DataFrameRow</code>; otherwise throw <code>ArgumentError</code>.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L535-L541">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.pop!" href="#Base.pop!"><code>Base.pop!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">pop!(df::DataFrame)</code></pre><p>Remove the last row from <code>df</code> and return a <code>NamedTuple</code> created from this row.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>Using this method for very wide data frames may lead to expensive compilation.</p></div></div><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:3, b=4:6)
+ 1</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/unique.jl#L1-L85">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.Iterators.only" href="#Base.Iterators.only"><code>Base.Iterators.only</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">only(df::AbstractDataFrame)</code></pre><p>If <code>df</code> has a single row return it as a <code>DataFrameRow</code>; otherwise throw <code>ArgumentError</code>.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L535-L541">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.pop!" href="#Base.pop!"><code>Base.pop!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">pop!(df::DataFrame)</code></pre><p>Remove the last row from <code>df</code> and return a <code>NamedTuple</code> created from this row.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>Using this method for very wide data frames may lead to expensive compilation.</p></div></div><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:3, b=4:6)
 3×2 DataFrame
  Row │ a      b
      │ Int64  Int64
@@ -3265,7 +3265,7 @@
      │ Int64  Int64
 ─────┼──────────────
    1 │     1      4
-   2 │     2      5</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/dataframe/dataframe.jl#L1083-L1117">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.popat!" href="#Base.popat!"><code>Base.popat!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">popat!(df::DataFrame, i::Integer)</code></pre><p>Remove the <code>i</code>-th row from <code>df</code> and return a <code>NamedTuple</code> created from this row.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>Using this method for very wide data frames may lead to expensive compilation.</p></div></div><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:3, b=4:6)
+   2 │     2      5</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/dataframe/dataframe.jl#L1083-L1117">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.popat!" href="#Base.popat!"><code>Base.popat!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">popat!(df::DataFrame, i::Integer)</code></pre><p>Remove the <code>i</code>-th row from <code>df</code> and return a <code>NamedTuple</code> created from this row.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>Using this method for very wide data frames may lead to expensive compilation.</p></div></div><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:3, b=4:6)
 3×2 DataFrame
  Row │ a      b
      │ Int64  Int64
@@ -3283,7 +3283,7 @@
      │ Int64  Int64
 ─────┼──────────────
    1 │     1      4
-   2 │     3      6</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/dataframe/dataframe.jl#L1156-L1189">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.popfirst!" href="#Base.popfirst!"><code>Base.popfirst!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">popfirst!(df::DataFrame)</code></pre><p>Remove the first row from <code>df</code> and return a <code>NamedTuple</code> created from this row.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>Using this method for very wide data frames may lead to expensive compilation.</p></div></div><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:3, b=4:6)
+   2 │     3      6</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/dataframe/dataframe.jl#L1156-L1189">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.popfirst!" href="#Base.popfirst!"><code>Base.popfirst!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">popfirst!(df::DataFrame)</code></pre><p>Remove the first row from <code>df</code> and return a <code>NamedTuple</code> created from this row.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>Using this method for very wide data frames may lead to expensive compilation.</p></div></div><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:3, b=4:6)
 3×2 DataFrame
  Row │ a      b
      │ Int64  Int64
@@ -3301,7 +3301,7 @@
      │ Int64  Int64
 ─────┼──────────────
    1 │     2      5
-   2 │     3      6</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/dataframe/dataframe.jl#L1120-L1153">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.resize!" href="#Base.resize!"><code>Base.resize!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">resize!(df::DataFrame, n::Integer)</code></pre><p>Resize <code>df</code> to have <code>n</code> rows by calling <code>resize!</code> on all columns of <code>df</code>.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:3, b=4:6)
+   2 │     3      6</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/dataframe/dataframe.jl#L1120-L1153">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.resize!" href="#Base.resize!"><code>Base.resize!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">resize!(df::DataFrame, n::Integer)</code></pre><p>Resize <code>df</code> to have <code>n</code> rows by calling <code>resize!</code> on all columns of <code>df</code>.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1:3, b=4:6)
 3×2 DataFrame
  Row │ a      b
      │ Int64  Int64
@@ -3316,7 +3316,7 @@
      │ Int64  Int64
 ─────┼──────────────
    1 │     1      4
-   2 │     2      5</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/dataframe/dataframe.jl#L1046-L1072">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.subset" href="#DataFrames.subset"><code>DataFrames.subset</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">subset(df::AbstractDataFrame, args...;
+   2 │     2      5</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/dataframe/dataframe.jl#L1046-L1072">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.subset" href="#DataFrames.subset"><code>DataFrames.subset</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">subset(df::AbstractDataFrame, args...;
        skipmissing::Bool=false, view::Bool=false, threads::Bool=true)
 subset(gdf::GroupedDataFrame, args...;
        skipmissing::Bool=false, view::Bool=false,
@@ -3379,7 +3379,7 @@
      │ Int64  Bool   Bool   Bool?    Int64
 ─────┼─────────────────────────────────────
    1 │     3   true  false  missing     11
-   2 │     4  false  false  missing     12</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/subset.jl#L159-L277">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.subset!" href="#DataFrames.subset!"><code>DataFrames.subset!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">subset!(df::AbstractDataFrame, args...;
+   2 │     4  false  false  missing     12</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/subset.jl#L159-L277">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.subset!" href="#DataFrames.subset!"><code>DataFrames.subset!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">subset!(df::AbstractDataFrame, args...;
         skipmissing::Bool=false, threads::Bool=true)
 subset!(gdf::GroupedDataFrame{DataFrame}, args...;
         skipmissing::Bool=false, ungroup::Bool=true, threads::Bool=true)</code></pre><p>Update data frame <code>df</code> or the parent of <code>gdf</code> in place to contain only rows for which all values produced by transformation(s) <code>args</code> for a given row is <code>true</code>. All transformations must produce vectors containing <code>true</code> or <code>false</code>. When the first argument is a <code>GroupedDataFrame</code>, transformations are also allowed to return a single <code>true</code> or <code>false</code> value, which results in including or excluding a whole group.</p><p>If <code>skipmissing=false</code> (the default) <code>args</code> are required to produce results containing only <code>Bool</code> values. If <code>skipmissing=true</code>, additionally <code>missing</code> is allowed and it is treated as <code>false</code> (i.e. rows for which one of the conditions returns <code>missing</code> are skipped).</p><p>Each argument passed in <code>args</code> can be any specifier following the rules described for <a href="#DataFrames.select"><code>select</code></a> with the restriction that:</p><ul><li>specifying target column name is not allowed as <code>subset!</code> does not create new columns;</li><li>every passed transformation must return a scalar or a vector (returning <code>AbstractDataFrame</code>, <code>NamedTuple</code>, <code>DataFrameRow</code> or <code>AbstractMatrix</code> is not supported).</li></ul><p>If <code>ungroup=false</code> the passed <code>GroupedDataFrame</code> <code>gdf</code> is updated (preserving the order of its groups) and returned.</p><p>If <code>threads=true</code> (the default) transformations may be run in separate tasks which can execute in parallel (possibly being applied to multiple rows or groups at the same time). Whether or not tasks are actually spawned and their number are determined automatically. Set to <code>false</code> if some transformations require serial execution or are not thread-safe.</p><p>If <code>GroupedDataFrame</code> is subsetted then it must include all groups present in the <code>parent</code> data frame, like in <a href="#DataFrames.select!"><code>select!</code></a>. In this case the passed <code>GroupedDataFrame</code> is updated to have correct groups after its parent is updated.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>Note that as the <code>subset!</code> function works in exactly the same way as other transformation functions defined in DataFrames.jl this is the preferred way to subset rows of a data frame or grouped data frame. In particular it uses a different set of rules for specifying transformations than <a href="#Base.filter!"><code>filter!</code></a> which is implemented in DataFrames.jl to ensure support for the standard Julia API for collections.</p></div></div><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p>See also: <a href="#DataFrames.subset"><code>subset</code></a>, <a href="#Base.filter!"><code>filter!</code></a>, <a href="#DataFrames.select!"><code>select!</code></a></p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(id=1:4, x=[true, false, true, false], y=[true, true, false, false])
@@ -3460,7 +3460,7 @@
      │ Int64  Bool   Bool   Bool?    Int64
 ─────┼─────────────────────────────────────
    1 │     3   true  false  missing     11
-   2 │     4  false  false  missing     12</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/subset.jl#L336-L471">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.unique" href="#Base.unique"><code>Base.unique</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">unique(df::AbstractDataFrame; view::Bool=false, keep::Symbol=:first)
+   2 │     4  false  false  missing     12</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/subset.jl#L336-L471">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.unique" href="#Base.unique"><code>Base.unique</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">unique(df::AbstractDataFrame; view::Bool=false, keep::Symbol=:first)
 unique(df::AbstractDataFrame, cols; view::Bool=false, keep::Symbol=:first)</code></pre><p>Return a data frame containing only unique rows in <code>df</code>.</p><p>Non-unique (duplicate) rows are those for which at least another row contains equal values (according to <code>isequal</code>) for all columns in <code>cols</code> (by default, all columns). If <code>keep=:first</code> (the default), only the first occurrence of a set of duplicate rows is kept. If <code>keep=:last</code>, only the last occurrence of a set of duplicate rows is kept. If <code>keep=:noduplicates</code>, only rows without any duplicates are kept.</p><p>If <code>view=false</code> a freshly allocated <code>DataFrame</code> is returned, and if <code>view=true</code> then a <code>SubDataFrame</code> view into <code>df</code> is returned.</p><p><strong>Arguments</strong></p><ul><li><code>df</code> : the AbstractDataFrame</li><li><code>cols</code> : a selector specifying the column(s) or their transformations to compare. Can be any column selector or transformation accepted by <a href="#DataFrames.select"><code>select</code></a> that returns at least one column if <code>df</code> has at least one column.</li></ul><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p>See also: <a href="#Base.unique!"><code>unique!</code></a>, <a href="#DataFrames.nonunique"><code>nonunique</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(i=1:4, x=[1, 2, 1, 2])
 4×2 DataFrame
  Row │ i      x
@@ -3507,7 +3507,7 @@
 0×2 DataFrame
  Row │ i      x
      │ Int64  Int64
-─────┴──────────────</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/unique.jl#L215-L294">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.unique!" href="#Base.unique!"><code>Base.unique!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">unique!(df::AbstractDataFrame; keep::Symbol=:first)
+─────┴──────────────</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/unique.jl#L215-L294">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.unique!" href="#Base.unique!"><code>Base.unique!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">unique!(df::AbstractDataFrame; keep::Symbol=:first)
 unique!(df::AbstractDataFrame, cols; keep::Symbol=:first)</code></pre><p>Update <code>df</code> in-place to contain only unique rows.</p><p>Non-unique (duplicate) rows are those for which at least another row contains equal values (according to <code>isequal</code>) for all columns in <code>cols</code> (by default, all columns). If <code>keep=:first</code> (the default), only the first occurrence of a set of duplicate rows is kept. If <code>keep=:last</code>, only the last occurrence of a set of duplicate rows is kept. If <code>keep=:noduplicates</code>, only rows without any duplicates are kept.</p><p><strong>Arguments</strong></p><ul><li><code>df</code> : the AbstractDataFrame</li><li><code>cols</code> :  column indicator (<code>Symbol</code>, <code>Int</code>, <code>Vector{Symbol}</code>, <code>Regex</code>, etc.) specifying the column(s) to compare. Can be any column selector or transformation accepted by <a href="#DataFrames.select"><code>select</code></a> that returns at least one column if <code>df</code> has at least one column.</li></ul><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p>See also: <a href="#Base.unique!"><code>unique!</code></a>, <a href="#DataFrames.nonunique"><code>nonunique</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(i=1:4, x=[1, 2, 1, 2])
 4×2 DataFrame
  Row │ i      x
@@ -3546,7 +3546,7 @@
 0×2 DataFrame
  Row │ i      x
      │ Int64  Int64
-─────┴──────────────</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/unique.jl#L307-L375">source</a></section></article><h2 id="Working-with-missing-values"><a class="docs-heading-anchor" href="#Working-with-missing-values">Working with missing values</a><a id="Working-with-missing-values-1"></a><a class="docs-heading-anchor-permalink" href="#Working-with-missing-values" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Missings.allowmissing" href="#Missings.allowmissing"><code>Missings.allowmissing</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">allowmissing(df::AbstractDataFrame, cols=:)</code></pre><p>Return a copy of data frame <code>df</code> with columns <code>cols</code> converted to element type <code>Union{T, Missing}</code> from <code>T</code> to allow support for missing values.</p><p><code>cols</code> can be any column selector (<code>Symbol</code>, string or integer; <code>:</code>, <code>Cols</code>, <code>All</code>, <code>Between</code>, <code>Not</code>, a regular expression, or a vector of <code>Symbol</code>s, strings or integers).</p><p>If <code>cols</code> is omitted all columns in the data frame are converted.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=[1, 2])
+─────┴──────────────</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/unique.jl#L307-L375">source</a></section></article><h2 id="Working-with-missing-values"><a class="docs-heading-anchor" href="#Working-with-missing-values">Working with missing values</a><a id="Working-with-missing-values-1"></a><a class="docs-heading-anchor-permalink" href="#Working-with-missing-values" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Missings.allowmissing" href="#Missings.allowmissing"><code>Missings.allowmissing</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">allowmissing(df::AbstractDataFrame, cols=:)</code></pre><p>Return a copy of data frame <code>df</code> with columns <code>cols</code> converted to element type <code>Union{T, Missing}</code> from <code>T</code> to allow support for missing values.</p><p><code>cols</code> can be any column selector (<code>Symbol</code>, string or integer; <code>:</code>, <code>Cols</code>, <code>All</code>, <code>Between</code>, <code>Not</code>, a regular expression, or a vector of <code>Symbol</code>s, strings or integers).</p><p>If <code>cols</code> is omitted all columns in the data frame are converted.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=[1, 2])
 2×1 DataFrame
  Row │ a
      │ Int64
@@ -3560,7 +3560,7 @@
      │ Int64?
 ─────┼────────
    1 │      1
-   2 │      2</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L2284-L2315">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.allowmissing!" href="#DataFrames.allowmissing!"><code>DataFrames.allowmissing!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">allowmissing!(df::DataFrame, cols=:)</code></pre><p>Convert columns <code>cols</code> of data frame <code>df</code> from element type <code>T</code> to <code>Union{T, Missing}</code> to support missing values.</p><p><code>cols</code> can be any column selector (<code>Symbol</code>, string or integer; <code>:</code>, <code>Cols</code>, <code>All</code>, <code>Between</code>, <code>Not</code>, a regular expression, or a vector of <code>Symbol</code>s, strings or integers).</p><p>If <code>cols</code> is omitted all columns in the data frame are converted.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/dataframe/dataframe.jl#L1251-L1262">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.completecases" href="#DataFrames.completecases"><code>DataFrames.completecases</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">completecases(df::AbstractDataFrame, cols=:)</code></pre><p>Return a Boolean vector with <code>true</code> entries indicating rows without missing values (complete cases) in data frame <code>df</code>.</p><p>If <code>cols</code> is provided, only missing values in the corresponding columns are considered. <code>cols</code> can be any column selector (<code>Symbol</code>, string or integer; <code>:</code>, <code>Cols</code>, <code>All</code>, <code>Between</code>, <code>Not</code>, a regular expression, or a vector of <code>Symbol</code>s, strings or integers) that returns at least one column if <code>df</code> has at least one column.</p><p>See also: <a href="#DataFrames.dropmissing"><code>dropmissing</code></a> and <a href="#DataFrames.dropmissing!"><code>dropmissing!</code></a>. Use <code>findall(completecases(df))</code> to get the indices of the rows.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(i=1:5,
+   2 │      2</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L2284-L2315">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.allowmissing!" href="#DataFrames.allowmissing!"><code>DataFrames.allowmissing!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">allowmissing!(df::DataFrame, cols=:)</code></pre><p>Convert columns <code>cols</code> of data frame <code>df</code> from element type <code>T</code> to <code>Union{T, Missing}</code> to support missing values.</p><p><code>cols</code> can be any column selector (<code>Symbol</code>, string or integer; <code>:</code>, <code>Cols</code>, <code>All</code>, <code>Between</code>, <code>Not</code>, a regular expression, or a vector of <code>Symbol</code>s, strings or integers).</p><p>If <code>cols</code> is omitted all columns in the data frame are converted.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/dataframe/dataframe.jl#L1251-L1262">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.completecases" href="#DataFrames.completecases"><code>DataFrames.completecases</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">completecases(df::AbstractDataFrame, cols=:)</code></pre><p>Return a Boolean vector with <code>true</code> entries indicating rows without missing values (complete cases) in data frame <code>df</code>.</p><p>If <code>cols</code> is provided, only missing values in the corresponding columns are considered. <code>cols</code> can be any column selector (<code>Symbol</code>, string or integer; <code>:</code>, <code>Cols</code>, <code>All</code>, <code>Between</code>, <code>Not</code>, a regular expression, or a vector of <code>Symbol</code>s, strings or integers) that returns at least one column if <code>df</code> has at least one column.</p><p>See also: <a href="#DataFrames.dropmissing"><code>dropmissing</code></a> and <a href="#DataFrames.dropmissing!"><code>dropmissing!</code></a>. Use <code>findall(completecases(df))</code> to get the indices of the rows.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(i=1:5,
                       x=[missing, 4, missing, 2, 1],
                       y=[missing, missing, &quot;c&quot;, &quot;d&quot;, &quot;e&quot;])
 5×3 DataFrame
@@ -3595,7 +3595,7 @@
  0
  0
  1
- 1</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L850-L903">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Missings.disallowmissing" href="#Missings.disallowmissing"><code>Missings.disallowmissing</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">disallowmissing(df::AbstractDataFrame, cols=:; error::Bool=true)</code></pre><p>Return a copy of data frame <code>df</code> with columns <code>cols</code> converted from element type <code>Union{T, Missing}</code> to <code>T</code> to drop support for missing values.</p><p><code>cols</code> can be any column selector (<code>Symbol</code>, string or integer; <code>:</code>, <code>Cols</code>, <code>All</code>, <code>Between</code>, <code>Not</code>, a regular expression, or a vector of <code>Symbol</code>s, strings or integers).</p><p>If <code>cols</code> is omitted all columns in the data frame are converted.</p><p>If <code>error=false</code> then columns containing a <code>missing</code> value will be skipped instead of throwing an error.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=Union{Int, Missing}[1, 2])
+ 1</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L850-L903">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Missings.disallowmissing" href="#Missings.disallowmissing"><code>Missings.disallowmissing</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">disallowmissing(df::AbstractDataFrame, cols=:; error::Bool=true)</code></pre><p>Return a copy of data frame <code>df</code> with columns <code>cols</code> converted from element type <code>Union{T, Missing}</code> to <code>T</code> to drop support for missing values.</p><p><code>cols</code> can be any column selector (<code>Symbol</code>, string or integer; <code>:</code>, <code>Cols</code>, <code>All</code>, <code>Between</code>, <code>Not</code>, a regular expression, or a vector of <code>Symbol</code>s, strings or integers).</p><p>If <code>cols</code> is omitted all columns in the data frame are converted.</p><p>If <code>error=false</code> then columns containing a <code>missing</code> value will be skipped instead of throwing an error.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=Union{Int, Missing}[1, 2])
 2×1 DataFrame
  Row │ a
      │ Int64?
@@ -3625,7 +3625,7 @@
      │ Int64?
 ─────┼─────────
    1 │       1
-   2 │ missing</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L2197-L2247">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.disallowmissing!" href="#DataFrames.disallowmissing!"><code>DataFrames.disallowmissing!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">disallowmissing!(df::DataFrame, cols=:; error::Bool=true)</code></pre><p>Convert columns <code>cols</code> of data frame <code>df</code> from element type <code>Union{T, Missing}</code> to <code>T</code> to drop support for missing values.</p><p><code>cols</code> can be any column selector (<code>Symbol</code>, string or integer; <code>:</code>, <code>Cols</code>, <code>All</code>, <code>Between</code>, <code>Not</code>, a regular expression, or a vector of <code>Symbol</code>s, strings or integers).</p><p>If <code>cols</code> is omitted all columns in the data frame are converted.</p><p>If <code>error=false</code> then columns containing a <code>missing</code> value will be skipped instead of throwing an error.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/dataframe/dataframe.jl#L1293-L1307">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.dropmissing" href="#DataFrames.dropmissing"><code>DataFrames.dropmissing</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">dropmissing(df::AbstractDataFrame, cols=:; view::Bool=false, disallowmissing::Bool=!view)</code></pre><p>Return a data frame excluding rows with missing values in <code>df</code>.</p><p>If <code>cols</code> is provided, only missing values in the corresponding columns are considered. <code>cols</code> can be any column selector (<code>Symbol</code>, string or integer; <code>:</code>, <code>Cols</code>, <code>All</code>, <code>Between</code>, <code>Not</code>, a regular expression, or a vector of <code>Symbol</code>s, strings or integers).</p><p>If <code>view=false</code> a freshly allocated <code>DataFrame</code> is returned. If <code>view=true</code> then a <code>SubDataFrame</code> view into <code>df</code> is returned. In this case <code>disallowmissing</code> must be <code>false</code>.</p><p>If <code>disallowmissing</code> is <code>true</code> (the default when <code>view</code> is <code>false</code>) then columns specified in <code>cols</code> will be converted so as not to allow for missing values using <a href="#DataFrames.disallowmissing!"><code>disallowmissing!</code></a>.</p><p>See also: <a href="#DataFrames.completecases"><code>completecases</code></a> and <a href="#DataFrames.dropmissing!"><code>dropmissing!</code></a>.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(i=1:5,
+   2 │ missing</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L2197-L2247">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.disallowmissing!" href="#DataFrames.disallowmissing!"><code>DataFrames.disallowmissing!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">disallowmissing!(df::DataFrame, cols=:; error::Bool=true)</code></pre><p>Convert columns <code>cols</code> of data frame <code>df</code> from element type <code>Union{T, Missing}</code> to <code>T</code> to drop support for missing values.</p><p><code>cols</code> can be any column selector (<code>Symbol</code>, string or integer; <code>:</code>, <code>Cols</code>, <code>All</code>, <code>Between</code>, <code>Not</code>, a regular expression, or a vector of <code>Symbol</code>s, strings or integers).</p><p>If <code>cols</code> is omitted all columns in the data frame are converted.</p><p>If <code>error=false</code> then columns containing a <code>missing</code> value will be skipped instead of throwing an error.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/dataframe/dataframe.jl#L1293-L1307">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.dropmissing" href="#DataFrames.dropmissing"><code>DataFrames.dropmissing</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">dropmissing(df::AbstractDataFrame, cols=:; view::Bool=false, disallowmissing::Bool=!view)</code></pre><p>Return a data frame excluding rows with missing values in <code>df</code>.</p><p>If <code>cols</code> is provided, only missing values in the corresponding columns are considered. <code>cols</code> can be any column selector (<code>Symbol</code>, string or integer; <code>:</code>, <code>Cols</code>, <code>All</code>, <code>Between</code>, <code>Not</code>, a regular expression, or a vector of <code>Symbol</code>s, strings or integers).</p><p>If <code>view=false</code> a freshly allocated <code>DataFrame</code> is returned. If <code>view=true</code> then a <code>SubDataFrame</code> view into <code>df</code> is returned. In this case <code>disallowmissing</code> must be <code>false</code>.</p><p>If <code>disallowmissing</code> is <code>true</code> (the default when <code>view</code> is <code>false</code>) then columns specified in <code>cols</code> will be converted so as not to allow for missing values using <a href="#DataFrames.disallowmissing!"><code>disallowmissing!</code></a>.</p><p>See also: <a href="#DataFrames.completecases"><code>completecases</code></a> and <a href="#DataFrames.dropmissing!"><code>dropmissing!</code></a>.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(i=1:5,
                       x=[missing, 4, missing, 2, 1],
                       y=[missing, missing, &quot;c&quot;, &quot;d&quot;, &quot;e&quot;])
 5×3 DataFrame
@@ -3669,7 +3669,7 @@
      │ Int64  Int64  String
 ─────┼──────────────────────
    1 │     4      2  d
-   2 │     5      1  e</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L938-L1007">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.dropmissing!" href="#DataFrames.dropmissing!"><code>DataFrames.dropmissing!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">dropmissing!(df::AbstractDataFrame, cols=:; disallowmissing::Bool=true)</code></pre><p>Remove rows with missing values from data frame <code>df</code> and return it.</p><p>If <code>cols</code> is provided, only missing values in the corresponding columns are considered. <code>cols</code> can be any column selector (<code>Symbol</code>, string or integer; <code>:</code>, <code>Cols</code>, <code>All</code>, <code>Between</code>, <code>Not</code>, a regular expression, or a vector of <code>Symbol</code>s, strings or integers).</p><p>If <code>disallowmissing</code> is <code>true</code> (the default) then the <code>cols</code> columns will get converted using <a href="#DataFrames.disallowmissing!"><code>disallowmissing!</code></a>.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p>See also: <a href="#DataFrames.dropmissing"><code>dropmissing</code></a> and <a href="#DataFrames.completecases"><code>completecases</code></a>.</p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(i=1:5,
+   2 │     5      1  e</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L938-L1007">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.dropmissing!" href="#DataFrames.dropmissing!"><code>DataFrames.dropmissing!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">dropmissing!(df::AbstractDataFrame, cols=:; disallowmissing::Bool=true)</code></pre><p>Remove rows with missing values from data frame <code>df</code> and return it.</p><p>If <code>cols</code> is provided, only missing values in the corresponding columns are considered. <code>cols</code> can be any column selector (<code>Symbol</code>, string or integer; <code>:</code>, <code>Cols</code>, <code>All</code>, <code>Between</code>, <code>Not</code>, a regular expression, or a vector of <code>Symbol</code>s, strings or integers).</p><p>If <code>disallowmissing</code> is <code>true</code> (the default) then the <code>cols</code> columns will get converted using <a href="#DataFrames.disallowmissing!"><code>disallowmissing!</code></a>.</p><p>Metadata: this function preserves table-level and column-level <code>:note</code>-style metadata.</p><p>See also: <a href="#DataFrames.dropmissing"><code>dropmissing</code></a> and <a href="#DataFrames.completecases"><code>completecases</code></a>.</p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(i=1:5,
                       x=[missing, 4, missing, 2, 1],
                       y=[missing, missing, &quot;c&quot;, &quot;d&quot;, &quot;e&quot;])
 5×3 DataFrame
@@ -3713,7 +3713,7 @@
      │ Int64  Int64  String
 ─────┼──────────────────────
    1 │     4      2  d
-   2 │     5      1  e</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L1051-L1113">source</a></section></article><h2 id="Iteration"><a class="docs-heading-anchor" href="#Iteration">Iteration</a><a id="Iteration-1"></a><a class="docs-heading-anchor-permalink" href="#Iteration" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.eachcol" href="#Base.eachcol"><code>Base.eachcol</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">eachcol(df::AbstractDataFrame)</code></pre><p>Return a <code>DataFrameColumns</code> object that is a vector-like that allows iterating an <code>AbstractDataFrame</code> column by column.</p><p>Indexing into <code>DataFrameColumns</code> objects using integer, <code>Symbol</code> or string returns the corresponding column (without copying). Indexing into <code>DataFrameColumns</code> objects using a multiple column selector returns a subsetted <code>DataFrameColumns</code> object with a new parent containing only the selected columns (without copying).</p><p><code>DataFrameColumns</code> supports most of the <code>AbstractVector</code> API. The key differences are that it is read-only and that the <code>keys</code> function returns a vector of <code>Symbol</code>s (and not integers as for normal vectors).</p><p>In particular <code>findnext</code>, <code>findprev</code>, <code>findfirst</code>, <code>findlast</code>, and <code>findall</code> functions are supported, and in <code>findnext</code> and <code>findprev</code> functions it is allowed to pass an integer, string, or <code>Symbol</code> as a reference index.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(x=1:4, y=11:14)
+   2 │     5      1  e</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L1051-L1113">source</a></section></article><h2 id="Iteration"><a class="docs-heading-anchor" href="#Iteration">Iteration</a><a id="Iteration-1"></a><a class="docs-heading-anchor-permalink" href="#Iteration" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.eachcol" href="#Base.eachcol"><code>Base.eachcol</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">eachcol(df::AbstractDataFrame)</code></pre><p>Return a <code>DataFrameColumns</code> object that is a vector-like that allows iterating an <code>AbstractDataFrame</code> column by column.</p><p>Indexing into <code>DataFrameColumns</code> objects using integer, <code>Symbol</code> or string returns the corresponding column (without copying). Indexing into <code>DataFrameColumns</code> objects using a multiple column selector returns a subsetted <code>DataFrameColumns</code> object with a new parent containing only the selected columns (without copying).</p><p><code>DataFrameColumns</code> supports most of the <code>AbstractVector</code> API. The key differences are that it is read-only and that the <code>keys</code> function returns a vector of <code>Symbol</code>s (and not integers as for normal vectors).</p><p>In particular <code>findnext</code>, <code>findprev</code>, <code>findfirst</code>, <code>findlast</code>, and <code>findall</code> functions are supported, and in <code>findnext</code> and <code>findprev</code> functions it is allowed to pass an integer, string, or <code>Symbol</code> as a reference index.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(x=1:4, y=11:14)
 4×2 DataFrame
  Row │ x      y
      │ Int64  Int64
@@ -3748,7 +3748,7 @@
 julia&gt; sum.(eachcol(df))
 2-element Vector{Int64}:
  10
- 50</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/iteration.jl#L191-L238">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.eachrow" href="#Base.eachrow"><code>Base.eachrow</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">eachrow(df::AbstractDataFrame)</code></pre><p>Return a <code>DataFrameRows</code> that iterates a data frame row by row, with each row represented as a <code>DataFrameRow</code>.</p><p>Because <code>DataFrameRow</code>s have an <code>eltype</code> of <code>Any</code>, use <code>copy(dfr::DataFrameRow)</code> to obtain a named tuple, which supports iteration and property access like a <code>DataFrameRow</code>, but also passes information on the <code>eltypes</code> of the columns of <code>df</code>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(x=1:4, y=11:14)
+ 50</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/iteration.jl#L191-L238">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.eachrow" href="#Base.eachrow"><code>Base.eachrow</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">eachrow(df::AbstractDataFrame)</code></pre><p>Return a <code>DataFrameRows</code> that iterates a data frame row by row, with each row represented as a <code>DataFrameRow</code>.</p><p>Because <code>DataFrameRow</code>s have an <code>eltype</code> of <code>Any</code>, use <code>copy(dfr::DataFrameRow)</code> to obtain a named tuple, which supports iteration and property access like a <code>DataFrameRow</code>, but also passes information on the <code>eltypes</code> of the columns of <code>df</code>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(x=1:4, y=11:14)
 4×2 DataFrame
  Row │ x      y
      │ Int64  Int64
@@ -3781,7 +3781,7 @@
      │ Int64  Int64
 ─────┼──────────────
    1 │    14      4
-   2 │    13      3</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/iteration.jl#L27-L74">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.values" href="#Base.values"><code>Base.values</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">values(dfc::DataFrameColumns)</code></pre><p>Get a vector of columns from <code>dfc</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/iteration.jl#L297-L301">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.pairs" href="#Base.pairs"><code>Base.pairs</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">pairs(dfc::DataFrameColumns)</code></pre><p>Return an iterator of pairs associating the name of each column of <code>dfc</code> with the corresponding column vector, i.e. <code>name =&gt; col</code> where <code>name</code> is the column name of the column <code>col</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/iteration.jl#L304-L310">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.Iterators.partition" href="#Base.Iterators.partition"><code>Base.Iterators.partition</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">Iterators.partition(df::AbstractDataFrame, n::Integer)</code></pre><p>Iterate over <code>df</code> data frame <code>n</code> rows at a time, returning each block as a <code>SubDataFrame</code>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; collect(Iterators.partition(DataFrame(x=1:5), 2))
+   2 │    13      3</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/iteration.jl#L27-L74">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.values" href="#Base.values"><code>Base.values</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">values(dfc::DataFrameColumns)</code></pre><p>Get a vector of columns from <code>dfc</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/iteration.jl#L297-L301">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.pairs" href="#Base.pairs"><code>Base.pairs</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">pairs(dfc::DataFrameColumns)</code></pre><p>Return an iterator of pairs associating the name of each column of <code>dfc</code> with the corresponding column vector, i.e. <code>name =&gt; col</code> where <code>name</code> is the column name of the column <code>col</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/iteration.jl#L304-L310">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.Iterators.partition" href="#Base.Iterators.partition"><code>Base.Iterators.partition</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">Iterators.partition(df::AbstractDataFrame, n::Integer)</code></pre><p>Iterate over <code>df</code> data frame <code>n</code> rows at a time, returning each block as a <code>SubDataFrame</code>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; collect(Iterators.partition(DataFrame(x=1:5), 2))
 3-element Vector{SubDataFrame{DataFrame, DataFrames.Index, UnitRange{Int64}}}:
  2×1 SubDataFrame
  Row │ x
@@ -3799,7 +3799,7 @@
  Row │ x
      │ Int64
 ─────┼───────
-   1 │     5</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L3217-L3246">source</a></section><section><div><pre><code class="language-julia hljs">Iterators.partition(dfr::DataFrameRows, n::Integer)</code></pre><p>Iterate over <code>DataFrameRows</code> <code>dfr</code> <code>n</code> rows at a time, returning each block as a <code>DataFrameRows</code> over a view of rows of parent of <code>dfr</code>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; collect(Iterators.partition(eachrow(DataFrame(x=1:5)), 2))
+   1 │     5</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L3217-L3246">source</a></section><section><div><pre><code class="language-julia hljs">Iterators.partition(dfr::DataFrameRows, n::Integer)</code></pre><p>Iterate over <code>DataFrameRows</code> <code>dfr</code> <code>n</code> rows at a time, returning each block as a <code>DataFrameRows</code> over a view of rows of parent of <code>dfr</code>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; collect(Iterators.partition(eachrow(DataFrame(x=1:5)), 2))
 3-element Vector{DataFrames.DataFrameRows{SubDataFrame{DataFrame, DataFrames.Index, UnitRange{Int64}}}}:
  2×1 DataFrameRows
  Row │ x
@@ -3817,9 +3817,9 @@
  Row │ x
      │ Int64
 ─────┼───────
-   1 │     5</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/iteration.jl#L99-L128">source</a></section></article><h2 id="Equality"><a class="docs-heading-anchor" href="#Equality">Equality</a><a id="Equality-1"></a><a class="docs-heading-anchor-permalink" href="#Equality" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.isapprox" href="#Base.isapprox"><code>Base.isapprox</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">isapprox(df1::AbstractDataFrame, df2::AbstractDataFrame;
+   1 │     5</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/iteration.jl#L99-L128">source</a></section></article><h2 id="Equality"><a class="docs-heading-anchor" href="#Equality">Equality</a><a id="Equality-1"></a><a class="docs-heading-anchor-permalink" href="#Equality" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="Base.isapprox" href="#Base.isapprox"><code>Base.isapprox</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">isapprox(df1::AbstractDataFrame, df2::AbstractDataFrame;
          rtol::Real=atol&gt;0 ? 0 : √eps, atol::Real=0,
-         nans::Bool=false, norm::Function=norm)</code></pre><p>Inexact equality comparison. <code>df1</code> and <code>df2</code> must have the same size and column names. Return  <code>true</code> if <code>isapprox</code> with given keyword arguments applied to all pairs of columns stored in <code>df1</code> and <code>df2</code> returns <code>true</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L513-L521">source</a></section></article><h2 id="Metadata"><a class="docs-heading-anchor" href="#Metadata">Metadata</a><a id="Metadata-1"></a><a class="docs-heading-anchor-permalink" href="#Metadata" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.metadata" href="#DataAPI.metadata"><code>DataAPI.metadata</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">metadata(df::AbstractDataFrame, key::AbstractString, [default]; style::Bool=false)
+         nans::Bool=false, norm::Function=norm)</code></pre><p>Inexact equality comparison. <code>df1</code> and <code>df2</code> must have the same size and column names. Return  <code>true</code> if <code>isapprox</code> with given keyword arguments applied to all pairs of columns stored in <code>df1</code> and <code>df2</code> returns <code>true</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L513-L521">source</a></section></article><h2 id="Metadata"><a class="docs-heading-anchor" href="#Metadata">Metadata</a><a id="Metadata-1"></a><a class="docs-heading-anchor-permalink" href="#Metadata" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.metadata" href="#DataAPI.metadata"><code>DataAPI.metadata</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">metadata(df::AbstractDataFrame, key::AbstractString, [default]; style::Bool=false)
 metadata(dfr::DataFrameRow, key::AbstractString, [default]; style::Bool=false)
 metadata(dfc::DataFrameColumns, key::AbstractString, [default]; style::Bool=false)
 metadata(dfr::DataFrameRows, key::AbstractString, [default]; style::Bool=false)</code></pre><p>Return table-level metadata value associated with <code>df</code> for key <code>key</code>. If <code>style=true</code> return a tuple of metadata value and metadata style.</p><p><code>SubDataFrame</code> and <code>DataFrameRow</code> expose only <code>:note</code>-style metadata of their parent.</p><p>If <code>default</code> is passed then return it if <code>key</code> does not exist; if <code>style=true</code> return <code>(default, :default)</code>.</p><p>See also: <a href="#DataAPI.metadatakeys"><code>metadatakeys</code></a>, <a href="#DataAPI.metadata!"><code>metadata!</code></a>, <a href="#DataAPI.deletemetadata!"><code>deletemetadata!</code></a>, <a href="#DataAPI.emptymetadata!"><code>emptymetadata!</code></a>, <a href="#DataAPI.colmetadata"><code>colmetadata</code></a>, <a href="#DataAPI.colmetadatakeys"><code>colmetadatakeys</code></a>, <a href="#DataAPI.colmetadata!"><code>colmetadata!</code></a>, <a href="#DataAPI.deletecolmetadata!"><code>deletecolmetadata!</code></a>, <a href="#DataAPI.emptycolmetadata!"><code>emptycolmetadata!</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1, b=2);
@@ -3842,7 +3842,7 @@
 julia&gt; deletemetadata!(df, &quot;name&quot;);
 
 julia&gt; metadatakeys(df)
-()</code></pre><p>```</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/other/metadata.jl#L79-L101">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.metadatakeys" href="#DataAPI.metadatakeys"><code>DataAPI.metadatakeys</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">metadatakeys(df::AbstractDataFrame)
+()</code></pre><p>```</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/other/metadata.jl#L79-L101">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.metadatakeys" href="#DataAPI.metadatakeys"><code>DataAPI.metadatakeys</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">metadatakeys(df::AbstractDataFrame)
 metadatakeys(dfr::DataFrameRow)
 metadatakeys(dfc::DataFrameColumns)
 metadatakeys(dfr::DataFrameRows)</code></pre><p>Return an iterator of table-level metadata keys which are set in the object.</p><p>Values can be accessed using <a href="#DataAPI.metadata"><code>metadata(df, key)</code></a>.</p><p><code>SubDataFrame</code> and <code>DataFrameRow</code> expose only <code>:note</code>-style metadata keys of their parent.</p><p>See also: <a href="#DataAPI.metadata"><code>metadata</code></a>, <a href="#DataAPI.metadata!"><code>metadata!</code></a>, <a href="#DataAPI.deletemetadata!"><code>deletemetadata!</code></a>, <a href="#DataAPI.emptymetadata!"><code>emptymetadata!</code></a>, <a href="#DataAPI.colmetadata"><code>colmetadata</code></a>, <a href="#DataAPI.colmetadatakeys"><code>colmetadatakeys</code></a>, <a href="#DataAPI.colmetadata!"><code>colmetadata!</code></a>, <a href="#DataAPI.deletecolmetadata!"><code>deletecolmetadata!</code></a>, <a href="#DataAPI.emptycolmetadata!"><code>emptycolmetadata!</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1, b=2);
@@ -3865,7 +3865,7 @@
 julia&gt; deletemetadata!(df, &quot;name&quot;);
 
 julia&gt; metadatakeys(df)
-()</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/other/metadata.jl#L131-L150">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.metadata!" href="#DataAPI.metadata!"><code>DataAPI.metadata!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">metadata!(df::AbstractDataFrame, key::AbstractString, value; style::Symbol=:default)
+()</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/other/metadata.jl#L131-L150">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.metadata!" href="#DataAPI.metadata!"><code>DataAPI.metadata!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">metadata!(df::AbstractDataFrame, key::AbstractString, value; style::Symbol=:default)
 metadata!(dfr::DataFrameRow, key::AbstractString, value; style::Symbol=:default)
 metadata!(dfc::DataFrameColumns, key::AbstractString, value; style::Symbol=:default)
 metadata!(dfr::DataFrameRows, key::AbstractString, value; style::Symbol=:default)</code></pre><p>Set table-level metadata for object <code>df</code> for key <code>key</code> to have value <code>value</code> and style <code>style</code> (<code>:default</code> by default) and return <code>df</code>.</p><p>For <code>SubDataFrame</code> and <code>DataFrameRow</code> only <code>:note</code>-style is allowed. Trying to set a key-value pair for which the key already exists in the parent data frame with another style throws an error.</p><p>See also: <a href="#DataAPI.metadata"><code>metadata</code></a>, <a href="#DataAPI.metadatakeys"><code>metadatakeys</code></a>, <a href="#DataAPI.deletemetadata!"><code>deletemetadata!</code></a>, <a href="#DataAPI.emptymetadata!"><code>emptymetadata!</code></a>, <a href="#DataAPI.colmetadata"><code>colmetadata</code></a>, <a href="#DataAPI.colmetadatakeys"><code>colmetadatakeys</code></a>, <a href="#DataAPI.colmetadata!"><code>colmetadata!</code></a>, <a href="#DataAPI.deletecolmetadata!"><code>deletecolmetadata!</code></a>, <a href="#DataAPI.emptycolmetadata!"><code>emptycolmetadata!</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1, b=2);
@@ -3888,7 +3888,7 @@
 julia&gt; deletemetadata!(df, &quot;name&quot;);
 
 julia&gt; metadatakeys(df)
-()</code></pre><p>```</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/other/metadata.jl#L170-L190">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.deletemetadata!" href="#DataAPI.deletemetadata!"><code>DataAPI.deletemetadata!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">deletemetadata!(df::AbstractDataFrame, key::AbstractString)
+()</code></pre><p>```</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/other/metadata.jl#L170-L190">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.deletemetadata!" href="#DataAPI.deletemetadata!"><code>DataAPI.deletemetadata!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">deletemetadata!(df::AbstractDataFrame, key::AbstractString)
 deletemetadata!(dfr::DataFrameRow, key::AbstractString)
 deletemetadata!(dfc::DataFrameColumns, key::AbstractString)
 deletemetadata!(dfr::DataFrameRows, key::AbstractString)</code></pre><p>Delete table-level metadata from object <code>df</code> for key <code>key</code> and return <code>df</code>. If key does not exist, return <code>df</code> without modification.</p><p>For <code>SubDataFrame</code> and <code>DataFrameRow</code> only <code>:note</code>-style metadata from their parent can be deleted (as other styles are not propagated to views).</p><p>See also: <a href="#DataAPI.metadata"><code>metadata</code></a>, <a href="#DataAPI.metadatakeys"><code>metadatakeys</code></a>, <a href="#DataAPI.metadata!"><code>metadata!</code></a>, <a href="#DataAPI.emptymetadata!"><code>emptymetadata!</code></a>, <a href="#DataAPI.colmetadata"><code>colmetadata</code></a>, <a href="#DataAPI.colmetadatakeys"><code>colmetadatakeys</code></a>, <a href="#DataAPI.colmetadata!"><code>colmetadata!</code></a>, <a href="#DataAPI.deletecolmetadata!"><code>deletecolmetadata!</code></a>, <a href="#DataAPI.emptycolmetadata!"><code>emptycolmetadata!</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1, b=2);
@@ -3911,7 +3911,7 @@
 julia&gt; deletemetadata!(df, &quot;name&quot;);
 
 julia&gt; metadatakeys(df)
-()</code></pre><p>```</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/other/metadata.jl#L230-L249">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.emptymetadata!" href="#DataAPI.emptymetadata!"><code>DataAPI.emptymetadata!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">emptymetadata!(df::AbstractDataFrame)
+()</code></pre><p>```</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/other/metadata.jl#L230-L249">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.emptymetadata!" href="#DataAPI.emptymetadata!"><code>DataAPI.emptymetadata!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">emptymetadata!(df::AbstractDataFrame)
 emptymetadata!(dfr::DataFrameRow)
 emptymetadata!(dfc::DataFrameColumns)
 emptymetadata!(dfr::DataFrameRows)</code></pre><p>Delete all table-level metadata from object <code>df</code>.</p><p>For <code>SubDataFrame</code> and <code>DataFrameRow</code> only <code>:note</code>-style metadata from their parent can be deleted (as other styles are not propagated to views).</p><p>See also: <a href="#DataAPI.metadata"><code>metadata</code></a>, <a href="#DataAPI.metadatakeys"><code>metadatakeys</code></a>, <a href="#DataAPI.metadata!"><code>metadata!</code></a>, <a href="#DataAPI.deletemetadata!"><code>deletemetadata!</code></a>, <a href="#DataAPI.colmetadata"><code>colmetadata</code></a>, <a href="#DataAPI.colmetadatakeys"><code>colmetadatakeys</code></a>, <a href="#DataAPI.colmetadata!"><code>colmetadata!</code></a>, <a href="#DataAPI.deletecolmetadata!"><code>deletecolmetadata!</code></a>, <a href="#DataAPI.emptycolmetadata!"><code>emptycolmetadata!</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1, b=2);
@@ -3934,7 +3934,7 @@
 julia&gt; emptymetadata!(df);
 
 julia&gt; metadatakeys(df)
-()</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/other/metadata.jl#L277-L318">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.colmetadata" href="#DataAPI.colmetadata"><code>DataAPI.colmetadata</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">colmetadata(df::AbstractDataFrame, col::ColumnIndex, key::AbstractString, [default]; style::Bool=false)
+()</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/other/metadata.jl#L277-L318">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.colmetadata" href="#DataAPI.colmetadata"><code>DataAPI.colmetadata</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">colmetadata(df::AbstractDataFrame, col::ColumnIndex, key::AbstractString, [default]; style::Bool=false)
 colmetadata(dfr::DataFrameRow, col::ColumnIndex, key::AbstractString, [default]; style::Bool=false)
 colmetadata(dfc::DataFrameColumns, col::ColumnIndex, key::AbstractString, [default]; style::Bool=false)
 colmetadata(dfr::DataFrameRows, col::ColumnIndex, key::AbstractString, [default]; style::Bool=false)</code></pre><p>Return column-level metadata value associated with <code>df</code> for column <code>col</code> and key <code>key</code>.</p><p><code>SubDataFrame</code> and <code>DataFrameRow</code> expose only <code>:note</code>-style metadata of their parent.</p><p>If <code>default</code> is passed then return it if <code>key</code> does not exist for column <code>col</code>; if <code>style=true</code> return <code>(default, :default)</code>. If <code>col</code> does not exist in <code>df</code> always throw an error.</p><p>See also: <a href="#DataAPI.metadata"><code>metadata</code></a>, <a href="#DataAPI.metadatakeys"><code>metadatakeys</code></a>, <a href="#DataAPI.metadata!"><code>metadata!</code></a>, <a href="#DataAPI.deletemetadata!"><code>deletemetadata!</code></a>, <a href="#DataAPI.emptymetadata!"><code>emptymetadata!</code></a>, <a href="#DataAPI.colmetadatakeys"><code>colmetadatakeys</code></a>, <a href="#DataAPI.colmetadata!"><code>colmetadata!</code></a>, <a href="#DataAPI.deletecolmetadata!"><code>deletecolmetadata!</code></a>, <a href="#DataAPI.emptycolmetadata!"><code>emptycolmetadata!</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1, b=2);
@@ -3961,7 +3961,7 @@
 julia&gt; deletecolmetadata!(df, :a, &quot;name&quot;);
 
 julia&gt; colmetadatakeys(df)
-()</code></pre><p>```</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/other/metadata.jl#L338-L359">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.colmetadatakeys" href="#DataAPI.colmetadatakeys"><code>DataAPI.colmetadatakeys</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">colmetadatakeys(df::AbstractDataFrame, [col::ColumnIndex])
+()</code></pre><p>```</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/other/metadata.jl#L338-L359">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.colmetadatakeys" href="#DataAPI.colmetadatakeys"><code>DataAPI.colmetadatakeys</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">colmetadatakeys(df::AbstractDataFrame, [col::ColumnIndex])
 colmetadatakeys(dfr::DataFrameRow, [col::ColumnIndex])
 colmetadatakeys(dfc::DataFrameColumns, [col::ColumnIndex])
 colmetadatakeys(dfr::DataFrameRows, [col::ColumnIndex])</code></pre><p>If <code>col</code> is passed return an iterator of column-level metadata keys which are set for column <code>col</code>. If <code>col</code> is not passed return an iterator of <code>col =&gt; colmetadatakeys(x, col)</code> pairs for all columns that have metadata, where <code>col</code> are <code>Symbol</code>.</p><p>Values can be accessed using <a href="#DataAPI.colmetadata"><code>colmetadata(df, col, key)</code></a>.</p><p><code>SubDataFrame</code> and <code>DataFrameRow</code> expose only <code>:note</code>-style metadata of their parent.</p><p>See also: <a href="#DataAPI.metadata"><code>metadata</code></a>, <a href="#DataAPI.metadatakeys"><code>metadatakeys</code></a>, <a href="#DataAPI.metadata!"><code>metadata!</code></a>, <a href="#DataAPI.deletemetadata!"><code>deletemetadata!</code></a>, <a href="#DataAPI.emptymetadata!"><code>emptymetadata!</code></a>, <a href="#DataAPI.colmetadata"><code>colmetadata</code></a>, <a href="#DataAPI.colmetadata!"><code>colmetadata!</code></a>, <a href="#DataAPI.deletecolmetadata!"><code>deletecolmetadata!</code></a>, <a href="#DataAPI.emptycolmetadata!"><code>emptycolmetadata!</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1, b=2);
@@ -3988,7 +3988,7 @@
 julia&gt; deletecolmetadata!(df, :a, &quot;name&quot;);
 
 julia&gt; colmetadatakeys(df)
-()</code></pre><p>```</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/other/metadata.jl#L403-L425">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.colmetadata!" href="#DataAPI.colmetadata!"><code>DataAPI.colmetadata!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">colmetadata!(df::AbstractDataFrame, col::ColumnIndex, key::AbstractString, value; style::Symbol=:default)
+()</code></pre><p>```</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/other/metadata.jl#L403-L425">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.colmetadata!" href="#DataAPI.colmetadata!"><code>DataAPI.colmetadata!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">colmetadata!(df::AbstractDataFrame, col::ColumnIndex, key::AbstractString, value; style::Symbol=:default)
 colmetadata!(dfr::DataFrameRow, col::ColumnIndex, key::AbstractString, value; style::Symbol=:default)
 colmetadata!(dfc::DataFrameColumns, col::ColumnIndex, key::AbstractString, value; style::Symbol=:default)
 colmetadata!(dfr::DataFrameRows, col::ColumnIndex, key::AbstractString, value; style::Symbol=:default)</code></pre><p>Set column-level metadata in <code>df</code> for column <code>col</code> and key <code>key</code> to have value <code>value</code> and style <code>style</code> (<code>:default</code> by default) and return <code>df</code>.</p><p>For <code>SubDataFrame</code> and <code>DataFrameRow</code> only <code>:note</code> style is allowed. Trying to set a key-value pair for which the key already exists in the parent data frame with another style throws an error.</p><p>See also: <a href="#DataAPI.metadata"><code>metadata</code></a>, <a href="#DataAPI.metadatakeys"><code>metadatakeys</code></a>, <a href="#DataAPI.metadata!"><code>metadata!</code></a>, <a href="#DataAPI.deletemetadata!"><code>deletemetadata!</code></a>, <a href="#DataAPI.emptymetadata!"><code>emptymetadata!</code></a>, <a href="#DataAPI.colmetadata"><code>colmetadata</code></a>, <a href="#DataAPI.colmetadatakeys"><code>colmetadatakeys</code></a>, <a href="#DataAPI.deletecolmetadata!"><code>deletecolmetadata!</code></a>, <a href="#DataAPI.emptycolmetadata!"><code>emptycolmetadata!</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1, b=2);
@@ -4015,7 +4015,7 @@
 julia&gt; deletecolmetadata!(df, :a, &quot;name&quot;);
 
 julia&gt; colmetadatakeys(df)
-()</code></pre><p>```</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/other/metadata.jl#L467-L487">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.deletecolmetadata!" href="#DataAPI.deletecolmetadata!"><code>DataAPI.deletecolmetadata!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">deletecolmetadata!(df::AbstractDataFrame, col::ColumnIndex, key::AbstractString)
+()</code></pre><p>```</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/other/metadata.jl#L467-L487">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.deletecolmetadata!" href="#DataAPI.deletecolmetadata!"><code>DataAPI.deletecolmetadata!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">deletecolmetadata!(df::AbstractDataFrame, col::ColumnIndex, key::AbstractString)
 deletecolmetadata!(dfr::DataFrameRow, col::ColumnIndex, key::AbstractString)
 deletecolmetadata!(dfc::DataFrameColumns, col::ColumnIndex, key::AbstractString)
 deletecolmetadata!(dfr::DataFrameRows, col::ColumnIndex, key::AbstractString)</code></pre><p>Delete column-level metadata set in <code>df</code> for column <code>col</code> and key <code>key</code> and return <code>df</code>.</p><p>For <code>SubDataFrame</code> and <code>DataFrameRow</code> only <code>:note</code>-style metadata from their parent can be deleted (as other styles are not propagated to views).</p><p>See also: <a href="#DataAPI.metadata"><code>metadata</code></a>, <a href="#DataAPI.metadatakeys"><code>metadatakeys</code></a>, <a href="#DataAPI.metadata!"><code>metadata!</code></a>, <a href="#DataAPI.deletemetadata!"><code>deletemetadata!</code></a>, <a href="#DataAPI.emptymetadata!"><code>emptymetadata!</code></a>, <a href="#DataAPI.colmetadata"><code>colmetadata</code></a>, <a href="#DataAPI.colmetadatakeys"><code>colmetadatakeys</code></a>, <a href="#DataAPI.colmetadata!"><code>colmetadata!</code></a>, <a href="#DataAPI.emptycolmetadata!"><code>emptycolmetadata!</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1, b=2);
@@ -4042,7 +4042,7 @@
 julia&gt; deletecolmetadata!(df, :a, &quot;name&quot;);
 
 julia&gt; colmetadatakeys(df)
-()</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/other/metadata.jl#L534-L551">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.emptycolmetadata!" href="#DataAPI.emptycolmetadata!"><code>DataAPI.emptycolmetadata!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">emptycolmetadata!(df::AbstractDataFrame, [col::ColumnIndex])
+()</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/other/metadata.jl#L534-L551">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataAPI.emptycolmetadata!" href="#DataAPI.emptycolmetadata!"><code>DataAPI.emptycolmetadata!</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">emptycolmetadata!(df::AbstractDataFrame, [col::ColumnIndex])
 emptycolmetadata!(dfr::DataFrameRow, [col::ColumnIndex])
 emptycolmetadata!(dfc::DataFrameColumns, [col::ColumnIndex])
 emptycolmetadata!(dfr::DataFrameRows, [col::ColumnIndex])</code></pre><p>Delete column-level metadata set in <code>df</code> for column <code>col</code> and key <code>key</code> and return <code>df</code>.</p><p>For <code>SubDataFrame</code> and <code>DataFrameRow</code> only <code>:note</code>-style metadata from their parent can be deleted (as other styles are not propagated to views).</p><p>See also: <a href="#DataAPI.metadata"><code>metadata</code></a>, <a href="#DataAPI.metadatakeys"><code>metadatakeys</code></a>, <a href="#DataAPI.metadata!"><code>metadata!</code></a>, <a href="#DataAPI.deletemetadata!"><code>deletemetadata!</code></a>, <a href="#DataAPI.emptymetadata!"><code>emptymetadata!</code></a>, <a href="#DataAPI.colmetadata"><code>colmetadata</code></a>, <a href="#DataAPI.colmetadatakeys"><code>colmetadatakeys</code></a>, <a href="#DataAPI.colmetadata!"><code>colmetadata!</code></a>, <a href="#DataAPI.deletecolmetadata!"><code>deletecolmetadata!</code></a>.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=1, b=2);
@@ -4066,4 +4066,4 @@
 julia&gt; emptycolmetadata!(df, :a);
 
 julia&gt; colmetadatakeys(df)
-()</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/other/metadata.jl#L586-L628">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../types/">« Types</a><a class="docs-footer-nextpage" href="../indexing/">Indexing »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Saturday 7 September 2024 11:00">Saturday 7 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+()</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/other/metadata.jl#L586-L628">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../types/">« Types</a><a class="docs-footer-nextpage" href="../indexing/">Indexing »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Sunday 8 September 2024 08:54">Sunday 8 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/lib/indexing/index.html b/dev/lib/indexing/index.html
index a4829a0b7..0b71c4e5f 100644
--- a/dev/lib/indexing/index.html
+++ b/dev/lib/indexing/index.html
@@ -1,2 +1,2 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Indexing · DataFrames.jl</title><meta name="title" content="Indexing · DataFrames.jl"/><meta property="og:title" content="Indexing · DataFrames.jl"/><meta property="twitter:title" content="Indexing · DataFrames.jl"/><meta name="description" content="Documentation for DataFrames.jl."/><meta property="og:description" content="Documentation for DataFrames.jl."/><meta property="twitter:description" content="Documentation for DataFrames.jl."/><meta property="og:url" content="https://juliadata.github.io/DataFrames.jl/stable/lib/indexing/"/><meta property="twitter:url" content="https://juliadata.github.io/DataFrames.jl/stable/lib/indexing/"/><link rel="canonical" href="https://juliadata.github.io/DataFrames.jl/stable/lib/indexing/"/><script data-outdated-warner src="../../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../search_index.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script><link href="../../assets/favicon.ico" rel="icon" type="image/x-icon"/></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../../"><img src="../../assets/logo.png" alt="DataFrames.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../../">DataFrames.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><a class="tocitem" href="../../">Introduction</a></li><li><a class="tocitem" href="../../man/basics/">First Steps with DataFrames.jl</a></li><li><span class="tocitem">User Guide</span><ul><li><a class="tocitem" href="../../man/getting_started/">Getting Started</a></li><li><a class="tocitem" href="../../man/working_with_dataframes/">Working with DataFrames</a></li><li><a class="tocitem" href="../../man/importing_and_exporting/">Importing and Exporting Data (I/O)</a></li><li><a class="tocitem" href="../../man/joins/">Joins</a></li><li><a class="tocitem" href="../../man/split_apply_combine/">Split-apply-combine</a></li><li><a class="tocitem" href="../../man/reshaping_and_pivoting/">Reshaping</a></li><li><a class="tocitem" href="../../man/sorting/">Sorting</a></li><li><a class="tocitem" href="../../man/categorical/">Categorical Data</a></li><li><a class="tocitem" href="../../man/missing/">Missing Data</a></li><li><a class="tocitem" href="../../man/querying_frameworks/">Data manipulation frameworks</a></li><li><a class="tocitem" href="../../man/comparisons/">Comparison with Python/R/Stata</a></li></ul></li><li><span class="tocitem">API</span><ul><li><a class="tocitem" href="../types/">Types</a></li><li><a class="tocitem" href="../functions/">Functions</a></li><li class="is-active"><a class="tocitem" href>Indexing</a><ul class="internal"><li><a class="tocitem" href="#General-rules"><span>General rules</span></a></li><li><a class="tocitem" href="#getindex-and-view"><span><code>getindex</code> and <code>view</code></span></a></li><li><a class="tocitem" href="#setindex!"><span><code>setindex!</code></span></a></li><li><a class="tocitem" href="#Broadcasting"><span>Broadcasting</span></a></li><li><a class="tocitem" href="#Indexing-GroupedDataFrames"><span>Indexing <code>GroupedDataFrame</code>s</span></a></li><li class="toplevel"><a class="tocitem" href="#Common-API-for-types-defined-in-DataFrames.jl"><span>Common API for types defined in DataFrames.jl</span></a></li></ul></li><li><a class="tocitem" href="../metadata/">Metadata</a></li></ul></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">API</a></li><li class="is-active"><a href>Indexing</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Indexing</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaData/DataFrames.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaData/DataFrames.jl/blob/main/docs/src/lib/indexing.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="Indexing"><a class="docs-heading-anchor" href="#Indexing">Indexing</a><a id="Indexing-1"></a><a class="docs-heading-anchor-permalink" href="#Indexing" title="Permalink"></a></h1><ul></ul><h2 id="General-rules"><a class="docs-heading-anchor" href="#General-rules">General rules</a><a id="General-rules-1"></a><a class="docs-heading-anchor-permalink" href="#General-rules" title="Permalink"></a></h2><p>The following rules explain target functionality of how <code>getindex</code>, <code>setindex!</code>, <code>view</code>, and broadcasting are intended to work with <code>DataFrame</code>, <code>SubDataFrame</code> and <code>DataFrameRow</code> objects.</p><p>The following values are a valid column index:</p><ul><li>a scalar, later denoted as <code>col</code>:<ul><li>a <code>Symbol</code>;</li><li>an <code>AbstractString</code>;</li><li>an <code>Integer</code> that is not <code>Bool</code>;</li></ul></li><li>a vector, later denoted as <code>cols</code>:<ul><li>a vector of <code>Symbol</code> (does not have to be a subtype of <code>AbstractVector{Symbol}</code>);</li><li>a vector of <code>AbstractString</code> (does not have to be a subtype of <code>AbstractVector{&lt;:AbstractString}</code>);</li><li>a vector of <code>Integer</code> that are not <code>Bool</code> (does not have to be a subtype of <code>AbstractVector{&lt;:Integer}</code>);</li><li>a vector of <code>Bool</code> (must be a subtype of <code>AbstractVector{Bool}</code>);</li><li>a <a href="https://docs.julialang.org/en/v1/manual/strings/#Regular-Expressions">regular expression</a> (will be expanded to a vector of matching column names);</li><li>a <code>Not</code> expression (see <a href="https://github.com/JuliaData/InvertedIndices.jl">InvertedIndices.jl</a>); <code>Not(idx)</code> selects all indices not in the passed <code>idx</code>; when passed as column selector <code>Not(idx...)</code> is equivalent to <code>Not(Cols(idx...))</code>.</li><li>a <code>Cols</code> expression (see <a href="https://github.com/JuliaData/DataAPI.jl">DataAPI.jl</a>); <code>Cols(idxs...)</code> selects the union of the selections in <code>idxs</code>; in particular <code>Cols()</code> selects no columns and <code>Cols(:)</code> selects all columns; a special rule is <code>Cols(predicate)</code>, where <code>predicate</code> is a predicate function; in this case the columns whose names passed to <code>predicate</code> as strings return <code>true</code> are selected.</li><li>a <code>Between</code> expression (see <a href="https://github.com/JuliaData/DataAPI.jl">DataAPI.jl</a>); <code>Between(first, last)</code> selects the columns between <code>first</code> and <code>last</code> inclusively;</li><li>an <code>All</code> expression (see <a href="https://github.com/JuliaData/DataAPI.jl">DataAPI.jl</a>); <code>All()</code> selects all columns, equivalent to <code>:</code>;</li><li>a literal colon <code>:</code> (selects all columns).</li></ul></li></ul><p>The following values are a valid row index:</p><ul><li>a scalar, later denoted as <code>row</code>:<ul><li>an <code>Integer</code> that is not <code>Bool</code>;</li></ul></li><li>a vector, later denoted as <code>rows</code>:<ul><li>a vector of <code>Integer</code> that are not <code>Bool</code> (does not have to be a subtype of <code>AbstractVector{&lt;:Integer}</code>);</li><li>a vector of <code>Bool</code> (must be a subtype of <code>AbstractVector{Bool}</code>);</li><li>a <code>Not</code> expression (see <a href="https://github.com/JuliaData/InvertedIndices.jl">InvertedIndices.jl</a>);</li><li>a literal colon <code>:</code> (selects all rows with copying);</li><li>a literal exclamation mark <code>!</code> (selects all rows without copying).</li></ul></li></ul><p>Additionally it is allowed to index into an <code>AbstractDataFrame</code> using a two-dimensional <code>CartesianIndex</code>.</p><p>In the descriptions below <code>df</code> represents a <code>DataFrame</code>, <code>sdf</code> is a <code>SubDataFrame</code> and <code>dfr</code> is a <code>DataFrameRow</code>.</p><p><code>:</code> always expands to <code>axes(df, 1)</code> or <code>axes(sdf, 1)</code>.</p><p><code>df.col</code> works like <code>df[!, col]</code> and <code>sdf.col</code> works like <code>sdf[!, col]</code> in all cases. An exception is that under Julia 1.6 or earlier <code>df.col .= v</code> and <code>sdf.col .= v</code> performs in-place broadcasting if <code>col</code> is present in <code>df</code>/<code>sdf</code> and is a valid identifier (this inconsistency is not present under Julia 1.7 and later).</p><h2 id="getindex-and-view"><a class="docs-heading-anchor" href="#getindex-and-view"><code>getindex</code> and <code>view</code></a><a id="getindex-and-view-1"></a><a class="docs-heading-anchor-permalink" href="#getindex-and-view" title="Permalink"></a></h2><p>The following list specifies the behavior of <code>getindex</code> and <code>view</code> operations depending on argument types.</p><p>In particular a description explicitly mentions that the data is <em>copied</em> or <em>reused without copying</em>.</p><p>For performance reasons, accessing, via <code>getindex</code> or <code>view</code>, a single <code>row</code> and multiple <code>cols</code> of a <code>DataFrame</code>, a <code>SubDataFrame</code> or a <code>DataFrameRow</code> always returns a <code>DataFrameRow</code> (which is a view type).</p><p><code>getindex</code> on <code>DataFrame</code>:</p><ul><li><code>df[row, col]</code> -&gt; the value contained in row <code>row</code> of column <code>col</code>, the same as <code>df[!, col][row]</code>;</li><li><code>df[CartesianIndex(row, col)]</code> -&gt; the same as <code>df[row, col]</code>;</li><li><code>df[row, cols]</code> -&gt; a <code>DataFrameRow</code> with parent <code>df</code>;</li><li><code>df[rows, col]</code> -&gt; a copy of the vector <code>df[!, col]</code> with only the entries                    corresponding to <code>rows</code> selected, the same as <code>df[!, col][rows]</code>;</li><li><code>df[rows, cols]</code> -&gt; a <code>DataFrame</code> containing copies of columns <code>cols</code> with                     only the entries corresponding to <code>rows</code> selected;</li><li><code>df[!, col]</code> -&gt; the vector contained in column <code>col</code> returned without copying;                 the same as <code>df.col</code> if <code>col</code> is a valid identifier.</li><li><code>df[!, cols]</code> -&gt; create a new <code>DataFrame</code> with columns <code>cols</code> without copying                  of columns; the same as <code>select(df, cols, copycols=false)</code>.</li></ul><p><code>view</code> on <code>DataFrame</code>:</p><ul><li><code>@view df[row, col]</code> -&gt; a <code>0</code>-dimensional view into <code>df[!, col]</code> in row <code>row</code>,                         the same as <code>view(df[!, col], row)</code>;</li><li><code>@view df[CartesianIndex(row, col)]</code> -&gt; the same as <code>@view df[row, col]</code>;</li><li><code>@view df[row, cols]</code> -&gt; the same as <code>df[row, cols]</code>;</li><li><code>@view df[rows, col]</code> -&gt; a view into <code>df[!, col]</code> with <code>rows</code> selected, the                          same as <code>view(df[!, col], rows)</code>;</li><li><code>@view df[rows, cols]</code> -&gt; a <code>SubDataFrame</code> with <code>rows</code> selected with parent <code>df</code>;</li><li><code>@view df[!, col]</code> -&gt; a view into <code>df[!, col]</code>  with all rows.</li><li><code>@view df[!, cols]</code> -&gt; the same as <code>@view df[:, cols]</code>.</li></ul><p><code>getindex</code> on <code>SubDataFrame</code>:</p><ul><li><code>sdf[row, col]</code> -&gt; a value contained in row <code>row</code> of column <code>col</code>;</li><li><code>sdf[CartesianIndex(row, col)]</code> -&gt; the same as <code>sdf[row, col]</code>;</li><li><code>sdf[row, cols]</code> -&gt; a <code>DataFrameRow</code> with parent <code>parent(sdf)</code>;</li><li><code>sdf[rows, col]</code> -&gt; a copy of <code>sdf[!, col]</code> with only rows <code>rows</code> selected,                     the same as <code>sdf[!, col][rows]</code>;</li><li><code>sdf[rows, cols]</code> -&gt; a <code>DataFrame</code> containing columns <code>cols</code> and <code>sdf[rows, col]</code> as a vector for each <code>col</code> in <code>cols</code>;</li><li><code>sdf[!, col]</code> -&gt; a view of entries corresponding to <code>sdf</code> in the vector                  <code>parent(sdf)[!, col]</code>; the same as <code>sdf.col</code> if <code>col</code> is a                  valid identifier.</li><li><code>sdf[!, cols]</code> -&gt; create a new <code>SubDataFrame</code> with columns <code>cols</code>, the same                   parent as <code>sdf</code>, and the same rows selected; the same as                   <code>select(sdf, cols, copycols=false)</code>.</li></ul><p><code>view</code> on <code>SubDataFrame</code>:</p><ul><li><code>@view sdf[row, col]</code> -&gt; a <code>0</code>-dimensional view into <code>df[!, col]</code> at row                          <code>row</code>, the same as <code>view(sdf[!, col], row)</code>;</li><li><code>@view sdf[CartesianIndex(row, col)]</code> -&gt; the same as <code>@view sdf[row, col]</code>;</li><li><code>@view sdf[row, cols]</code> -&gt; a <code>DataFrameRow</code> with parent <code>parent(sdf)</code>;</li><li><code>@view sdf[rows, col]</code> -&gt; a view into <code>sdf[!, col]</code> vector with <code>rows</code>                           selected, the same as <code>view(sdf[!, col], rows)</code>;</li><li><code>@view sdf[rows, cols]</code> -&gt; a <code>SubDataFrame</code> with parent <code>parent(sdf)</code>;</li><li><code>@view sdf[!, col]</code> -&gt; a view into <code>sdf[!, col]</code> vector with all rows.</li><li><code>@view sdf[!, cols]</code> -&gt; the same as <code>@view sdf[:, cols]</code>.</li></ul><p><code>getindex</code> on <code>DataFrameRow</code>:</p><ul><li><code>dfr[col]</code> -&gt; the value contained in column <code>col</code> of <code>dfr</code>; the same as               <code>dfr.col</code> if <code>col</code> is a valid identifier;</li><li><code>dfr[cols]</code> -&gt; a <code>DataFrameRow</code> with parent <code>parent(dfr)</code>;</li></ul><p><code>view</code> on <code>DataFrameRow</code>:</p><ul><li><code>@view dfr[col]</code> -&gt; a <code>0</code>-dimensional view into                     <code>parent(dfr)[DataFrames.row(dfr), col]</code>;</li><li><code>@view dfr[cols]</code> -&gt; a <code>DataFrameRow</code> with parent <code>parent(dfr)</code>;</li></ul><p>Note that views created with columns selector set to <code>:</code> change their columns&#39; count if columns are added/removed/renamed in the parent; if column selector is other than <code>:</code> then view points to selected columns by their number at the moment of creation of the view.</p><h2 id="setindex!"><a class="docs-heading-anchor" href="#setindex!"><code>setindex!</code></a><a id="setindex!-1"></a><a class="docs-heading-anchor-permalink" href="#setindex!" title="Permalink"></a></h2><p>The following list specifies the behavior of <code>setindex!</code> operations depending on argument types.</p><p>In particular a description explicitly mentions if the assignment is <em>in-place</em>.</p><p>Note that if a <code>setindex!</code> operation throws an error the target data frame may be partially changed so it is unsafe to use it afterwards (the column length correctness will be preserved).</p><p><code>setindex!</code> on <code>DataFrame</code>:</p><ul><li><code>df[row, col] = v</code> -&gt; set value of <code>col</code> in row <code>row</code> to <code>v</code> in-place;</li><li><code>df[CartesianIndex(row, col)] = v</code> -&gt; the same as <code>df[row, col] = v</code>;</li><li><code>df[row, cols] = v</code> -&gt; set row <code>row</code> of columns <code>cols</code> in-place; the same as                        <code>dfr = df[row, cols]; dfr[:] = v</code>;</li><li><code>df[rows, col] = v</code> -&gt; set rows <code>rows</code> of column <code>col</code> in-place; <code>v</code> must be                        an <code>AbstractVector</code>; if <code>rows</code> is <code>:</code> and <code>col</code> is a                        <code>Symbol</code> or <code>AbstractString</code> that is not present in                        <code>df</code> then a new column in <code>df</code> is created and holds a                        <code>copy</code> of <code>v</code>; equivalent to <code>df.col = copy(v)</code> if                        <code>col</code> is a valid identifier;</li><li><code>df[rows, cols] = v</code> -&gt; set rows <code>rows</code> of columns <code>cols</code> in-place; <code>v</code> must                         be an <code>AbstractMatrix</code> or an <code>AbstractDataFrame</code> (in                         this case column names must match);</li><li><code>df[!, col] = v</code> -&gt; replaces <code>col</code> with <code>v</code> without copying (with the                     exception that if <code>v</code> is an <code>AbstractRange</code> it gets                     converted to a <code>Vector</code>); also if <code>col</code> is a <code>Symbol</code> or                     <code>AbstractString</code> that is not present in <code>df</code> then a new                     column in <code>df</code> is created and holds <code>v</code>; equivalent to                     <code>df.col = v</code> if <code>col</code> is a valid identifier; this is                     allowed if <code>ncol(df) == 0 || length(v) == nrow(df)</code>;</li><li><code>df[!, cols] = v</code> -&gt; replaces existing columns <code>cols</code> in data frame <code>df</code> with                      copying; <code>v</code> must be an <code>AbstractMatrix</code> or an                      <code>AbstractDataFrame</code> (in the latter case column names must                      match);</li></ul><p><code>setindex!</code> on <code>SubDataFrame</code>:</p><ul><li><code>sdf[row, col] = v</code> -&gt; set value of <code>col</code> in row <code>row</code> to <code>v</code> in-place;</li><li><code>sdf[CartesianIndex(row, col)] = v</code> -&gt; the same as <code>sdf[row, col] = v</code>;</li><li><code>sdf[row, cols] = v</code> -&gt; the same as <code>dfr = df[row, cols]; dfr[:] = v</code> in-place;</li><li><code>sdf[rows, col] = v</code> -&gt; set rows <code>rows</code> of column <code>col</code>, in-place; <code>v</code> must be                         an abstract vector;</li><li><code>sdf[rows, cols] = v</code> -&gt; set rows <code>rows</code> of columns <code>cols</code> in-place; <code>v</code> can                          be an <code>AbstractMatrix</code> or <code>v</code> can be                          <code>AbstractDataFrame</code> in which case column names must                          match;</li><li><code>sdf[!, col] = v</code> -&gt; replaces <code>col</code> with <code>v</code> with copying; if <code>col</code> is present                      in <code>sdf</code> then filtered-out rows in newly created vector                      are filled with values already present in that column and                      <code>promote_type</code> is used to determine the <code>eltype</code> of the                      new column; if <code>col</code> is not present in <code>sdf</code> then the                      operation is only allowed if <code>sdf</code> was created with <code>:</code>                      as column selector, in which case filtered-out rows are                      filled with <code>missing</code>; equivalent to <code>sdf.col = v</code> if                      <code>col</code> is a valid identifier; operation is allowed if                      <code>length(v) == nrow(sdf)</code>;</li><li><code>sdf[!, cols] = v</code> -&gt; replaces existing columns <code>cols</code> in data frame <code>sdf</code>                       with copying; <code>v</code> must be an <code>AbstractMatrix</code> or an                       <code>AbstractDataFrame</code> (in the latter case column names                       must match); filtered-out rows in newly created vectors                       are filled with values already present in respective                       columns and <code>promote_type</code> is used to determine the                       <code>eltype</code> of the new columns;</li></ul><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>The rules above mean that <code>sdf[:, col] = v</code> is an in-place operation if <code>col</code> is present in <code>sdf</code>, therefore it will be fast in general. On the other hand using <code>sdf[!, col] = v</code> or <code>sdf.col = v</code> will always allocate a new vector, which is more expensive computationally.</p></div></div><p><code>setindex!</code> on <code>DataFrameRow</code>:</p><ul><li><code>dfr[col] = v</code> -&gt; set value of <code>col</code> in row <code>row</code> to <code>v</code> in-place;                   equivalent to <code>dfr.col = v</code> if <code>col</code> is a valid identifier;</li><li><code>dfr[cols] = v</code> -&gt; set values of entries in columns <code>cols</code> in <code>dfr</code> by                    elements of <code>v</code> in place; <code>v</code> can be: 1) a <code>Tuple</code> or an                    <code>AbstractArray</code>, in which cases it must have a number of                    elements equal to <code>length(dfr)</code>, 2) an <code>AbstractDict</code>, in                    which case column names must match, 3) a <code>NamedTuple</code> or                    <code>DataFrameRow</code>, in which case column names and order must                    match;</li></ul><h2 id="Broadcasting"><a class="docs-heading-anchor" href="#Broadcasting">Broadcasting</a><a id="Broadcasting-1"></a><a class="docs-heading-anchor-permalink" href="#Broadcasting" title="Permalink"></a></h2><p>The following broadcasting rules apply to <code>AbstractDataFrame</code> objects:</p><ul><li><code>AbstractDataFrame</code> behaves in broadcasting like a two-dimensional collection compatible with matrices.</li><li>If an <code>AbstractDataFrame</code> takes part in broadcasting then a <code>DataFrame</code> is always produced as a result. In this case the requested broadcasting operation produces an object with exactly two dimensions. An exception is when an <code>AbstractDataFrame</code> is used only as a source of broadcast assignment into an object of dimensionality higher than two.</li><li>If multiple <code>AbstractDataFrame</code> objects take part in broadcasting then they have to have identical column names.</li></ul><p>Note that if broadcasting assignment operation throws an error the target data frame may be partially changed so it is unsafe to use it afterwards (the column length correctness will be preserved).</p><p>Broadcasting <code>DataFrameRow</code> is currently not allowed (which is consistent with <code>NamedTuple</code>).</p><p>It is possible to assign a value to <code>AbstractDataFrame</code> and <code>DataFrameRow</code> objects using the <code>.=</code> operator. In such an operation <code>AbstractDataFrame</code> is considered as two-dimensional and <code>DataFrameRow</code> as single-dimensional.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>The rule above means that, similar to single-dimensional objects in Base (e.g. vectors), <code>DataFrameRow</code> is considered to be column-oriented.</p></div></div><p>Additional rules:</p><ul><li>in the <code>df[CartesianIndex(row, col)] .= v</code>, <code>df[row, col] .= v</code> syntaxes <code>v</code> is broadcasted into the contents of <code>df[row, col]</code> (this is consistent with Julia Base);</li><li>in the <code>df[row, cols] .= v</code> syntaxes the assignment to <code>df</code> is performed in-place;</li><li>in the <code>df[rows, col] .= v</code> and <code>df[rows, cols] .= v</code> syntaxes the assignment to <code>df</code> is performed in-place; if <code>rows</code> is <code>:</code> and <code>col</code> is <code>Symbol</code> or <code>AbstractString</code> and it is missing from <code>df</code> then a new column is allocated and added; the length of the column is always the value of <code>nrow(df)</code> before the assignment takes place;</li><li>in the <code>df[!, col] .= v</code> syntax column <code>col</code> is replaced by a freshly allocated vector; if <code>col</code> is <code>Symbol</code> or <code>AbstractString</code> and it is missing from <code>df</code> then a new column is allocated added; the length of the column is always the value of <code>nrow(df)</code> before the assignment takes place;</li><li>the <code>df[!, cols] .= v</code> syntax replaces existing columns <code>cols</code> in data frame <code>df</code> with freshly allocated vectors;</li><li><code>df.col .= v</code> syntax currently performs in-place assignment to an existing vector <code>df.col</code>; this behavior is deprecated and a new column will be allocated in the future. Starting from Julia 1.7 if <code>:col</code> is not present in <code>df</code> then a new column will be created in <code>df</code>.</li><li>in the <code>sdf[CartesianIndex(row, col)] .= v</code>, <code>sdf[row, col] .= v</code> and <code>sdf[row, cols] .= v</code> syntaxes the assignment to <code>sdf</code> is performed in-place;</li><li>in the <code>sdf[rows, col] .= v</code> and <code>sdf[rows, cols] .= v</code> syntaxes the assignment to <code>sdf</code> is performed in-place; if <code>rows</code> is <code>:</code> and <code>col</code> is a <code>Symbol</code> or <code>AbstractString</code> referring to a column missing from <code>sdf</code> and <code>sdf</code> was created with <code>:</code> as column selector then a new column is allocated and added; the filtered-out rows are filled with <code>missing</code>;</li><li>in the <code>sdf[!, col] .= v</code> syntax column <code>col</code> is replaced by a freshly allocated vector; the filtered-out rows are filled with values already present in <code>col</code>; if <code>col</code> is a <code>Symbol</code> or <code>AbstractString</code> referring to a column missing from <code>sdf</code> and was <code>sdf</code> created with <code>:</code> as column selector then a new column is allocated and added; in this case the filtered-out rows are filled with <code>missing</code>;</li><li>the <code>sdf[!, cols] .= v</code> syntax replaces existing columns <code>cols</code> in data frame <code>sdf</code> with freshly allocated vectors; the filtered-out rows are filled with values already present in <code>cols</code>;</li><li><code>sdf.col .= v</code> syntax currently performs in-place assignment to an existing vector <code>sdf.col</code>; this behavior is deprecated and a new column will be allocated in the future. Starting from Julia 1.7 if <code>:col</code> is not present in <code>sdf</code> then a new column will be created in <code>sdf</code> if <code>sdf</code> was created with <code>:</code> as a column selector.</li><li><code>dfr.col .= v</code> syntax is allowed and performs in-place assignment to a value extracted by <code>dfr.col</code>.</li></ul><p>Note that <code>sdf[!, col] .= v</code> and <code>sdf[!, cols] .= v</code> syntaxes are not allowed as <code>sdf</code> can be only modified in-place.</p><p>If column indexing using <code>Symbol</code> or <code>AbstractString</code> names in <code>cols</code> is performed, the order of columns in the operation is specified by the order of names.</p><h2 id="Indexing-GroupedDataFrames"><a class="docs-heading-anchor" href="#Indexing-GroupedDataFrames">Indexing <code>GroupedDataFrame</code>s</a><a id="Indexing-GroupedDataFrames-1"></a><a class="docs-heading-anchor-permalink" href="#Indexing-GroupedDataFrames" title="Permalink"></a></h2><p>A <a href="../types/#DataFrames.GroupedDataFrame"><code>GroupedDataFrame</code></a> can behave as either an <code>AbstractVector</code> or <code>AbstractDict</code> depending on the type of index used. Integers (or arrays of them) trigger vector-like indexing while <code>Tuples</code>s and <code>NamedTuple</code>s trigger dictionary-like indexing. An intermediate between the two is the <a href="../types/#DataFrames.GroupKey"><code>GroupKey</code></a> type returned by <a href="../functions/#Base.keys"><code>keys(::GroupedDataFrame)</code></a>, which behaves similarly to a <code>NamedTuple</code> but has performance on par with integer indexing.</p><p>The elements of a <code>GroupedDataFrame</code> are <a href="../types/#DataFrames.SubDataFrame"><code>SubDataFrame</code></a>s of its parent.</p><ul><li><code>gd[i::Integer]</code> -&gt; Get the <code>i</code>th group.</li><li><code>gd[key::NamedTuple]</code> -&gt; Get the group corresponding to the given values of the grouping columns. The fields of the <code>NamedTuple</code> must match the grouping columns columns passed to <a href="../functions/#DataAPI.groupby"><code>groupby</code></a> (including order).</li><li><code>gd[key::Tuple]</code> -&gt; Same as previous, but omitting the names on <code>key</code>.</li><li><code>get(gd, key::Union{Tuple, NamedTuple}, default)</code> -&gt; Get group for key <code>key</code>, returning <code>default</code> if it does not exist.</li><li><code>gd[key::GroupKey]</code> -&gt; Get the group corresponding to the <a href="../types/#DataFrames.GroupKey"><code>GroupKey</code></a> <code>key</code> (one of the elements of the vector returned by <a href="../functions/#Base.keys"><code>keys(::GroupedDataFrame)</code></a>). This should be nearly as fast as integer indexing.</li><li><code>gd[a::AbstractVector]</code> -&gt; Select multiple groups and return them in a new <code>GroupedDataFrame</code> object. Groups may be selected by integer position using an array of <code>Integer</code>s or <code>Bool</code>s, similar to a standard array. Alternatively the array may contain keys of any of the types supported for dictionary-like indexing (<code>GroupKey</code>, <code>Tuple</code>, or <code>NamedTuple</code>). Selected groups must be unique, and different types of indices cannot be mixed.</li><li><code>gd[n::Not]</code> -&gt; Any of the above types wrapped in <code>Not</code>. The result will be a  new <code>GroupedDataFrame</code> containing all groups in <code>gd</code> <em>not</em> selected by the  wrapped index.</li></ul><h1 id="Common-API-for-types-defined-in-DataFrames.jl"><a class="docs-heading-anchor" href="#Common-API-for-types-defined-in-DataFrames.jl">Common API for types defined in DataFrames.jl</a><a id="Common-API-for-types-defined-in-DataFrames.jl-1"></a><a class="docs-heading-anchor-permalink" href="#Common-API-for-types-defined-in-DataFrames.jl" title="Permalink"></a></h1><p>This table presents return value types of calling <code>names</code>, <code>propertynames</code>, <code>keys</code>, <code>length</code> and <code>ndims</code> on types exposed to the user by DataFrames.jl:</p><table><tr><th style="text-align: right">Type</th><th style="text-align: right"><code>names</code></th><th style="text-align: right"><code>propertynames</code></th><th style="text-align: right"><code>keys</code></th><th style="text-align: right"><code>length</code></th><th style="text-align: right"><code>ndims</code></th></tr><tr><td style="text-align: right"><code>AbstractDataFrame</code></td><td style="text-align: right"><code>Vector{String}</code></td><td style="text-align: right"><code>Vector{Symbol}</code></td><td style="text-align: right">undefined</td><td style="text-align: right">undefined</td><td style="text-align: right"><code>2</code></td></tr><tr><td style="text-align: right"><code>DataFrameRow</code></td><td style="text-align: right"><code>Vector{String}</code></td><td style="text-align: right"><code>Vector{Symbol}</code></td><td style="text-align: right"><code>Vector{Symbol}</code></td><td style="text-align: right"><code>Int</code></td><td style="text-align: right"><code>1</code></td></tr><tr><td style="text-align: right"><code>DataFrameRows</code></td><td style="text-align: right"><code>Vector{String}</code></td><td style="text-align: right"><code>Vector{Symbol}</code></td><td style="text-align: right">vector of <code>Int</code></td><td style="text-align: right"><code>Int</code></td><td style="text-align: right"><code>1</code></td></tr><tr><td style="text-align: right"><code>DataFrameColumns</code></td><td style="text-align: right"><code>Vector{String}</code></td><td style="text-align: right"><code>Vector{Symbol}</code></td><td style="text-align: right"><code>Vector{Symbol}</code></td><td style="text-align: right"><code>Int</code></td><td style="text-align: right"><code>1</code></td></tr><tr><td style="text-align: right"><code>GroupedDataFrame</code></td><td style="text-align: right"><code>Vector{String}</code></td><td style="text-align: right">tuple of fields</td><td style="text-align: right"><code>GroupKeys</code></td><td style="text-align: right"><code>Int</code></td><td style="text-align: right"><code>1</code></td></tr><tr><td style="text-align: right"><code>GroupKeys</code></td><td style="text-align: right">undefined</td><td style="text-align: right">tuple of fields</td><td style="text-align: right">vector of <code>Int</code></td><td style="text-align: right"><code>Int</code></td><td style="text-align: right"><code>1</code></td></tr><tr><td style="text-align: right"><code>GroupKey</code></td><td style="text-align: right"><code>Vector{String}</code></td><td style="text-align: right"><code>Vector{Symbol}</code></td><td style="text-align: right"><code>Vector{Symbol}</code></td><td style="text-align: right"><code>Int</code></td><td style="text-align: right"><code>1</code></td></tr></table><p>Additionally the above types <code>T</code> (i.e. <code>AbstractDataFrame</code>, <code>DataFrameRow</code>, <code>DataFrameRows</code>, <code>DataFrameColumns</code>, <code>GroupedDataFrame</code>, <code>GroupKeys</code>, <code>GroupKey</code>) the following methods are defined:</p><ul><li><code>size(::T)</code> returning a <code>Tuple</code> of <code>Int</code>.</li><li><code>size(::T, ::Integer)</code> returning an <code>Int</code>.</li><li><code>axes(::T)</code> returning a <code>Tuple</code> of <code>Int</code> vectors.</li><li><code>axes(::T, ::Integer)</code> returning an <code>Int</code> vector for a valid dimension (except  <code>DataFrameRows</code> and <code>GroupKeys</code> for which <code>Base.OneTo(1)</code> is also returned  for a dimension higher than a valid one because they are <code>AbstractVector</code>).</li><li><code>firstindex(::T)</code> returning <code>1</code> (except <code>AbstractDataFrame</code> for which it is undefined).</li><li><code>firstindex(::T, ::Integer)</code> returning <code>1</code> for a valid dimension (except  <code>DataFrameRows</code> and <code>GroupKeys</code> for which <code>1</code> is also returned for a  dimension higher than a valid one because they are <code>AbstractVector</code>).</li><li><code>lastindex(::T)</code> returning <code>Int</code> (except <code>AbstractDataFrame</code> for which it is undefined).</li><li><code>lastindex(::T, ::Integer)</code> returning <code>Int</code> for a valid dimension  (except  <code>DataFrameRows</code> and <code>GroupKeys</code> for which <code>1</code> is also returned for a  dimension higher than a valid one because they are <code>AbstractVector</code>).</li></ul></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../functions/">« Functions</a><a class="docs-footer-nextpage" href="../metadata/">Metadata »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Saturday 7 September 2024 11:00">Saturday 7 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Indexing · DataFrames.jl</title><meta name="title" content="Indexing · DataFrames.jl"/><meta property="og:title" content="Indexing · DataFrames.jl"/><meta property="twitter:title" content="Indexing · DataFrames.jl"/><meta name="description" content="Documentation for DataFrames.jl."/><meta property="og:description" content="Documentation for DataFrames.jl."/><meta property="twitter:description" content="Documentation for DataFrames.jl."/><meta property="og:url" content="https://juliadata.github.io/DataFrames.jl/stable/lib/indexing/"/><meta property="twitter:url" content="https://juliadata.github.io/DataFrames.jl/stable/lib/indexing/"/><link rel="canonical" href="https://juliadata.github.io/DataFrames.jl/stable/lib/indexing/"/><script data-outdated-warner src="../../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../search_index.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script><link href="../../assets/favicon.ico" rel="icon" type="image/x-icon"/></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../../"><img src="../../assets/logo.png" alt="DataFrames.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../../">DataFrames.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><a class="tocitem" href="../../">Introduction</a></li><li><a class="tocitem" href="../../man/basics/">First Steps with DataFrames.jl</a></li><li><span class="tocitem">User Guide</span><ul><li><a class="tocitem" href="../../man/getting_started/">Getting Started</a></li><li><a class="tocitem" href="../../man/working_with_dataframes/">Working with DataFrames</a></li><li><a class="tocitem" href="../../man/importing_and_exporting/">Importing and Exporting Data (I/O)</a></li><li><a class="tocitem" href="../../man/joins/">Joins</a></li><li><a class="tocitem" href="../../man/split_apply_combine/">Split-apply-combine</a></li><li><a class="tocitem" href="../../man/reshaping_and_pivoting/">Reshaping</a></li><li><a class="tocitem" href="../../man/sorting/">Sorting</a></li><li><a class="tocitem" href="../../man/categorical/">Categorical Data</a></li><li><a class="tocitem" href="../../man/missing/">Missing Data</a></li><li><a class="tocitem" href="../../man/querying_frameworks/">Data manipulation frameworks</a></li><li><a class="tocitem" href="../../man/comparisons/">Comparison with Python/R/Stata</a></li></ul></li><li><span class="tocitem">API</span><ul><li><a class="tocitem" href="../types/">Types</a></li><li><a class="tocitem" href="../functions/">Functions</a></li><li class="is-active"><a class="tocitem" href>Indexing</a><ul class="internal"><li><a class="tocitem" href="#General-rules"><span>General rules</span></a></li><li><a class="tocitem" href="#getindex-and-view"><span><code>getindex</code> and <code>view</code></span></a></li><li><a class="tocitem" href="#setindex!"><span><code>setindex!</code></span></a></li><li><a class="tocitem" href="#Broadcasting"><span>Broadcasting</span></a></li><li><a class="tocitem" href="#Indexing-GroupedDataFrames"><span>Indexing <code>GroupedDataFrame</code>s</span></a></li><li class="toplevel"><a class="tocitem" href="#Common-API-for-types-defined-in-DataFrames.jl"><span>Common API for types defined in DataFrames.jl</span></a></li></ul></li><li><a class="tocitem" href="../metadata/">Metadata</a></li></ul></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">API</a></li><li class="is-active"><a href>Indexing</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Indexing</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaData/DataFrames.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaData/DataFrames.jl/blob/main/docs/src/lib/indexing.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="Indexing"><a class="docs-heading-anchor" href="#Indexing">Indexing</a><a id="Indexing-1"></a><a class="docs-heading-anchor-permalink" href="#Indexing" title="Permalink"></a></h1><ul></ul><h2 id="General-rules"><a class="docs-heading-anchor" href="#General-rules">General rules</a><a id="General-rules-1"></a><a class="docs-heading-anchor-permalink" href="#General-rules" title="Permalink"></a></h2><p>The following rules explain target functionality of how <code>getindex</code>, <code>setindex!</code>, <code>view</code>, and broadcasting are intended to work with <code>DataFrame</code>, <code>SubDataFrame</code> and <code>DataFrameRow</code> objects.</p><p>The following values are a valid column index:</p><ul><li>a scalar, later denoted as <code>col</code>:<ul><li>a <code>Symbol</code>;</li><li>an <code>AbstractString</code>;</li><li>an <code>Integer</code> that is not <code>Bool</code>;</li></ul></li><li>a vector, later denoted as <code>cols</code>:<ul><li>a vector of <code>Symbol</code> (does not have to be a subtype of <code>AbstractVector{Symbol}</code>);</li><li>a vector of <code>AbstractString</code> (does not have to be a subtype of <code>AbstractVector{&lt;:AbstractString}</code>);</li><li>a vector of <code>Integer</code> that are not <code>Bool</code> (does not have to be a subtype of <code>AbstractVector{&lt;:Integer}</code>);</li><li>a vector of <code>Bool</code> (must be a subtype of <code>AbstractVector{Bool}</code>);</li><li>a <a href="https://docs.julialang.org/en/v1/manual/strings/#Regular-Expressions">regular expression</a> (will be expanded to a vector of matching column names);</li><li>a <code>Not</code> expression (see <a href="https://github.com/JuliaData/InvertedIndices.jl">InvertedIndices.jl</a>); <code>Not(idx)</code> selects all indices not in the passed <code>idx</code>; when passed as column selector <code>Not(idx...)</code> is equivalent to <code>Not(Cols(idx...))</code>.</li><li>a <code>Cols</code> expression (see <a href="https://github.com/JuliaData/DataAPI.jl">DataAPI.jl</a>); <code>Cols(idxs...)</code> selects the union of the selections in <code>idxs</code>; in particular <code>Cols()</code> selects no columns and <code>Cols(:)</code> selects all columns; a special rule is <code>Cols(predicate)</code>, where <code>predicate</code> is a predicate function; in this case the columns whose names passed to <code>predicate</code> as strings return <code>true</code> are selected.</li><li>a <code>Between</code> expression (see <a href="https://github.com/JuliaData/DataAPI.jl">DataAPI.jl</a>); <code>Between(first, last)</code> selects the columns between <code>first</code> and <code>last</code> inclusively;</li><li>an <code>All</code> expression (see <a href="https://github.com/JuliaData/DataAPI.jl">DataAPI.jl</a>); <code>All()</code> selects all columns, equivalent to <code>:</code>;</li><li>a literal colon <code>:</code> (selects all columns).</li></ul></li></ul><p>The following values are a valid row index:</p><ul><li>a scalar, later denoted as <code>row</code>:<ul><li>an <code>Integer</code> that is not <code>Bool</code>;</li></ul></li><li>a vector, later denoted as <code>rows</code>:<ul><li>a vector of <code>Integer</code> that are not <code>Bool</code> (does not have to be a subtype of <code>AbstractVector{&lt;:Integer}</code>);</li><li>a vector of <code>Bool</code> (must be a subtype of <code>AbstractVector{Bool}</code>);</li><li>a <code>Not</code> expression (see <a href="https://github.com/JuliaData/InvertedIndices.jl">InvertedIndices.jl</a>);</li><li>a literal colon <code>:</code> (selects all rows with copying);</li><li>a literal exclamation mark <code>!</code> (selects all rows without copying).</li></ul></li></ul><p>Additionally it is allowed to index into an <code>AbstractDataFrame</code> using a two-dimensional <code>CartesianIndex</code>.</p><p>In the descriptions below <code>df</code> represents a <code>DataFrame</code>, <code>sdf</code> is a <code>SubDataFrame</code> and <code>dfr</code> is a <code>DataFrameRow</code>.</p><p><code>:</code> always expands to <code>axes(df, 1)</code> or <code>axes(sdf, 1)</code>.</p><p><code>df.col</code> works like <code>df[!, col]</code> and <code>sdf.col</code> works like <code>sdf[!, col]</code> in all cases. An exception is that under Julia 1.6 or earlier <code>df.col .= v</code> and <code>sdf.col .= v</code> performs in-place broadcasting if <code>col</code> is present in <code>df</code>/<code>sdf</code> and is a valid identifier (this inconsistency is not present under Julia 1.7 and later).</p><h2 id="getindex-and-view"><a class="docs-heading-anchor" href="#getindex-and-view"><code>getindex</code> and <code>view</code></a><a id="getindex-and-view-1"></a><a class="docs-heading-anchor-permalink" href="#getindex-and-view" title="Permalink"></a></h2><p>The following list specifies the behavior of <code>getindex</code> and <code>view</code> operations depending on argument types.</p><p>In particular a description explicitly mentions that the data is <em>copied</em> or <em>reused without copying</em>.</p><p>For performance reasons, accessing, via <code>getindex</code> or <code>view</code>, a single <code>row</code> and multiple <code>cols</code> of a <code>DataFrame</code>, a <code>SubDataFrame</code> or a <code>DataFrameRow</code> always returns a <code>DataFrameRow</code> (which is a view type).</p><p><code>getindex</code> on <code>DataFrame</code>:</p><ul><li><code>df[row, col]</code> -&gt; the value contained in row <code>row</code> of column <code>col</code>, the same as <code>df[!, col][row]</code>;</li><li><code>df[CartesianIndex(row, col)]</code> -&gt; the same as <code>df[row, col]</code>;</li><li><code>df[row, cols]</code> -&gt; a <code>DataFrameRow</code> with parent <code>df</code>;</li><li><code>df[rows, col]</code> -&gt; a copy of the vector <code>df[!, col]</code> with only the entries                    corresponding to <code>rows</code> selected, the same as <code>df[!, col][rows]</code>;</li><li><code>df[rows, cols]</code> -&gt; a <code>DataFrame</code> containing copies of columns <code>cols</code> with                     only the entries corresponding to <code>rows</code> selected;</li><li><code>df[!, col]</code> -&gt; the vector contained in column <code>col</code> returned without copying;                 the same as <code>df.col</code> if <code>col</code> is a valid identifier.</li><li><code>df[!, cols]</code> -&gt; create a new <code>DataFrame</code> with columns <code>cols</code> without copying                  of columns; the same as <code>select(df, cols, copycols=false)</code>.</li></ul><p><code>view</code> on <code>DataFrame</code>:</p><ul><li><code>@view df[row, col]</code> -&gt; a <code>0</code>-dimensional view into <code>df[!, col]</code> in row <code>row</code>,                         the same as <code>view(df[!, col], row)</code>;</li><li><code>@view df[CartesianIndex(row, col)]</code> -&gt; the same as <code>@view df[row, col]</code>;</li><li><code>@view df[row, cols]</code> -&gt; the same as <code>df[row, cols]</code>;</li><li><code>@view df[rows, col]</code> -&gt; a view into <code>df[!, col]</code> with <code>rows</code> selected, the                          same as <code>view(df[!, col], rows)</code>;</li><li><code>@view df[rows, cols]</code> -&gt; a <code>SubDataFrame</code> with <code>rows</code> selected with parent <code>df</code>;</li><li><code>@view df[!, col]</code> -&gt; a view into <code>df[!, col]</code>  with all rows.</li><li><code>@view df[!, cols]</code> -&gt; the same as <code>@view df[:, cols]</code>.</li></ul><p><code>getindex</code> on <code>SubDataFrame</code>:</p><ul><li><code>sdf[row, col]</code> -&gt; a value contained in row <code>row</code> of column <code>col</code>;</li><li><code>sdf[CartesianIndex(row, col)]</code> -&gt; the same as <code>sdf[row, col]</code>;</li><li><code>sdf[row, cols]</code> -&gt; a <code>DataFrameRow</code> with parent <code>parent(sdf)</code>;</li><li><code>sdf[rows, col]</code> -&gt; a copy of <code>sdf[!, col]</code> with only rows <code>rows</code> selected,                     the same as <code>sdf[!, col][rows]</code>;</li><li><code>sdf[rows, cols]</code> -&gt; a <code>DataFrame</code> containing columns <code>cols</code> and <code>sdf[rows, col]</code> as a vector for each <code>col</code> in <code>cols</code>;</li><li><code>sdf[!, col]</code> -&gt; a view of entries corresponding to <code>sdf</code> in the vector                  <code>parent(sdf)[!, col]</code>; the same as <code>sdf.col</code> if <code>col</code> is a                  valid identifier.</li><li><code>sdf[!, cols]</code> -&gt; create a new <code>SubDataFrame</code> with columns <code>cols</code>, the same                   parent as <code>sdf</code>, and the same rows selected; the same as                   <code>select(sdf, cols, copycols=false)</code>.</li></ul><p><code>view</code> on <code>SubDataFrame</code>:</p><ul><li><code>@view sdf[row, col]</code> -&gt; a <code>0</code>-dimensional view into <code>df[!, col]</code> at row                          <code>row</code>, the same as <code>view(sdf[!, col], row)</code>;</li><li><code>@view sdf[CartesianIndex(row, col)]</code> -&gt; the same as <code>@view sdf[row, col]</code>;</li><li><code>@view sdf[row, cols]</code> -&gt; a <code>DataFrameRow</code> with parent <code>parent(sdf)</code>;</li><li><code>@view sdf[rows, col]</code> -&gt; a view into <code>sdf[!, col]</code> vector with <code>rows</code>                           selected, the same as <code>view(sdf[!, col], rows)</code>;</li><li><code>@view sdf[rows, cols]</code> -&gt; a <code>SubDataFrame</code> with parent <code>parent(sdf)</code>;</li><li><code>@view sdf[!, col]</code> -&gt; a view into <code>sdf[!, col]</code> vector with all rows.</li><li><code>@view sdf[!, cols]</code> -&gt; the same as <code>@view sdf[:, cols]</code>.</li></ul><p><code>getindex</code> on <code>DataFrameRow</code>:</p><ul><li><code>dfr[col]</code> -&gt; the value contained in column <code>col</code> of <code>dfr</code>; the same as               <code>dfr.col</code> if <code>col</code> is a valid identifier;</li><li><code>dfr[cols]</code> -&gt; a <code>DataFrameRow</code> with parent <code>parent(dfr)</code>;</li></ul><p><code>view</code> on <code>DataFrameRow</code>:</p><ul><li><code>@view dfr[col]</code> -&gt; a <code>0</code>-dimensional view into                     <code>parent(dfr)[DataFrames.row(dfr), col]</code>;</li><li><code>@view dfr[cols]</code> -&gt; a <code>DataFrameRow</code> with parent <code>parent(dfr)</code>;</li></ul><p>Note that views created with columns selector set to <code>:</code> change their columns&#39; count if columns are added/removed/renamed in the parent; if column selector is other than <code>:</code> then view points to selected columns by their number at the moment of creation of the view.</p><h2 id="setindex!"><a class="docs-heading-anchor" href="#setindex!"><code>setindex!</code></a><a id="setindex!-1"></a><a class="docs-heading-anchor-permalink" href="#setindex!" title="Permalink"></a></h2><p>The following list specifies the behavior of <code>setindex!</code> operations depending on argument types.</p><p>In particular a description explicitly mentions if the assignment is <em>in-place</em>.</p><p>Note that if a <code>setindex!</code> operation throws an error the target data frame may be partially changed so it is unsafe to use it afterwards (the column length correctness will be preserved).</p><p><code>setindex!</code> on <code>DataFrame</code>:</p><ul><li><code>df[row, col] = v</code> -&gt; set value of <code>col</code> in row <code>row</code> to <code>v</code> in-place;</li><li><code>df[CartesianIndex(row, col)] = v</code> -&gt; the same as <code>df[row, col] = v</code>;</li><li><code>df[row, cols] = v</code> -&gt; set row <code>row</code> of columns <code>cols</code> in-place; the same as                        <code>dfr = df[row, cols]; dfr[:] = v</code>;</li><li><code>df[rows, col] = v</code> -&gt; set rows <code>rows</code> of column <code>col</code> in-place; <code>v</code> must be                        an <code>AbstractVector</code>; if <code>rows</code> is <code>:</code> and <code>col</code> is a                        <code>Symbol</code> or <code>AbstractString</code> that is not present in                        <code>df</code> then a new column in <code>df</code> is created and holds a                        <code>copy</code> of <code>v</code>; equivalent to <code>df.col = copy(v)</code> if                        <code>col</code> is a valid identifier;</li><li><code>df[rows, cols] = v</code> -&gt; set rows <code>rows</code> of columns <code>cols</code> in-place; <code>v</code> must                         be an <code>AbstractMatrix</code> or an <code>AbstractDataFrame</code> (in                         this case column names must match);</li><li><code>df[!, col] = v</code> -&gt; replaces <code>col</code> with <code>v</code> without copying (with the                     exception that if <code>v</code> is an <code>AbstractRange</code> it gets                     converted to a <code>Vector</code>); also if <code>col</code> is a <code>Symbol</code> or                     <code>AbstractString</code> that is not present in <code>df</code> then a new                     column in <code>df</code> is created and holds <code>v</code>; equivalent to                     <code>df.col = v</code> if <code>col</code> is a valid identifier; this is                     allowed if <code>ncol(df) == 0 || length(v) == nrow(df)</code>;</li><li><code>df[!, cols] = v</code> -&gt; replaces existing columns <code>cols</code> in data frame <code>df</code> with                      copying; <code>v</code> must be an <code>AbstractMatrix</code> or an                      <code>AbstractDataFrame</code> (in the latter case column names must                      match);</li></ul><p><code>setindex!</code> on <code>SubDataFrame</code>:</p><ul><li><code>sdf[row, col] = v</code> -&gt; set value of <code>col</code> in row <code>row</code> to <code>v</code> in-place;</li><li><code>sdf[CartesianIndex(row, col)] = v</code> -&gt; the same as <code>sdf[row, col] = v</code>;</li><li><code>sdf[row, cols] = v</code> -&gt; the same as <code>dfr = df[row, cols]; dfr[:] = v</code> in-place;</li><li><code>sdf[rows, col] = v</code> -&gt; set rows <code>rows</code> of column <code>col</code>, in-place; <code>v</code> must be                         an abstract vector;</li><li><code>sdf[rows, cols] = v</code> -&gt; set rows <code>rows</code> of columns <code>cols</code> in-place; <code>v</code> can                          be an <code>AbstractMatrix</code> or <code>v</code> can be                          <code>AbstractDataFrame</code> in which case column names must                          match;</li><li><code>sdf[!, col] = v</code> -&gt; replaces <code>col</code> with <code>v</code> with copying; if <code>col</code> is present                      in <code>sdf</code> then filtered-out rows in newly created vector                      are filled with values already present in that column and                      <code>promote_type</code> is used to determine the <code>eltype</code> of the                      new column; if <code>col</code> is not present in <code>sdf</code> then the                      operation is only allowed if <code>sdf</code> was created with <code>:</code>                      as column selector, in which case filtered-out rows are                      filled with <code>missing</code>; equivalent to <code>sdf.col = v</code> if                      <code>col</code> is a valid identifier; operation is allowed if                      <code>length(v) == nrow(sdf)</code>;</li><li><code>sdf[!, cols] = v</code> -&gt; replaces existing columns <code>cols</code> in data frame <code>sdf</code>                       with copying; <code>v</code> must be an <code>AbstractMatrix</code> or an                       <code>AbstractDataFrame</code> (in the latter case column names                       must match); filtered-out rows in newly created vectors                       are filled with values already present in respective                       columns and <code>promote_type</code> is used to determine the                       <code>eltype</code> of the new columns;</li></ul><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>The rules above mean that <code>sdf[:, col] = v</code> is an in-place operation if <code>col</code> is present in <code>sdf</code>, therefore it will be fast in general. On the other hand using <code>sdf[!, col] = v</code> or <code>sdf.col = v</code> will always allocate a new vector, which is more expensive computationally.</p></div></div><p><code>setindex!</code> on <code>DataFrameRow</code>:</p><ul><li><code>dfr[col] = v</code> -&gt; set value of <code>col</code> in row <code>row</code> to <code>v</code> in-place;                   equivalent to <code>dfr.col = v</code> if <code>col</code> is a valid identifier;</li><li><code>dfr[cols] = v</code> -&gt; set values of entries in columns <code>cols</code> in <code>dfr</code> by                    elements of <code>v</code> in place; <code>v</code> can be: 1) a <code>Tuple</code> or an                    <code>AbstractArray</code>, in which cases it must have a number of                    elements equal to <code>length(dfr)</code>, 2) an <code>AbstractDict</code>, in                    which case column names must match, 3) a <code>NamedTuple</code> or                    <code>DataFrameRow</code>, in which case column names and order must                    match;</li></ul><h2 id="Broadcasting"><a class="docs-heading-anchor" href="#Broadcasting">Broadcasting</a><a id="Broadcasting-1"></a><a class="docs-heading-anchor-permalink" href="#Broadcasting" title="Permalink"></a></h2><p>The following broadcasting rules apply to <code>AbstractDataFrame</code> objects:</p><ul><li><code>AbstractDataFrame</code> behaves in broadcasting like a two-dimensional collection compatible with matrices.</li><li>If an <code>AbstractDataFrame</code> takes part in broadcasting then a <code>DataFrame</code> is always produced as a result. In this case the requested broadcasting operation produces an object with exactly two dimensions. An exception is when an <code>AbstractDataFrame</code> is used only as a source of broadcast assignment into an object of dimensionality higher than two.</li><li>If multiple <code>AbstractDataFrame</code> objects take part in broadcasting then they have to have identical column names.</li></ul><p>Note that if broadcasting assignment operation throws an error the target data frame may be partially changed so it is unsafe to use it afterwards (the column length correctness will be preserved).</p><p>Broadcasting <code>DataFrameRow</code> is currently not allowed (which is consistent with <code>NamedTuple</code>).</p><p>It is possible to assign a value to <code>AbstractDataFrame</code> and <code>DataFrameRow</code> objects using the <code>.=</code> operator. In such an operation <code>AbstractDataFrame</code> is considered as two-dimensional and <code>DataFrameRow</code> as single-dimensional.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>The rule above means that, similar to single-dimensional objects in Base (e.g. vectors), <code>DataFrameRow</code> is considered to be column-oriented.</p></div></div><p>Additional rules:</p><ul><li>in the <code>df[CartesianIndex(row, col)] .= v</code>, <code>df[row, col] .= v</code> syntaxes <code>v</code> is broadcasted into the contents of <code>df[row, col]</code> (this is consistent with Julia Base);</li><li>in the <code>df[row, cols] .= v</code> syntaxes the assignment to <code>df</code> is performed in-place;</li><li>in the <code>df[rows, col] .= v</code> and <code>df[rows, cols] .= v</code> syntaxes the assignment to <code>df</code> is performed in-place; if <code>rows</code> is <code>:</code> and <code>col</code> is <code>Symbol</code> or <code>AbstractString</code> and it is missing from <code>df</code> then a new column is allocated and added; the length of the column is always the value of <code>nrow(df)</code> before the assignment takes place;</li><li>in the <code>df[!, col] .= v</code> syntax column <code>col</code> is replaced by a freshly allocated vector; if <code>col</code> is <code>Symbol</code> or <code>AbstractString</code> and it is missing from <code>df</code> then a new column is allocated added; the length of the column is always the value of <code>nrow(df)</code> before the assignment takes place;</li><li>the <code>df[!, cols] .= v</code> syntax replaces existing columns <code>cols</code> in data frame <code>df</code> with freshly allocated vectors;</li><li><code>df.col .= v</code> syntax currently performs in-place assignment to an existing vector <code>df.col</code>; this behavior is deprecated and a new column will be allocated in the future. Starting from Julia 1.7 if <code>:col</code> is not present in <code>df</code> then a new column will be created in <code>df</code>.</li><li>in the <code>sdf[CartesianIndex(row, col)] .= v</code>, <code>sdf[row, col] .= v</code> and <code>sdf[row, cols] .= v</code> syntaxes the assignment to <code>sdf</code> is performed in-place;</li><li>in the <code>sdf[rows, col] .= v</code> and <code>sdf[rows, cols] .= v</code> syntaxes the assignment to <code>sdf</code> is performed in-place; if <code>rows</code> is <code>:</code> and <code>col</code> is a <code>Symbol</code> or <code>AbstractString</code> referring to a column missing from <code>sdf</code> and <code>sdf</code> was created with <code>:</code> as column selector then a new column is allocated and added; the filtered-out rows are filled with <code>missing</code>;</li><li>in the <code>sdf[!, col] .= v</code> syntax column <code>col</code> is replaced by a freshly allocated vector; the filtered-out rows are filled with values already present in <code>col</code>; if <code>col</code> is a <code>Symbol</code> or <code>AbstractString</code> referring to a column missing from <code>sdf</code> and was <code>sdf</code> created with <code>:</code> as column selector then a new column is allocated and added; in this case the filtered-out rows are filled with <code>missing</code>;</li><li>the <code>sdf[!, cols] .= v</code> syntax replaces existing columns <code>cols</code> in data frame <code>sdf</code> with freshly allocated vectors; the filtered-out rows are filled with values already present in <code>cols</code>;</li><li><code>sdf.col .= v</code> syntax currently performs in-place assignment to an existing vector <code>sdf.col</code>; this behavior is deprecated and a new column will be allocated in the future. Starting from Julia 1.7 if <code>:col</code> is not present in <code>sdf</code> then a new column will be created in <code>sdf</code> if <code>sdf</code> was created with <code>:</code> as a column selector.</li><li><code>dfr.col .= v</code> syntax is allowed and performs in-place assignment to a value extracted by <code>dfr.col</code>.</li></ul><p>Note that <code>sdf[!, col] .= v</code> and <code>sdf[!, cols] .= v</code> syntaxes are not allowed as <code>sdf</code> can be only modified in-place.</p><p>If column indexing using <code>Symbol</code> or <code>AbstractString</code> names in <code>cols</code> is performed, the order of columns in the operation is specified by the order of names.</p><h2 id="Indexing-GroupedDataFrames"><a class="docs-heading-anchor" href="#Indexing-GroupedDataFrames">Indexing <code>GroupedDataFrame</code>s</a><a id="Indexing-GroupedDataFrames-1"></a><a class="docs-heading-anchor-permalink" href="#Indexing-GroupedDataFrames" title="Permalink"></a></h2><p>A <a href="../types/#DataFrames.GroupedDataFrame"><code>GroupedDataFrame</code></a> can behave as either an <code>AbstractVector</code> or <code>AbstractDict</code> depending on the type of index used. Integers (or arrays of them) trigger vector-like indexing while <code>Tuples</code>s and <code>NamedTuple</code>s trigger dictionary-like indexing. An intermediate between the two is the <a href="../types/#DataFrames.GroupKey"><code>GroupKey</code></a> type returned by <a href="../functions/#Base.keys"><code>keys(::GroupedDataFrame)</code></a>, which behaves similarly to a <code>NamedTuple</code> but has performance on par with integer indexing.</p><p>The elements of a <code>GroupedDataFrame</code> are <a href="../types/#DataFrames.SubDataFrame"><code>SubDataFrame</code></a>s of its parent.</p><ul><li><code>gd[i::Integer]</code> -&gt; Get the <code>i</code>th group.</li><li><code>gd[key::NamedTuple]</code> -&gt; Get the group corresponding to the given values of the grouping columns. The fields of the <code>NamedTuple</code> must match the grouping columns columns passed to <a href="../functions/#DataAPI.groupby"><code>groupby</code></a> (including order).</li><li><code>gd[key::Tuple]</code> -&gt; Same as previous, but omitting the names on <code>key</code>.</li><li><code>get(gd, key::Union{Tuple, NamedTuple}, default)</code> -&gt; Get group for key <code>key</code>, returning <code>default</code> if it does not exist.</li><li><code>gd[key::GroupKey]</code> -&gt; Get the group corresponding to the <a href="../types/#DataFrames.GroupKey"><code>GroupKey</code></a> <code>key</code> (one of the elements of the vector returned by <a href="../functions/#Base.keys"><code>keys(::GroupedDataFrame)</code></a>). This should be nearly as fast as integer indexing.</li><li><code>gd[a::AbstractVector]</code> -&gt; Select multiple groups and return them in a new <code>GroupedDataFrame</code> object. Groups may be selected by integer position using an array of <code>Integer</code>s or <code>Bool</code>s, similar to a standard array. Alternatively the array may contain keys of any of the types supported for dictionary-like indexing (<code>GroupKey</code>, <code>Tuple</code>, or <code>NamedTuple</code>). Selected groups must be unique, and different types of indices cannot be mixed.</li><li><code>gd[n::Not]</code> -&gt; Any of the above types wrapped in <code>Not</code>. The result will be a  new <code>GroupedDataFrame</code> containing all groups in <code>gd</code> <em>not</em> selected by the  wrapped index.</li></ul><h1 id="Common-API-for-types-defined-in-DataFrames.jl"><a class="docs-heading-anchor" href="#Common-API-for-types-defined-in-DataFrames.jl">Common API for types defined in DataFrames.jl</a><a id="Common-API-for-types-defined-in-DataFrames.jl-1"></a><a class="docs-heading-anchor-permalink" href="#Common-API-for-types-defined-in-DataFrames.jl" title="Permalink"></a></h1><p>This table presents return value types of calling <code>names</code>, <code>propertynames</code>, <code>keys</code>, <code>length</code> and <code>ndims</code> on types exposed to the user by DataFrames.jl:</p><table><tr><th style="text-align: right">Type</th><th style="text-align: right"><code>names</code></th><th style="text-align: right"><code>propertynames</code></th><th style="text-align: right"><code>keys</code></th><th style="text-align: right"><code>length</code></th><th style="text-align: right"><code>ndims</code></th></tr><tr><td style="text-align: right"><code>AbstractDataFrame</code></td><td style="text-align: right"><code>Vector{String}</code></td><td style="text-align: right"><code>Vector{Symbol}</code></td><td style="text-align: right">undefined</td><td style="text-align: right">undefined</td><td style="text-align: right"><code>2</code></td></tr><tr><td style="text-align: right"><code>DataFrameRow</code></td><td style="text-align: right"><code>Vector{String}</code></td><td style="text-align: right"><code>Vector{Symbol}</code></td><td style="text-align: right"><code>Vector{Symbol}</code></td><td style="text-align: right"><code>Int</code></td><td style="text-align: right"><code>1</code></td></tr><tr><td style="text-align: right"><code>DataFrameRows</code></td><td style="text-align: right"><code>Vector{String}</code></td><td style="text-align: right"><code>Vector{Symbol}</code></td><td style="text-align: right">vector of <code>Int</code></td><td style="text-align: right"><code>Int</code></td><td style="text-align: right"><code>1</code></td></tr><tr><td style="text-align: right"><code>DataFrameColumns</code></td><td style="text-align: right"><code>Vector{String}</code></td><td style="text-align: right"><code>Vector{Symbol}</code></td><td style="text-align: right"><code>Vector{Symbol}</code></td><td style="text-align: right"><code>Int</code></td><td style="text-align: right"><code>1</code></td></tr><tr><td style="text-align: right"><code>GroupedDataFrame</code></td><td style="text-align: right"><code>Vector{String}</code></td><td style="text-align: right">tuple of fields</td><td style="text-align: right"><code>GroupKeys</code></td><td style="text-align: right"><code>Int</code></td><td style="text-align: right"><code>1</code></td></tr><tr><td style="text-align: right"><code>GroupKeys</code></td><td style="text-align: right">undefined</td><td style="text-align: right">tuple of fields</td><td style="text-align: right">vector of <code>Int</code></td><td style="text-align: right"><code>Int</code></td><td style="text-align: right"><code>1</code></td></tr><tr><td style="text-align: right"><code>GroupKey</code></td><td style="text-align: right"><code>Vector{String}</code></td><td style="text-align: right"><code>Vector{Symbol}</code></td><td style="text-align: right"><code>Vector{Symbol}</code></td><td style="text-align: right"><code>Int</code></td><td style="text-align: right"><code>1</code></td></tr></table><p>Additionally the above types <code>T</code> (i.e. <code>AbstractDataFrame</code>, <code>DataFrameRow</code>, <code>DataFrameRows</code>, <code>DataFrameColumns</code>, <code>GroupedDataFrame</code>, <code>GroupKeys</code>, <code>GroupKey</code>) the following methods are defined:</p><ul><li><code>size(::T)</code> returning a <code>Tuple</code> of <code>Int</code>.</li><li><code>size(::T, ::Integer)</code> returning an <code>Int</code>.</li><li><code>axes(::T)</code> returning a <code>Tuple</code> of <code>Int</code> vectors.</li><li><code>axes(::T, ::Integer)</code> returning an <code>Int</code> vector for a valid dimension (except  <code>DataFrameRows</code> and <code>GroupKeys</code> for which <code>Base.OneTo(1)</code> is also returned  for a dimension higher than a valid one because they are <code>AbstractVector</code>).</li><li><code>firstindex(::T)</code> returning <code>1</code> (except <code>AbstractDataFrame</code> for which it is undefined).</li><li><code>firstindex(::T, ::Integer)</code> returning <code>1</code> for a valid dimension (except  <code>DataFrameRows</code> and <code>GroupKeys</code> for which <code>1</code> is also returned for a  dimension higher than a valid one because they are <code>AbstractVector</code>).</li><li><code>lastindex(::T)</code> returning <code>Int</code> (except <code>AbstractDataFrame</code> for which it is undefined).</li><li><code>lastindex(::T, ::Integer)</code> returning <code>Int</code> for a valid dimension  (except  <code>DataFrameRows</code> and <code>GroupKeys</code> for which <code>1</code> is also returned for a  dimension higher than a valid one because they are <code>AbstractVector</code>).</li></ul></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../functions/">« Functions</a><a class="docs-footer-nextpage" href="../metadata/">Metadata »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Sunday 8 September 2024 08:54">Sunday 8 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/lib/internals/index.html b/dev/lib/internals/index.html
index a84e3378e..0be9fa815 100644
--- a/dev/lib/internals/index.html
+++ b/dev/lib/internals/index.html
@@ -1,9 +1,9 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Internals · DataFrames.jl</title><meta name="title" content="Internals · DataFrames.jl"/><meta property="og:title" content="Internals · DataFrames.jl"/><meta property="twitter:title" content="Internals · DataFrames.jl"/><meta name="description" content="Documentation for DataFrames.jl."/><meta property="og:description" content="Documentation for DataFrames.jl."/><meta property="twitter:description" content="Documentation for DataFrames.jl."/><meta property="og:url" content="https://juliadata.github.io/DataFrames.jl/stable/lib/internals/"/><meta property="twitter:url" content="https://juliadata.github.io/DataFrames.jl/stable/lib/internals/"/><link rel="canonical" href="https://juliadata.github.io/DataFrames.jl/stable/lib/internals/"/><script data-outdated-warner src="../../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../search_index.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script><link href="../../assets/favicon.ico" rel="icon" type="image/x-icon"/></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../../"><img src="../../assets/logo.png" alt="DataFrames.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../../">DataFrames.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><a class="tocitem" href="../../">Introduction</a></li><li><a class="tocitem" href="../../man/basics/">First Steps with DataFrames.jl</a></li><li><span class="tocitem">User Guide</span><ul><li><a class="tocitem" href="../../man/getting_started/">Getting Started</a></li><li><a class="tocitem" href="../../man/working_with_dataframes/">Working with DataFrames</a></li><li><a class="tocitem" href="../../man/importing_and_exporting/">Importing and Exporting Data (I/O)</a></li><li><a class="tocitem" href="../../man/joins/">Joins</a></li><li><a class="tocitem" href="../../man/split_apply_combine/">Split-apply-combine</a></li><li><a class="tocitem" href="../../man/reshaping_and_pivoting/">Reshaping</a></li><li><a class="tocitem" href="../../man/sorting/">Sorting</a></li><li><a class="tocitem" href="../../man/categorical/">Categorical Data</a></li><li><a class="tocitem" href="../../man/missing/">Missing Data</a></li><li><a class="tocitem" href="../../man/querying_frameworks/">Data manipulation frameworks</a></li><li><a class="tocitem" href="../../man/comparisons/">Comparison with Python/R/Stata</a></li></ul></li><li><span class="tocitem">API</span><ul><li><a class="tocitem" href="../types/">Types</a></li><li><a class="tocitem" href="../functions/">Functions</a></li><li><a class="tocitem" href="../indexing/">Indexing</a></li><li><a class="tocitem" href="../metadata/">Metadata</a></li><li class="is-active"><a class="tocitem" href>Internals</a></li></ul></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">API</a></li><li class="is-active"><a href>Internals</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Internals</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaData/DataFrames.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaData/DataFrames.jl/blob/main/docs/src/lib/internals.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="Internals"><a class="docs-heading-anchor" href="#Internals">Internals</a><a id="Internals-1"></a><a class="docs-heading-anchor-permalink" href="#Internals" title="Permalink"></a></h1><div class="admonition is-warning"><header class="admonition-header">Internal API</header><div class="admonition-body"><p>The functions, methods and types listed on this page are internal to DataFrames and are <strong>not considered to be part of the public API</strong>.</p></div></div><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.compacttype" href="#DataFrames.compacttype"><code>DataFrames.compacttype</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">compacttype(T::Type, maxwidth::Int=8, initial::Bool=true)</code></pre><p>Return compact string representation of type <code>T</code>.</p><p>For displaying data frame we do not want string representation of type to be longer than <code>maxwidth</code>. This function implements rules how type names are cropped if they are longer than <code>maxwidth</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/show.jl#L85-L93">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.gennames" href="#DataFrames.gennames"><code>DataFrames.gennames</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">gennames(n::Integer)</code></pre><p>Generate standardized names for columns of a DataFrame. The first name will be <code>:x1</code>, the second <code>:x2</code>, etc.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/other/utils.jl#L124-L129">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.getmaxwidths" href="#DataFrames.getmaxwidths"><code>DataFrames.getmaxwidths</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">DataFrames.getmaxwidths(df::AbstractDataFrame,
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Internals · DataFrames.jl</title><meta name="title" content="Internals · DataFrames.jl"/><meta property="og:title" content="Internals · DataFrames.jl"/><meta property="twitter:title" content="Internals · DataFrames.jl"/><meta name="description" content="Documentation for DataFrames.jl."/><meta property="og:description" content="Documentation for DataFrames.jl."/><meta property="twitter:description" content="Documentation for DataFrames.jl."/><meta property="og:url" content="https://juliadata.github.io/DataFrames.jl/stable/lib/internals/"/><meta property="twitter:url" content="https://juliadata.github.io/DataFrames.jl/stable/lib/internals/"/><link rel="canonical" href="https://juliadata.github.io/DataFrames.jl/stable/lib/internals/"/><script data-outdated-warner src="../../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../search_index.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script><link href="../../assets/favicon.ico" rel="icon" type="image/x-icon"/></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../../"><img src="../../assets/logo.png" alt="DataFrames.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../../">DataFrames.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><a class="tocitem" href="../../">Introduction</a></li><li><a class="tocitem" href="../../man/basics/">First Steps with DataFrames.jl</a></li><li><span class="tocitem">User Guide</span><ul><li><a class="tocitem" href="../../man/getting_started/">Getting Started</a></li><li><a class="tocitem" href="../../man/working_with_dataframes/">Working with DataFrames</a></li><li><a class="tocitem" href="../../man/importing_and_exporting/">Importing and Exporting Data (I/O)</a></li><li><a class="tocitem" href="../../man/joins/">Joins</a></li><li><a class="tocitem" href="../../man/split_apply_combine/">Split-apply-combine</a></li><li><a class="tocitem" href="../../man/reshaping_and_pivoting/">Reshaping</a></li><li><a class="tocitem" href="../../man/sorting/">Sorting</a></li><li><a class="tocitem" href="../../man/categorical/">Categorical Data</a></li><li><a class="tocitem" href="../../man/missing/">Missing Data</a></li><li><a class="tocitem" href="../../man/querying_frameworks/">Data manipulation frameworks</a></li><li><a class="tocitem" href="../../man/comparisons/">Comparison with Python/R/Stata</a></li></ul></li><li><span class="tocitem">API</span><ul><li><a class="tocitem" href="../types/">Types</a></li><li><a class="tocitem" href="../functions/">Functions</a></li><li><a class="tocitem" href="../indexing/">Indexing</a></li><li><a class="tocitem" href="../metadata/">Metadata</a></li><li class="is-active"><a class="tocitem" href>Internals</a></li></ul></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">API</a></li><li class="is-active"><a href>Internals</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Internals</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaData/DataFrames.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaData/DataFrames.jl/blob/main/docs/src/lib/internals.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="Internals"><a class="docs-heading-anchor" href="#Internals">Internals</a><a id="Internals-1"></a><a class="docs-heading-anchor-permalink" href="#Internals" title="Permalink"></a></h1><div class="admonition is-warning"><header class="admonition-header">Internal API</header><div class="admonition-body"><p>The functions, methods and types listed on this page are internal to DataFrames and are <strong>not considered to be part of the public API</strong>.</p></div></div><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.compacttype" href="#DataFrames.compacttype"><code>DataFrames.compacttype</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">compacttype(T::Type, maxwidth::Int=8, initial::Bool=true)</code></pre><p>Return compact string representation of type <code>T</code>.</p><p>For displaying data frame we do not want string representation of type to be longer than <code>maxwidth</code>. This function implements rules how type names are cropped if they are longer than <code>maxwidth</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/show.jl#L85-L93">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.gennames" href="#DataFrames.gennames"><code>DataFrames.gennames</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">gennames(n::Integer)</code></pre><p>Generate standardized names for columns of a DataFrame. The first name will be <code>:x1</code>, the second <code>:x2</code>, etc.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/other/utils.jl#L124-L129">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.getmaxwidths" href="#DataFrames.getmaxwidths"><code>DataFrames.getmaxwidths</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">DataFrames.getmaxwidths(df::AbstractDataFrame,
                         io::IO,
                         rowindices1::AbstractVector{Int},
                         rowindices2::AbstractVector{Int},
                         rowlabel::Symbol,
                         rowid::Union{Integer, Nothing},
                         show_eltype::Bool,
-                        buffer::IOBuffer)</code></pre><p>Calculate, for each column of an AbstractDataFrame, the maximum string width used to render the name of that column, its type, and the longest entry in that column – among the rows of the data frame will be rendered to IO. The widths for all columns are returned as a vector.</p><p>Return a <code>Vector{Int}</code> giving the maximum string widths required to render each column, including that column&#39;s name and type.</p><p>NOTE: The last entry of the result vector is the string width of the implicit row ID column contained in every <code>AbstractDataFrame</code>.</p><p><strong>Arguments</strong></p><ul><li><code>df::AbstractDataFrame</code>: The data frame whose columns will be printed.</li><li><code>io::IO</code>: The <code>IO</code> to which <code>df</code> is to be printed</li><li>`rowindices1::AbstractVector{Int}: A set of indices of the first chunk of the AbstractDataFrame that would be rendered to IO.</li><li>`rowindices2::AbstractVector{Int}: A set of indices of the second chunk of the AbstractDataFrame that would be rendered to IO. Can be empty if the AbstractDataFrame would be printed without any ellipses.</li><li><code>rowlabel::AbstractString</code>: The label that will be used when rendered the numeric ID&#39;s of each row. Typically, this will be set to &quot;Row&quot;.</li><li><code>rowid</code>: Used to handle showing <code>DataFrameRow</code>.</li><li><code>show_eltype</code>: Whether to print the column type  under the column name in the heading.</li><li><code>buffer</code>: buffer passed around to avoid reallocations in <code>ourstrwidth</code></li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/io.jl#L1-L38">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.ourshow" href="#DataFrames.ourshow"><code>DataFrames.ourshow</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">DataFrames.ourshow(io::IO, x::Any, truncstring::Int)</code></pre><p>Render a value to an <code>IO</code> object compactly using print. <code>truncstring</code> indicates the approximate number of text characters width to truncate the output (if it is a non-positive value then no truncation is applied).</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/show.jl#L28-L34">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.ourstrwidth" href="#DataFrames.ourstrwidth"><code>DataFrames.ourstrwidth</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">DataFrames.ourstrwidth(io::IO, x::Any, buffer::IOBuffer, truncstring::Int)</code></pre><p>Determine the number of characters that would be used to print a value.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/show.jl#L5-L9">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.@spawn_for_chunks" href="#DataFrames.@spawn_for_chunks"><code>DataFrames.@spawn_for_chunks</code></a> — <span class="docstring-category">Macro</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">@spawn_for_chunks basesize for i in range ... end</code></pre><p>Parallelize a <code>for</code> loop by spawning separate tasks iterating each over a chunk of at least <code>basesize</code> elements in <code>range</code>.</p><p>A number of tasks higher than <code>Threads.nthreads()</code> may be spawned, since that can allow for a more efficient load balancing in case some threads are busy (nested parallelism).</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/other/utils.jl#L197-L207">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.@spawn_or_run_task" href="#DataFrames.@spawn_or_run_task"><code>DataFrames.@spawn_or_run_task</code></a> — <span class="docstring-category">Macro</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">@spawn_or_run_task threads expr</code></pre><p>Equivalent to <code>Threads.@spawn</code> if <code>threads === true</code>, otherwise run <code>expr</code> and return a <code>Task</code> that returns its value.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/other/utils.jl#L218-L223">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.@spawn_or_run" href="#DataFrames.@spawn_or_run"><code>DataFrames.@spawn_or_run</code></a> — <span class="docstring-category">Macro</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">@spawn_or_run threads expr</code></pre><p>Equivalent to <code>Threads.@spawn</code> if <code>threads === true</code>, otherwise run <code>expr</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/other/utils.jl#L257-L262">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.default_table_transformation" href="#DataFrames.default_table_transformation"><code>DataFrames.default_table_transformation</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">default_table_transformation(df_sel::AbstractDataFrame, fun)</code></pre><p>This is a default implementation called when <code>AsTable(...) =&gt; fun</code> is requested. The <code>df_sel</code> argument is a data frame storing columns selected by <code>AsTable(...)</code> selector.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/selectionfast.jl#L91-L97">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.isreadonly" href="#DataFrames.isreadonly"><code>DataFrames.isreadonly</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">isreadonly(fun)</code></pre><p>Trait returning a <code>Bool</code> indicator if function <code>fun</code> is only reading the passed argument. Such a function guarantees not to modify nor return in any form the passed argument. By default <code>false</code> is returned.</p><p>This function might become a part of the public API of DataFrames.jl in the future, currently it should be considered experimental. Adding a method to <code>isreadonly</code> for a specific function <code>fun</code> will improve performance of <code>AsTable(...) =&gt; ByRow(fun∘collect)</code> operation.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/selectionfast.jl#L57-L68">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../metadata/">« Metadata</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Saturday 7 September 2024 11:00">Saturday 7 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+                        buffer::IOBuffer)</code></pre><p>Calculate, for each column of an AbstractDataFrame, the maximum string width used to render the name of that column, its type, and the longest entry in that column – among the rows of the data frame will be rendered to IO. The widths for all columns are returned as a vector.</p><p>Return a <code>Vector{Int}</code> giving the maximum string widths required to render each column, including that column&#39;s name and type.</p><p>NOTE: The last entry of the result vector is the string width of the implicit row ID column contained in every <code>AbstractDataFrame</code>.</p><p><strong>Arguments</strong></p><ul><li><code>df::AbstractDataFrame</code>: The data frame whose columns will be printed.</li><li><code>io::IO</code>: The <code>IO</code> to which <code>df</code> is to be printed</li><li>`rowindices1::AbstractVector{Int}: A set of indices of the first chunk of the AbstractDataFrame that would be rendered to IO.</li><li>`rowindices2::AbstractVector{Int}: A set of indices of the second chunk of the AbstractDataFrame that would be rendered to IO. Can be empty if the AbstractDataFrame would be printed without any ellipses.</li><li><code>rowlabel::AbstractString</code>: The label that will be used when rendered the numeric ID&#39;s of each row. Typically, this will be set to &quot;Row&quot;.</li><li><code>rowid</code>: Used to handle showing <code>DataFrameRow</code>.</li><li><code>show_eltype</code>: Whether to print the column type  under the column name in the heading.</li><li><code>buffer</code>: buffer passed around to avoid reallocations in <code>ourstrwidth</code></li></ul></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/io.jl#L1-L38">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.ourshow" href="#DataFrames.ourshow"><code>DataFrames.ourshow</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">DataFrames.ourshow(io::IO, x::Any, truncstring::Int)</code></pre><p>Render a value to an <code>IO</code> object compactly using print. <code>truncstring</code> indicates the approximate number of text characters width to truncate the output (if it is a non-positive value then no truncation is applied).</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/show.jl#L28-L34">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.ourstrwidth" href="#DataFrames.ourstrwidth"><code>DataFrames.ourstrwidth</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">DataFrames.ourstrwidth(io::IO, x::Any, buffer::IOBuffer, truncstring::Int)</code></pre><p>Determine the number of characters that would be used to print a value.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/show.jl#L5-L9">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.@spawn_for_chunks" href="#DataFrames.@spawn_for_chunks"><code>DataFrames.@spawn_for_chunks</code></a> — <span class="docstring-category">Macro</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">@spawn_for_chunks basesize for i in range ... end</code></pre><p>Parallelize a <code>for</code> loop by spawning separate tasks iterating each over a chunk of at least <code>basesize</code> elements in <code>range</code>.</p><p>A number of tasks higher than <code>Threads.nthreads()</code> may be spawned, since that can allow for a more efficient load balancing in case some threads are busy (nested parallelism).</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/other/utils.jl#L197-L207">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.@spawn_or_run_task" href="#DataFrames.@spawn_or_run_task"><code>DataFrames.@spawn_or_run_task</code></a> — <span class="docstring-category">Macro</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">@spawn_or_run_task threads expr</code></pre><p>Equivalent to <code>Threads.@spawn</code> if <code>threads === true</code>, otherwise run <code>expr</code> and return a <code>Task</code> that returns its value.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/other/utils.jl#L218-L223">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.@spawn_or_run" href="#DataFrames.@spawn_or_run"><code>DataFrames.@spawn_or_run</code></a> — <span class="docstring-category">Macro</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">@spawn_or_run threads expr</code></pre><p>Equivalent to <code>Threads.@spawn</code> if <code>threads === true</code>, otherwise run <code>expr</code>.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/other/utils.jl#L257-L262">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.default_table_transformation" href="#DataFrames.default_table_transformation"><code>DataFrames.default_table_transformation</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">default_table_transformation(df_sel::AbstractDataFrame, fun)</code></pre><p>This is a default implementation called when <code>AsTable(...) =&gt; fun</code> is requested. The <code>df_sel</code> argument is a data frame storing columns selected by <code>AsTable(...)</code> selector.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/selectionfast.jl#L91-L97">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.isreadonly" href="#DataFrames.isreadonly"><code>DataFrames.isreadonly</code></a> — <span class="docstring-category">Function</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">isreadonly(fun)</code></pre><p>Trait returning a <code>Bool</code> indicator if function <code>fun</code> is only reading the passed argument. Such a function guarantees not to modify nor return in any form the passed argument. By default <code>false</code> is returned.</p><p>This function might become a part of the public API of DataFrames.jl in the future, currently it should be considered experimental. Adding a method to <code>isreadonly</code> for a specific function <code>fun</code> will improve performance of <code>AsTable(...) =&gt; ByRow(fun∘collect)</code> operation.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/selectionfast.jl#L57-L68">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../metadata/">« Metadata</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Sunday 8 September 2024 08:54">Sunday 8 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/lib/metadata/index.html b/dev/lib/metadata/index.html
index 8b18caf56..21fc2c443 100644
--- a/dev/lib/metadata/index.html
+++ b/dev/lib/metadata/index.html
@@ -72,4 +72,4 @@
 julia&gt; emptycolmetadata!(df);
 
 julia&gt; colmetadatakeys(df)
-()</code></pre><h2 id="Propagation-of-:note-style-metadata"><a class="docs-heading-anchor" href="#Propagation-of-:note-style-metadata">Propagation of <code>:note</code>-style metadata</a><a id="Propagation-of-:note-style-metadata-1"></a><a class="docs-heading-anchor-permalink" href="#Propagation-of-:note-style-metadata" title="Permalink"></a></h2><p>An important design feature of <code>:note</code>-style metadata is how it is handled when data frames are transformed.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>The provided rules might slightly change in the future. Any change to <code>:note</code>-style metadata propagation rules will not be considered as breaking and can be done in any minor release of DataFrames.jl. Such changes might be made based on users&#39; feedback about what metadata propagation rules are most convenient in practice.</p></div></div><p>The general design rules for propagation of <code>:note</code>-style metadata are as follows.</p><p>For operations that take a single data frame as an input:</p><ul><li>Table level metadata is propagated to the returned data frame object.</li><li>For column-level metadata:<ul><li>in all cases when a single column is transformed to a single column and the name of the column does not change (or is automatically changed e.g. to de-duplicate column names or via column renaming in joins) column-level metadata is preserved (example operations of this kind are <code>getindex</code>, <code>subset</code>, joins, <code>mapcols</code>).</li><li>in all cases when a single column is transformed with <code>identity</code> or <code>copy</code> to a single column, column-level metadata is preserved even if column name is changed (example operations of this kind are <code>rename</code>, or the <code>:x =&gt; :y</code> or <code>:x =&gt; copy =&gt; :y</code> operation specification in <code>select</code>).</li></ul></li></ul><p>For operations that take multiple data frames as their input two cases are distinguished:</p><ul><li>When there is a natural main table in the operation (<code>append!</code>, <code>prepend!</code>, <code>leftjoin</code>, <code>leftjoin!</code>, <code>rightjoin</code>, <code>semijoin</code>, <code>antijoin</code>, <code>setindex!</code>):<ul><li>table-level metadata is taken from the main table;</li><li>column-level metadata for columns from the main table is taken from main table;</li><li>column-level metadata for columns from the non-main table is taken only for columns not present in the main table.</li></ul></li><li>When all tables are equivalent (<code>hcat</code>, <code>vcat</code>, <code>innerjoin</code>, <code>outerjoin</code>):<ul><li>table-level metadata is preserved only for keys which are defined in all passed tables and have the same value;</li><li>column-level metadata is preserved only for keys which are defined in all passed tables that contain this column and have the same value.</li></ul></li></ul><p>In all these operations when metadata is preserved the values in the key-value pairs are not copied (this is relevant in case of mutable values).</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>The rules for column-level <code>:note</code>-style metadata propagation are designed to make the right decision in common cases. In particular, they assume that if source and target column name is the same then the metadata for the column is not changed. While this is valid for many operations, it is not always true in general. For example the <code>:x =&gt; ByRow(log) =&gt; :x</code> transformation might invalidate metadata if it contained unit of measure of the variable. In such cases user must either use a different name for the output column, set metadata style to <code>:default</code> before the operation, or manually drop or update such metadata from the <code>:x</code> column after the transformation.</p></div></div><h3 id="Operations-that-preserve-:note-style-metadata"><a class="docs-heading-anchor" href="#Operations-that-preserve-:note-style-metadata">Operations that preserve <code>:note</code>-style metadata</a><a id="Operations-that-preserve-:note-style-metadata-1"></a><a class="docs-heading-anchor-permalink" href="#Operations-that-preserve-:note-style-metadata" title="Permalink"></a></h3><p>Most of the functions in DataFrames.jl only preserve table and column metadata whose style is <code>:note</code>. Some functions use a more complex logic, even if they follow the general rules described above (in particular under any transformation all non-<code>:note</code>-style metadata is always dropped). These are:</p><ul><li><a href="../functions/#DataAPI.describe"><code>describe</code></a> drops all metadata.</li><li><a href="../functions/#Base.hcat"><code>hcat</code></a>: propagates table-level metadata only for keys which are defined in all passed tables and have the same value; column-level metadata is preserved.</li><li><a href="../functions/#Base.vcat"><code>vcat</code></a>: propagates table-level metadata only for keys which are defined in all passed tables and have the same value; column-level metadata is preserved only for keys which are defined in all passed tables that contain this column and have the same value;</li><li><a href="../functions/#Base.stack"><code>stack</code></a>: propagates table-level metadata and column-level metadata for identifier columns.</li><li><a href="../functions/#DataFrames.unstack"><code>unstack</code></a>: propagates table-level metadata and column-level metadata for row keys columns.</li><li><a href="../functions/#Base.permutedims"><code>permutedims</code></a>: propagates table-level metadata and drops column-level  metadata.</li><li>broadcasted assignment does not change target metadata; under Julia earlier than 1.7 operation of kind <code>df.a .= s</code> does not drop non-<code>:note</code>-style metadata; under Julia 1.7 or later this operation preserves only <code>:note</code>-style metadata</li><li>broadcasting propagates table-level metadata if some key is present in all passed data frames and value associated with it is identical in all passed data frames; column-level metadata is propagated for columns if some key for a given column is present in all passed data frames and value associated with it is identical in all passed data frames.</li><li><code>getindex</code> preserves table-level metadata and column-level metadata for selected columns</li><li><code>setindex!</code> does not affect table-level and column-level metadata</li><li><a href="../functions/#Base.push!"><code>push!</code></a>, <a href="../functions/#Base.pushfirst!"><code>pushfirst!</code></a>, <a href="../functions/#Base.insert!"><code>insert!</code></a> do not affect table-level nor column-level metadata (even if they add new columns and pushed row is a <code>DataFrameRow</code> or other value supporting metadata interface)</li><li><a href="../functions/#Base.append!"><code>append!</code></a> and <a href="../functions/#Base.prepend!"><code>prepend!</code></a> do not change table and column-level metadata of the destination data frame, except that if new columns are added and these columns have metadata in the appended/prepended table then this metadata is preserved.</li><li><a href="../functions/#DataFrames.leftjoin!"><code>leftjoin!</code></a>, <a href="../functions/#DataAPI.leftjoin"><code>leftjoin</code></a>: table and column-level metadata is taken from the left table except for non-key columns from right table for which metadata is taken from right table;</li><li><a href="../functions/#DataAPI.rightjoin"><code>rightjoin</code></a>: table and column-level metadata is taken from the right table except for non-key columns from left table for which metadata is taken from left table;</li><li><a href="../functions/#DataAPI.innerjoin"><code>innerjoin</code></a>, <a href="../functions/#DataAPI.outerjoin"><code>outerjoin</code></a>: propagates table-level metadata only for keys that are defined in all passed data frames and have the same value; column-level metadata is propagated for all columns except for key columns, for which it is propagated only for keys that are defined in all passed data frames and have the same value.</li><li><a href="../functions/#DataAPI.semijoin"><code>semijoin</code></a>, <a href="../functions/#DataAPI.antijoin"><code>antijoin</code></a>: table and column-level metadata is taken from the left table.</li><li><a href="../functions/#DataAPI.crossjoin"><code>crossjoin</code></a>: propagates table-level metadata only for keys that are defined in both passed data frames and have the same value; propagates column-level metadata from both passed data frames.</li><li><a href="../functions/#DataFrames.select"><code>select</code></a>, <a href="../functions/#DataFrames.select!"><code>select!</code></a>, <a href="../functions/#DataFrames.transform"><code>transform</code></a>, <a href="../functions/#DataFrames.transform!"><code>transform!</code></a>, <a href="../functions/#DataFrames.combine"><code>combine</code></a>: propagate table-level metadata; column-level metadata is propagated if: a) a single column is transformed to a single column and the name of the column does not change    (this includes all column selection operations), or b) a single column is transformed with <code>identity</code> or <code>copy</code> to a single column    even if column name is changed (this includes column renaming).</li></ul></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../indexing/">« Indexing</a><a class="docs-footer-nextpage" href="../internals/">Internals »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Saturday 7 September 2024 11:00">Saturday 7 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+()</code></pre><h2 id="Propagation-of-:note-style-metadata"><a class="docs-heading-anchor" href="#Propagation-of-:note-style-metadata">Propagation of <code>:note</code>-style metadata</a><a id="Propagation-of-:note-style-metadata-1"></a><a class="docs-heading-anchor-permalink" href="#Propagation-of-:note-style-metadata" title="Permalink"></a></h2><p>An important design feature of <code>:note</code>-style metadata is how it is handled when data frames are transformed.</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>The provided rules might slightly change in the future. Any change to <code>:note</code>-style metadata propagation rules will not be considered as breaking and can be done in any minor release of DataFrames.jl. Such changes might be made based on users&#39; feedback about what metadata propagation rules are most convenient in practice.</p></div></div><p>The general design rules for propagation of <code>:note</code>-style metadata are as follows.</p><p>For operations that take a single data frame as an input:</p><ul><li>Table level metadata is propagated to the returned data frame object.</li><li>For column-level metadata:<ul><li>in all cases when a single column is transformed to a single column and the name of the column does not change (or is automatically changed e.g. to de-duplicate column names or via column renaming in joins) column-level metadata is preserved (example operations of this kind are <code>getindex</code>, <code>subset</code>, joins, <code>mapcols</code>).</li><li>in all cases when a single column is transformed with <code>identity</code> or <code>copy</code> to a single column, column-level metadata is preserved even if column name is changed (example operations of this kind are <code>rename</code>, or the <code>:x =&gt; :y</code> or <code>:x =&gt; copy =&gt; :y</code> operation specification in <code>select</code>).</li></ul></li></ul><p>For operations that take multiple data frames as their input two cases are distinguished:</p><ul><li>When there is a natural main table in the operation (<code>append!</code>, <code>prepend!</code>, <code>leftjoin</code>, <code>leftjoin!</code>, <code>rightjoin</code>, <code>semijoin</code>, <code>antijoin</code>, <code>setindex!</code>):<ul><li>table-level metadata is taken from the main table;</li><li>column-level metadata for columns from the main table is taken from main table;</li><li>column-level metadata for columns from the non-main table is taken only for columns not present in the main table.</li></ul></li><li>When all tables are equivalent (<code>hcat</code>, <code>vcat</code>, <code>innerjoin</code>, <code>outerjoin</code>):<ul><li>table-level metadata is preserved only for keys which are defined in all passed tables and have the same value;</li><li>column-level metadata is preserved only for keys which are defined in all passed tables that contain this column and have the same value.</li></ul></li></ul><p>In all these operations when metadata is preserved the values in the key-value pairs are not copied (this is relevant in case of mutable values).</p><div class="admonition is-info"><header class="admonition-header">Note</header><div class="admonition-body"><p>The rules for column-level <code>:note</code>-style metadata propagation are designed to make the right decision in common cases. In particular, they assume that if source and target column name is the same then the metadata for the column is not changed. While this is valid for many operations, it is not always true in general. For example the <code>:x =&gt; ByRow(log) =&gt; :x</code> transformation might invalidate metadata if it contained unit of measure of the variable. In such cases user must either use a different name for the output column, set metadata style to <code>:default</code> before the operation, or manually drop or update such metadata from the <code>:x</code> column after the transformation.</p></div></div><h3 id="Operations-that-preserve-:note-style-metadata"><a class="docs-heading-anchor" href="#Operations-that-preserve-:note-style-metadata">Operations that preserve <code>:note</code>-style metadata</a><a id="Operations-that-preserve-:note-style-metadata-1"></a><a class="docs-heading-anchor-permalink" href="#Operations-that-preserve-:note-style-metadata" title="Permalink"></a></h3><p>Most of the functions in DataFrames.jl only preserve table and column metadata whose style is <code>:note</code>. Some functions use a more complex logic, even if they follow the general rules described above (in particular under any transformation all non-<code>:note</code>-style metadata is always dropped). These are:</p><ul><li><a href="../functions/#DataAPI.describe"><code>describe</code></a> drops all metadata.</li><li><a href="../functions/#Base.hcat"><code>hcat</code></a>: propagates table-level metadata only for keys which are defined in all passed tables and have the same value; column-level metadata is preserved.</li><li><a href="../functions/#Base.vcat"><code>vcat</code></a>: propagates table-level metadata only for keys which are defined in all passed tables and have the same value; column-level metadata is preserved only for keys which are defined in all passed tables that contain this column and have the same value;</li><li><a href="../functions/#Base.stack"><code>stack</code></a>: propagates table-level metadata and column-level metadata for identifier columns.</li><li><a href="../functions/#DataFrames.unstack"><code>unstack</code></a>: propagates table-level metadata and column-level metadata for row keys columns.</li><li><a href="../functions/#Base.permutedims"><code>permutedims</code></a>: propagates table-level metadata and drops column-level  metadata.</li><li>broadcasted assignment does not change target metadata; under Julia earlier than 1.7 operation of kind <code>df.a .= s</code> does not drop non-<code>:note</code>-style metadata; under Julia 1.7 or later this operation preserves only <code>:note</code>-style metadata</li><li>broadcasting propagates table-level metadata if some key is present in all passed data frames and value associated with it is identical in all passed data frames; column-level metadata is propagated for columns if some key for a given column is present in all passed data frames and value associated with it is identical in all passed data frames.</li><li><code>getindex</code> preserves table-level metadata and column-level metadata for selected columns</li><li><code>setindex!</code> does not affect table-level and column-level metadata</li><li><a href="../functions/#Base.push!"><code>push!</code></a>, <a href="../functions/#Base.pushfirst!"><code>pushfirst!</code></a>, <a href="../functions/#Base.insert!"><code>insert!</code></a> do not affect table-level nor column-level metadata (even if they add new columns and pushed row is a <code>DataFrameRow</code> or other value supporting metadata interface)</li><li><a href="../functions/#Base.append!"><code>append!</code></a> and <a href="../functions/#Base.prepend!"><code>prepend!</code></a> do not change table and column-level metadata of the destination data frame, except that if new columns are added and these columns have metadata in the appended/prepended table then this metadata is preserved.</li><li><a href="../functions/#DataFrames.leftjoin!"><code>leftjoin!</code></a>, <a href="../functions/#DataAPI.leftjoin"><code>leftjoin</code></a>: table and column-level metadata is taken from the left table except for non-key columns from right table for which metadata is taken from right table;</li><li><a href="../functions/#DataAPI.rightjoin"><code>rightjoin</code></a>: table and column-level metadata is taken from the right table except for non-key columns from left table for which metadata is taken from left table;</li><li><a href="../functions/#DataAPI.innerjoin"><code>innerjoin</code></a>, <a href="../functions/#DataAPI.outerjoin"><code>outerjoin</code></a>: propagates table-level metadata only for keys that are defined in all passed data frames and have the same value; column-level metadata is propagated for all columns except for key columns, for which it is propagated only for keys that are defined in all passed data frames and have the same value.</li><li><a href="../functions/#DataAPI.semijoin"><code>semijoin</code></a>, <a href="../functions/#DataAPI.antijoin"><code>antijoin</code></a>: table and column-level metadata is taken from the left table.</li><li><a href="../functions/#DataAPI.crossjoin"><code>crossjoin</code></a>: propagates table-level metadata only for keys that are defined in both passed data frames and have the same value; propagates column-level metadata from both passed data frames.</li><li><a href="../functions/#DataFrames.select"><code>select</code></a>, <a href="../functions/#DataFrames.select!"><code>select!</code></a>, <a href="../functions/#DataFrames.transform"><code>transform</code></a>, <a href="../functions/#DataFrames.transform!"><code>transform!</code></a>, <a href="../functions/#DataFrames.combine"><code>combine</code></a>: propagate table-level metadata; column-level metadata is propagated if: a) a single column is transformed to a single column and the name of the column does not change    (this includes all column selection operations), or b) a single column is transformed with <code>identity</code> or <code>copy</code> to a single column    even if column name is changed (this includes column renaming).</li></ul></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../indexing/">« Indexing</a><a class="docs-footer-nextpage" href="../internals/">Internals »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Sunday 8 September 2024 08:54">Sunday 8 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/lib/types/index.html b/dev/lib/types/index.html
index abd1f62b0..db4203948 100644
--- a/dev/lib/types/index.html
+++ b/dev/lib/types/index.html
@@ -1,5 +1,5 @@
 <!DOCTYPE html>
-<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Types · DataFrames.jl</title><meta name="title" content="Types · DataFrames.jl"/><meta property="og:title" content="Types · DataFrames.jl"/><meta property="twitter:title" content="Types · DataFrames.jl"/><meta name="description" content="Documentation for DataFrames.jl."/><meta property="og:description" content="Documentation for DataFrames.jl."/><meta property="twitter:description" content="Documentation for DataFrames.jl."/><meta property="og:url" content="https://juliadata.github.io/DataFrames.jl/stable/lib/types/"/><meta property="twitter:url" content="https://juliadata.github.io/DataFrames.jl/stable/lib/types/"/><link rel="canonical" href="https://juliadata.github.io/DataFrames.jl/stable/lib/types/"/><script data-outdated-warner src="../../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../search_index.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script><link href="../../assets/favicon.ico" rel="icon" type="image/x-icon"/></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../../"><img src="../../assets/logo.png" alt="DataFrames.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../../">DataFrames.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><a class="tocitem" href="../../">Introduction</a></li><li><a class="tocitem" href="../../man/basics/">First Steps with DataFrames.jl</a></li><li><span class="tocitem">User Guide</span><ul><li><a class="tocitem" href="../../man/getting_started/">Getting Started</a></li><li><a class="tocitem" href="../../man/working_with_dataframes/">Working with DataFrames</a></li><li><a class="tocitem" href="../../man/importing_and_exporting/">Importing and Exporting Data (I/O)</a></li><li><a class="tocitem" href="../../man/joins/">Joins</a></li><li><a class="tocitem" href="../../man/split_apply_combine/">Split-apply-combine</a></li><li><a class="tocitem" href="../../man/reshaping_and_pivoting/">Reshaping</a></li><li><a class="tocitem" href="../../man/sorting/">Sorting</a></li><li><a class="tocitem" href="../../man/categorical/">Categorical Data</a></li><li><a class="tocitem" href="../../man/missing/">Missing Data</a></li><li><a class="tocitem" href="../../man/querying_frameworks/">Data manipulation frameworks</a></li><li><a class="tocitem" href="../../man/comparisons/">Comparison with Python/R/Stata</a></li></ul></li><li><span class="tocitem">API</span><ul><li class="is-active"><a class="tocitem" href>Types</a><ul class="internal"><li><a class="tocitem" href="#Type-hierarchy-design"><span>Type hierarchy design</span></a></li><li><a class="tocitem" href="#man-columnhandling"><span>The design of handling of columns of a <code>DataFrame</code></span></a></li><li><a class="tocitem" href="#Types-specification"><span>Types specification</span></a></li></ul></li><li><a class="tocitem" href="../functions/">Functions</a></li><li><a class="tocitem" href="../indexing/">Indexing</a></li><li><a class="tocitem" href="../metadata/">Metadata</a></li></ul></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">API</a></li><li class="is-active"><a href>Types</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Types</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaData/DataFrames.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaData/DataFrames.jl/blob/main/docs/src/lib/types.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="Types"><a class="docs-heading-anchor" href="#Types">Types</a><a id="Types-1"></a><a class="docs-heading-anchor-permalink" href="#Types" title="Permalink"></a></h1><ul><li><a href="#DataFrames.AbstractDataFrame"><code>DataFrames.AbstractDataFrame</code></a></li><li><a href="#DataFrames.AsTable"><code>DataFrames.AsTable</code></a></li><li><a href="#DataFrames.DataFrame"><code>DataFrames.DataFrame</code></a></li><li><a href="#DataFrames.DataFrameColumns"><code>DataFrames.DataFrameColumns</code></a></li><li><a href="#DataFrames.DataFrameRow"><code>DataFrames.DataFrameRow</code></a></li><li><a href="#DataFrames.DataFrameRows"><code>DataFrames.DataFrameRows</code></a></li><li><a href="#DataFrames.GroupKey"><code>DataFrames.GroupKey</code></a></li><li><a href="#DataFrames.GroupKeys"><code>DataFrames.GroupKeys</code></a></li><li><a href="#DataFrames.GroupedDataFrame"><code>DataFrames.GroupedDataFrame</code></a></li><li><a href="#DataFrames.RepeatedVector"><code>DataFrames.RepeatedVector</code></a></li><li><a href="#DataFrames.StackedVector"><code>DataFrames.StackedVector</code></a></li><li><a href="#DataFrames.SubDataFrame"><code>DataFrames.SubDataFrame</code></a></li></ul><h2 id="Type-hierarchy-design"><a class="docs-heading-anchor" href="#Type-hierarchy-design">Type hierarchy design</a><a id="Type-hierarchy-design-1"></a><a class="docs-heading-anchor-permalink" href="#Type-hierarchy-design" title="Permalink"></a></h2><p><code>AbstractDataFrame</code> is an abstract type that provides an interface for data frame types. It is not intended as a fully generic interface for working with tabular data, which is the role of interfaces defined by <a href="https://github.com/JuliaData/Tables.jl/">Tables.jl</a> instead.</p><p><code>DataFrame</code> is the most fundamental subtype of <code>AbstractDataFrame</code>, which stores a set of columns as <code>AbstractVector</code> objects. Indexing of all stored columns must be 1-based. Also, all functions exposed by DataFrames.jl API make sure to <code>collect</code> passed <code>AbstractRange</code> source columns before storing them in a <code>DataFrame</code>.</p><p><code>SubDataFrame</code> is an <code>AbstractDataFrame</code> subtype representing a view into a <code>DataFrame</code>. It stores only a reference to the parent <code>DataFrame</code> and information about which rows and columns from the parent are selected (both as integer indices referring to the parent). Typically it is created using the <code>view</code> function or is returned by indexing into a <code>GroupedDataFrame</code> object.</p><p><code>GroupedDataFrame</code> is a type that stores the result of a  grouping operation performed on an <code>AbstractDataFrame</code>. It is intended to be created as a result of a call to the <code>groupby</code> function.</p><p><code>DataFrameRow</code> is a view into a single row of an <code>AbstractDataFrame</code>. It stores only a reference to a parent <code>DataFrame</code> and information about which row and columns from the parent are selected (both as integer indices referring to the parent). The <code>DataFrameRow</code> type supports iteration over columns of the row and is similar in functionality to the <code>NamedTuple</code> type, but allows for modification of data stored in the parent <code>DataFrame</code> and reflects changes done to the parent after the creation of the view. Typically objects of the <code>DataFrameRow</code> type are encountered when returned by the <code>eachrow</code> function, or when accessing a single row of a <code>DataFrame</code> or <code>SubDataFrame</code> via <code>getindex</code> or <code>view</code>.</p><p>The <code>eachrow</code> function returns a value of the <code>DataFrameRows</code> type, which serves as an iterator over rows of an <code>AbstractDataFrame</code>, returning <code>DataFrameRow</code> objects. The <code>DataFrameRows</code> is a subtype of <code>AbstractVector</code> and supports its interface with the exception that it is read-only.</p><p>Similarly, the <code>eachcol</code> function returns a value of the <code>DataFrameColumns</code> type, which is not an <code>AbstractVector</code>, but supports most of its API. The key differences are that it is read-only and that the <code>keys</code> function returns a vector of <code>Symbol</code>s (and not integers as for normal vectors).</p><p>Note that <code>DataFrameRows</code> and <code>DataFrameColumns</code> are not exported and should not be constructed directly, but using the <code>eachrow</code> and <code>eachcol</code> functions.</p><p>The <code>RepeatedVector</code> and <code>StackedVector</code> types are subtypes of <code>AbstractVector</code> and support its interface with the exception that they are read only. Note that they are not exported and should not be constructed directly, but they are columns of a <code>DataFrame</code> returned by <code>stack</code> with <code>view=true</code>.</p><p>The <code>ByRow</code> type is a special type used for selection operations to signal that the wrapped function should be applied to each element (row) of the selection.</p><p>The <code>AsTable</code> type is a special type used for selection operations to signal that the columns selected by a wrapped selector should be passed as a <code>NamedTuple</code> to the function or to signal that it is requested to expand the return value of a transformation into multiple columns.</p><h2 id="man-columnhandling"><a class="docs-heading-anchor" href="#man-columnhandling">The design of handling of columns of a <code>DataFrame</code></a><a id="man-columnhandling-1"></a><a class="docs-heading-anchor-permalink" href="#man-columnhandling" title="Permalink"></a></h2><p>When a <code>DataFrame</code> is constructed columns are copied by default. You can disable this behavior by setting <code>copycols</code> keyword argument to <code>false</code>. The exception is if an <code>AbstractRange</code> is passed as a column, then it is always collected to a <code>Vector</code>.</p><p>Also functions that transform a <code>DataFrame</code> to produce a new <code>DataFrame</code> perform a copy of the columns, unless they are passed <code>copycols=false</code> (available only for functions that could perform a transformation without copying the columns). Examples of such functions are <a href="../functions/#Base.vcat"><code>vcat</code></a>, <a href="../functions/#Base.hcat"><code>hcat</code></a>, <a href="../functions/#Base.filter"><code>filter</code></a>, <a href="../functions/#DataFrames.dropmissing"><code>dropmissing</code></a>, <code>getindex</code>, <a href="../functions/#Base.copy"><code>copy</code></a> or the <a href="#DataFrames.DataFrame"><code>DataFrame</code></a> constructor mentioned above.</p><p>The generic single-argument constructor <code>DataFrame(table)</code> has <code>copycols=nothing</code> by default, meaning that columns are copied unless <code>table</code> signals that a copy of columns doesn&#39;t need to be made (this is done by wrapping the source table in <code>Tables.CopiedColumns</code>). <a href="https://csv.juliadata.org/stable">CSV.jl</a> does this when <code>CSV.read(file, DataFrame)</code> is called, since columns are built only for the purpose of use in a <code>DataFrame</code> constructor. Another example is <a href="https://arrow.juliadata.org/dev/manual/#Arrow.Table"><code>Arrow.Table</code></a>, where arrow data is inherently immutable so columns can&#39;t be accidentally mutated anyway. To be able to mutate arrow data, columns must be materialized, which can be accomplished via <code>DataFrame(arrow_table, copycols=true)</code>.</p><p>On the contrary, functions that create a view of a <code>DataFrame</code> <em>do not</em> by definition make copies of the columns, and therefore require particular caution. This includes <code>view</code>, which returns a <code>SubDataFrame</code> or a <code>DataFrameRow</code>, and <code>groupby</code>, which returns a <code>GroupedDataFrame</code>.</p><p>A partial exception to this rule is the <a href="../functions/#Base.stack"><code>stack</code></a> function with <code>view=true</code> which creates a <code>DataFrame</code> that contains views of the columns from the source <code>DataFrame</code>.</p><p>In-place functions whose names end with <code>!</code> (like <code>sort!</code> or <a href="../functions/#DataFrames.dropmissing!"><code>dropmissing!</code></a>, <code>setindex!</code>, <code>push!</code>, <code>append!</code>) may mutate the column vectors of the <code>DataFrame</code> they take as an argument. These functions are safe to call due to the rules described above, <em>except</em> when a view of the <code>DataFrame</code> is in use (via a <code>SubDataFrame</code>, a <code>DataFrameRow</code> or a <code>GroupedDataFrame</code>). In the latter case, calling such a function on the parent might corrupt the view, which make trigger errors, silently return invalid data or even cause Julia to crash. The same caution applies when <code>DataFrame</code> was created using columns of another <code>DataFrame</code> without copying (for instance when <code>copycols=false</code> in functions such as <code>DataFrame</code> or <code>hcat</code>).</p><p>It is possible to have a direct access to a column <code>col</code> of a <code>DataFrame</code> <code>df</code> (e.g. this can be useful in performance critical code to avoid copying), using one of the following methods:</p><ul><li>via the <code>getproperty</code> function using the syntax <code>df.col</code>;</li><li>via the <code>getindex</code> function using the syntax <code>df[!, :col]</code> (note this is in contrast to <code>df[:, :col]</code> which copies);</li><li>by creating a <code>DataFrameColumns</code> object using the <a href="../functions/#Base.eachcol"><code>eachcol</code></a> function;</li><li>by calling the <code>parent</code> function on a view of a column of the <code>DataFrame</code>, e.g. <code>parent(@view df[:, :col])</code>;</li><li>by storing the reference to the column before creating a <code>DataFrame</code> with <code>copycols=false</code>;</li></ul><p>A column obtained from a <code>DataFrame</code> using one of the above methods should not be mutated without caution because:</p><ul><li>resizing a column vector will corrupt its parent <code>DataFrame</code> and any associated views as methods only check the length of the column when it is added to the <code>DataFrame</code> and later assume that all columns have the same length;</li><li>reordering values in a column vector (e.g. using <code>sort!</code>) will break the consistency of rows with other columns, which will also affect views (if any);</li><li>changing values contained in a column vector is acceptable as long as it is not used as a grouping column in a <code>GroupedDataFrame</code> created based on the <code>DataFrame</code>.</li></ul><h2 id="Types-specification"><a class="docs-heading-anchor" href="#Types-specification">Types specification</a><a id="Types-specification-1"></a><a class="docs-heading-anchor-permalink" href="#Types-specification" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.AbstractDataFrame" href="#DataFrames.AbstractDataFrame"><code>DataFrames.AbstractDataFrame</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">AbstractDataFrame</code></pre><p>An abstract type for which all concrete types expose an interface for working with tabular data.</p><p>An <code>AbstractDataFrame</code> is a two-dimensional table with <code>Symbol</code>s or strings for column names.</p><p>DataFrames.jl defines two types that are subtypes of <code>AbstractDataFrame</code>: <a href="#DataFrames.DataFrame"><code>DataFrame</code></a> and <a href="#DataFrames.SubDataFrame"><code>SubDataFrame</code></a>.</p><p><strong>Indexing and broadcasting</strong></p><p><code>AbstractDataFrame</code> can be indexed by passing two indices specifying row and column selectors. The allowed indices are a superset of indices that can be used for standard arrays. You can also access a single column of an <code>AbstractDataFrame</code> using <code>getproperty</code> and <code>setproperty!</code> functions. Columns can be selected using integers, <code>Symbol</code>s, or strings. In broadcasting <code>AbstractDataFrame</code> behavior is similar to a <code>Matrix</code>.</p><p>A detailed description of <code>getindex</code>, <code>setindex!</code>, <code>getproperty</code>, <code>setproperty!</code>, broadcasting and broadcasting assignment for data frames is given in the <a href="https://juliadata.github.io/DataFrames.jl/stable/lib/indexing/">&quot;Indexing&quot; section</a> of the manual.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/abstractdataframe.jl#L1-L26">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.AsTable" href="#DataFrames.AsTable"><code>DataFrames.AsTable</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">AsTable(cols)</code></pre><p>A type having a special meaning in <code>source =&gt; transformation =&gt; destination</code> selection operations supported by <a href="../functions/#DataFrames.combine"><code>combine</code></a>, <a href="../functions/#DataFrames.select"><code>select</code></a>, <a href="../functions/#DataFrames.select!"><code>select!</code></a>, <a href="../functions/#DataFrames.transform"><code>transform</code></a>, <a href="../functions/#DataFrames.transform!"><code>transform!</code></a>, <a href="../functions/#DataFrames.subset"><code>subset</code></a>, and <a href="../functions/#DataFrames.subset!"><code>subset!</code></a>.</p><p>If <code>AsTable(cols)</code> is used in <code>source</code> position it signals that the columns selected by the wrapped selector <code>cols</code> should be passed as a <code>NamedTuple</code> to the function.</p><p>If <code>AsTable</code> is used in <code>destination</code> position it means that the result of the <code>transformation</code> operation is a vector of containers (or a single container if <code>ByRow(transformation)</code> is used) that should be expanded  into multiple columns using <code>keys</code> to get column names.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df1 = DataFrame(a=1:3, b=11:13)
+<html lang="en"><head><meta charset="UTF-8"/><meta name="viewport" content="width=device-width, initial-scale=1.0"/><title>Types · DataFrames.jl</title><meta name="title" content="Types · DataFrames.jl"/><meta property="og:title" content="Types · DataFrames.jl"/><meta property="twitter:title" content="Types · DataFrames.jl"/><meta name="description" content="Documentation for DataFrames.jl."/><meta property="og:description" content="Documentation for DataFrames.jl."/><meta property="twitter:description" content="Documentation for DataFrames.jl."/><meta property="og:url" content="https://juliadata.github.io/DataFrames.jl/stable/lib/types/"/><meta property="twitter:url" content="https://juliadata.github.io/DataFrames.jl/stable/lib/types/"/><link rel="canonical" href="https://juliadata.github.io/DataFrames.jl/stable/lib/types/"/><script data-outdated-warner src="../../assets/warner.js"></script><link href="https://cdnjs.cloudflare.com/ajax/libs/lato-font/3.0.0/css/lato-font.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/juliamono/0.050/juliamono.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/fontawesome.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/solid.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/brands.min.css" rel="stylesheet" type="text/css"/><link href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.16.8/katex.min.css" rel="stylesheet" type="text/css"/><script>documenterBaseURL="../.."</script><script src="https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.6/require.min.js" data-main="../../assets/documenter.js"></script><script src="../../search_index.js"></script><script src="../../siteinfo.js"></script><script src="../../../versions.js"></script><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-mocha.css" data-theme-name="catppuccin-mocha"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-macchiato.css" data-theme-name="catppuccin-macchiato"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-frappe.css" data-theme-name="catppuccin-frappe"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/catppuccin-latte.css" data-theme-name="catppuccin-latte"/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-dark.css" data-theme-name="documenter-dark" data-theme-primary-dark/><link class="docs-theme-link" rel="stylesheet" type="text/css" href="../../assets/themes/documenter-light.css" data-theme-name="documenter-light" data-theme-primary/><script src="../../assets/themeswap.js"></script><link href="../../assets/favicon.ico" rel="icon" type="image/x-icon"/></head><body><div id="documenter"><nav class="docs-sidebar"><a class="docs-logo" href="../../"><img src="../../assets/logo.png" alt="DataFrames.jl logo"/></a><div class="docs-package-name"><span class="docs-autofit"><a href="../../">DataFrames.jl</a></span></div><button class="docs-search-query input is-rounded is-small is-clickable my-2 mx-auto py-1 px-2" id="documenter-search-query">Search docs (Ctrl + /)</button><ul class="docs-menu"><li><a class="tocitem" href="../../">Introduction</a></li><li><a class="tocitem" href="../../man/basics/">First Steps with DataFrames.jl</a></li><li><span class="tocitem">User Guide</span><ul><li><a class="tocitem" href="../../man/getting_started/">Getting Started</a></li><li><a class="tocitem" href="../../man/working_with_dataframes/">Working with DataFrames</a></li><li><a class="tocitem" href="../../man/importing_and_exporting/">Importing and Exporting Data (I/O)</a></li><li><a class="tocitem" href="../../man/joins/">Joins</a></li><li><a class="tocitem" href="../../man/split_apply_combine/">Split-apply-combine</a></li><li><a class="tocitem" href="../../man/reshaping_and_pivoting/">Reshaping</a></li><li><a class="tocitem" href="../../man/sorting/">Sorting</a></li><li><a class="tocitem" href="../../man/categorical/">Categorical Data</a></li><li><a class="tocitem" href="../../man/missing/">Missing Data</a></li><li><a class="tocitem" href="../../man/querying_frameworks/">Data manipulation frameworks</a></li><li><a class="tocitem" href="../../man/comparisons/">Comparison with Python/R/Stata</a></li></ul></li><li><span class="tocitem">API</span><ul><li class="is-active"><a class="tocitem" href>Types</a><ul class="internal"><li><a class="tocitem" href="#Type-hierarchy-design"><span>Type hierarchy design</span></a></li><li><a class="tocitem" href="#man-columnhandling"><span>The design of handling of columns of a <code>DataFrame</code></span></a></li><li><a class="tocitem" href="#Types-specification"><span>Types specification</span></a></li></ul></li><li><a class="tocitem" href="../functions/">Functions</a></li><li><a class="tocitem" href="../indexing/">Indexing</a></li><li><a class="tocitem" href="../metadata/">Metadata</a></li></ul></li></ul><div class="docs-version-selector field has-addons"><div class="control"><span class="docs-label button is-static is-size-7">Version</span></div><div class="docs-selector control is-expanded"><div class="select is-fullwidth is-size-7"><select id="documenter-version-selector"></select></div></div></div></nav><div class="docs-main"><header class="docs-navbar"><a class="docs-sidebar-button docs-navbar-link fa-solid fa-bars is-hidden-desktop" id="documenter-sidebar-button" href="#"></a><nav class="breadcrumb"><ul class="is-hidden-mobile"><li><a class="is-disabled">API</a></li><li class="is-active"><a href>Types</a></li></ul><ul class="is-hidden-tablet"><li class="is-active"><a href>Types</a></li></ul></nav><div class="docs-right"><a class="docs-navbar-link" href="https://github.com/JuliaData/DataFrames.jl" title="View the repository on GitHub"><span class="docs-icon fa-brands"></span><span class="docs-label is-hidden-touch">GitHub</span></a><a class="docs-navbar-link" href="https://github.com/JuliaData/DataFrames.jl/blob/main/docs/src/lib/types.md" title="Edit source on GitHub"><span class="docs-icon fa-solid"></span></a><a class="docs-settings-button docs-navbar-link fa-solid fa-gear" id="documenter-settings-button" href="#" title="Settings"></a><a class="docs-article-toggle-button fa-solid fa-chevron-up" id="documenter-article-toggle-button" href="javascript:;" title="Collapse all docstrings"></a></div></header><article class="content" id="documenter-page"><h1 id="Types"><a class="docs-heading-anchor" href="#Types">Types</a><a id="Types-1"></a><a class="docs-heading-anchor-permalink" href="#Types" title="Permalink"></a></h1><ul><li><a href="#DataFrames.AbstractDataFrame"><code>DataFrames.AbstractDataFrame</code></a></li><li><a href="#DataFrames.AsTable"><code>DataFrames.AsTable</code></a></li><li><a href="#DataFrames.DataFrame"><code>DataFrames.DataFrame</code></a></li><li><a href="#DataFrames.DataFrameColumns"><code>DataFrames.DataFrameColumns</code></a></li><li><a href="#DataFrames.DataFrameRow"><code>DataFrames.DataFrameRow</code></a></li><li><a href="#DataFrames.DataFrameRows"><code>DataFrames.DataFrameRows</code></a></li><li><a href="#DataFrames.GroupKey"><code>DataFrames.GroupKey</code></a></li><li><a href="#DataFrames.GroupKeys"><code>DataFrames.GroupKeys</code></a></li><li><a href="#DataFrames.GroupedDataFrame"><code>DataFrames.GroupedDataFrame</code></a></li><li><a href="#DataFrames.RepeatedVector"><code>DataFrames.RepeatedVector</code></a></li><li><a href="#DataFrames.StackedVector"><code>DataFrames.StackedVector</code></a></li><li><a href="#DataFrames.SubDataFrame"><code>DataFrames.SubDataFrame</code></a></li></ul><h2 id="Type-hierarchy-design"><a class="docs-heading-anchor" href="#Type-hierarchy-design">Type hierarchy design</a><a id="Type-hierarchy-design-1"></a><a class="docs-heading-anchor-permalink" href="#Type-hierarchy-design" title="Permalink"></a></h2><p><code>AbstractDataFrame</code> is an abstract type that provides an interface for data frame types. It is not intended as a fully generic interface for working with tabular data, which is the role of interfaces defined by <a href="https://github.com/JuliaData/Tables.jl/">Tables.jl</a> instead.</p><p><code>DataFrame</code> is the most fundamental subtype of <code>AbstractDataFrame</code>, which stores a set of columns as <code>AbstractVector</code> objects. Indexing of all stored columns must be 1-based. Also, all functions exposed by DataFrames.jl API make sure to <code>collect</code> passed <code>AbstractRange</code> source columns before storing them in a <code>DataFrame</code>.</p><p><code>SubDataFrame</code> is an <code>AbstractDataFrame</code> subtype representing a view into a <code>DataFrame</code>. It stores only a reference to the parent <code>DataFrame</code> and information about which rows and columns from the parent are selected (both as integer indices referring to the parent). Typically it is created using the <code>view</code> function or is returned by indexing into a <code>GroupedDataFrame</code> object.</p><p><code>GroupedDataFrame</code> is a type that stores the result of a  grouping operation performed on an <code>AbstractDataFrame</code>. It is intended to be created as a result of a call to the <code>groupby</code> function.</p><p><code>DataFrameRow</code> is a view into a single row of an <code>AbstractDataFrame</code>. It stores only a reference to a parent <code>DataFrame</code> and information about which row and columns from the parent are selected (both as integer indices referring to the parent). The <code>DataFrameRow</code> type supports iteration over columns of the row and is similar in functionality to the <code>NamedTuple</code> type, but allows for modification of data stored in the parent <code>DataFrame</code> and reflects changes done to the parent after the creation of the view. Typically objects of the <code>DataFrameRow</code> type are encountered when returned by the <code>eachrow</code> function, or when accessing a single row of a <code>DataFrame</code> or <code>SubDataFrame</code> via <code>getindex</code> or <code>view</code>.</p><p>The <code>eachrow</code> function returns a value of the <code>DataFrameRows</code> type, which serves as an iterator over rows of an <code>AbstractDataFrame</code>, returning <code>DataFrameRow</code> objects. The <code>DataFrameRows</code> is a subtype of <code>AbstractVector</code> and supports its interface with the exception that it is read-only.</p><p>Similarly, the <code>eachcol</code> function returns a value of the <code>DataFrameColumns</code> type, which is not an <code>AbstractVector</code>, but supports most of its API. The key differences are that it is read-only and that the <code>keys</code> function returns a vector of <code>Symbol</code>s (and not integers as for normal vectors).</p><p>Note that <code>DataFrameRows</code> and <code>DataFrameColumns</code> are not exported and should not be constructed directly, but using the <code>eachrow</code> and <code>eachcol</code> functions.</p><p>The <code>RepeatedVector</code> and <code>StackedVector</code> types are subtypes of <code>AbstractVector</code> and support its interface with the exception that they are read only. Note that they are not exported and should not be constructed directly, but they are columns of a <code>DataFrame</code> returned by <code>stack</code> with <code>view=true</code>.</p><p>The <code>ByRow</code> type is a special type used for selection operations to signal that the wrapped function should be applied to each element (row) of the selection.</p><p>The <code>AsTable</code> type is a special type used for selection operations to signal that the columns selected by a wrapped selector should be passed as a <code>NamedTuple</code> to the function or to signal that it is requested to expand the return value of a transformation into multiple columns.</p><h2 id="man-columnhandling"><a class="docs-heading-anchor" href="#man-columnhandling">The design of handling of columns of a <code>DataFrame</code></a><a id="man-columnhandling-1"></a><a class="docs-heading-anchor-permalink" href="#man-columnhandling" title="Permalink"></a></h2><p>When a <code>DataFrame</code> is constructed columns are copied by default. You can disable this behavior by setting <code>copycols</code> keyword argument to <code>false</code>. The exception is if an <code>AbstractRange</code> is passed as a column, then it is always collected to a <code>Vector</code>.</p><p>Also functions that transform a <code>DataFrame</code> to produce a new <code>DataFrame</code> perform a copy of the columns, unless they are passed <code>copycols=false</code> (available only for functions that could perform a transformation without copying the columns). Examples of such functions are <a href="../functions/#Base.vcat"><code>vcat</code></a>, <a href="../functions/#Base.hcat"><code>hcat</code></a>, <a href="../functions/#Base.filter"><code>filter</code></a>, <a href="../functions/#DataFrames.dropmissing"><code>dropmissing</code></a>, <code>getindex</code>, <a href="../functions/#Base.copy"><code>copy</code></a> or the <a href="#DataFrames.DataFrame"><code>DataFrame</code></a> constructor mentioned above.</p><p>The generic single-argument constructor <code>DataFrame(table)</code> has <code>copycols=nothing</code> by default, meaning that columns are copied unless <code>table</code> signals that a copy of columns doesn&#39;t need to be made (this is done by wrapping the source table in <code>Tables.CopiedColumns</code>). <a href="https://csv.juliadata.org/stable">CSV.jl</a> does this when <code>CSV.read(file, DataFrame)</code> is called, since columns are built only for the purpose of use in a <code>DataFrame</code> constructor. Another example is <a href="https://arrow.juliadata.org/dev/manual/#Arrow.Table"><code>Arrow.Table</code></a>, where arrow data is inherently immutable so columns can&#39;t be accidentally mutated anyway. To be able to mutate arrow data, columns must be materialized, which can be accomplished via <code>DataFrame(arrow_table, copycols=true)</code>.</p><p>On the contrary, functions that create a view of a <code>DataFrame</code> <em>do not</em> by definition make copies of the columns, and therefore require particular caution. This includes <code>view</code>, which returns a <code>SubDataFrame</code> or a <code>DataFrameRow</code>, and <code>groupby</code>, which returns a <code>GroupedDataFrame</code>.</p><p>A partial exception to this rule is the <a href="../functions/#Base.stack"><code>stack</code></a> function with <code>view=true</code> which creates a <code>DataFrame</code> that contains views of the columns from the source <code>DataFrame</code>.</p><p>In-place functions whose names end with <code>!</code> (like <code>sort!</code> or <a href="../functions/#DataFrames.dropmissing!"><code>dropmissing!</code></a>, <code>setindex!</code>, <code>push!</code>, <code>append!</code>) may mutate the column vectors of the <code>DataFrame</code> they take as an argument. These functions are safe to call due to the rules described above, <em>except</em> when a view of the <code>DataFrame</code> is in use (via a <code>SubDataFrame</code>, a <code>DataFrameRow</code> or a <code>GroupedDataFrame</code>). In the latter case, calling such a function on the parent might corrupt the view, which make trigger errors, silently return invalid data or even cause Julia to crash. The same caution applies when <code>DataFrame</code> was created using columns of another <code>DataFrame</code> without copying (for instance when <code>copycols=false</code> in functions such as <code>DataFrame</code> or <code>hcat</code>).</p><p>It is possible to have a direct access to a column <code>col</code> of a <code>DataFrame</code> <code>df</code> (e.g. this can be useful in performance critical code to avoid copying), using one of the following methods:</p><ul><li>via the <code>getproperty</code> function using the syntax <code>df.col</code>;</li><li>via the <code>getindex</code> function using the syntax <code>df[!, :col]</code> (note this is in contrast to <code>df[:, :col]</code> which copies);</li><li>by creating a <code>DataFrameColumns</code> object using the <a href="../functions/#Base.eachcol"><code>eachcol</code></a> function;</li><li>by calling the <code>parent</code> function on a view of a column of the <code>DataFrame</code>, e.g. <code>parent(@view df[:, :col])</code>;</li><li>by storing the reference to the column before creating a <code>DataFrame</code> with <code>copycols=false</code>;</li></ul><p>A column obtained from a <code>DataFrame</code> using one of the above methods should not be mutated without caution because:</p><ul><li>resizing a column vector will corrupt its parent <code>DataFrame</code> and any associated views as methods only check the length of the column when it is added to the <code>DataFrame</code> and later assume that all columns have the same length;</li><li>reordering values in a column vector (e.g. using <code>sort!</code>) will break the consistency of rows with other columns, which will also affect views (if any);</li><li>changing values contained in a column vector is acceptable as long as it is not used as a grouping column in a <code>GroupedDataFrame</code> created based on the <code>DataFrame</code>.</li></ul><h2 id="Types-specification"><a class="docs-heading-anchor" href="#Types-specification">Types specification</a><a id="Types-specification-1"></a><a class="docs-heading-anchor-permalink" href="#Types-specification" title="Permalink"></a></h2><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.AbstractDataFrame" href="#DataFrames.AbstractDataFrame"><code>DataFrames.AbstractDataFrame</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">AbstractDataFrame</code></pre><p>An abstract type for which all concrete types expose an interface for working with tabular data.</p><p>An <code>AbstractDataFrame</code> is a two-dimensional table with <code>Symbol</code>s or strings for column names.</p><p>DataFrames.jl defines two types that are subtypes of <code>AbstractDataFrame</code>: <a href="#DataFrames.DataFrame"><code>DataFrame</code></a> and <a href="#DataFrames.SubDataFrame"><code>SubDataFrame</code></a>.</p><p><strong>Indexing and broadcasting</strong></p><p><code>AbstractDataFrame</code> can be indexed by passing two indices specifying row and column selectors. The allowed indices are a superset of indices that can be used for standard arrays. You can also access a single column of an <code>AbstractDataFrame</code> using <code>getproperty</code> and <code>setproperty!</code> functions. Columns can be selected using integers, <code>Symbol</code>s, or strings. In broadcasting <code>AbstractDataFrame</code> behavior is similar to a <code>Matrix</code>.</p><p>A detailed description of <code>getindex</code>, <code>setindex!</code>, <code>getproperty</code>, <code>setproperty!</code>, broadcasting and broadcasting assignment for data frames is given in the <a href="https://juliadata.github.io/DataFrames.jl/stable/lib/indexing/">&quot;Indexing&quot; section</a> of the manual.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/abstractdataframe.jl#L1-L26">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.AsTable" href="#DataFrames.AsTable"><code>DataFrames.AsTable</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">AsTable(cols)</code></pre><p>A type having a special meaning in <code>source =&gt; transformation =&gt; destination</code> selection operations supported by <a href="../functions/#DataFrames.combine"><code>combine</code></a>, <a href="../functions/#DataFrames.select"><code>select</code></a>, <a href="../functions/#DataFrames.select!"><code>select!</code></a>, <a href="../functions/#DataFrames.transform"><code>transform</code></a>, <a href="../functions/#DataFrames.transform!"><code>transform!</code></a>, <a href="../functions/#DataFrames.subset"><code>subset</code></a>, and <a href="../functions/#DataFrames.subset!"><code>subset!</code></a>.</p><p>If <code>AsTable(cols)</code> is used in <code>source</code> position it signals that the columns selected by the wrapped selector <code>cols</code> should be passed as a <code>NamedTuple</code> to the function.</p><p>If <code>AsTable</code> is used in <code>destination</code> position it means that the result of the <code>transformation</code> operation is a vector of containers (or a single container if <code>ByRow(transformation)</code> is used) that should be expanded  into multiple columns using <code>keys</code> to get column names.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df1 = DataFrame(a=1:3, b=11:13)
 3×2 DataFrame
  Row │ a      b
      │ Int64  Int64
@@ -33,7 +33,7 @@
 ─────┼──────────────
    1 │     1    121
    2 │     4    144
-   3 │     9    169</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/other/utils.jl#L1-L54">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.DataFrame" href="#DataFrames.DataFrame"><code>DataFrames.DataFrame</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">DataFrame &lt;: AbstractDataFrame</code></pre><p>An <code>AbstractDataFrame</code> that stores a set of named columns.</p><p>The columns are normally <code>AbstractVector</code>s stored in memory, particularly a <code>Vector</code>, <code>PooledVector</code> or <code>CategoricalVector</code>.</p><p><strong>Constructors</strong></p><pre><code class="language-julia hljs">DataFrame(pairs::Pair...; makeunique::Bool=false, copycols::Bool=true)
+   3 │     9    169</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/other/utils.jl#L1-L54">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.DataFrame" href="#DataFrames.DataFrame"><code>DataFrames.DataFrame</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">DataFrame &lt;: AbstractDataFrame</code></pre><p>An <code>AbstractDataFrame</code> that stores a set of named columns.</p><p>The columns are normally <code>AbstractVector</code>s stored in memory, particularly a <code>Vector</code>, <code>PooledVector</code> or <code>CategoricalVector</code>.</p><p><strong>Constructors</strong></p><pre><code class="language-julia hljs">DataFrame(pairs::Pair...; makeunique::Bool=false, copycols::Bool=true)
 DataFrame(pairs::AbstractVector{&lt;:Pair}; makeunique::Bool=false, copycols::Bool=true)
 DataFrame(ds::AbstractDict; copycols::Bool=true)
 DataFrame(; kwargs..., copycols::Bool=true)
@@ -107,7 +107,7 @@
      │ Int64  Int64
 ─────┼──────────────
    1 │     1      0
-   2 │     2      0</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/dataframe/dataframe.jl#L1-L177">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.DataFrameRow" href="#DataFrames.DataFrameRow"><code>DataFrames.DataFrameRow</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">DataFrameRow{&lt;:AbstractDataFrame, &lt;:AbstractIndex}</code></pre><p>A view of one row of an <code>AbstractDataFrame</code>.</p><p>A <code>DataFrameRow</code> is returned by <code>getindex</code> or <code>view</code> functions when one row and a selection of columns are requested, or when iterating the result of the call to the <a href="../functions/#Base.eachrow"><code>eachrow</code></a> function.</p><p>The <code>DataFrameRow</code> constructor can also be called directly:</p><pre><code class="nohighlight hljs">DataFrameRow(parent::AbstractDataFrame, row::Integer, cols=:)</code></pre><p>A <code>DataFrameRow</code> supports the iteration interface and can therefore be passed to functions that expect a collection as an argument. Its element type is always <code>Any</code>.</p><p>Indexing is one-dimensional like specifying a column of a <code>DataFrame</code>. You can also access the data in a <code>DataFrameRow</code> using the <code>getproperty</code> and <code>setproperty!</code> functions and convert it to a <code>Tuple</code>, <code>NamedTuple</code>, or <code>Vector</code> using the corresponding functions.</p><p>If the selection of columns in a parent data frame is passed as <code>:</code> (a colon) then <code>DataFrameRow</code> will always have all columns from the parent, even if they are added or removed after its creation.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=repeat([1, 2], outer=[2]),
+   2 │     2      0</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/dataframe/dataframe.jl#L1-L177">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.DataFrameRow" href="#DataFrames.DataFrameRow"><code>DataFrames.DataFrameRow</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">DataFrameRow{&lt;:AbstractDataFrame, &lt;:AbstractIndex}</code></pre><p>A view of one row of an <code>AbstractDataFrame</code>.</p><p>A <code>DataFrameRow</code> is returned by <code>getindex</code> or <code>view</code> functions when one row and a selection of columns are requested, or when iterating the result of the call to the <a href="../functions/#Base.eachrow"><code>eachrow</code></a> function.</p><p>The <code>DataFrameRow</code> constructor can also be called directly:</p><pre><code class="nohighlight hljs">DataFrameRow(parent::AbstractDataFrame, row::Integer, cols=:)</code></pre><p>A <code>DataFrameRow</code> supports the iteration interface and can therefore be passed to functions that expect a collection as an argument. Its element type is always <code>Any</code>.</p><p>Indexing is one-dimensional like specifying a column of a <code>DataFrame</code>. You can also access the data in a <code>DataFrameRow</code> using the <code>getproperty</code> and <code>setproperty!</code> functions and convert it to a <code>Tuple</code>, <code>NamedTuple</code>, or <code>Vector</code> using the corresponding functions.</p><p>If the selection of columns in a parent data frame is passed as <code>:</code> (a colon) then <code>DataFrameRow</code> will always have all columns from the parent, even if they are added or removed after its creation.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=repeat([1, 2], outer=[2]),
                       b=repeat([&quot;a&quot;, &quot;b&quot;], inner=[2]),
                       c=1:4)
 4×3 DataFrame
@@ -150,7 +150,7 @@
 3-element Vector{Any}:
  1
   &quot;a&quot;
- 1</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/dataframerow/dataframerow.jl#L1-L75">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.GroupedDataFrame" href="#DataFrames.GroupedDataFrame"><code>DataFrames.GroupedDataFrame</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">GroupedDataFrame</code></pre><p>The result of a <a href="../functions/#DataAPI.groupby"><code>groupby</code></a> operation on an <code>AbstractDataFrame</code>; a view into the <code>AbstractDataFrame</code> grouped by rows.</p><p>Not meant to be constructed directly, see <a href="../functions/#DataAPI.groupby"><code>groupby</code></a>.</p><p>One can get the names of columns used to create <code>GroupedDataFrame</code> using the <a href="../functions/#DataFrames.groupcols"><code>groupcols</code></a> function. Similarly the <a href="../functions/#DataFrames.groupindices"><code>groupindices</code></a> function returns a vector of group indices for each row of the parent data frame.</p><p>After its creation, a <code>GroupedDataFrame</code> reflects the grouping of rows that was valid at its creation time. Therefore grouping columns of its parent data frame must not be mutated, and rows must not be added nor removed from it. To safeguard the user against such cases, if the number of rows in the parent data frame changes then trying to use <code>GroupedDataFrame</code> will throw an error. However, one can add or remove columns to the parent data frame without invalidating the <code>GroupedDataFrame</code> provided that columns used for grouping are not changed.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/groupeddataframe/groupeddataframe.jl#L15-L36">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.GroupKey" href="#DataFrames.GroupKey"><code>DataFrames.GroupKey</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">GroupKey{T&lt;:GroupedDataFrame}</code></pre><p>Key for one of the groups of a <a href="#DataFrames.GroupedDataFrame"><code>GroupedDataFrame</code></a>. Contains the values of the corresponding grouping columns and behaves similarly to a <code>NamedTuple</code>, but using it to index its <code>GroupedDataFrame</code> is more efficient than using the equivalent <code>Tuple</code> and <code>NamedTuple</code>, and much more efficient than using the equivalent <code>AbstractDict</code>.</p><p>Instances of this type are returned by <code>keys(::GroupedDataFrame)</code> and are not meant to be constructed directly.</p><p>Indexing fields of <code>GroupKey</code> is allowed using an integer, a <code>Symbol</code>, or a string. It is also possible to access the data in a <code>GroupKey</code> using the <code>getproperty</code> function. A <code>GroupKey</code> can be converted to a <code>Tuple</code>, <code>NamedTuple</code>, a <code>Vector</code>, or a <code>Dict</code>. When converted to a <code>Dict</code>, the keys of the <code>Dict</code> are <code>Symbol</code>s.</p><p>See <a href="../functions/#Base.keys"><code>keys(::GroupedDataFrame)</code></a> for more information.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/groupeddataframe/groupeddataframe.jl#L612-L630">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.GroupKeys" href="#DataFrames.GroupKeys"><code>DataFrames.GroupKeys</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">GroupKeys{T&lt;:GroupedDataFrame} &lt;: AbstractVector{GroupKey{T}}</code></pre><p>A vector containing all <a href="#DataFrames.GroupKey"><code>GroupKey</code></a> objects for a given <a href="#DataFrames.GroupedDataFrame"><code>GroupedDataFrame</code></a>.</p><p>See <a href="../functions/#Base.keys"><code>keys(::GroupedDataFrame)</code></a> for more information.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/groupeddataframe/groupeddataframe.jl#L760-L767">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.SubDataFrame" href="#DataFrames.SubDataFrame"><code>DataFrames.SubDataFrame</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">SubDataFrame{&lt;:AbstractDataFrame, &lt;:AbstractIndex, &lt;:AbstractVector{Int}} &lt;: AbstractDataFrame</code></pre><p>A view of an <code>AbstractDataFrame</code>. It is returned by a call to the <code>view</code> function on an <code>AbstractDataFrame</code> if a collections of rows and columns are specified.</p><p>A <code>SubDataFrame</code> is an <code>AbstractDataFrame</code>, so expect that most DataFrame functions should work. Such methods include <code>describe</code>, <code>summary</code>, <code>nrow</code>, <code>size</code>, <code>by</code>, <code>stack</code>, and <code>join</code>.</p><p>If the selection of columns in a parent data frame is passed as <code>:</code> (a colon) then <code>SubDataFrame</code> will always have all columns from the parent, even if they are added or removed after its creation.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=repeat([1, 2, 3, 4], outer=[2]),
+ 1</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/dataframerow/dataframerow.jl#L1-L75">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.GroupedDataFrame" href="#DataFrames.GroupedDataFrame"><code>DataFrames.GroupedDataFrame</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">GroupedDataFrame</code></pre><p>The result of a <a href="../functions/#DataAPI.groupby"><code>groupby</code></a> operation on an <code>AbstractDataFrame</code>; a view into the <code>AbstractDataFrame</code> grouped by rows.</p><p>Not meant to be constructed directly, see <a href="../functions/#DataAPI.groupby"><code>groupby</code></a>.</p><p>One can get the names of columns used to create <code>GroupedDataFrame</code> using the <a href="../functions/#DataFrames.groupcols"><code>groupcols</code></a> function. Similarly the <a href="../functions/#DataFrames.groupindices"><code>groupindices</code></a> function returns a vector of group indices for each row of the parent data frame.</p><p>After its creation, a <code>GroupedDataFrame</code> reflects the grouping of rows that was valid at its creation time. Therefore grouping columns of its parent data frame must not be mutated, and rows must not be added nor removed from it. To safeguard the user against such cases, if the number of rows in the parent data frame changes then trying to use <code>GroupedDataFrame</code> will throw an error. However, one can add or remove columns to the parent data frame without invalidating the <code>GroupedDataFrame</code> provided that columns used for grouping are not changed.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/groupeddataframe/groupeddataframe.jl#L15-L36">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.GroupKey" href="#DataFrames.GroupKey"><code>DataFrames.GroupKey</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">GroupKey{T&lt;:GroupedDataFrame}</code></pre><p>Key for one of the groups of a <a href="#DataFrames.GroupedDataFrame"><code>GroupedDataFrame</code></a>. Contains the values of the corresponding grouping columns and behaves similarly to a <code>NamedTuple</code>, but using it to index its <code>GroupedDataFrame</code> is more efficient than using the equivalent <code>Tuple</code> and <code>NamedTuple</code>, and much more efficient than using the equivalent <code>AbstractDict</code>.</p><p>Instances of this type are returned by <code>keys(::GroupedDataFrame)</code> and are not meant to be constructed directly.</p><p>Indexing fields of <code>GroupKey</code> is allowed using an integer, a <code>Symbol</code>, or a string. It is also possible to access the data in a <code>GroupKey</code> using the <code>getproperty</code> function. A <code>GroupKey</code> can be converted to a <code>Tuple</code>, <code>NamedTuple</code>, a <code>Vector</code>, or a <code>Dict</code>. When converted to a <code>Dict</code>, the keys of the <code>Dict</code> are <code>Symbol</code>s.</p><p>See <a href="../functions/#Base.keys"><code>keys(::GroupedDataFrame)</code></a> for more information.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/groupeddataframe/groupeddataframe.jl#L612-L630">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.GroupKeys" href="#DataFrames.GroupKeys"><code>DataFrames.GroupKeys</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">GroupKeys{T&lt;:GroupedDataFrame} &lt;: AbstractVector{GroupKey{T}}</code></pre><p>A vector containing all <a href="#DataFrames.GroupKey"><code>GroupKey</code></a> objects for a given <a href="#DataFrames.GroupedDataFrame"><code>GroupedDataFrame</code></a>.</p><p>See <a href="../functions/#Base.keys"><code>keys(::GroupedDataFrame)</code></a> for more information.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/groupeddataframe/groupeddataframe.jl#L760-L767">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.SubDataFrame" href="#DataFrames.SubDataFrame"><code>DataFrames.SubDataFrame</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">SubDataFrame{&lt;:AbstractDataFrame, &lt;:AbstractIndex, &lt;:AbstractVector{Int}} &lt;: AbstractDataFrame</code></pre><p>A view of an <code>AbstractDataFrame</code>. It is returned by a call to the <code>view</code> function on an <code>AbstractDataFrame</code> if a collections of rows and columns are specified.</p><p>A <code>SubDataFrame</code> is an <code>AbstractDataFrame</code>, so expect that most DataFrame functions should work. Such methods include <code>describe</code>, <code>summary</code>, <code>nrow</code>, <code>size</code>, <code>by</code>, <code>stack</code>, and <code>join</code>.</p><p>If the selection of columns in a parent data frame is passed as <code>:</code> (a colon) then <code>SubDataFrame</code> will always have all columns from the parent, even if they are added or removed after its creation.</p><p><strong>Examples</strong></p><pre><code class="language-julia-repl hljs">julia&gt; df = DataFrame(a=repeat([1, 2, 3, 4], outer=[2]),
                       b=repeat([2, 1], outer=[4]),
                       c=1:8)
 8×3 DataFrame
@@ -200,6 +200,6 @@
      │ Int64  Int64  Int64
 ─────┼─────────────────────
    1 │     1      2      1
-   2 │     1      2      5</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/subdataframe/subdataframe.jl#L1-L69">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.DataFrameRows" href="#DataFrames.DataFrameRows"><code>DataFrames.DataFrameRows</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">DataFrameRows{D&lt;:AbstractDataFrame} &lt;: AbstractVector{DataFrameRow}</code></pre><p>Iterator over rows of an <code>AbstractDataFrame</code>, with each row represented as a <code>DataFrameRow</code>.</p><p>A value of this type is returned by the <a href="../functions/#Base.eachrow"><code>eachrow</code></a> function.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/iteration.jl#L8-L15">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.DataFrameColumns" href="#DataFrames.DataFrameColumns"><code>DataFrames.DataFrameColumns</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">DataFrameColumns{&lt;:AbstractDataFrame}</code></pre><p>A vector-like object that allows iteration over columns of an <code>AbstractDataFrame</code>.</p><p>Indexing into <code>DataFrameColumns</code> objects using integer, <code>Symbol</code> or string returns the corresponding column (without copying). Indexing into <code>DataFrameColumns</code> objects using a multiple column selector returns a subsetted <code>DataFrameColumns</code> object with a new parent containing only the selected columns (without copying).</p><p><code>DataFrameColumns</code> supports most of the <code>AbstractVector</code> API. The key differences are that it is read-only and that the <code>keys</code> function returns a vector of <code>Symbol</code>s (and not integers as for normal vectors).</p><p>In particular <code>findnext</code>, <code>findprev</code>, <code>findfirst</code>, <code>findlast</code>, and <code>findall</code> functions are supported, and in <code>findnext</code> and <code>findprev</code> functions it is allowed to pass an integer, string, or <code>Symbol</code> as a reference index.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/iteration.jl#L177-L183">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.RepeatedVector" href="#DataFrames.RepeatedVector"><code>DataFrames.RepeatedVector</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">RepeatedVector{T} &lt;: AbstractVector{T}</code></pre><p>An AbstractVector that is a view into another AbstractVector with repeated elements</p><p>NOTE: Not exported.</p><p><strong>Constructor</strong></p><pre><code class="language-julia hljs">RepeatedVector(parent::AbstractVector, inner::Int, outer::Int)</code></pre><p><strong>Arguments</strong></p><ul><li><code>parent</code> : the AbstractVector that&#39;s repeated</li><li><code>inner</code> : the number of times each element is repeated</li><li><code>outer</code> : the number of times the whole vector is repeated after expanded by <code>inner</code></li></ul><p><code>inner</code> and <code>outer</code> have the same meaning as similarly named arguments to <code>repeat</code>.</p><p><strong>Examples</strong></p><pre><code class="language-julia hljs">RepeatedVector([1, 2], 3, 1)   # [1, 1, 1, 2, 2, 2]
+   2 │     1      2      5</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/subdataframe/subdataframe.jl#L1-L69">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.DataFrameRows" href="#DataFrames.DataFrameRows"><code>DataFrames.DataFrameRows</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">DataFrameRows{D&lt;:AbstractDataFrame} &lt;: AbstractVector{DataFrameRow}</code></pre><p>Iterator over rows of an <code>AbstractDataFrame</code>, with each row represented as a <code>DataFrameRow</code>.</p><p>A value of this type is returned by the <a href="../functions/#Base.eachrow"><code>eachrow</code></a> function.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/iteration.jl#L8-L15">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.DataFrameColumns" href="#DataFrames.DataFrameColumns"><code>DataFrames.DataFrameColumns</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">DataFrameColumns{&lt;:AbstractDataFrame}</code></pre><p>A vector-like object that allows iteration over columns of an <code>AbstractDataFrame</code>.</p><p>Indexing into <code>DataFrameColumns</code> objects using integer, <code>Symbol</code> or string returns the corresponding column (without copying). Indexing into <code>DataFrameColumns</code> objects using a multiple column selector returns a subsetted <code>DataFrameColumns</code> object with a new parent containing only the selected columns (without copying).</p><p><code>DataFrameColumns</code> supports most of the <code>AbstractVector</code> API. The key differences are that it is read-only and that the <code>keys</code> function returns a vector of <code>Symbol</code>s (and not integers as for normal vectors).</p><p>In particular <code>findnext</code>, <code>findprev</code>, <code>findfirst</code>, <code>findlast</code>, and <code>findall</code> functions are supported, and in <code>findnext</code> and <code>findprev</code> functions it is allowed to pass an integer, string, or <code>Symbol</code> as a reference index.</p></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/iteration.jl#L177-L183">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.RepeatedVector" href="#DataFrames.RepeatedVector"><code>DataFrames.RepeatedVector</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">RepeatedVector{T} &lt;: AbstractVector{T}</code></pre><p>An AbstractVector that is a view into another AbstractVector with repeated elements</p><p>NOTE: Not exported.</p><p><strong>Constructor</strong></p><pre><code class="language-julia hljs">RepeatedVector(parent::AbstractVector, inner::Int, outer::Int)</code></pre><p><strong>Arguments</strong></p><ul><li><code>parent</code> : the AbstractVector that&#39;s repeated</li><li><code>inner</code> : the number of times each element is repeated</li><li><code>outer</code> : the number of times the whole vector is repeated after expanded by <code>inner</code></li></ul><p><code>inner</code> and <code>outer</code> have the same meaning as similarly named arguments to <code>repeat</code>.</p><p><strong>Examples</strong></p><pre><code class="language-julia hljs">RepeatedVector([1, 2], 3, 1)   # [1, 1, 1, 2, 2, 2]
 RepeatedVector([1, 2], 1, 3)   # [1, 2, 1, 2, 1, 2]
-RepeatedVector([1, 2], 2, 2)   # [1, 1, 2, 2, 1, 1, 2, 2]</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/reshape.jl#L668-L696">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.StackedVector" href="#DataFrames.StackedVector"><code>DataFrames.StackedVector</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">StackedVector &lt;: AbstractVector</code></pre><p>An <code>AbstractVector</code> that is a linear, concatenated view into another set of AbstractVectors</p><p>NOTE: Not exported.</p><p><strong>Constructor</strong></p><pre><code class="language-julia hljs">StackedVector(d::AbstractVector)</code></pre><p><strong>Arguments</strong></p><ul><li><code>d...</code> : one or more AbstractVectors</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia hljs">StackedVector(Any[[1, 2], [9, 10], [11, 12]])  # [1, 2, 9, 10, 11, 12]</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/1761261e432ec923f8750e929d986d398bb60d31/src/abstractdataframe/reshape.jl#L619-L639">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../../man/comparisons/">« Comparison with Python/R/Stata</a><a class="docs-footer-nextpage" href="../functions/">Functions »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Saturday 7 September 2024 11:00">Saturday 7 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+RepeatedVector([1, 2], 2, 2)   # [1, 1, 2, 2, 1, 1, 2, 2]</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/reshape.jl#L668-L696">source</a></section></article><article class="docstring"><header><a class="docstring-article-toggle-button fa-solid fa-chevron-down" href="javascript:;" title="Collapse docstring"></a><a class="docstring-binding" id="DataFrames.StackedVector" href="#DataFrames.StackedVector"><code>DataFrames.StackedVector</code></a> — <span class="docstring-category">Type</span><span class="is-flex-grow-1 docstring-article-toggle-button" title="Collapse docstring"></span></header><section><div><pre><code class="language-julia hljs">StackedVector &lt;: AbstractVector</code></pre><p>An <code>AbstractVector</code> that is a linear, concatenated view into another set of AbstractVectors</p><p>NOTE: Not exported.</p><p><strong>Constructor</strong></p><pre><code class="language-julia hljs">StackedVector(d::AbstractVector)</code></pre><p><strong>Arguments</strong></p><ul><li><code>d...</code> : one or more AbstractVectors</li></ul><p><strong>Examples</strong></p><pre><code class="language-julia hljs">StackedVector(Any[[1, 2], [9, 10], [11, 12]])  # [1, 2, 9, 10, 11, 12]</code></pre></div><a class="docs-sourcelink" target="_blank" href="https://github.com/JuliaData/DataFrames.jl/blob/96839313f523e98b894459f4bba959c21febd7f3/src/abstractdataframe/reshape.jl#L619-L639">source</a></section></article></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../../man/comparisons/">« Comparison with Python/R/Stata</a><a class="docs-footer-nextpage" href="../functions/">Functions »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Sunday 8 September 2024 08:54">Sunday 8 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/basics/index.html b/dev/man/basics/index.html
index da9a377ac..9fa89c053 100644
--- a/dev/man/basics/index.html
+++ b/dev/man/basics/index.html
@@ -1324,4 +1324,4 @@
   998 │    38      2     40
   999 │    23      2     25
  1000 │    27      2     29
-            985 rows omitted</code></pre><p>In the examples given in this introductory tutorial we did not cover all options of the transformation mini-language. More advanced examples, in particular showing how to pass or produce multiple columns using the <code>AsTable</code> operation (which you might have seen in some DataFrames.jl demos) are given in the later sections of the manual.</p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../../">« Introduction</a><a class="docs-footer-nextpage" href="../getting_started/">Getting Started »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Saturday 7 September 2024 11:00">Saturday 7 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+            985 rows omitted</code></pre><p>In the examples given in this introductory tutorial we did not cover all options of the transformation mini-language. More advanced examples, in particular showing how to pass or produce multiple columns using the <code>AsTable</code> operation (which you might have seen in some DataFrames.jl demos) are given in the later sections of the manual.</p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../../">« Introduction</a><a class="docs-footer-nextpage" href="../getting_started/">Getting Started »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Sunday 8 September 2024 08:54">Sunday 8 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/categorical/index.html b/dev/man/categorical/index.html
index 3b3e82684..23b76a367 100644
--- a/dev/man/categorical/index.html
+++ b/dev/man/categorical/index.html
@@ -79,4 +79,4 @@
 true
 
 julia&gt; cv1[1] &lt; cv1[2]
-true</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../sorting/">« Sorting</a><a class="docs-footer-nextpage" href="../missing/">Missing Data »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Saturday 7 September 2024 11:00">Saturday 7 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+true</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../sorting/">« Sorting</a><a class="docs-footer-nextpage" href="../missing/">Missing Data »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Sunday 8 September 2024 08:54">Sunday 8 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/comparisons/index.html b/dev/man/comparisons/index.html
index a23397183..c8493f23f 100644
--- a/dev/man/comparisons/index.html
+++ b/dev/man/comparisons/index.html
@@ -26,4 +26,4 @@
              z = c(3:7, NA), id = letters[1:6])</code></pre><table><tr><th style="text-align: left">Operation</th><th style="text-align: left">dplyr</th><th style="text-align: left">DataFrames.jl</th></tr><tr><td style="text-align: left">Reduce multiple values</td><td style="text-align: left"><code>summarize(df, mean(x))</code></td><td style="text-align: left"><code>combine(df, :x =&gt; mean)</code></td></tr><tr><td style="text-align: left">Add new columns</td><td style="text-align: left"><code>mutate(df, x_mean = mean(x))</code></td><td style="text-align: left"><code>transform(df, :x =&gt; mean =&gt; :x_mean)</code></td></tr><tr><td style="text-align: left">Rename columns</td><td style="text-align: left"><code>rename(df, x_new = x)</code></td><td style="text-align: left"><code>rename(df, :x =&gt; :x_new)</code></td></tr><tr><td style="text-align: left">Pick columns</td><td style="text-align: left"><code>select(df, x, y)</code></td><td style="text-align: left"><code>select(df, :x, :y)</code></td></tr><tr><td style="text-align: left">Pick &amp; transform columns</td><td style="text-align: left"><code>transmute(df, mean(x), y)</code></td><td style="text-align: left"><code>select(df, :x =&gt; mean, :y)</code></td></tr><tr><td style="text-align: left">Pick rows</td><td style="text-align: left"><code>filter(df, x &gt;= 1)</code></td><td style="text-align: left"><code>subset(df, :x =&gt; ByRow(x -&gt; x &gt;= 1))</code></td></tr><tr><td style="text-align: left">Sort rows</td><td style="text-align: left"><code>arrange(df, x)</code></td><td style="text-align: left"><code>sort(df, :x)</code></td></tr></table><p>As in dplyr, some of these functions can be applied to grouped data frames, in which case they operate by group:</p><table><tr><th style="text-align: left">Operation</th><th style="text-align: left">dplyr</th><th style="text-align: left">DataFrames.jl</th></tr><tr><td style="text-align: left">Reduce multiple values</td><td style="text-align: left"><code>summarize(group_by(df, grp), mean(x))</code></td><td style="text-align: left"><code>combine(groupby(df, :grp), :x =&gt; mean)</code></td></tr><tr><td style="text-align: left">Add new columns</td><td style="text-align: left"><code>mutate(group_by(df, grp), mean(x))</code></td><td style="text-align: left"><code>transform(groupby(df, :grp), :x =&gt; mean)</code></td></tr><tr><td style="text-align: left">Pick &amp; transform columns</td><td style="text-align: left"><code>transmute(group_by(df, grp), mean(x), y)</code></td><td style="text-align: left"><code>select(groupby(df, :grp), :x =&gt; mean, :y)</code></td></tr></table><p>The table below compares more advanced commands:</p><table><tr><th style="text-align: left">Operation</th><th style="text-align: left">dplyr</th><th style="text-align: left">DataFrames.jl</th></tr><tr><td style="text-align: left">Complex Function</td><td style="text-align: left"><code>summarize(df, mean(x, na.rm = T))</code></td><td style="text-align: left"><code>combine(df, :x =&gt; x -&gt; mean(skipmissing(x)))</code></td></tr><tr><td style="text-align: left">Transform several columns</td><td style="text-align: left"><code>summarize(df, max(x), min(y))</code></td><td style="text-align: left"><code>combine(df, :x =&gt; maximum,  :y =&gt; minimum)</code></td></tr><tr><td style="text-align: left"></td><td style="text-align: left"><code>summarize(df, across(c(x, y), mean))</code></td><td style="text-align: left"><code>combine(df, [:x, :y] .=&gt; mean)</code></td></tr><tr><td style="text-align: left"></td><td style="text-align: left"><code>summarize(df, across(starts_with(&quot;x&quot;), mean))</code></td><td style="text-align: left"><code>combine(df, names(df, r&quot;^x&quot;) .=&gt; mean)</code></td></tr><tr><td style="text-align: left"></td><td style="text-align: left"><code>summarize(df, across(c(x, y), list(max, min)))</code></td><td style="text-align: left"><code>combine(df, ([:x, :y] .=&gt; [maximum minimum])...)</code></td></tr><tr><td style="text-align: left">Multivariate function</td><td style="text-align: left"><code>mutate(df, cor(x, y))</code></td><td style="text-align: left"><code>transform(df, [:x, :y] =&gt; cor)</code></td></tr><tr><td style="text-align: left">Row-wise</td><td style="text-align: left"><code>mutate(rowwise(df), min(x, y))</code></td><td style="text-align: left"><code>transform(df, [:x, :y] =&gt; ByRow(min))</code></td></tr><tr><td style="text-align: left"></td><td style="text-align: left"><code>mutate(rowwise(df), which.max(c_across(matches(&quot;^x&quot;))))</code></td><td style="text-align: left"><code>transform(df, AsTable(r&quot;^x&quot;) =&gt; ByRow(argmax))</code></td></tr><tr><td style="text-align: left">DataFrame as input</td><td style="text-align: left"><code>summarize(df, head(across(), 2))</code></td><td style="text-align: left"><code>combine(d -&gt; first(d, 2), df)</code></td></tr><tr><td style="text-align: left">DataFrame as output</td><td style="text-align: left"><code>summarize(df, tibble(value = c(min(x), max(x))))</code></td><td style="text-align: left"><code>combine(df, :x =&gt; (x -&gt; (value = [minimum(x), maximum(x)],)) =&gt; AsTable)</code></td></tr></table><h2 id="Comparison-with-the-R-package-data.table"><a class="docs-heading-anchor" href="#Comparison-with-the-R-package-data.table">Comparison with the R package data.table</a><a id="Comparison-with-the-R-package-data.table-1"></a><a class="docs-heading-anchor-permalink" href="#Comparison-with-the-R-package-data.table" title="Permalink"></a></h2><p>The following table compares the main functions of DataFrames.jl with the R package data.table (version 1.14.1).</p><pre><code class="language-R hljs">library(data.table)
 df  &lt;- data.table(grp = rep(1:2, 3), x = 6:1, y = 4:9,
                   z = c(3:7, NA), id = letters[1:6])
-df2 &lt;- data.table(grp=c(1,3), w = c(10,11))</code></pre><table><tr><th style="text-align: left">Operation</th><th style="text-align: left">data.table</th><th style="text-align: left">DataFrames.jl</th></tr><tr><td style="text-align: left">Reduce multiple values</td><td style="text-align: left"><code>df[, .(mean(x))]</code></td><td style="text-align: left"><code>combine(df, :x =&gt; mean)</code></td></tr><tr><td style="text-align: left">Add new columns</td><td style="text-align: left"><code>df[, x_mean:=mean(x) ]</code></td><td style="text-align: left"><code>transform!(df, :x =&gt; mean =&gt; :x_mean)</code></td></tr><tr><td style="text-align: left">Rename column (in place)</td><td style="text-align: left"><code>setnames(df, &quot;x&quot;, &quot;x_new&quot;)</code></td><td style="text-align: left"><code>rename!(df, :x =&gt; :x_new)</code></td></tr><tr><td style="text-align: left">Rename multiple columns (in place)</td><td style="text-align: left"><code>setnames(df, c(&quot;x&quot;, &quot;y&quot;), c(&quot;x_new&quot;, &quot;y_new&quot;))</code></td><td style="text-align: left"><code>rename!(df, [:x, :y] .=&gt; [:x_new, :y_new])</code></td></tr><tr><td style="text-align: left">Pick columns as dataframe</td><td style="text-align: left"><code>df[, .(x, y)]</code></td><td style="text-align: left"><code>select(df, :x, :y)</code></td></tr><tr><td style="text-align: left">Pick column as a vector</td><td style="text-align: left"><code>df[, x]</code></td><td style="text-align: left"><code>df[!, :x]</code></td></tr><tr><td style="text-align: left">Remove columns</td><td style="text-align: left"><code>df[, -&quot;x&quot;]</code></td><td style="text-align: left"><code>select(df, Not(:x))</code></td></tr><tr><td style="text-align: left">Remove columns (in place)</td><td style="text-align: left"><code>df[, x:=NULL]</code></td><td style="text-align: left"><code>select!(df, Not(:x))</code></td></tr><tr><td style="text-align: left">Remove columns (in place)</td><td style="text-align: left"><code>df[, c(&quot;x&quot;, &quot;y&quot;):=NULL]</code></td><td style="text-align: left"><code>select!(df, Not([:x, :y]))</code></td></tr><tr><td style="text-align: left">Pick &amp; transform columns</td><td style="text-align: left"><code>df[, .(mean(x), y)]</code></td><td style="text-align: left"><code>select(df, :x =&gt; mean, :y)</code></td></tr><tr><td style="text-align: left">Pick rows</td><td style="text-align: left"><code>df[ x &gt;= 1 ]</code></td><td style="text-align: left"><code>filter(:x =&gt; &gt;=(1), df)</code></td></tr><tr><td style="text-align: left">Sort rows (in place)</td><td style="text-align: left"><code>setorder(df, x)</code></td><td style="text-align: left"><code>sort!(df, :x)</code></td></tr><tr><td style="text-align: left">Sort rows</td><td style="text-align: left"><code>df[ order(x) ]</code></td><td style="text-align: left"><code>sort(df, :x)</code></td></tr></table><h3 id="Grouping-data-and-aggregation-2"><a class="docs-heading-anchor" href="#Grouping-data-and-aggregation-2">Grouping data and aggregation</a><a class="docs-heading-anchor-permalink" href="#Grouping-data-and-aggregation-2" title="Permalink"></a></h3><table><tr><th style="text-align: left">Operation</th><th style="text-align: left">data.table</th><th style="text-align: left">DataFrames.jl</th></tr><tr><td style="text-align: left">Reduce multiple values</td><td style="text-align: left"><code>df[, mean(x), by=id ]</code></td><td style="text-align: left"><code>combine(groupby(df, :id), :x =&gt; mean)</code></td></tr><tr><td style="text-align: left">Add new columns (in place)</td><td style="text-align: left"><code>df[, x_mean:=mean(x), by=id]</code></td><td style="text-align: left"><code>transform!(groupby(df, :id), :x =&gt; mean)</code></td></tr><tr><td style="text-align: left">Pick &amp; transform columns</td><td style="text-align: left"><code>df[, .(x_mean = mean(x), y), by=id]</code></td><td style="text-align: left"><code>select(groupby(df, :id), :x =&gt; mean, :y)</code></td></tr></table><h3 id="More-advanced-commands-2"><a class="docs-heading-anchor" href="#More-advanced-commands-2">More advanced commands</a><a class="docs-heading-anchor-permalink" href="#More-advanced-commands-2" title="Permalink"></a></h3><table><tr><th style="text-align: left">Operation</th><th style="text-align: left">data.table</th><th style="text-align: left">DataFrames.jl</th></tr><tr><td style="text-align: left">Complex Function</td><td style="text-align: left"><code>df[, .(mean(x, na.rm=TRUE)) ]</code></td><td style="text-align: left"><code>combine(df, :x =&gt; x -&gt; mean(skipmissing(x)))</code></td></tr><tr><td style="text-align: left">Transform certain rows (in place)</td><td style="text-align: left"><code>df[x&lt;=0, x:=0]</code></td><td style="text-align: left"><code>df.x[df.x .&lt;= 0] .= 0</code></td></tr><tr><td style="text-align: left">Transform several columns</td><td style="text-align: left"><code>df[, .(max(x), min(y)) ]</code></td><td style="text-align: left"><code>combine(df, :x =&gt; maximum, :y =&gt; minimum)</code></td></tr><tr><td style="text-align: left"></td><td style="text-align: left"><code>df[, lapply(.SD, mean), .SDcols = c(&quot;x&quot;, &quot;y&quot;) ]</code></td><td style="text-align: left"><code>combine(df, [:x, :y] .=&gt; mean)</code></td></tr><tr><td style="text-align: left"></td><td style="text-align: left"><code>df[, lapply(.SD, mean), .SDcols = patterns(&quot;*x&quot;) ]</code></td><td style="text-align: left"><code>combine(df, names(df, r&quot;^x&quot;) .=&gt; mean)</code></td></tr><tr><td style="text-align: left"></td><td style="text-align: left"><code>df[, unlist(lapply(.SD, function(x) c(max=max(x), min=min(x)))), .SDcols = c(&quot;x&quot;, &quot;y&quot;) ]</code></td><td style="text-align: left"><code>combine(df, ([:x, :y] .=&gt; [maximum minimum])...)</code></td></tr><tr><td style="text-align: left">Multivariate function</td><td style="text-align: left"><code>df[, .(cor(x,y)) ]</code></td><td style="text-align: left"><code>transform(df, [:x, :y] =&gt; cor)</code></td></tr><tr><td style="text-align: left">Row-wise</td><td style="text-align: left"><code>df[, min_xy := min(x, y), by = 1:nrow(df)]</code></td><td style="text-align: left"><code>transform!(df, [:x, :y] =&gt; ByRow(min))</code></td></tr><tr><td style="text-align: left"></td><td style="text-align: left"><code>df[, argmax_xy := which.max(.SD) , .SDcols = patterns(&quot;*x&quot;), by = 1:nrow(df) ]</code></td><td style="text-align: left"><code>transform!(df, AsTable(r&quot;^x&quot;) =&gt; ByRow(argmax))</code></td></tr><tr><td style="text-align: left">DataFrame as output</td><td style="text-align: left"><code>df[, .SD[1], by=grp]</code></td><td style="text-align: left"><code>combine(groupby(df, :grp), first)</code></td></tr><tr><td style="text-align: left">DataFrame as output</td><td style="text-align: left"><code>df[, .SD[which.max(x)], by=grp]</code></td><td style="text-align: left"><code>combine(groupby(df, :grp), sdf -&gt; sdf[argmax(sdf.x), :])</code></td></tr></table><h3 id="Joining-data-frames-2"><a class="docs-heading-anchor" href="#Joining-data-frames-2">Joining data frames</a><a class="docs-heading-anchor-permalink" href="#Joining-data-frames-2" title="Permalink"></a></h3><table><tr><th style="text-align: left">Operation</th><th style="text-align: left">data.table</th><th style="text-align: left">DataFrames.jl</th></tr><tr><td style="text-align: left">Inner join</td><td style="text-align: left"><code>merge(df, df2, on = &quot;grp&quot;)</code></td><td style="text-align: left"><code>innerjoin(df, df2, on = :grp)</code></td></tr><tr><td style="text-align: left">Outer join</td><td style="text-align: left"><code>merge(df, df2, all = TRUE, on = &quot;grp&quot;)</code></td><td style="text-align: left"><code>outerjoin(df, df2, on = :grp)</code></td></tr><tr><td style="text-align: left">Left join</td><td style="text-align: left"><code>merge(df, df2, all.x = TRUE, on = &quot;grp&quot;)</code></td><td style="text-align: left"><code>leftjoin(df, df2, on = :grp)</code></td></tr><tr><td style="text-align: left">Right join</td><td style="text-align: left"><code>merge(df, df2, all.y = TRUE, on = &quot;grp&quot;)</code></td><td style="text-align: left"><code>rightjoin(df, df2, on = :grp)</code></td></tr><tr><td style="text-align: left">Anti join (filtering)</td><td style="text-align: left"><code>df[!df2, on = &quot;grp&quot; ]</code></td><td style="text-align: left"><code>antijoin(df, df2, on = :grp)</code></td></tr><tr><td style="text-align: left">Semi join (filtering)</td><td style="text-align: left"><code>merge(df1, df2[, .(grp)])</code></td><td style="text-align: left"><code>semijoin(df, df2, on = :grp)</code></td></tr></table><h2 id="Comparison-with-Stata-(version-8-and-above)"><a class="docs-heading-anchor" href="#Comparison-with-Stata-(version-8-and-above)">Comparison with Stata (version 8 and above)</a><a id="Comparison-with-Stata-(version-8-and-above)-1"></a><a class="docs-heading-anchor-permalink" href="#Comparison-with-Stata-(version-8-and-above)" title="Permalink"></a></h2><p>The following table compares the main functions of DataFrames.jl with Stata:</p><table><tr><th style="text-align: left">Operation</th><th style="text-align: left">Stata</th><th style="text-align: left">DataFrames.jl</th></tr><tr><td style="text-align: left">Reduce multiple values</td><td style="text-align: left"><code>collapse (mean) x</code></td><td style="text-align: left"><code>combine(df, :x =&gt; mean)</code></td></tr><tr><td style="text-align: left">Add new columns</td><td style="text-align: left"><code>egen x_mean = mean(x)</code></td><td style="text-align: left"><code>transform!(df, :x =&gt; mean =&gt; :x_mean)</code></td></tr><tr><td style="text-align: left">Rename columns</td><td style="text-align: left"><code>rename x x_new</code></td><td style="text-align: left"><code>rename!(df, :x =&gt; :x_new)</code></td></tr><tr><td style="text-align: left">Pick columns</td><td style="text-align: left"><code>keep x y</code></td><td style="text-align: left"><code>select!(df, :x, :y)</code></td></tr><tr><td style="text-align: left">Pick rows</td><td style="text-align: left"><code>keep if x &gt;= 1</code></td><td style="text-align: left"><code>subset!(df, :x =&gt; ByRow(x -&gt; x &gt;= 1))</code></td></tr><tr><td style="text-align: left">Sort rows</td><td style="text-align: left"><code>sort x</code></td><td style="text-align: left"><code>sort!(df, :x)</code></td></tr></table><p>Note that the suffix <code>!</code> (i.e. <code>transform!</code>, <code>select!</code>, etc) ensures that the operation transforms the dataframe in place, as in Stata</p><p>Some of these functions can be applied to grouped data frames, in which case they operate by group:</p><table><tr><th style="text-align: left">Operation</th><th style="text-align: left">Stata</th><th style="text-align: left">DataFrames.jl</th></tr><tr><td style="text-align: left">Add new columns</td><td style="text-align: left"><code>egen x_mean = mean(x), by(grp)</code></td><td style="text-align: left"><code>transform!(groupby(df, :grp), :x =&gt; mean)</code></td></tr><tr><td style="text-align: left">Reduce multiple values</td><td style="text-align: left"><code>collapse (mean) x, by(grp)</code></td><td style="text-align: left"><code>combine(groupby(df, :grp), :x =&gt; mean)</code></td></tr></table><p>The table below compares more advanced commands:</p><table><tr><th style="text-align: left">Operation</th><th style="text-align: left">Stata</th><th style="text-align: left">DataFrames.jl</th></tr><tr><td style="text-align: left">Transform certain rows</td><td style="text-align: left"><code>replace x = 0 if x &lt;= 0</code></td><td style="text-align: left"><code>transform(df, :x =&gt; (x -&gt; ifelse.(x .&lt;= 0, 0, x)) =&gt; :x)</code></td></tr><tr><td style="text-align: left">Transform several columns</td><td style="text-align: left"><code>collapse (max) x (min) y</code></td><td style="text-align: left"><code>combine(df, :x =&gt; maximum,  :y =&gt; minimum)</code></td></tr><tr><td style="text-align: left"></td><td style="text-align: left"><code>collapse (mean) x y</code></td><td style="text-align: left"><code>combine(df, [:x, :y] .=&gt; mean)</code></td></tr><tr><td style="text-align: left"></td><td style="text-align: left"><code>collapse (mean) x*</code></td><td style="text-align: left"><code>combine(df, names(df, r&quot;^x&quot;) .=&gt; mean)</code></td></tr><tr><td style="text-align: left"></td><td style="text-align: left"><code>collapse (max) x y (min) x y</code></td><td style="text-align: left"><code>combine(df, ([:x, :y] .=&gt; [maximum minimum])...)</code></td></tr><tr><td style="text-align: left">Multivariate function</td><td style="text-align: left"><code>egen z = corr(x y)</code></td><td style="text-align: left"><code>transform!(df, [:x, :y] =&gt; cor =&gt; :z)</code></td></tr><tr><td style="text-align: left">Row-wise</td><td style="text-align: left"><code>egen z = rowmin(x y)</code></td><td style="text-align: left"><code>transform!(df, [:x, :y] =&gt; ByRow(min) =&gt; :z)</code></td></tr></table></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../querying_frameworks/">« Data manipulation frameworks</a><a class="docs-footer-nextpage" href="../../lib/types/">Types »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Saturday 7 September 2024 11:00">Saturday 7 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+df2 &lt;- data.table(grp=c(1,3), w = c(10,11))</code></pre><table><tr><th style="text-align: left">Operation</th><th style="text-align: left">data.table</th><th style="text-align: left">DataFrames.jl</th></tr><tr><td style="text-align: left">Reduce multiple values</td><td style="text-align: left"><code>df[, .(mean(x))]</code></td><td style="text-align: left"><code>combine(df, :x =&gt; mean)</code></td></tr><tr><td style="text-align: left">Add new columns</td><td style="text-align: left"><code>df[, x_mean:=mean(x) ]</code></td><td style="text-align: left"><code>transform!(df, :x =&gt; mean =&gt; :x_mean)</code></td></tr><tr><td style="text-align: left">Rename column (in place)</td><td style="text-align: left"><code>setnames(df, &quot;x&quot;, &quot;x_new&quot;)</code></td><td style="text-align: left"><code>rename!(df, :x =&gt; :x_new)</code></td></tr><tr><td style="text-align: left">Rename multiple columns (in place)</td><td style="text-align: left"><code>setnames(df, c(&quot;x&quot;, &quot;y&quot;), c(&quot;x_new&quot;, &quot;y_new&quot;))</code></td><td style="text-align: left"><code>rename!(df, [:x, :y] .=&gt; [:x_new, :y_new])</code></td></tr><tr><td style="text-align: left">Pick columns as dataframe</td><td style="text-align: left"><code>df[, .(x, y)]</code></td><td style="text-align: left"><code>select(df, :x, :y)</code></td></tr><tr><td style="text-align: left">Pick column as a vector</td><td style="text-align: left"><code>df[, x]</code></td><td style="text-align: left"><code>df[!, :x]</code></td></tr><tr><td style="text-align: left">Remove columns</td><td style="text-align: left"><code>df[, -&quot;x&quot;]</code></td><td style="text-align: left"><code>select(df, Not(:x))</code></td></tr><tr><td style="text-align: left">Remove columns (in place)</td><td style="text-align: left"><code>df[, x:=NULL]</code></td><td style="text-align: left"><code>select!(df, Not(:x))</code></td></tr><tr><td style="text-align: left">Remove columns (in place)</td><td style="text-align: left"><code>df[, c(&quot;x&quot;, &quot;y&quot;):=NULL]</code></td><td style="text-align: left"><code>select!(df, Not([:x, :y]))</code></td></tr><tr><td style="text-align: left">Pick &amp; transform columns</td><td style="text-align: left"><code>df[, .(mean(x), y)]</code></td><td style="text-align: left"><code>select(df, :x =&gt; mean, :y)</code></td></tr><tr><td style="text-align: left">Pick rows</td><td style="text-align: left"><code>df[ x &gt;= 1 ]</code></td><td style="text-align: left"><code>filter(:x =&gt; &gt;=(1), df)</code></td></tr><tr><td style="text-align: left">Sort rows (in place)</td><td style="text-align: left"><code>setorder(df, x)</code></td><td style="text-align: left"><code>sort!(df, :x)</code></td></tr><tr><td style="text-align: left">Sort rows</td><td style="text-align: left"><code>df[ order(x) ]</code></td><td style="text-align: left"><code>sort(df, :x)</code></td></tr></table><h3 id="Grouping-data-and-aggregation-2"><a class="docs-heading-anchor" href="#Grouping-data-and-aggregation-2">Grouping data and aggregation</a><a class="docs-heading-anchor-permalink" href="#Grouping-data-and-aggregation-2" title="Permalink"></a></h3><table><tr><th style="text-align: left">Operation</th><th style="text-align: left">data.table</th><th style="text-align: left">DataFrames.jl</th></tr><tr><td style="text-align: left">Reduce multiple values</td><td style="text-align: left"><code>df[, mean(x), by=id ]</code></td><td style="text-align: left"><code>combine(groupby(df, :id), :x =&gt; mean)</code></td></tr><tr><td style="text-align: left">Add new columns (in place)</td><td style="text-align: left"><code>df[, x_mean:=mean(x), by=id]</code></td><td style="text-align: left"><code>transform!(groupby(df, :id), :x =&gt; mean)</code></td></tr><tr><td style="text-align: left">Pick &amp; transform columns</td><td style="text-align: left"><code>df[, .(x_mean = mean(x), y), by=id]</code></td><td style="text-align: left"><code>select(groupby(df, :id), :x =&gt; mean, :y)</code></td></tr></table><h3 id="More-advanced-commands-2"><a class="docs-heading-anchor" href="#More-advanced-commands-2">More advanced commands</a><a class="docs-heading-anchor-permalink" href="#More-advanced-commands-2" title="Permalink"></a></h3><table><tr><th style="text-align: left">Operation</th><th style="text-align: left">data.table</th><th style="text-align: left">DataFrames.jl</th></tr><tr><td style="text-align: left">Complex Function</td><td style="text-align: left"><code>df[, .(mean(x, na.rm=TRUE)) ]</code></td><td style="text-align: left"><code>combine(df, :x =&gt; x -&gt; mean(skipmissing(x)))</code></td></tr><tr><td style="text-align: left">Transform certain rows (in place)</td><td style="text-align: left"><code>df[x&lt;=0, x:=0]</code></td><td style="text-align: left"><code>df.x[df.x .&lt;= 0] .= 0</code></td></tr><tr><td style="text-align: left">Transform several columns</td><td style="text-align: left"><code>df[, .(max(x), min(y)) ]</code></td><td style="text-align: left"><code>combine(df, :x =&gt; maximum, :y =&gt; minimum)</code></td></tr><tr><td style="text-align: left"></td><td style="text-align: left"><code>df[, lapply(.SD, mean), .SDcols = c(&quot;x&quot;, &quot;y&quot;) ]</code></td><td style="text-align: left"><code>combine(df, [:x, :y] .=&gt; mean)</code></td></tr><tr><td style="text-align: left"></td><td style="text-align: left"><code>df[, lapply(.SD, mean), .SDcols = patterns(&quot;*x&quot;) ]</code></td><td style="text-align: left"><code>combine(df, names(df, r&quot;^x&quot;) .=&gt; mean)</code></td></tr><tr><td style="text-align: left"></td><td style="text-align: left"><code>df[, unlist(lapply(.SD, function(x) c(max=max(x), min=min(x)))), .SDcols = c(&quot;x&quot;, &quot;y&quot;) ]</code></td><td style="text-align: left"><code>combine(df, ([:x, :y] .=&gt; [maximum minimum])...)</code></td></tr><tr><td style="text-align: left">Multivariate function</td><td style="text-align: left"><code>df[, .(cor(x,y)) ]</code></td><td style="text-align: left"><code>transform(df, [:x, :y] =&gt; cor)</code></td></tr><tr><td style="text-align: left">Row-wise</td><td style="text-align: left"><code>df[, min_xy := min(x, y), by = 1:nrow(df)]</code></td><td style="text-align: left"><code>transform!(df, [:x, :y] =&gt; ByRow(min))</code></td></tr><tr><td style="text-align: left"></td><td style="text-align: left"><code>df[, argmax_xy := which.max(.SD) , .SDcols = patterns(&quot;*x&quot;), by = 1:nrow(df) ]</code></td><td style="text-align: left"><code>transform!(df, AsTable(r&quot;^x&quot;) =&gt; ByRow(argmax))</code></td></tr><tr><td style="text-align: left">DataFrame as output</td><td style="text-align: left"><code>df[, .SD[1], by=grp]</code></td><td style="text-align: left"><code>combine(groupby(df, :grp), first)</code></td></tr><tr><td style="text-align: left">DataFrame as output</td><td style="text-align: left"><code>df[, .SD[which.max(x)], by=grp]</code></td><td style="text-align: left"><code>combine(groupby(df, :grp), sdf -&gt; sdf[argmax(sdf.x), :])</code></td></tr></table><h3 id="Joining-data-frames-2"><a class="docs-heading-anchor" href="#Joining-data-frames-2">Joining data frames</a><a class="docs-heading-anchor-permalink" href="#Joining-data-frames-2" title="Permalink"></a></h3><table><tr><th style="text-align: left">Operation</th><th style="text-align: left">data.table</th><th style="text-align: left">DataFrames.jl</th></tr><tr><td style="text-align: left">Inner join</td><td style="text-align: left"><code>merge(df, df2, on = &quot;grp&quot;)</code></td><td style="text-align: left"><code>innerjoin(df, df2, on = :grp)</code></td></tr><tr><td style="text-align: left">Outer join</td><td style="text-align: left"><code>merge(df, df2, all = TRUE, on = &quot;grp&quot;)</code></td><td style="text-align: left"><code>outerjoin(df, df2, on = :grp)</code></td></tr><tr><td style="text-align: left">Left join</td><td style="text-align: left"><code>merge(df, df2, all.x = TRUE, on = &quot;grp&quot;)</code></td><td style="text-align: left"><code>leftjoin(df, df2, on = :grp)</code></td></tr><tr><td style="text-align: left">Right join</td><td style="text-align: left"><code>merge(df, df2, all.y = TRUE, on = &quot;grp&quot;)</code></td><td style="text-align: left"><code>rightjoin(df, df2, on = :grp)</code></td></tr><tr><td style="text-align: left">Anti join (filtering)</td><td style="text-align: left"><code>df[!df2, on = &quot;grp&quot; ]</code></td><td style="text-align: left"><code>antijoin(df, df2, on = :grp)</code></td></tr><tr><td style="text-align: left">Semi join (filtering)</td><td style="text-align: left"><code>merge(df1, df2[, .(grp)])</code></td><td style="text-align: left"><code>semijoin(df, df2, on = :grp)</code></td></tr></table><h2 id="Comparison-with-Stata-(version-8-and-above)"><a class="docs-heading-anchor" href="#Comparison-with-Stata-(version-8-and-above)">Comparison with Stata (version 8 and above)</a><a id="Comparison-with-Stata-(version-8-and-above)-1"></a><a class="docs-heading-anchor-permalink" href="#Comparison-with-Stata-(version-8-and-above)" title="Permalink"></a></h2><p>The following table compares the main functions of DataFrames.jl with Stata:</p><table><tr><th style="text-align: left">Operation</th><th style="text-align: left">Stata</th><th style="text-align: left">DataFrames.jl</th></tr><tr><td style="text-align: left">Reduce multiple values</td><td style="text-align: left"><code>collapse (mean) x</code></td><td style="text-align: left"><code>combine(df, :x =&gt; mean)</code></td></tr><tr><td style="text-align: left">Add new columns</td><td style="text-align: left"><code>egen x_mean = mean(x)</code></td><td style="text-align: left"><code>transform!(df, :x =&gt; mean =&gt; :x_mean)</code></td></tr><tr><td style="text-align: left">Rename columns</td><td style="text-align: left"><code>rename x x_new</code></td><td style="text-align: left"><code>rename!(df, :x =&gt; :x_new)</code></td></tr><tr><td style="text-align: left">Pick columns</td><td style="text-align: left"><code>keep x y</code></td><td style="text-align: left"><code>select!(df, :x, :y)</code></td></tr><tr><td style="text-align: left">Pick rows</td><td style="text-align: left"><code>keep if x &gt;= 1</code></td><td style="text-align: left"><code>subset!(df, :x =&gt; ByRow(x -&gt; x &gt;= 1))</code></td></tr><tr><td style="text-align: left">Sort rows</td><td style="text-align: left"><code>sort x</code></td><td style="text-align: left"><code>sort!(df, :x)</code></td></tr></table><p>Note that the suffix <code>!</code> (i.e. <code>transform!</code>, <code>select!</code>, etc) ensures that the operation transforms the dataframe in place, as in Stata</p><p>Some of these functions can be applied to grouped data frames, in which case they operate by group:</p><table><tr><th style="text-align: left">Operation</th><th style="text-align: left">Stata</th><th style="text-align: left">DataFrames.jl</th></tr><tr><td style="text-align: left">Add new columns</td><td style="text-align: left"><code>egen x_mean = mean(x), by(grp)</code></td><td style="text-align: left"><code>transform!(groupby(df, :grp), :x =&gt; mean)</code></td></tr><tr><td style="text-align: left">Reduce multiple values</td><td style="text-align: left"><code>collapse (mean) x, by(grp)</code></td><td style="text-align: left"><code>combine(groupby(df, :grp), :x =&gt; mean)</code></td></tr></table><p>The table below compares more advanced commands:</p><table><tr><th style="text-align: left">Operation</th><th style="text-align: left">Stata</th><th style="text-align: left">DataFrames.jl</th></tr><tr><td style="text-align: left">Transform certain rows</td><td style="text-align: left"><code>replace x = 0 if x &lt;= 0</code></td><td style="text-align: left"><code>transform(df, :x =&gt; (x -&gt; ifelse.(x .&lt;= 0, 0, x)) =&gt; :x)</code></td></tr><tr><td style="text-align: left">Transform several columns</td><td style="text-align: left"><code>collapse (max) x (min) y</code></td><td style="text-align: left"><code>combine(df, :x =&gt; maximum,  :y =&gt; minimum)</code></td></tr><tr><td style="text-align: left"></td><td style="text-align: left"><code>collapse (mean) x y</code></td><td style="text-align: left"><code>combine(df, [:x, :y] .=&gt; mean)</code></td></tr><tr><td style="text-align: left"></td><td style="text-align: left"><code>collapse (mean) x*</code></td><td style="text-align: left"><code>combine(df, names(df, r&quot;^x&quot;) .=&gt; mean)</code></td></tr><tr><td style="text-align: left"></td><td style="text-align: left"><code>collapse (max) x y (min) x y</code></td><td style="text-align: left"><code>combine(df, ([:x, :y] .=&gt; [maximum minimum])...)</code></td></tr><tr><td style="text-align: left">Multivariate function</td><td style="text-align: left"><code>egen z = corr(x y)</code></td><td style="text-align: left"><code>transform!(df, [:x, :y] =&gt; cor =&gt; :z)</code></td></tr><tr><td style="text-align: left">Row-wise</td><td style="text-align: left"><code>egen z = rowmin(x y)</code></td><td style="text-align: left"><code>transform!(df, [:x, :y] =&gt; ByRow(min) =&gt; :z)</code></td></tr></table></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../querying_frameworks/">« Data manipulation frameworks</a><a class="docs-footer-nextpage" href="../../lib/types/">Types »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Sunday 8 September 2024 08:54">Sunday 8 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/getting_started/index.html b/dev/man/getting_started/index.html
index e606f9516..c09be72b7 100644
--- a/dev/man/getting_started/index.html
+++ b/dev/man/getting_started/index.html
@@ -264,4 +264,4 @@
 julia&gt; Tables.rowtable(df)
 2-element Vector{@NamedTuple{a::Int64, b::Int64}}:
  (a = 1, b = 2)
- (a = 3, b = 4)</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../basics/">« First Steps with DataFrames.jl</a><a class="docs-footer-nextpage" href="../working_with_dataframes/">Working with DataFrames »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Saturday 7 September 2024 11:00">Saturday 7 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+ (a = 3, b = 4)</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../basics/">« First Steps with DataFrames.jl</a><a class="docs-footer-nextpage" href="../working_with_dataframes/">Working with DataFrames »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Sunday 8 September 2024 08:54">Sunday 8 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/importing_and_exporting/index.html b/dev/man/importing_and_exporting/index.html
index bbe7ef8bb..8f1a4eb1d 100644
--- a/dev/man/importing_and_exporting/index.html
+++ b/dev/man/importing_and_exporting/index.html
@@ -51,4 +51,4 @@
  148 │         6.5         3.0          5.2         2.0  Iris-virginica
  149 │         6.2         3.4          5.4         2.3  Iris-virginica
  150 │         5.9         3.0          5.1         1.8  Iris-virginica
-                                                        135 rows omitted</code></pre><p>Observe that in our example:</p><ul><li><code>header</code> is a <code>Matrix</code> therefore we had to pass <code>vec(header)</code> to the <code>DataFrame</code> constructor;</li><li>we broadcasted the <code>identity</code> function over the <code>iris_raw</code> data frame to perform narrowing of <code>eltype</code> of columns of <code>iris_raw</code>; the reason is that read in by the <code>readdlm</code> function is stored into a <code>data</code> <code>Matrix</code> so all columns in <code>iris_raw</code> initially have the same <code>eltype</code> – in this case it had to be <code>Any</code> as some of the columns are numeric and some are string.</li></ul><p>All such operations (and many more) are automatically handled by CSV.jl.</p><p>Similarly, you can use the <code>writedlm</code> function from the <code>DelimitedFiles</code> module to save a data frame like this:</p><pre><code class="language-julia hljs">writedlm(&quot;test.csv&quot;, Iterators.flatten(([names(iris)], eachrow(iris))), &#39;,&#39;)</code></pre><p>As you can see the code required to transform <code>iris</code> into a proper input to the <code>writedlm</code> function so that you can create the CSV file having the expected format is not easy. Therefore CSV.jl is the preferred package to write CSV files for data stored in data frames.</p><h2 id="Other-formats"><a class="docs-heading-anchor" href="#Other-formats">Other formats</a><a id="Other-formats-1"></a><a class="docs-heading-anchor-permalink" href="#Other-formats" title="Permalink"></a></h2><p>Other data formats are supported for reading and writing in the following packages (non exhaustive list):</p><ul><li>Apache Arrow (including Feather v2): <a href="https://github.com/JuliaData/Arrow.jl">Arrow.jl</a></li><li>Apache Feather (v1): <a href="https://github.com/JuliaData/Feather.jl">Feather.jl</a></li><li>Apache Avro: <a href="https://github.com/JuliaData/Avro.jl">Avro.jl</a></li><li>JSON: <a href="https://github.com/JuliaData/JSONTables.jl">JSONTables.jl</a></li><li>Parquet: <a href="https://gitlab.com/ExpandingMan/Parquet2.jl">Parquet2.jl</a></li><li>Stata, SAS and SPSS: <a href="https://github.com/junyuan-chen/ReadStatTables.jl">ReadStatTables.jl</a> (alternatively <a href="https://www.queryverse.org/">Queryverse</a>  users can choose <a href="https://github.com/queryverse/StatFiles.jl">StatFiles.jl</a>)</li><li>reading R data files (.rda, .RData): <a href="https://github.com/JuliaData/RData.jl">RData.jl</a></li><li>Microsoft Excel (XLSX): <a href="https://github.com/felipenoris/XLSX.jl">XLSX.jl</a></li><li>Copying/pasting to clipboard, for sending data to and from spreadsheets: <a href="https://github.com/pdeffebach/ClipData.jl">ClipData.jl</a></li></ul></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../working_with_dataframes/">« Working with DataFrames</a><a class="docs-footer-nextpage" href="../joins/">Joins »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Saturday 7 September 2024 11:00">Saturday 7 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+                                                        135 rows omitted</code></pre><p>Observe that in our example:</p><ul><li><code>header</code> is a <code>Matrix</code> therefore we had to pass <code>vec(header)</code> to the <code>DataFrame</code> constructor;</li><li>we broadcasted the <code>identity</code> function over the <code>iris_raw</code> data frame to perform narrowing of <code>eltype</code> of columns of <code>iris_raw</code>; the reason is that read in by the <code>readdlm</code> function is stored into a <code>data</code> <code>Matrix</code> so all columns in <code>iris_raw</code> initially have the same <code>eltype</code> – in this case it had to be <code>Any</code> as some of the columns are numeric and some are string.</li></ul><p>All such operations (and many more) are automatically handled by CSV.jl.</p><p>Similarly, you can use the <code>writedlm</code> function from the <code>DelimitedFiles</code> module to save a data frame like this:</p><pre><code class="language-julia hljs">writedlm(&quot;test.csv&quot;, Iterators.flatten(([names(iris)], eachrow(iris))), &#39;,&#39;)</code></pre><p>As you can see the code required to transform <code>iris</code> into a proper input to the <code>writedlm</code> function so that you can create the CSV file having the expected format is not easy. Therefore CSV.jl is the preferred package to write CSV files for data stored in data frames.</p><h2 id="Other-formats"><a class="docs-heading-anchor" href="#Other-formats">Other formats</a><a id="Other-formats-1"></a><a class="docs-heading-anchor-permalink" href="#Other-formats" title="Permalink"></a></h2><p>Other data formats are supported for reading and writing in the following packages (non exhaustive list):</p><ul><li>Apache Arrow (including Feather v2): <a href="https://github.com/JuliaData/Arrow.jl">Arrow.jl</a></li><li>Apache Feather (v1): <a href="https://github.com/JuliaData/Feather.jl">Feather.jl</a></li><li>Apache Avro: <a href="https://github.com/JuliaData/Avro.jl">Avro.jl</a></li><li>JSON: <a href="https://github.com/JuliaData/JSONTables.jl">JSONTables.jl</a></li><li>Parquet: <a href="https://gitlab.com/ExpandingMan/Parquet2.jl">Parquet2.jl</a></li><li>Stata, SAS and SPSS: <a href="https://github.com/junyuan-chen/ReadStatTables.jl">ReadStatTables.jl</a> (alternatively <a href="https://www.queryverse.org/">Queryverse</a>  users can choose <a href="https://github.com/queryverse/StatFiles.jl">StatFiles.jl</a>)</li><li>reading R data files (.rda, .RData): <a href="https://github.com/JuliaData/RData.jl">RData.jl</a></li><li>Microsoft Excel (XLSX): <a href="https://github.com/felipenoris/XLSX.jl">XLSX.jl</a></li><li>Copying/pasting to clipboard, for sending data to and from spreadsheets: <a href="https://github.com/pdeffebach/ClipData.jl">ClipData.jl</a></li></ul></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../working_with_dataframes/">« Working with DataFrames</a><a class="docs-footer-nextpage" href="../joins/">Joins »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Sunday 8 September 2024 08:54">Sunday 8 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/joins/index.html b/dev/man/joins/index.html
index 4a56b6156..15aad96b5 100644
--- a/dev/man/joins/index.html
+++ b/dev/man/joins/index.html
@@ -283,4 +283,4 @@
    2 │     2      2  a
    3 │     3      3  missing
    4 │     4      4  b</code></pre><p>Note that in this case the order and number of rows in the left table is not changed. Therefore, in particular, it is not allowed to have duplicate keys in the right table:</p><pre><code class="nohighlight hljs">julia&gt; leftjoin!(main, DataFrame(id=[2, 2], info_bad=[&quot;a&quot;, &quot;b&quot;]), on=:id)
-ERROR: ArgumentError: duplicate rows found in right table</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../importing_and_exporting/">« Importing and Exporting Data (I/O)</a><a class="docs-footer-nextpage" href="../split_apply_combine/">Split-apply-combine »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Saturday 7 September 2024 11:00">Saturday 7 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+ERROR: ArgumentError: duplicate rows found in right table</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../importing_and_exporting/">« Importing and Exporting Data (I/O)</a><a class="docs-footer-nextpage" href="../split_apply_combine/">Split-apply-combine »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Sunday 8 September 2024 08:54">Sunday 8 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/missing/index.html b/dev/man/missing/index.html
index 51c2ad743..7e2cec70a 100644
--- a/dev/man/missing/index.html
+++ b/dev/man/missing/index.html
@@ -137,4 +137,4 @@
 
 julia&gt; missings(Int, 1, 3)
 1×3 Matrix{Union{Missing, Int64}}:
- missing  missing  missing</code></pre><p>See the <a href="https://docs.julialang.org/en/v1/manual/missing/">Julia manual</a> for more information about missing values.</p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../categorical/">« Categorical Data</a><a class="docs-footer-nextpage" href="../querying_frameworks/">Data manipulation frameworks »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Saturday 7 September 2024 11:00">Saturday 7 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+ missing  missing  missing</code></pre><p>See the <a href="https://docs.julialang.org/en/v1/manual/missing/">Julia manual</a> for more information about missing values.</p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../categorical/">« Categorical Data</a><a class="docs-footer-nextpage" href="../querying_frameworks/">Data manipulation frameworks »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Sunday 8 September 2024 08:54">Sunday 8 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/querying_frameworks/index.html b/dev/man/querying_frameworks/index.html
index dcbb14701..bb095d2f9 100644
--- a/dev/man/querying_frameworks/index.html
+++ b/dev/man/querying_frameworks/index.html
@@ -242,4 +242,4 @@
        end
 1-element Vector{String}:
  &quot;Roger&quot;
-</code></pre><p>A query that ends with a <code>@collect</code> statement without a specific type will materialize the query results into an array. Note also the difference in the <code>@select</code> statement: The previous queries all used the <code>{}</code> syntax in the <code>@select</code> statement to project results into a tabular format. The last query instead just selects a single value from each row in the <code>@select</code> statement.</p><p>These examples only scratch the surface of what one can do with <a href="https://github.com/queryverse/Query.jl">Query.jl</a>, and the interested reader is referred to the <a href="http://www.queryverse.org/Query.jl/stable/">Query.jl documentation</a> for more information.</p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../missing/">« Missing Data</a><a class="docs-footer-nextpage" href="../comparisons/">Comparison with Python/R/Stata »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Saturday 7 September 2024 11:00">Saturday 7 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+</code></pre><p>A query that ends with a <code>@collect</code> statement without a specific type will materialize the query results into an array. Note also the difference in the <code>@select</code> statement: The previous queries all used the <code>{}</code> syntax in the <code>@select</code> statement to project results into a tabular format. The last query instead just selects a single value from each row in the <code>@select</code> statement.</p><p>These examples only scratch the surface of what one can do with <a href="https://github.com/queryverse/Query.jl">Query.jl</a>, and the interested reader is referred to the <a href="http://www.queryverse.org/Query.jl/stable/">Query.jl documentation</a> for more information.</p></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../missing/">« Missing Data</a><a class="docs-footer-nextpage" href="../comparisons/">Comparison with Python/R/Stata »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Sunday 8 September 2024 08:54">Sunday 8 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/reshaping_and_pivoting/index.html b/dev/man/reshaping_and_pivoting/index.html
index cc286e551..101a13fb4 100644
--- a/dev/man/reshaping_and_pivoting/index.html
+++ b/dev/man/reshaping_and_pivoting/index.html
@@ -316,4 +316,4 @@
 ─────┼─────────────────────────────
    1 │ b               1     two
    2 │ c               3     4
-   3 │ d               true  false</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../split_apply_combine/">« Split-apply-combine</a><a class="docs-footer-nextpage" href="../sorting/">Sorting »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Saturday 7 September 2024 11:00">Saturday 7 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+   3 │ d               true  false</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../split_apply_combine/">« Split-apply-combine</a><a class="docs-footer-nextpage" href="../sorting/">Sorting »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Sunday 8 September 2024 08:54">Sunday 8 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/sorting/index.html b/dev/man/sorting/index.html
index fdee99250..5effcb4fa 100644
--- a/dev/man/sorting/index.html
+++ b/dev/man/sorting/index.html
@@ -158,4 +158,4 @@
  148 │         5.1         3.3          1.7         0.5  Iris-setosa
  149 │         5.1         3.8          1.9         0.4  Iris-setosa
  150 │         4.8         3.4          1.9         0.2  Iris-setosa
-                                                        135 rows omitted</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../reshaping_and_pivoting/">« Reshaping</a><a class="docs-footer-nextpage" href="../categorical/">Categorical Data »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Saturday 7 September 2024 11:00">Saturday 7 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+                                                        135 rows omitted</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../reshaping_and_pivoting/">« Reshaping</a><a class="docs-footer-nextpage" href="../categorical/">Categorical Data »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Sunday 8 September 2024 08:54">Sunday 8 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/split_apply_combine/index.html b/dev/man/split_apply_combine/index.html
index 86dce0935..2c514c214 100644
--- a/dev/man/split_apply_combine/index.html
+++ b/dev/man/split_apply_combine/index.html
@@ -814,4 +814,4 @@
 3-element DataFrames.GroupKeys{GroupedDataFrame{DataFrame}}:
  GroupKey: (customer_id = &quot;c&quot;,)
  GroupKey: (customer_id = &quot;b&quot;,)
- GroupKey: (customer_id = &quot;a&quot;,)</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../joins/">« Joins</a><a class="docs-footer-nextpage" href="../reshaping_and_pivoting/">Reshaping »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Saturday 7 September 2024 11:00">Saturday 7 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+ GroupKey: (customer_id = &quot;a&quot;,)</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../joins/">« Joins</a><a class="docs-footer-nextpage" href="../reshaping_and_pivoting/">Reshaping »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Sunday 8 September 2024 08:54">Sunday 8 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
diff --git a/dev/man/working_with_dataframes/index.html b/dev/man/working_with_dataframes/index.html
index f11767165..3eaf06ac1 100644
--- a/dev/man/working_with_dataframes/index.html
+++ b/dev/man/working_with_dataframes/index.html
@@ -710,4 +710,4 @@
    1 │ a             1  missing  x
    2 │ missing       2  j        y
    3 │ b             3  k        missing
-   4 │ missing       4  h        z</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../getting_started/">« Getting Started</a><a class="docs-footer-nextpage" href="../importing_and_exporting/">Importing and Exporting Data (I/O) »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Saturday 7 September 2024 11:00">Saturday 7 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>
+   4 │ missing       4  h        z</code></pre></article><nav class="docs-footer"><a class="docs-footer-prevpage" href="../getting_started/">« Getting Started</a><a class="docs-footer-nextpage" href="../importing_and_exporting/">Importing and Exporting Data (I/O) »</a><div class="flexbox-break"></div><p class="footer-message">Powered by <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> and the <a href="https://julialang.org/">Julia Programming Language</a>.</p></nav></div><div class="modal" id="documenter-settings"><div class="modal-background"></div><div class="modal-card"><header class="modal-card-head"><p class="modal-card-title">Settings</p><button class="delete"></button></header><section class="modal-card-body"><p><label class="label">Theme</label><div class="select"><select id="documenter-themepicker"><option value="auto">Automatic (OS)</option><option value="documenter-light">documenter-light</option><option value="documenter-dark">documenter-dark</option><option value="catppuccin-latte">catppuccin-latte</option><option value="catppuccin-frappe">catppuccin-frappe</option><option value="catppuccin-macchiato">catppuccin-macchiato</option><option value="catppuccin-mocha">catppuccin-mocha</option></select></div></p><hr/><p>This document was generated with <a href="https://github.com/JuliaDocs/Documenter.jl">Documenter.jl</a> version 1.7.0 on <span class="colophon-date" title="Sunday 8 September 2024 08:54">Sunday 8 September 2024</span>. Using Julia version 1.10.5.</p></section><footer class="modal-card-foot"></footer></div></div></div></body></html>

Type	`names`	`propertynames`	`keys`	`length`	`ndims`
`AbstractDataFrame`	`Vector{String}`	`Vector{Symbol}`	undefined	undefined	`2`
`DataFrameRow`	`Vector{String}`	`Vector{Symbol}`	`Vector{Symbol}`	`Int`	`1`
`DataFrameRows`	`Vector{String}`	`Vector{Symbol}`	vector of `Int`	`Int`	`1`
`DataFrameColumns`	`Vector{String}`	`Vector{Symbol}`	`Vector{Symbol}`	`Int`	`1`
`GroupedDataFrame`	`Vector{String}`	tuple of fields	`GroupKeys`	`Int`	`1`
`GroupKeys`	undefined	tuple of fields	vector of `Int`	`Int`	`1`
`GroupKey`	`Vector{String}`	`Vector{Symbol}`	`Vector{Symbol}`	`Int`	`1`
Operation	dplyr	DataFrames.jl
Reduce multiple values	`summarize(df, mean(x))`	`combine(df, :x => mean)`
Add new columns	`mutate(df, x_mean = mean(x))`	`transform(df, :x => mean => :x_mean)`
Rename columns	`rename(df, x_new = x)`	`rename(df, :x => :x_new)`
Pick columns	`select(df, x, y)`	`select(df, :x, :y)`
Pick & transform columns	`transmute(df, mean(x), y)`	`select(df, :x => mean, :y)`
Pick rows	`filter(df, x >= 1)`	`subset(df, :x => ByRow(x -> x >= 1))`
Sort rows	`arrange(df, x)`	`sort(df, :x)`
Operation	dplyr	DataFrames.jl
Reduce multiple values	`summarize(group_by(df, grp), mean(x))`	`combine(groupby(df, :grp), :x => mean)`
Add new columns	`mutate(group_by(df, grp), mean(x))`	`transform(groupby(df, :grp), :x => mean)`
Pick & transform columns	`transmute(group_by(df, grp), mean(x), y)`	`select(groupby(df, :grp), :x => mean, :y)`
Operation	dplyr	DataFrames.jl
Complex Function	`summarize(df, mean(x, na.rm = T))`	`combine(df, :x => x -> mean(skipmissing(x)))`
Transform several columns	`summarize(df, max(x), min(y))`	`combine(df, :x => maximum, :y => minimum)`
	`summarize(df, across(c(x, y), mean))`	`combine(df, [:x, :y] .=> mean)`
	`summarize(df, across(starts_with("x"), mean))`	`combine(df, names(df, r"^x") .=> mean)`
	`summarize(df, across(c(x, y), list(max, min)))`	`combine(df, ([:x, :y] .=> [maximum minimum])...)`
Multivariate function	`mutate(df, cor(x, y))`	`transform(df, [:x, :y] => cor)`
Row-wise	`mutate(rowwise(df), min(x, y))`	`transform(df, [:x, :y] => ByRow(min))`
	`mutate(rowwise(df), which.max(c_across(matches("^x"))))`	`transform(df, AsTable(r"^x") => ByRow(argmax))`
DataFrame as input	`summarize(df, head(across(), 2))`	`combine(d -> first(d, 2), df)`
DataFrame as output	`summarize(df, tibble(value = c(min(x), max(x))))`	`combine(df, :x => (x -> (value = [minimum(x), maximum(x)],)) => AsTable)`
Operation	data.table	DataFrames.jl
Reduce multiple values	`df[, .(mean(x))]`	`combine(df, :x => mean)`
Add new columns	`df[, x_mean:=mean(x) ]`	`transform!(df, :x => mean => :x_mean)`
Rename column (in place)	`setnames(df, "x", "x_new")`	`rename!(df, :x => :x_new)`
Rename multiple columns (in place)	`setnames(df, c("x", "y"), c("x_new", "y_new"))`	`rename!(df, [:x, :y] .=> [:x_new, :y_new])`
Pick columns as dataframe	`df[, .(x, y)]`	`select(df, :x, :y)`
Pick column as a vector	`df[, x]`	`df[!, :x]`
Remove columns	`df[, -"x"]`	`select(df, Not(:x))`
Remove columns (in place)	`df[, x:=NULL]`	`select!(df, Not(:x))`
Remove columns (in place)	`df[, c("x", "y"):=NULL]`	`select!(df, Not([:x, :y]))`
Pick & transform columns	`df[, .(mean(x), y)]`	`select(df, :x => mean, :y)`
Pick rows	`df[ x >= 1 ]`	`filter(:x => >=(1), df)`
Sort rows (in place)	`setorder(df, x)`	`sort!(df, :x)`
Sort rows	`df[ order(x) ]`	`sort(df, :x)`
Operation	data.table	DataFrames.jl
Reduce multiple values	`df[, mean(x), by=id ]`	`combine(groupby(df, :id), :x => mean)`
Add new columns (in place)	`df[, x_mean:=mean(x), by=id]`	`transform!(groupby(df, :id), :x => mean)`
Pick & transform columns	`df[, .(x_mean = mean(x), y), by=id]`	`select(groupby(df, :id), :x => mean, :y)`
Operation	data.table	DataFrames.jl
Complex Function	`df[, .(mean(x, na.rm=TRUE)) ]`	`combine(df, :x => x -> mean(skipmissing(x)))`
Transform certain rows (in place)	`df[x<=0, x:=0]`	`df.x[df.x .<= 0] .= 0`
Transform several columns	`df[, .(max(x), min(y)) ]`	`combine(df, :x => maximum, :y => minimum)`
	`df[, lapply(.SD, mean), .SDcols = c("x", "y") ]`	`combine(df, [:x, :y] .=> mean)`
	`df[, lapply(.SD, mean), .SDcols = patterns("*x") ]`	`combine(df, names(df, r"^x") .=> mean)`
	`df[, unlist(lapply(.SD, function(x) c(max=max(x), min=min(x)))), .SDcols = c("x", "y") ]`	`combine(df, ([:x, :y] .=> [maximum minimum])...)`
Multivariate function	`df[, .(cor(x,y)) ]`	`transform(df, [:x, :y] => cor)`
Row-wise	`df[, min_xy := min(x, y), by = 1:nrow(df)]`	`transform!(df, [:x, :y] => ByRow(min))`
	`df[, argmax_xy := which.max(.SD) , .SDcols = patterns("*x"), by = 1:nrow(df) ]`	`transform!(df, AsTable(r"^x") => ByRow(argmax))`
DataFrame as output	`df[, .SD[1], by=grp]`	`combine(groupby(df, :grp), first)`
DataFrame as output	`df[, .SD[which.max(x)], by=grp]`	`combine(groupby(df, :grp), sdf -> sdf[argmax(sdf.x), :])`
Operation	data.table	DataFrames.jl
Inner join	`merge(df, df2, on = "grp")`	`innerjoin(df, df2, on = :grp)`
Outer join	`merge(df, df2, all = TRUE, on = "grp")`	`outerjoin(df, df2, on = :grp)`
Left join	`merge(df, df2, all.x = TRUE, on = "grp")`	`leftjoin(df, df2, on = :grp)`
Right join	`merge(df, df2, all.y = TRUE, on = "grp")`	`rightjoin(df, df2, on = :grp)`
Anti join (filtering)	`df[!df2, on = "grp" ]`	`antijoin(df, df2, on = :grp)`
Semi join (filtering)	`merge(df1, df2[, .(grp)])`	`semijoin(df, df2, on = :grp)`
Operation	Stata	DataFrames.jl
Reduce multiple values	`collapse (mean) x`	`combine(df, :x => mean)`
Add new columns	`egen x_mean = mean(x)`	`transform!(df, :x => mean => :x_mean)`
Rename columns	`rename x x_new`	`rename!(df, :x => :x_new)`
Pick columns	`keep x y`	`select!(df, :x, :y)`
Pick rows	`keep if x >= 1`	`subset!(df, :x => ByRow(x -> x >= 1))`
Sort rows	`sort x`	`sort!(df, :x)`
Operation	Stata	DataFrames.jl
Add new columns	`egen x_mean = mean(x), by(grp)`	`transform!(groupby(df, :grp), :x => mean)`
Reduce multiple values	`collapse (mean) x, by(grp)`	`combine(groupby(df, :grp), :x => mean)`