From 7357907430b2fa782ceed954bbe83447a05e382c Mon Sep 17 00:00:00 2001 From: pwwang <1188067+pwwang@users.noreply.github.com> Date: Wed, 23 Mar 2022 12:31:44 -0500 Subject: [PATCH] =?UTF-8?q?=F0=9F=94=96=200.6.4=20(#95)?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit * 🔥 Remove unused code * 🩹 Change dtypes of `base.letters/LETTERS/month_abb/month_name` * 📝 Update reference maps * 📝 Add environment.yml for binder to work * Update environment.yml * 📝 Update styles for docs * 🐛 Fix order_by argument for `dplyr.lead-lag` * 📝 Update notebooks * 📝 Update README * 🔖 0.6.4 --- .gitignore | 2 +- README.md | 54 +- datar/__init__.py | 2 +- datar/base/constants.py | 8 +- datar/base/seq.py | 2 +- datar/base/string.py | 26 - datar/core/broadcast.py | 6 +- datar/dplyr/across.py | 20 +- datar/dplyr/lead_lag.py | 4 +- docs/CHANGELOG.md | 24 + docs/notebooks/across.ipynb | 33 +- docs/notebooks/add_column.ipynb | 4 +- docs/notebooks/add_row.ipynb | 4 +- docs/notebooks/arrange.ipynb | 22 +- docs/notebooks/base-arithmetic.ipynb | 172 +++---- docs/notebooks/base-funs.ipynb | 44 +- docs/notebooks/base.ipynb | 182 +++---- docs/notebooks/between.ipynb | 67 ++- docs/notebooks/bind.ipynb | 94 ++-- docs/notebooks/case_when.ipynb | 27 +- docs/notebooks/chop.ipynb | 47 +- docs/notebooks/coalesce.ipynb | 24 +- docs/notebooks/complete.ipynb | 22 +- docs/notebooks/context.ipynb | 238 ++++----- docs/notebooks/count.ipynb | 30 +- docs/notebooks/cumall.ipynb | 63 +-- docs/notebooks/datar.ipynb | 26 +- docs/notebooks/desc.ipynb | 18 +- docs/notebooks/distinct.ipynb | 322 ++++++------ docs/notebooks/drop_na.ipynb | 22 +- docs/notebooks/enframe.ipynb | 8 +- docs/notebooks/expand.ipynb | 74 ++- docs/notebooks/expand_grid.ipynb | 22 +- docs/notebooks/extract.ipynb | 22 +- docs/notebooks/fill.ipynb | 22 +- docs/notebooks/filter-joins.ipynb | 24 +- docs/notebooks/filter.ipynb | 22 +- docs/notebooks/forcats_fct_multi.ipynb | 25 +- docs/notebooks/forcats_lvl_addrm.ipynb | 35 +- docs/notebooks/forcats_lvl_order.ipynb | 64 +-- docs/notebooks/forcats_lvl_value.ipynb | 471 ++++++++--------- docs/notebooks/forcats_misc.ipynb | 599 ++++++++++------------ docs/notebooks/full_seq.ipynb | 22 +- docs/notebooks/group_by.ipynb | 27 +- docs/notebooks/group_map.ipynb | 22 +- docs/notebooks/group_split.ipynb | 37 +- docs/notebooks/group_trim.ipynb | 30 +- docs/notebooks/lead-lag.ipynb | 125 ++--- docs/notebooks/mutate-joins.ipynb | 29 +- docs/notebooks/mutate.ipynb | 57 +-- docs/notebooks/n_distinct.ipynb | 8 +- docs/notebooks/na_if.ipynb | 30 +- docs/notebooks/nb_helpers.py | 48 +- docs/notebooks/near.ipynb | 25 +- docs/notebooks/nest-join.ipynb | 26 +- docs/notebooks/nest.ipynb | 130 +---- docs/notebooks/nth.ipynb | 14 +- docs/notebooks/pack.ipynb | 121 ++--- docs/notebooks/pivot_longer.ipynb | 22 +- docs/notebooks/pivot_wider.ipynb | 22 +- docs/notebooks/pull.ipynb | 34 +- docs/notebooks/ranking.ipynb | 92 ++-- docs/notebooks/recode.ipynb | 82 +-- docs/notebooks/relocate.ipynb | 22 +- docs/notebooks/rename.ipynb | 28 +- docs/notebooks/replace_na.ipynb | 22 +- docs/notebooks/rownames.ipynb | 40 +- docs/notebooks/rows.ipynb | 46 +- docs/notebooks/rowwise.ipynb | 355 +++++++------ docs/notebooks/select.ipynb | 27 +- docs/notebooks/separate.ipynb | 122 +---- docs/notebooks/setops.ipynb | 30 +- docs/notebooks/slice.ipynb | 364 +++++++------- docs/notebooks/summarise.ipynb | 66 +-- docs/notebooks/tibble.ipynb | 174 +++---- docs/notebooks/uncount.ipynb | 22 +- docs/notebooks/unite.ipynb | 24 +- docs/notebooks/with_groups.ipynb | 132 +++-- docs/reference-maps/base.md | 240 ++++----- docs/reference-maps/datar.md | 7 +- docs/reference-maps/tibble.md | 5 +- docs/reference-maps/tidyr.md | 6 +- docs/style.css | 14 +- environment.yml | 9 + mkdocs.yml | 19 +- poetry.lock | 670 +++++++++++++++++++++++++ pyproject.toml | 2 +- tests/__init__.py | 4 +- tests/dplyr/test_funs.py | 7 +- 89 files changed, 2959 insertions(+), 3498 deletions(-) create mode 100644 environment.yml create mode 100644 poetry.lock diff --git a/.gitignore b/.gitignore index 66e18286..d6c72971 100644 --- a/.gitignore +++ b/.gitignore @@ -101,7 +101,7 @@ export/ site/ # poetry -poetry.lock +# poetry.lock # backup files *.bak diff --git a/README.md b/README.md index 7f40cb2f..37a9207b 100644 --- a/README.md +++ b/README.md @@ -1,6 +1,6 @@ # datar -Port of [dplyr][2] and other related R packages in python, using [pipda][3]. +A Grammar of Data Manipulation in python [![Pypi][6]][7] [![Github][8]][9] ![Building][10] [![Docs and API][11]][5] [![Codacy][12]][13] [![Codacy coverage][14]][13] @@ -9,18 +9,20 @@ Port of [dplyr][2] and other related R packages in python, using [pipda][3]. -Unlike other similar packages in python that just mimic the piping syntax, `datar` follows the API designs from the original packages as much as possible, and is tested thoroughly with the cases from the original packages. So that minimal effort is needed for those who are familar with those R packages to transition to python. +`datar` is a re-imagining of APIs of data manipulation libraries in python (currently only `pandas` supported) so that you can manipulate your data with it like with `dplyr` in `R`. +`datar` is an in-depth port of `tidyverse` packages, such as `dplyr`, `tidyr`, `forcats` and `tibble`, as well as some functions from `R` itself. ## Installtion ```shell pip install -U datar -# to make sure dependencies to be up-to-date -# pip install -U varname pipda datar ``` - -`datar` requires python 3.7.1+ and is backended by `pandas (1.3+)`. +or +```shell +conda install -c conda-forge datar +# mamba install -c conda-forge datar +``` ## Example usage @@ -103,6 +105,46 @@ iris >> pull(f.Sepal_Length) >> dist_plot() ![example](./example2.png) +See also some advanced examples from my answers on StackOverflow: + +- [Compare 2 DataFrames and drop rows that do not contain corresponding ID variables](https://stackoverflow.com/a/71532167/5088165) +- [count by id with dynamic criteria](https://stackoverflow.com/a/71519157/5088165) +- [counting the frequency in python size vs count](https://stackoverflow.com/a/71516503/5088165) +- [Pandas equivalent of R/dplyr group_by summarise concatenation](https://stackoverflow.com/a/71490832/5088165) +- [ntiles over columns in python using R's "mutate(across(cols = ..."](https://stackoverflow.com/a/71490501/5088165) +- [Replicate R Solution in Python for Calculating Monthly CRR](https://stackoverflow.com/a/71490194/5088165) +- [Best/Concise Way to Conditionally Concat two Columns in Pandas DataFrame](https://stackoverflow.com/a/71443587/5088165) +- [how to transform R dataframe to rows of indicator values](https://stackoverflow.com/a/71443515/5088165) +- [Left join on multiple columns](https://stackoverflow.com/a/71443441/5088165) +- [Python: change column of strings with None to 0/1](https://stackoverflow.com/a/71429016/5088165) +- [Comparing 2 data frames and finding values are not in 2nd data frame](https://stackoverflow.com/a/71415818/5088165) +- [How to compare two Pandas DataFrames based on specific columns in Python?](https://stackoverflow.com/a/71413499/5088165) +- [expand.grid equivalent to get pandas data frame for prediction in Python](https://stackoverflow.com/a/71376414/5088165) +- [Python pandas equivalent to R's group_by, mutate, and ifelse](https://stackoverflow.com/a/70387267/5088165) +- [How to convert a list of dictionaries to a Pandas Dataframe with one of the values as column name?](https://stackoverflow.com/a/69094005/5088165) +- [Moving window on a Standard Deviation & Mean calculation](https://stackoverflow.com/a/69093067/5088165) +- [Python: creating new "interpolated" rows based on a specific field in Pandas](https://stackoverflow.com/a/69092696/5088165) +- [How would I extend a Pandas DataFrame such as this?](https://stackoverflow.com/a/69092067/5088165) +- [How to define new variable based on multiple conditions in Pandas - dplyr case_when equivalent](https://stackoverflow.com/a/69080870/5088165) +- [What is the Pandas equivalent of top_n() in dplyr?](https://stackoverflow.com/a/69080806/5088165) +- [Equivalent of fct_lump in pandas](https://stackoverflow.com/a/69080727/5088165) +- [pandas equivalent of fct_reorder](https://stackoverflow.com/a/69080638/5088165) +- [Is there a way to find out the 2 X 2 contingency table consisting of the count of values by applying a condition from two dataframe](https://stackoverflow.com/a/68674345/5088165) +- [Count if array in pandas](https://stackoverflow.com/a/68659334/5088165) +- [How to create a new column for transposed data](https://stackoverflow.com/a/68642891/5088165) +- [How to create new DataFrame based on conditions from another DataFrame](https://stackoverflow.com/a/68640494/5088165) +- [Refer to column of a data frame that is being defined](https://stackoverflow.com/a/68308077/5088165) +- [How to use regex in mutate dplython to add new column](https://stackoverflow.com/a/68308033/5088165) +- [Multiplying a row by the previous row (with a certain name) in Pandas](https://stackoverflow.com/a/68137136/5088165) +- [Create dataframe from rows under a row with a certain condition](https://stackoverflow.com/a/68137089/5088165) +- [pandas data frame, group by multiple cols and put other columns' contents in one](https://stackoverflow.com/a/68136982/5088165) +- [Pandas custom aggregate function with condition on group, is it possible?](https://stackoverflow.com/a/68136704/5088165) +- [multiply different values to pandas column with combination of other columns](https://stackoverflow.com/a/68136300/5088165) +- [Vectorized column-wise regex matching in pandas](https://stackoverflow.com/a/68124082/5088165) +- [Iterate through and conditionally append string values in a Pandas dataframe](https://stackoverflow.com/a/68123912/5088165) +- [Groupby mutate equivalent in pandas/python using tidydata principles](https://stackoverflow.com/a/68123753/5088165) +- [More ...](https://stackoverflow.com/search?q=user%3A5088165+and+%5Bpandas%5D) + [1]: https://tidyr.tidyverse.org/index.html [2]: https://dplyr.tidyverse.org/index.html diff --git a/datar/__init__.py b/datar/__init__.py index ea32249b..147b2da1 100644 --- a/datar/__init__.py +++ b/datar/__init__.py @@ -30,7 +30,7 @@ ) __all__ = ("f", "get_versions") -__version__ = "0.6.3" +__version__ = "0.6.4" def get_versions(prnt: bool = True) -> _VersionsTuple: diff --git a/datar/base/constants.py b/datar/base/constants.py index d8385066..81ef4157 100644 --- a/datar/base/constants.py +++ b/datar/base/constants.py @@ -7,8 +7,8 @@ pi = math.pi -letters = np.array(list(ascii_letters[:26]), dtype=object) -LETTERS = np.array(list(ascii_letters[26:]), dtype=object) +letters = np.array(list(ascii_letters[:26]), dtype=' 0 and size % value.size != 0: - raise ValueError( - f"Cannot recycle {name} (size={value.size}) to size {size}." - ) - - if value.size == size == 0: - return np.array([], dtype=object) - - if value.size == 0: - value = np.array([np.nan], dtype=object) - - return value.repeat(size // value.size) - - @register_func(None, context=Context.EVAL) def as_character( x, diff --git a/datar/core/broadcast.py b/datar/core/broadcast.py index 6ed093d3..29218a36 100644 --- a/datar/core/broadcast.py +++ b/datar/core/broadcast.py @@ -525,7 +525,10 @@ def _( if isinstance(value, DataFrame) and value.index.size == 0: value.index = index - if not value.index.equals(index): + # if not value.index.equals(index): + if not value.index.equals(index) and frozenset( + value.index + ) != frozenset(index): raise ValueError("Value has incompatible index.") if isinstance(value, Series): @@ -716,6 +719,7 @@ def _(value: SeriesGroupBy, name: str) -> Tibble: @init_tibble_from.register(DataFrameGroupBy) def _(value: Union[DataFrame, DataFrameGroupBy], name: str) -> Tibble: from ..tibble import as_tibble + result = regcall(as_tibble, value) if name: diff --git a/datar/dplyr/across.py b/datar/dplyr/across.py index 3427270c..29635de1 100644 --- a/datar/dplyr/across.py +++ b/datar/dplyr/across.py @@ -165,6 +165,24 @@ def across( The original API: https://dplyr.tidyverse.org/reference/across.html + Examples: + # + >>> iris >> mutate(across(c(f.Sepal_Length, f.Sepal_Width), round)) + Sepal_Length Sepal_Width Petal_Length Petal_Width Species + + 0 5.0 4.0 1.4 0.2 setosa + 1 5.0 3.0 1.4 0.2 setosa + .. ... ... ... ... ... + + >>> iris >> group_by(f.Species) >> summarise( + >>> across(starts_with("Sepal"), mean) + >>> ) + Species Sepal_Length Sepal_Width + + 0 setosa 5.006 3.428 + 1 versicolor 5.936 2.770 + 2 virginica 6.588 2.974 + Args: _data: The dataframe. *args: If given, the first 2 elements should be columns and functions @@ -218,7 +236,7 @@ def c_across( _cols: The columns Returns: - A series + A rowwise tibble """ _data = _context.meta.get("input_data", _data) diff --git a/datar/dplyr/lead_lag.py b/datar/dplyr/lead_lag.py index a78939e2..bc6f524f 100644 --- a/datar/dplyr/lead_lag.py +++ b/datar/dplyr/lead_lag.py @@ -28,12 +28,12 @@ def _shift(x, n, default=None, order_by=None): newx = Series(x) if order_by is not None: - newx = newx.reset_index(drop=True) + # newx = newx.reset_index(drop=True) out = with_order(order_by, Series.shift, newx, n, fill_value=default) else: out = newx.shift(n, fill_value=default) - return out + return out if isinstance(x, Series) else out.values @register_func(None, context=Context.EVAL) diff --git a/docs/CHANGELOG.md b/docs/CHANGELOG.md index 56c3cb89..50c600c1 100644 --- a/docs/CHANGELOG.md +++ b/docs/CHANGELOG.md @@ -1,3 +1,27 @@ +## 0.6.4 + +### Breaking changes + +- 🩹 Make `base.ntile()` labels 1-based (#92) + +### Fixes + +- 🐛 Fix `order_by` argument for `dplyr.lead-lag` + +### Enhancements + +- 🚑 Allow `base.paste/paste0()` to work with grouped data +- 🩹 Change dtypes of `base.letters/LETTERS/month_abb/month_name` + +### Housekeeping + +- 📝 Update and fix reference maps +- 📝 Add `environment.yml` for binder to work +- 📝 Update styles for docs +- 📝 Update styles for API doc in notebooks +- 📝 Update README for new description about the project and add examples from StackOverflow + + ## 0.6.3 - ✨ Allow `base.c()` to handle groupby data diff --git a/docs/notebooks/across.ipynb b/docs/notebooks/across.ipynb index df49b8ce..141b5cd7 100644 --- a/docs/notebooks/across.ipynb +++ b/docs/notebooks/across.ipynb @@ -2,7 +2,7 @@ "cells": [ { "cell_type": "code", - "execution_count": 1, + "execution_count": 5, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:27:57.831736Z", @@ -12,26 +12,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 00:17:06][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 00:17:06][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 00:17:06][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 00:17:06][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 00:17:06][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 00:17:06][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 00:17:06][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 00:17:06][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 00:17:06][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 00:17:06][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -43,7 +27,7 @@ { "data": { "text/markdown": [ - "### # across " + "###
★ across
" ], "text/plain": [ "" @@ -94,7 +78,7 @@ { "data": { "text/markdown": [ - "### # if_any " + "###
★ if_any
" ], "text/plain": [ "" @@ -122,7 +106,7 @@ { "data": { "text/markdown": [ - "### # if_all " + "###
★ if_all
" ], "text/plain": [ "" @@ -150,7 +134,7 @@ { "data": { "text/markdown": [ - "### # c_across " + "###
★ c_across
" ], "text/plain": [ "" @@ -169,7 +153,7 @@ "  `_cols`: The columns \n", "\n", "##### Returns:\n", - "  A series \n" + "  A rowwise tibble \n" ], "text/plain": [ "" @@ -180,10 +164,11 @@ } ], "source": [ + "%run nb_helpers.py\n", + "\n", "from datar.datasets import iris\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(across, if_any, if_all, c_across)" ] }, diff --git a/docs/notebooks/add_column.ipynb b/docs/notebooks/add_column.ipynb index d7033309..877f0b41 100644 --- a/docs/notebooks/add_column.ipynb +++ b/docs/notebooks/add_column.ipynb @@ -15,7 +15,7 @@ { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -27,7 +27,7 @@ { "data": { "text/markdown": [ - "### # add_column " + "###
★ add_column
" ], "text/plain": [ "" diff --git a/docs/notebooks/add_row.ipynb b/docs/notebooks/add_row.ipynb index 288fb0cd..edc98b0a 100644 --- a/docs/notebooks/add_row.ipynb +++ b/docs/notebooks/add_row.ipynb @@ -15,7 +15,7 @@ { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -27,7 +27,7 @@ { "data": { "text/markdown": [ - "### # add_row " + "###
★ add_row
" ], "text/plain": [ "" diff --git a/docs/notebooks/arrange.ipynb b/docs/notebooks/arrange.ipynb index cf03f644..03a853fa 100644 --- a/docs/notebooks/arrange.ipynb +++ b/docs/notebooks/arrange.ipynb @@ -13,26 +13,10 @@ "tags": [] }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 00:29:30][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 00:29:30][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 00:29:30][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 00:29:30][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 00:29:30][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 00:29:30][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 00:29:30][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 00:29:30][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 00:29:30][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 00:29:30][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # arrange " + "###
★ arrange
" ], "text/plain": [ "" @@ -88,10 +72,10 @@ } ], "source": [ + "%run nb_helpers.py\n", "from datar.datasets import mtcars, iris\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(arrange)" ] }, diff --git a/docs/notebooks/base-arithmetic.ipynb b/docs/notebooks/base-arithmetic.ipynb index bd5d2e8c..f0d5252b 100644 --- a/docs/notebooks/base-arithmetic.ipynb +++ b/docs/notebooks/base-arithmetic.ipynb @@ -2,23 +2,13 @@ "cells": [ { "cell_type": "code", - "execution_count": 3, + "execution_count": 1, "metadata": {}, "outputs": [ - { - "data": { - "text/plain": [ - "Diot({'warn_builtin_names': False}, diot_transform= at 0x7fad66f3b790>)" - ] - }, - "execution_count": 3, - "metadata": {}, - "output_type": "execute_result" - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -30,7 +20,7 @@ { "data": { "text/markdown": [ - "### # sum " + "###
★ sum
" ], "text/plain": [ "" @@ -65,7 +55,7 @@ { "data": { "text/markdown": [ - "### # prod " + "###
★ prod
" ], "text/plain": [ "" @@ -100,7 +90,7 @@ { "data": { "text/markdown": [ - "### # mean " + "###
★ mean
" ], "text/plain": [ "" @@ -134,7 +124,7 @@ { "data": { "text/markdown": [ - "### # median " + "###
★ median
" ], "text/plain": [ "" @@ -168,7 +158,7 @@ { "data": { "text/markdown": [ - "### # min " + "###
★ min
" ], "text/plain": [ "" @@ -203,7 +193,7 @@ { "data": { "text/markdown": [ - "### # max " + "###
★ max
" ], "text/plain": [ "" @@ -238,7 +228,7 @@ { "data": { "text/markdown": [ - "### # var " + "###
★ var
" ], "text/plain": [ "" @@ -274,7 +264,7 @@ { "data": { "text/markdown": [ - "### # pmin " + "###
★ pmin
" ], "text/plain": [ "" @@ -305,7 +295,7 @@ { "data": { "text/markdown": [ - "### # pmax " + "###
★ pmax
" ], "text/plain": [ "" @@ -336,7 +326,7 @@ { "data": { "text/markdown": [ - "### # round_ " + "###
★ round_
" ], "text/plain": [ "" @@ -367,7 +357,7 @@ { "data": { "text/markdown": [ - "### # sqrt " + "###
★ sqrt
" ], "text/plain": [ "" @@ -397,7 +387,7 @@ { "data": { "text/markdown": [ - "### # absolute " + "###
★ absolute
" ], "text/plain": [ "" @@ -427,7 +417,7 @@ { "data": { "text/markdown": [ - "### # sign " + "###
★ sign
" ], "text/plain": [ "" @@ -457,7 +447,7 @@ { "data": { "text/markdown": [ - "### # trunc " + "###
★ trunc
" ], "text/plain": [ "" @@ -488,7 +478,7 @@ { "data": { "text/markdown": [ - "### # ceiling " + "###
★ ceiling
" ], "text/plain": [ "" @@ -518,7 +508,7 @@ { "data": { "text/markdown": [ - "### # floor " + "###
★ floor
" ], "text/plain": [ "" @@ -548,7 +538,7 @@ { "data": { "text/markdown": [ - "### # signif " + "###
★ signif
" ], "text/plain": [ "" @@ -580,7 +570,7 @@ { "data": { "text/markdown": [ - "### # log " + "###
★ log
" ], "text/plain": [ "" @@ -612,7 +602,7 @@ { "data": { "text/markdown": [ - "### # exp " + "###
★ exp
" ], "text/plain": [ "" @@ -642,7 +632,7 @@ { "data": { "text/markdown": [ - "### # log2 " + "###
★ log2
" ], "text/plain": [ "" @@ -673,7 +663,7 @@ { "data": { "text/markdown": [ - "### # log10 " + "###
★ log10
" ], "text/plain": [ "" @@ -704,7 +694,7 @@ { "data": { "text/markdown": [ - "### # log1p " + "###
★ log1p
" ], "text/plain": [ "" @@ -735,7 +725,7 @@ { "data": { "text/markdown": [ - "### # cov " + "###
★ cov
" ], "text/plain": [ "" @@ -760,7 +750,7 @@ { "data": { "text/markdown": [ - "### # _scale " + "###
★ _scale
" ], "text/plain": [ "" @@ -797,7 +787,7 @@ { "data": { "text/markdown": [ - "### # col_sums " + "###
★ col_sums
" ], "text/plain": [ "" @@ -828,7 +818,7 @@ { "data": { "text/markdown": [ - "### # row_sums " + "###
★ row_sums
" ], "text/plain": [ "" @@ -859,7 +849,7 @@ { "data": { "text/markdown": [ - "### # col_means " + "###
★ col_means
" ], "text/plain": [ "" @@ -890,7 +880,7 @@ { "data": { "text/markdown": [ - "### # row_means " + "###
★ row_means
" ], "text/plain": [ "" @@ -921,7 +911,7 @@ { "data": { "text/markdown": [ - "### # col_sds " + "###
★ col_sds
" ], "text/plain": [ "" @@ -953,7 +943,7 @@ { "data": { "text/markdown": [ - "### # row_sds " + "###
★ row_sds
" ], "text/plain": [ "" @@ -985,7 +975,7 @@ { "data": { "text/markdown": [ - "### # col_medians " + "###
★ col_medians
" ], "text/plain": [ "" @@ -1016,7 +1006,7 @@ { "data": { "text/markdown": [ - "### # row_medians " + "###
★ row_medians
" ], "text/plain": [ "" @@ -1047,7 +1037,7 @@ { "data": { "text/markdown": [ - "### # quantile " + "###
★ quantile
" ], "text/plain": [ "" @@ -1093,7 +1083,7 @@ { "data": { "text/markdown": [ - "### # std " + "###
★ std
" ], "text/plain": [ "" @@ -1117,7 +1107,7 @@ { "data": { "text/markdown": [ - "### # weighted_mean " + "###
★ weighted_mean
" ], "text/plain": [ "" @@ -1140,12 +1130,10 @@ } ], "source": [ - "from datar import options\n", - "options(warn_builtin_names=False)\n", + "%run nb_helpers.py\n", "\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "debug_kwargs = {'prefix': '\\n', 'sep': f'\\n{\"-\" * 20}\\n'}\n", "nb_header(\n", " sum, prod, mean, median, min, max, var, pmin, pmax,\n", @@ -1158,7 +1146,7 @@ }, { "cell_type": "code", - "execution_count": 7, + "execution_count": 2, "metadata": {}, "outputs": [ { @@ -1226,7 +1214,7 @@ }, { "cell_type": "code", - "execution_count": 9, + "execution_count": 3, "metadata": {}, "outputs": [ { @@ -1284,7 +1272,7 @@ }, { "cell_type": "code", - "execution_count": 15, + "execution_count": 4, "metadata": {}, "outputs": [ { @@ -1340,7 +1328,7 @@ }, { "cell_type": "code", - "execution_count": 30, + "execution_count": 5, "metadata": {}, "outputs": [ { @@ -1352,74 +1340,74 @@ "--------------------\n", " v1 v2 v3\n", " \n", - "0 -0.527205 -0.563083 -1.030619\n", - "1 -0.652748 -0.620141 -0.410482\n", - "2 -1.464778 1.274939 0.505686\n", - "3 0.505498 -0.103748 0.805596\n", - "4 1.431942 -0.759830 -0.755049\n", + "0 -0.562974 0.260601 0.021010\n", + "1 -0.880938 -0.658334 0.716204\n", + "2 0.354143 -0.313041 -1.183404\n", + "3 -1.073970 -0.394479 -0.337136\n", + "4 1.063941 1.128986 -0.747481\n", "\n", "col_sums(df)\n", "--------------------\n", - "v1 -0.707291\n", - "v2 -0.771863\n", - "v3 -0.884868\n", + "v1 -1.099799\n", + "v2 0.023733\n", + "v3 -1.530807\n", "dtype: float64\n", "\n", "row_sums(df)\n", "--------------------\n", - "0 -2.120907\n", - "1 -1.683371\n", - "2 0.315848\n", - "3 1.207346\n", - "4 -0.082938\n", + "0 -0.281364\n", + "1 -0.823068\n", + "2 -1.142302\n", + "3 -1.805586\n", + "4 1.445446\n", "dtype: float64\n", "\n", "col_means(df)\n", "--------------------\n", - "v1 -0.141458\n", - "v2 -0.154373\n", - "v3 -0.176974\n", + "v1 -0.219960\n", + "v2 0.004747\n", + "v3 -0.306161\n", "dtype: float64\n", "\n", "row_means(df)\n", "--------------------\n", - "0 -0.706969\n", - "1 -0.561124\n", - "2 0.105283\n", - "3 0.402449\n", - "4 -0.027646\n", + "0 -0.093788\n", + "1 -0.274356\n", + "2 -0.380767\n", + "3 -0.601862\n", + "4 0.481815\n", "dtype: float64\n", "\n", "col_sds(df)\n", "--------------------\n", - "v1 1.124226\n", - "v2 0.836071\n", - "v3 0.798260\n", + "v1 0.903034\n", + "v2 0.712289\n", + "v3 0.727590\n", "dtype: float64\n", "\n", "row_sds(df)\n", "--------------------\n", - "0 0.280863\n", - "1 0.131475\n", - "2 1.413066\n", - "3 0.463348\n", - "4 1.264042\n", + "0 0.423619\n", + "1 0.865041\n", + "2 0.771008\n", + "3 0.409862\n", + "4 1.065098\n", "dtype: float64\n", "\n", "col_medians(df)\n", "--------------------\n", - "v1 -0.527205\n", - "v2 -0.563083\n", - "v3 -0.410482\n", + "v1 -0.562974\n", + "v2 -0.313041\n", + "v3 -0.337136\n", "dtype: float64\n", "\n", "row_medians(df)\n", "--------------------\n", - "0 -0.563083\n", - "1 -0.620141\n", - "2 0.505686\n", - "3 0.505498\n", - "4 -0.755049\n", + "0 0.021010\n", + "1 -0.658334\n", + "2 -0.313041\n", + "3 -0.394479\n", + "4 1.063941\n", "dtype: float64\n" ] } @@ -1444,7 +1432,7 @@ }, { "cell_type": "code", - "execution_count": 35, + "execution_count": 6, "metadata": {}, "outputs": [ { diff --git a/docs/notebooks/base-funs.ipynb b/docs/notebooks/base-funs.ipynb index 6b8dd737..f6ade545 100644 --- a/docs/notebooks/base-funs.ipynb +++ b/docs/notebooks/base-funs.ipynb @@ -8,7 +8,7 @@ { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -20,7 +20,7 @@ { "data": { "text/markdown": [ - "### # cut " + "###
★ cut
" ], "text/plain": [ "" @@ -71,7 +71,7 @@ { "data": { "text/markdown": [ - "### # diff " + "###
★ diff
" ], "text/plain": [ "" @@ -89,14 +89,6 @@ "result is equal to the successive differences \n", "`x[lag:] – x[:-lag]`. \n", "\n", - "##### Examples:\n", - "  >>> rv = [52, 21, 10, 11, 19] \n", - "  >>> data = diff(rv) \n", - "  >>> # -31 -11 1 8 \n", - "  >>> # rv[1:] - rv[:-1] \n", - "  >>> # rv[1:] [21, 10, 11, 19] \n", - "  >>> # rv[:-1] [52, 21, 10, 11] \n", - "\n", "##### Args:\n", "  `x`: The data \n", "  `lag`: The lag to use. Could be negative. \n", @@ -118,7 +110,7 @@ { "data": { "text/markdown": [ - "### # identity " + "###
★ identity
" ], "text/plain": [ "" @@ -144,7 +136,7 @@ { "data": { "text/markdown": [ - "### # expandgrid " + "###
★ expandgrid
" ], "text/plain": [ "" @@ -168,7 +160,7 @@ { "data": { "text/markdown": [ - "### # outer " + "###
★ outer
" ], "text/plain": [ "" @@ -203,7 +195,7 @@ { "data": { "text/markdown": [ - "### # make_names " + "###
★ make_names
" ], "text/plain": [ "" @@ -244,7 +236,7 @@ { "data": { "text/markdown": [ - "### # make_unique " + "###
★ make_unique
" ], "text/plain": [ "" @@ -278,7 +270,7 @@ { "data": { "text/markdown": [ - "### # rank " + "###
★ rank
" ], "text/plain": [ "" @@ -317,7 +309,7 @@ { "data": { "text/markdown": [ - "### # data_context " + "###
★ data_context
" ], "text/plain": [ "" @@ -356,12 +348,10 @@ } ], "source": [ - "from datar import options\n", - "options(warn_builtin_names=False)\n", + "%run nb_helpers.py\n", "\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "debug_kwargs = {'prefix': '\\n', 'sep': f'\\n{\"-\" * 20}\\n'}\n", "nb_header(\n", " cut, diff, identity, expandgrid, outer, \n", @@ -371,17 +361,17 @@ }, { "cell_type": "code", - "execution_count": 3, + "execution_count": 2, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ - "[2022-03-11 21:23:06][datar][WARNING] New names:\n", - "[2022-03-11 21:23:06][datar][WARNING] * '_1' -> '__0'\n", - "[2022-03-11 21:23:06][datar][WARNING] * '_1' -> '__1'\n", - "[2022-03-11 21:23:06][datar][WARNING] * '_1' -> '__2'\n" + "[2022-03-18 17:15:21][datar][WARNING] New names:\n", + "[2022-03-18 17:15:21][datar][WARNING] * '_1' -> '__0'\n", + "[2022-03-18 17:15:21][datar][WARNING] * '_1' -> '__1'\n", + "[2022-03-18 17:15:21][datar][WARNING] * '_1' -> '__2'\n" ] }, { @@ -495,7 +485,7 @@ "3 2 4" ] }, - "execution_count": 3, + "execution_count": 2, "metadata": {}, "output_type": "execute_result" } diff --git a/docs/notebooks/base.ipynb b/docs/notebooks/base.ipynb index 47c5727c..edb60d51 100644 --- a/docs/notebooks/base.ipynb +++ b/docs/notebooks/base.ipynb @@ -12,29 +12,14 @@ "shell.execute_reply": "2021-07-16T22:27:46.079498Z" } }, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 00:29:39][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 00:29:39][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 00:29:39][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 00:29:39][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 00:29:39][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 00:29:39][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 00:29:39][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 00:29:39][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n" - ] - } - ], + "outputs": [], "source": [ + "%run nb_helpers.py\n", "import numpy\n", "from datar import f\n", "from datar.base import *\n", "from datar.tibble import tibble\n", "\n", - "%run nb_helpers.py\n", "debug_kwargs = {'prefix': '\\n', 'sep': f'\\n{\"-\" * 20}\\n'}" ] }, @@ -68,24 +53,23 @@ "--------------------\n", "array(['a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i', 'j', 'k', 'l', 'm',\n", " 'n', 'o', 'p', 'q', 'r', 's', 't', 'u', 'v', 'w', 'x', 'y', 'z'],\n", - " dtype=object)\n", + " dtype='Try this notebook on binder." + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -28,7 +28,7 @@ { "data": { "text/markdown": [ - "### # between " + "###
★ between
" ], "text/plain": [ "" @@ -66,17 +66,17 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/between.html\n", + "%run nb_helpers.py\n", "\n", "from datar.datasets import starwars\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(between)" ] }, { "cell_type": "code", - "execution_count": 7, + "execution_count": 2, "id": "6b3effe3", "metadata": { "execution": { @@ -90,22 +90,11 @@ { "data": { "text/plain": [ - "0 False\n", - "1 False\n", - "2 False\n", - "3 False\n", - "4 False\n", - "5 False\n", - "6 True\n", - "7 True\n", - "8 True\n", - "9 False\n", - "10 False\n", - "11 False\n", - "Name: x, dtype: bool" + "array([False, False, False, False, False, False, True, True, True,\n", + " False, False, False])" ] }, - "execution_count": 7, + "execution_count": 2, "metadata": {}, "output_type": "execute_result" } @@ -116,7 +105,7 @@ }, { "cell_type": "code", - "execution_count": 8, + "execution_count": 3, "id": "302aa8fc", "metadata": { "execution": { @@ -130,23 +119,23 @@ { "data": { "text/plain": [ - "array([-0.62317072, 0.65948569, -0.54024359, -0.82184473, -0.1764757 ,\n", - " 0.18213228, 0.79855673, -0.24855138, 0.01262424, -0.84894048,\n", - " 0.37285632, 0.22835416, 0.42217402, -0.87096832, -0.66171351,\n", - " 0.66683691, -0.45817378, 0.70713136, 0.47549812, 0.76217418,\n", - " -0.0998089 , -0.40394027, -0.47139879, 0.23089977, -0.90173509,\n", - " -0.42211495, -0.47364465, -0.53518737, 0.11029949, 0.63746745,\n", - " 0.18128595, 0.4488157 , -0.94351625, 0.16476352, -0.02417968,\n", - " 0.13975003, 0.98128978, 0.03124932, 0.42528095, -0.44302586,\n", - " -0.26502179, -0.22858774, -0.93915892, -0.60314281, -0.35186847,\n", - " -0.07903075, -0.41372665, -0.32182693, -0.70112294, -0.99253387,\n", - " -0.576679 , -0.05485442, 0.30572563, -0.53975388, 0.01075027,\n", - " 0.13986945, 0.19666611, -0.11363934, -0.44002343, -0.36146865,\n", - " -0.13858168, 0.1501186 , 0.11285687, 0.60659002, 0.5742983 ,\n", - " 0.65033481, 0.94642001, 0.64107236, -0.86960338])" + "array([-0.65386489, 0.18885862, -0.61516756, -0.69568368, -0.70885902,\n", + " 0.26602314, -0.35391689, -0.52768408, -0.73553316, -0.79054691,\n", + " 0.08399462, 0.07164568, 0.09310497, 0.86196196, 0.4187352 ,\n", + " -0.17829678, 0.55933483, -0.43936161, -0.4501368 , -0.07061945,\n", + " -0.68175617, -0.39724819, -0.33263432, 0.3349741 , -0.08515872,\n", + " -0.68384246, -0.53988212, -0.35831946, -0.97737568, -0.53775482,\n", + " -0.23827599, -0.51523472, 0.0303137 , 0.40593 , 0.61505644,\n", + " 0.67219774, 0.4803338 , -0.80846003, -0.04245792, 0.30025567,\n", + " 0.68137426, -0.86946604, 0.69392051, 0.91926884, -0.92290023,\n", + " 0.38203131, 0.01162034, -0.2835221 , 0.02245063, 0.42526291,\n", + " 0.15444326, 0.59198204, -0.17717905, -0.4154278 , 0.27511335,\n", + " -0.3062066 , -0.18671645, 0.2090275 , 0.15432189, -0.42519021,\n", + " -0.86684503, 0.02594608, 0.68585011, 0.99557676, 0.571366 ,\n", + " -0.81727091, -0.18650605, 0.27366826])" ] }, - "execution_count": 8, + "execution_count": 3, "metadata": {}, "output_type": "execute_result" } @@ -158,7 +147,7 @@ }, { "cell_type": "code", - "execution_count": 9, + "execution_count": 4, "id": "d1b79572", "metadata": { "execution": { @@ -310,7 +299,7 @@ "45 NaN male masculine Troiken Xexto " ] }, - "execution_count": 9, + "execution_count": 4, "metadata": {}, "output_type": "execute_result" } @@ -321,7 +310,7 @@ }, { "cell_type": "code", - "execution_count": 10, + "execution_count": 5, "id": "1e52d002", "metadata": { "execution": { @@ -585,7 +574,7 @@ "72 red, blue NaN none feminine NaN Droid " ] }, - "execution_count": 10, + "execution_count": 5, "metadata": {}, "output_type": "execute_result" } diff --git a/docs/notebooks/bind.ipynb b/docs/notebooks/bind.ipynb index 4f8d119e..9d4205f2 100644 --- a/docs/notebooks/bind.ipynb +++ b/docs/notebooks/bind.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 00:30:01][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 00:30:01][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 00:30:01][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 00:30:01][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 00:30:01][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 00:30:01][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 00:30:01][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 00:30:01][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 00:30:01][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 00:30:01][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # bind_rows " + "###
★ bind_rows
" ], "text/plain": [ "" @@ -85,7 +69,7 @@ { "data": { "text/markdown": [ - "### # bind_cols " + "###
★ bind_cols
" ], "text/plain": [ "" @@ -136,11 +120,11 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/bind.html\n", + "%run nb_helpers.py\n", "\n", "from datar.datasets import starwars\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(bind_rows, bind_cols, book='bind')" ] }, @@ -1213,7 +1197,7 @@ }, { "cell_type": "code", - "execution_count": 9, + "execution_count": 8, "id": "fd18f54b", "metadata": { "execution": { @@ -1406,7 +1390,7 @@ "6 blue 64.0 male masculine Eriadu Human " ] }, - "execution_count": 9, + "execution_count": 8, "metadata": {}, "output_type": "execute_result" } @@ -1418,7 +1402,7 @@ }, { "cell_type": "code", - "execution_count": 10, + "execution_count": 9, "id": "85f9ae65", "metadata": { "execution": { @@ -1611,7 +1595,7 @@ "6 blue 64.0 male masculine Eriadu Human " ] }, - "execution_count": 10, + "execution_count": 9, "metadata": {}, "output_type": "execute_result" } @@ -1622,7 +1606,7 @@ }, { "cell_type": "code", - "execution_count": 11, + "execution_count": 10, "id": "203c53a8", "metadata": { "execution": { @@ -1715,7 +1699,7 @@ "6 NaN 3.0" ] }, - "execution_count": 11, + "execution_count": 10, "metadata": {}, "output_type": "execute_result" } @@ -1728,7 +1712,7 @@ }, { "cell_type": "code", - "execution_count": 12, + "execution_count": 11, "id": "0aeecbc1", "metadata": { "execution": { @@ -1797,7 +1781,7 @@ "2 2 NaN" ] }, - "execution_count": 12, + "execution_count": 11, "metadata": {}, "output_type": "execute_result" } @@ -1811,7 +1795,7 @@ }, { "cell_type": "code", - "execution_count": 13, + "execution_count": 12, "id": "655c5124", "metadata": { "execution": { @@ -1875,7 +1859,7 @@ "2 2" ] }, - "execution_count": 13, + "execution_count": 12, "metadata": {}, "output_type": "execute_result" } @@ -1886,7 +1870,7 @@ }, { "cell_type": "code", - "execution_count": 14, + "execution_count": 13, "id": "f9281c6c", "metadata": { "execution": { @@ -1901,29 +1885,29 @@ "name": "stderr", "output_type": "stream", "text": [ - "[2022-03-06 00:38:01][datar][WARNING] New names:\n", - "[2022-03-06 00:38:01][datar][WARNING] * 'name' -> 'name__0'\n", - "[2022-03-06 00:38:01][datar][WARNING] * 'height' -> 'height__1'\n", - "[2022-03-06 00:38:01][datar][WARNING] * 'mass' -> 'mass__2'\n", - "[2022-03-06 00:38:01][datar][WARNING] * 'hair_color' -> 'hair_color__3'\n", - "[2022-03-06 00:38:01][datar][WARNING] * 'skin_color' -> 'skin_color__4'\n", - "[2022-03-06 00:38:01][datar][WARNING] * 'eye_color' -> 'eye_color__5'\n", - "[2022-03-06 00:38:01][datar][WARNING] * 'birth_year' -> 'birth_year__6'\n", - "[2022-03-06 00:38:01][datar][WARNING] * 'sex' -> 'sex__7'\n", - "[2022-03-06 00:38:01][datar][WARNING] * 'gender' -> 'gender__8'\n", - "[2022-03-06 00:38:01][datar][WARNING] * 'homeworld' -> 'homeworld__9'\n", - "[2022-03-06 00:38:01][datar][WARNING] * 'species' -> 'species__10'\n", - "[2022-03-06 00:38:01][datar][WARNING] * 'name' -> 'name__11'\n", - "[2022-03-06 00:38:01][datar][WARNING] * 'height' -> 'height__12'\n", - "[2022-03-06 00:38:01][datar][WARNING] * 'mass' -> 'mass__13'\n", - "[2022-03-06 00:38:01][datar][WARNING] * 'hair_color' -> 'hair_color__14'\n", - "[2022-03-06 00:38:01][datar][WARNING] * 'skin_color' -> 'skin_color__15'\n", - "[2022-03-06 00:38:01][datar][WARNING] * 'eye_color' -> 'eye_color__16'\n", - "[2022-03-06 00:38:01][datar][WARNING] * 'birth_year' -> 'birth_year__17'\n", - "[2022-03-06 00:38:01][datar][WARNING] * 'sex' -> 'sex__18'\n", - "[2022-03-06 00:38:01][datar][WARNING] * 'gender' -> 'gender__19'\n", - "[2022-03-06 00:38:01][datar][WARNING] * 'homeworld' -> 'homeworld__20'\n", - "[2022-03-06 00:38:01][datar][WARNING] * 'species' -> 'species__21'\n" + "[2022-03-18 17:26:56][datar][WARNING] New names:\n", + "[2022-03-18 17:26:56][datar][WARNING] * 'name' -> 'name__0'\n", + "[2022-03-18 17:26:56][datar][WARNING] * 'height' -> 'height__1'\n", + "[2022-03-18 17:26:56][datar][WARNING] * 'mass' -> 'mass__2'\n", + "[2022-03-18 17:26:56][datar][WARNING] * 'hair_color' -> 'hair_color__3'\n", + "[2022-03-18 17:26:56][datar][WARNING] * 'skin_color' -> 'skin_color__4'\n", + "[2022-03-18 17:26:56][datar][WARNING] * 'eye_color' -> 'eye_color__5'\n", + "[2022-03-18 17:26:56][datar][WARNING] * 'birth_year' -> 'birth_year__6'\n", + "[2022-03-18 17:26:56][datar][WARNING] * 'sex' -> 'sex__7'\n", + "[2022-03-18 17:26:56][datar][WARNING] * 'gender' -> 'gender__8'\n", + "[2022-03-18 17:26:56][datar][WARNING] * 'homeworld' -> 'homeworld__9'\n", + "[2022-03-18 17:26:56][datar][WARNING] * 'species' -> 'species__10'\n", + "[2022-03-18 17:26:56][datar][WARNING] * 'name' -> 'name__11'\n", + "[2022-03-18 17:26:56][datar][WARNING] * 'height' -> 'height__12'\n", + "[2022-03-18 17:26:56][datar][WARNING] * 'mass' -> 'mass__13'\n", + "[2022-03-18 17:26:56][datar][WARNING] * 'hair_color' -> 'hair_color__14'\n", + "[2022-03-18 17:26:56][datar][WARNING] * 'skin_color' -> 'skin_color__15'\n", + "[2022-03-18 17:26:56][datar][WARNING] * 'eye_color' -> 'eye_color__16'\n", + "[2022-03-18 17:26:56][datar][WARNING] * 'birth_year' -> 'birth_year__17'\n", + "[2022-03-18 17:26:56][datar][WARNING] * 'sex' -> 'sex__18'\n", + "[2022-03-18 17:26:56][datar][WARNING] * 'gender' -> 'gender__19'\n", + "[2022-03-18 17:26:56][datar][WARNING] * 'homeworld' -> 'homeworld__20'\n", + "[2022-03-18 17:26:56][datar][WARNING] * 'species' -> 'species__21'\n" ] }, { @@ -2212,7 +2196,7 @@ "[7 rows x 22 columns]" ] }, - "execution_count": 14, + "execution_count": 13, "metadata": {}, "output_type": "execute_result" } diff --git a/docs/notebooks/case_when.ipynb b/docs/notebooks/case_when.ipynb index 686bb74d..c22ad4c2 100644 --- a/docs/notebooks/case_when.ipynb +++ b/docs/notebooks/case_when.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-10 12:56:17][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-10 12:56:17][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-10 12:56:17][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-10 12:56:17][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-10 12:56:17][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-10 12:56:17][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-10 12:56:17][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-10 12:56:17][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-10 12:56:17][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-10 12:56:17][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # case_when " + "###
★ case_when
" ], "text/plain": [ "" @@ -77,10 +61,11 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/case_when.html\n", + "%run nb_helpers.py\n", + "\n", "from datar.datasets import starwars \n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(case_when)" ] }, @@ -356,7 +341,7 @@ }, { "cell_type": "code", - "execution_count": 11, + "execution_count": 9, "id": "intermediate-edmonton", "metadata": { "execution": { @@ -528,7 +513,7 @@ "[87 rows x 6 columns]" ] }, - "execution_count": 11, + "execution_count": 9, "metadata": {}, "output_type": "execute_result" } diff --git a/docs/notebooks/chop.ipynb b/docs/notebooks/chop.ipynb index ad5f73f6..48af88f5 100644 --- a/docs/notebooks/chop.ipynb +++ b/docs/notebooks/chop.ipynb @@ -12,26 +12,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 01:13:18][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 01:13:18][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 01:13:18][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 01:13:18][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 01:13:18][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 01:13:18][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 01:13:18][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 01:13:18][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 01:13:18][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 01:13:18][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -43,7 +27,7 @@ { "data": { "text/markdown": [ - "### # chop " + "###
★ chop
" ], "text/plain": [ "" @@ -75,7 +59,7 @@ { "data": { "text/markdown": [ - "### # unchop " + "###
★ unchop
" ], "text/plain": [ "" @@ -130,10 +114,9 @@ } ], "source": [ - "from datar.datasets import iris, fish_encounters\n", + "%run nb_helpers.py\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(chop, unchop)" ] }, @@ -303,7 +286,7 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": 4, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:27:29.135078Z", @@ -389,7 +372,7 @@ "5 4 3.0" ] }, - "execution_count": 5, + "execution_count": 4, "metadata": {}, "output_type": "execute_result" } @@ -402,7 +385,7 @@ }, { "cell_type": "code", - "execution_count": 7, + "execution_count": 5, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:27:29.195709Z", @@ -488,7 +471,7 @@ "5 4 3" ] }, - "execution_count": 7, + "execution_count": 5, "metadata": {}, "output_type": "execute_result" } @@ -499,7 +482,7 @@ }, { "cell_type": "code", - "execution_count": 8, + "execution_count": 6, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:27:29.210591Z", @@ -573,7 +556,7 @@ "3 1 3" ] }, - "execution_count": 8, + "execution_count": 6, "metadata": {}, "output_type": "execute_result" } @@ -585,7 +568,7 @@ }, { "cell_type": "code", - "execution_count": 9, + "execution_count": 7, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:27:29.251668Z", @@ -610,7 +593,7 @@ }, { "cell_type": "code", - "execution_count": 11, + "execution_count": 8, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:27:29.265947Z", @@ -683,7 +666,7 @@ "2 3 NaN 2.0" ] }, - "execution_count": 11, + "execution_count": 8, "metadata": {}, "output_type": "execute_result" } @@ -695,7 +678,7 @@ }, { "cell_type": "code", - "execution_count": 12, + "execution_count": 9, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:27:29.376449Z", @@ -775,7 +758,7 @@ "3 3 NaN 2.0" ] }, - "execution_count": 12, + "execution_count": 9, "metadata": {}, "output_type": "execute_result" } diff --git a/docs/notebooks/coalesce.ipynb b/docs/notebooks/coalesce.ipynb index 2a8f2c05..504a555a 100644 --- a/docs/notebooks/coalesce.ipynb +++ b/docs/notebooks/coalesce.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 00:31:06][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 00:31:06][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 00:31:06][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 00:31:06][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 00:31:06][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 00:31:06][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 00:31:06][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 00:31:06][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 00:31:06][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 00:31:06][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # coalesce " + "###
★ coalesce
" ], "text/plain": [ "" @@ -78,10 +62,10 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/coalesce.html\n", - "from datar.datasets import starwars \n", + "%run nb_helpers.py\n", + "\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(coalesce)" ] }, diff --git a/docs/notebooks/complete.ipynb b/docs/notebooks/complete.ipynb index a9182ef4..f3521729 100644 --- a/docs/notebooks/complete.ipynb +++ b/docs/notebooks/complete.ipynb @@ -12,26 +12,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 00:44:34][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 00:44:34][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 00:44:34][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 00:44:34][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 00:44:34][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 00:44:34][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 00:44:34][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 00:44:34][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 00:44:34][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 00:44:34][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -43,7 +27,7 @@ { "data": { "text/markdown": [ - "### # complete " + "###
★ complete
" ], "text/plain": [ "" @@ -84,9 +68,9 @@ } ], "source": [ + "%run nb_helpers.py\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(complete)" ] }, diff --git a/docs/notebooks/context.ipynb b/docs/notebooks/context.ipynb index e16bec7f..9c2b0842 100644 --- a/docs/notebooks/context.ipynb +++ b/docs/notebooks/context.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 00:31:25][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 00:31:25][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 00:31:25][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 00:31:25][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 00:31:25][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 00:31:25][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 00:31:25][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 00:31:25][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 00:31:25][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 00:31:25][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # cur_group_id " + "###
★ cur_group_id
" ], "text/plain": [ "" @@ -68,7 +52,7 @@ { "data": { "text/markdown": [ - "### # cur_group_rows " + "###
★ cur_group_rows
" ], "text/plain": [ "" @@ -98,7 +82,7 @@ { "data": { "text/markdown": [ - "### # cur_data " + "###
★ cur_data
" ], "text/plain": [ "" @@ -123,7 +107,7 @@ { "data": { "text/markdown": [ - "### # cur_data_all " + "###
★ cur_data_all
" ], "text/plain": [ "" @@ -148,7 +132,7 @@ { "data": { "text/markdown": [ - "### # cur_column " + "###
★ cur_column
" ], "text/plain": [ "" @@ -172,9 +156,9 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/context.html\n", + "%run nb_helpers.py\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(cur_group_id, cur_group_rows, cur_data, cur_data_all, cur_column, book='context')" ] }, @@ -314,38 +298,38 @@ " \n", " 0\n", " a\n", - " 0.006538\n", - " 0.421710\n", + " 0.276842\n", + " 0.639718\n", " \n", " \n", " 1\n", " b\n", - " 0.480888\n", - " 0.103287\n", + " 0.333175\n", + " 0.149536\n", " \n", " \n", " 2\n", " b\n", - " 0.763029\n", - " 0.543031\n", + " 0.728975\n", + " 0.400257\n", " \n", " \n", " 3\n", " c\n", - " 0.201200\n", - " 0.207406\n", + " 0.116262\n", + " 0.087035\n", " \n", " \n", " 4\n", " c\n", - " 0.508855\n", - " 0.315907\n", + " 0.541848\n", + " 0.312297\n", " \n", " \n", " 5\n", " c\n", - " 0.610592\n", - " 0.650160\n", + " 0.495865\n", + " 0.114572\n", " \n", " \n", "\n", @@ -355,12 +339,12 @@ "text/plain": [ " g x y\n", " \n", - "0 a 0.006538 0.421710\n", - "1 b 0.480888 0.103287\n", - "2 b 0.763029 0.543031\n", - "3 c 0.201200 0.207406\n", - "4 c 0.508855 0.315907\n", - "5 c 0.610592 0.650160\n", + "0 a 0.276842 0.639718\n", + "1 b 0.333175 0.149536\n", + "2 b 0.728975 0.400257\n", + "3 c 0.116262 0.087035\n", + "4 c 0.541848 0.312297\n", + "5 c 0.495865 0.114572\n", "[TibbleGrouped: g (n=3)]" ] }, @@ -424,43 +408,43 @@ " \n", " 0\n", " a\n", - " 0.006538\n", - " 0.421710\n", + " 0.276842\n", + " 0.639718\n", " 0\n", " \n", " \n", " 1\n", " b\n", - " 0.480888\n", - " 0.103287\n", + " 0.333175\n", + " 0.149536\n", " 1\n", " \n", " \n", " 2\n", " b\n", - " 0.763029\n", - " 0.543031\n", + " 0.728975\n", + " 0.400257\n", " 1\n", " \n", " \n", " 3\n", " c\n", - " 0.201200\n", - " 0.207406\n", + " 0.116262\n", + " 0.087035\n", " 2\n", " \n", " \n", " 4\n", " c\n", - " 0.508855\n", - " 0.315907\n", + " 0.541848\n", + " 0.312297\n", " 2\n", " \n", " \n", " 5\n", " c\n", - " 0.610592\n", - " 0.650160\n", + " 0.495865\n", + " 0.114572\n", " 2\n", " \n", " \n", @@ -471,12 +455,12 @@ "text/plain": [ " g x y id\n", " \n", - "0 a 0.006538 0.421710 0\n", - "1 b 0.480888 0.103287 1\n", - "2 b 0.763029 0.543031 1\n", - "3 c 0.201200 0.207406 2\n", - "4 c 0.508855 0.315907 2\n", - "5 c 0.610592 0.650160 2\n", + "0 a 0.276842 0.639718 0\n", + "1 b 0.333175 0.149536 1\n", + "2 b 0.728975 0.400257 1\n", + "3 c 0.116262 0.087035 2\n", + "4 c 0.541848 0.312297 2\n", + "5 c 0.495865 0.114572 2\n", "[TibbleGrouped: g (n=3)]" ] }, @@ -571,7 +555,7 @@ }, { "cell_type": "code", - "execution_count": 9, + "execution_count": 6, "id": "cb760a8a", "metadata": { "execution": { @@ -640,7 +624,7 @@ "2 c " ] }, - "execution_count": 9, + "execution_count": 6, "metadata": {}, "output_type": "execute_result" } @@ -652,7 +636,7 @@ }, { "cell_type": "code", - "execution_count": 10, + "execution_count": 7, "id": "4c25f162", "metadata": { "execution": { @@ -672,7 +656,7 @@ "Name: data, dtype: object" ] }, - "execution_count": 10, + "execution_count": 7, "metadata": {}, "output_type": "execute_result" } @@ -683,7 +667,7 @@ }, { "cell_type": "code", - "execution_count": 11, + "execution_count": 8, "id": "71996f23", "metadata": { "execution": { @@ -752,7 +736,7 @@ "2 c " ] }, - "execution_count": 11, + "execution_count": 8, "metadata": {}, "output_type": "execute_result" } @@ -764,7 +748,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 9, "id": "9b37d097", "metadata": { "execution": { @@ -780,19 +764,19 @@ "text/plain": [ "[ x y\n", " \n", - " 0 0.355023 0.000239,\n", + " 0 0.276842 0.639718,\n", " x y\n", " \n", - " 0 0.880160 0.685917\n", - " 1 0.346984 0.925864,\n", + " 1 0.333175 0.149536\n", + " 2 0.728975 0.400257,\n", " x y\n", " \n", - " 0 0.235711 0.701329\n", - " 1 0.320924 0.903383\n", - " 2 0.517224 0.223750]" + " 3 0.116262 0.087035\n", + " 4 0.541848 0.312297\n", + " 5 0.495865 0.114572]" ] }, - "execution_count": 1, + "execution_count": 9, "metadata": {}, "output_type": "execute_result" } @@ -803,7 +787,7 @@ }, { "cell_type": "code", - "execution_count": 12, + "execution_count": 10, "id": "03c07299", "metadata": { "execution": { @@ -872,7 +856,7 @@ "2 c " ] }, - "execution_count": 12, + "execution_count": 10, "metadata": {}, "output_type": "execute_result" } @@ -884,7 +868,7 @@ }, { "cell_type": "code", - "execution_count": 13, + "execution_count": 11, "id": "4cc41680", "metadata": { "execution": { @@ -900,19 +884,19 @@ "text/plain": [ "[ g x y\n", " \n", - " 0 a 0.006538 0.42171,\n", + " 0 a 0.276842 0.639718,\n", " g x y\n", " \n", - " 1 b 0.480888 0.103287\n", - " 2 b 0.763029 0.543031,\n", + " 1 b 0.333175 0.149536\n", + " 2 b 0.728975 0.400257,\n", " g x y\n", " \n", - " 3 c 0.201200 0.207406\n", - " 4 c 0.508855 0.315907\n", - " 5 c 0.610592 0.650160]" + " 3 c 0.116262 0.087035\n", + " 4 c 0.541848 0.312297\n", + " 5 c 0.495865 0.114572]" ] }, - "execution_count": 13, + "execution_count": 11, "metadata": {}, "output_type": "execute_result" } @@ -923,7 +907,7 @@ }, { "cell_type": "code", - "execution_count": 14, + "execution_count": 12, "id": "fe4097d2", "metadata": { "execution": { @@ -967,50 +951,50 @@ " \n", " \n", " 0\n", - " x 4.275181839861608e-05\n", - " y 0.17783898820060154\n", + " x 0.07664148433958724\n", + " y 0.4092387034410027\n", " \n", " \n", " 1\n", - " x 0.2312531724845601\n", - " y 0.01066819823473873\n", + " x 0.11100534084266422\n", + " y 0.02236109719928575\n", " \n", " \n", " 2\n", - " x 0.5822139970696143\n", - " y 0.2948830834486957\n", + " x 0.5314038334653144\n", + " y 0.16020604530995483\n", " \n", " \n", " 3\n", - " x 0.04048149826262316\n", - " y 0.04301741953459272\n", + " x 0.013516938415598222\n", + " y 0.007575071702234481\n", " \n", " \n", " 4\n", - " x 0.25893300858833146\n", - " y 0.09979740403309767\n", + " x 0.2935994793280256\n", + " y 0.0975293132771369\n", " \n", " \n", " 5\n", - " x 0.37282240541087586\n", - " y 0.4227077348376767\n", + " x 0.24588211859358594\n", + " y 0.013126717677172012\n", " \n", " \n", "\n", "\n" ], "text/plain": [ - " x y\n", - " \n", - "0 x 4.275181839861608e-05 y 0.17783898820060154\n", - "1 x 0.2312531724845601 y 0.01066819823473873\n", - "2 x 0.5822139970696143 y 0.2948830834486957\n", - "3 x 0.04048149826262316 y 0.04301741953459272\n", - "4 x 0.25893300858833146 y 0.09979740403309767\n", - "5 x 0.37282240541087586 y 0.4227077348376767" + " x y\n", + " \n", + "0 x 0.07664148433958724 y 0.4092387034410027\n", + "1 x 0.11100534084266422 y 0.02236109719928575\n", + "2 x 0.5314038334653144 y 0.16020604530995483\n", + "3 x 0.013516938415598222 y 0.007575071702234481\n", + "4 x 0.2935994793280256 y 0.0975293132771369\n", + "5 x 0.24588211859358594 y 0.013126717677172012" ] }, - "execution_count": 14, + "execution_count": 12, "metadata": {}, "output_type": "execute_result" } @@ -1026,7 +1010,7 @@ }, { "cell_type": "code", - "execution_count": 15, + "execution_count": 13, "id": "c99b8dee", "metadata": { "execution": { @@ -1073,55 +1057,55 @@ " \n", " 0\n", " a\n", - " x 4.275181839861608e-05\n", - " y 0.17783898820060154\n", + " x 0.07664148433958724\n", + " y 0.4092387034410027\n", " \n", " \n", " 1\n", " b\n", - " x 0.2312531724845601\n", - " y 0.01066819823473873\n", + " x 0.11100534084266422\n", + " y 0.02236109719928575\n", " \n", " \n", " 2\n", " b\n", - " x 0.5822139970696143\n", - " y 0.2948830834486957\n", + " x 0.5314038334653144\n", + " y 0.16020604530995483\n", " \n", " \n", " 3\n", " c\n", - " x 0.04048149826262316\n", - " y 0.04301741953459272\n", + " x 0.013516938415598222\n", + " y 0.007575071702234481\n", " \n", " \n", " 4\n", " c\n", - " x 0.25893300858833146\n", - " y 0.09979740403309767\n", + " x 0.2935994793280256\n", + " y 0.0975293132771369\n", " \n", " \n", " 5\n", " c\n", - " x 0.37282240541087586\n", - " y 0.4227077348376767\n", + " x 0.24588211859358594\n", + " y 0.013126717677172012\n", " \n", " \n", "\n", "\n" ], "text/plain": [ - " g x y\n", - " \n", - "0 a x 4.275181839861608e-05 y 0.17783898820060154\n", - "1 b x 0.2312531724845601 y 0.01066819823473873\n", - "2 b x 0.5822139970696143 y 0.2948830834486957\n", - "3 c x 0.04048149826262316 y 0.04301741953459272\n", - "4 c x 0.25893300858833146 y 0.09979740403309767\n", - "5 c x 0.37282240541087586 y 0.4227077348376767" + " g x y\n", + " \n", + "0 a x 0.07664148433958724 y 0.4092387034410027\n", + "1 b x 0.11100534084266422 y 0.02236109719928575\n", + "2 b x 0.5314038334653144 y 0.16020604530995483\n", + "3 c x 0.013516938415598222 y 0.007575071702234481\n", + "4 c x 0.2935994793280256 y 0.0975293132771369\n", + "5 c x 0.24588211859358594 y 0.013126717677172012" ] }, - "execution_count": 15, + "execution_count": 13, "metadata": {}, "output_type": "execute_result" } diff --git a/docs/notebooks/count.ipynb b/docs/notebooks/count.ipynb index 87bbbaee..b38b5192 100644 --- a/docs/notebooks/count.ipynb +++ b/docs/notebooks/count.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 01:34:00][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 01:34:00][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 01:34:00][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 01:34:00][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 01:34:00][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 01:34:00][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 01:34:00][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 01:34:00][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 01:34:00][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 01:34:00][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # count " + "###
★ count
" ], "text/plain": [ "" @@ -84,7 +68,7 @@ { "data": { "text/markdown": [ - "### # tally " + "###
★ tally
" ], "text/plain": [ "" @@ -110,7 +94,7 @@ { "data": { "text/markdown": [ - "### # add_count " + "###
★ add_count
" ], "text/plain": [ "" @@ -136,7 +120,7 @@ { "data": { "text/markdown": [ - "### # add_tally " + "###
★ add_tally
" ], "text/plain": [ "" @@ -162,11 +146,11 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/count.html\n", - "from pandas import DataFrame\n", + "%run nb_helpers.py\n", + "\n", "from datar.datasets import starwars\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(count, tally, add_count, add_tally)" ] }, diff --git a/docs/notebooks/cumall.ipynb b/docs/notebooks/cumall.ipynb index 889a23a3..589d2873 100644 --- a/docs/notebooks/cumall.ipynb +++ b/docs/notebooks/cumall.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 01:35:10][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 01:35:10][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 01:35:10][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 01:35:10][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 01:35:10][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 01:35:10][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 01:35:10][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 01:35:10][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 01:35:10][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 01:35:10][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # cummean " + "###
★ cummean
" ], "text/plain": [ "" @@ -68,7 +52,7 @@ { "data": { "text/markdown": [ - "### # cumsum " + "###
★ cumsum
" ], "text/plain": [ "" @@ -98,7 +82,7 @@ { "data": { "text/markdown": [ - "### # cumall " + "###
★ cumall
" ], "text/plain": [ "" @@ -122,7 +106,7 @@ { "data": { "text/markdown": [ - "### # cumany " + "###
★ cumany
" ], "text/plain": [ "" @@ -146,7 +130,7 @@ { "data": { "text/markdown": [ - "### # cumany " + "###
★ cumany
" ], "text/plain": [ "" @@ -170,11 +154,12 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/cumall.html\n", + "%run nb_helpers.py\n", + "\n", "import numpy\n", "\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(cummean, cumsum, cumall, cumany, cumany, book='cumall')" ] }, @@ -194,12 +179,7 @@ { "data": { "text/plain": [ - "0 1.00\n", - "1 2.00\n", - "2 3.00\n", - "3 2.75\n", - "4 2.60\n", - "Name: x, dtype: float64" + "array([1. , 2. , 3. , 2.75, 2.6 ])" ] }, "execution_count": 2, @@ -214,7 +194,7 @@ }, { "cell_type": "code", - "execution_count": 8, + "execution_count": 3, "id": "religious-voltage", "metadata": { "execution": { @@ -228,15 +208,10 @@ { "data": { "text/plain": [ - "0 1.00\n", - "1 2.00\n", - "2 3.00\n", - "3 2.75\n", - "4 2.60\n", - "Name: x, dtype: float64" + "array([1. , 2. , 3. , 2.75, 2.6 ])" ] }, - "execution_count": 8, + "execution_count": 3, "metadata": {}, "output_type": "execute_result" } @@ -261,12 +236,7 @@ { "data": { "text/plain": [ - "0 True\n", - "1 True\n", - "2 False\n", - "3 False\n", - "4 False\n", - "Name: x, dtype: bool" + "array([ True, True, False, False, False])" ] }, "execution_count": 4, @@ -294,12 +264,7 @@ { "data": { "text/plain": [ - "0 False\n", - "1 True\n", - "2 True\n", - "3 True\n", - "4 True\n", - "Name: x, dtype: bool" + "array([False, True, True, True, True])" ] }, "execution_count": 5, diff --git a/docs/notebooks/datar.ipynb b/docs/notebooks/datar.ipynb index df8c1bee..9e7e2dd1 100644 --- a/docs/notebooks/datar.ipynb +++ b/docs/notebooks/datar.ipynb @@ -2,7 +2,7 @@ "cells": [ { "cell_type": "code", - "execution_count": 15, + "execution_count": 1, "id": "5ddd5613", "metadata": { "execution": { @@ -16,7 +16,7 @@ { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -28,7 +28,7 @@ { "data": { "text/markdown": [ - "### # get " + "###
★ get
" ], "text/plain": [ "" @@ -63,7 +63,7 @@ { "data": { "text/markdown": [ - "### # flatten " + "###
★ flatten
" ], "text/plain": [ "" @@ -93,7 +93,7 @@ { "data": { "text/markdown": [ - "### # itemgetter " + "###
★ itemgetter
" ], "text/plain": [ "" @@ -128,7 +128,7 @@ { "data": { "text/markdown": [ - "### # attrgetter " + "###
★ attrgetter
" ], "text/plain": [ "" @@ -155,7 +155,7 @@ { "data": { "text/markdown": [ - "### # pd_str " + "###
★ pd_str
" ], "text/plain": [ "" @@ -181,7 +181,7 @@ { "data": { "text/markdown": [ - "### # pd_cat " + "###
★ pd_cat
" ], "text/plain": [ "" @@ -207,7 +207,7 @@ { "data": { "text/markdown": [ - "### # pd_dt " + "###
★ pd_dt
" ], "text/plain": [ "" @@ -976,7 +976,7 @@ }, { "cell_type": "code", - "execution_count": 14, + "execution_count": 12, "id": "081a9d1e", "metadata": {}, "outputs": [ @@ -1038,7 +1038,7 @@ "[TibbleGrouped: g (n=2)]" ] }, - "execution_count": 14, + "execution_count": 12, "metadata": {}, "output_type": "execute_result" } @@ -1054,7 +1054,7 @@ }, { "cell_type": "code", - "execution_count": 16, + "execution_count": 13, "id": "b2aaa7f0", "metadata": {}, "outputs": [ @@ -1116,7 +1116,7 @@ "[TibbleGrouped: g (n=2)]" ] }, - "execution_count": 16, + "execution_count": 13, "metadata": {}, "output_type": "execute_result" } diff --git a/docs/notebooks/desc.ipynb b/docs/notebooks/desc.ipynb index c2093807..33099551 100644 --- a/docs/notebooks/desc.ipynb +++ b/docs/notebooks/desc.ipynb @@ -16,7 +16,7 @@ { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -28,7 +28,7 @@ { "data": { "text/markdown": [ - "### # desc " + "###
★ desc
" ], "text/plain": [ "" @@ -62,10 +62,10 @@ } ], "source": [ + "%run nb_helpers.py\n", "from datar.base import factor, letters\n", "from datar.dplyr import desc\n", "\n", - "%run nb_helpers.py\n", "nb_header(desc)" ] }, @@ -85,17 +85,7 @@ { "data": { "text/plain": [ - "0 -1\n", - "1 -2\n", - "2 -3\n", - "3 -4\n", - "4 -5\n", - "5 -6\n", - "6 -7\n", - "7 -8\n", - "8 -9\n", - "9 -10\n", - "dtype: int64" + "array([ -1, -2, -3, -4, -5, -6, -7, -8, -9, -10])" ] }, "execution_count": 2, diff --git a/docs/notebooks/distinct.ipynb b/docs/notebooks/distinct.ipynb index 0cd322e2..ff7a1cdc 100644 --- a/docs/notebooks/distinct.ipynb +++ b/docs/notebooks/distinct.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 01:35:44][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 01:35:44][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 01:35:44][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 01:35:44][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 01:35:44][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 01:35:44][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 01:35:44][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 01:35:44][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 01:35:44][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 01:35:44][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # distinct " + "###
★ distinct
" ], "text/plain": [ "" @@ -82,7 +66,7 @@ { "data": { "text/markdown": [ - "### # n_distinct " + "###
★ n_distinct
" ], "text/plain": [ "" @@ -106,10 +90,10 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/distinct.html\n", + "%run nb_helpers.py\n", "from datar.datasets import starwars\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(distinct, n_distinct, book='distinct')" ] }, @@ -161,7 +145,7 @@ { "data": { "text/plain": [ - "60" + "61" ] }, "execution_count": 3, @@ -189,7 +173,7 @@ { "data": { "text/plain": [ - "60" + "61" ] }, "execution_count": 4, @@ -245,43 +229,43 @@ " \n", " \n", " 0\n", - " 0\n", + " 8\n", " \n", " \n", - " 2\n", - " 2\n", + " 1\n", + " 5\n", " \n", " \n", " 3\n", - " 3\n", + " 4\n", " \n", " \n", " 4\n", - " 4\n", + " 0\n", " \n", " \n", - " 7\n", - " 1\n", + " 6\n", + " 7\n", " \n", " \n", - " 8\n", - " 6\n", + " 12\n", + " 2\n", " \n", " \n", - " 11\n", - " 5\n", + " 13\n", + " 1\n", " \n", " \n", - " 13\n", - " 8\n", + " 14\n", + " 3\n", " \n", " \n", " 15\n", - " 9\n", + " 6\n", " \n", " \n", - " 27\n", - " 7\n", + " 21\n", + " 9\n", " \n", " \n", "\n", @@ -290,16 +274,16 @@ "text/plain": [ " x\n", " \n", - "0 0\n", - "2 2\n", - "3 3\n", - "4 4\n", - "7 1\n", - "8 6\n", - "11 5\n", - "13 8\n", - "15 9\n", - "27 7" + "0 8\n", + "1 5\n", + "3 4\n", + "4 0\n", + "6 7\n", + "12 2\n", + "13 1\n", + "14 3\n", + "15 6\n", + "21 9" ] }, "execution_count": 5, @@ -355,43 +339,43 @@ " \n", " \n", " 0\n", - " 1\n", + " 5\n", " \n", " \n", " 1\n", - " 5\n", + " 7\n", " \n", " \n", - " 4\n", - " 2\n", + " 2\n", + " 9\n", " \n", " \n", - " 5\n", - " 7\n", + " 3\n", + " 4\n", " \n", " \n", - " 6\n", - " 0\n", + " 4\n", + " 6\n", " \n", " \n", - " 9\n", - " 8\n", + " 5\n", + " 1\n", " \n", " \n", - " 12\n", - " 6\n", + " 13\n", + " 0\n", " \n", " \n", - " 13\n", - " 3\n", + " 14\n", + " 2\n", " \n", " \n", - " 15\n", - " 9\n", + " 17\n", + " 3\n", " \n", " \n", - " 25\n", - " 4\n", + " 18\n", + " 8\n", " \n", " \n", "\n", @@ -400,16 +384,16 @@ "text/plain": [ " y\n", " \n", - "0 1\n", - "1 5\n", - "4 2\n", - "5 7\n", - "6 0\n", - "9 8\n", - "12 6\n", - "13 3\n", - "15 9\n", - "25 4" + "0 5\n", + "1 7\n", + "2 9\n", + "3 4\n", + "4 6\n", + "5 1\n", + "13 0\n", + "14 2\n", + "17 3\n", + "18 8" ] }, "execution_count": 6, @@ -467,53 +451,53 @@ " \n", " \n", " 0\n", - " 0\n", - " 1\n", + " 8\n", + " 5\n", " \n", " \n", - " 2\n", - " 2\n", - " 1\n", + " 1\n", + " 5\n", + " 7\n", " \n", " \n", " 3\n", - " 3\n", - " 5\n", + " 4\n", + " 4\n", " \n", " \n", " 4\n", - " 4\n", - " 2\n", + " 0\n", + " 6\n", " \n", " \n", - " 7\n", - " 1\n", + " 6\n", " 7\n", + " 4\n", " \n", " \n", - " 8\n", - " 6\n", - " 7\n", + " 12\n", + " 2\n", + " 5\n", " \n", " \n", - " 11\n", - " 5\n", + " 13\n", + " 1\n", " 0\n", " \n", " \n", - " 13\n", - " 8\n", + " 14\n", " 3\n", + " 2\n", " \n", " \n", " 15\n", - " 9\n", - " 9\n", + " 6\n", + " 0\n", " \n", " \n", - " 27\n", - " 7\n", - " 8\n", + " 21\n", + " 9\n", + " 6\n", " \n", " \n", "\n", @@ -522,16 +506,16 @@ "text/plain": [ " x y\n", " \n", - "0 0 1\n", - "2 2 1\n", - "3 3 5\n", - "4 4 2\n", - "7 1 7\n", - "8 6 7\n", - "11 5 0\n", - "13 8 3\n", - "15 9 9\n", - "27 7 8" + "0 8 5\n", + "1 5 7\n", + "3 4 4\n", + "4 0 6\n", + "6 7 4\n", + "12 2 5\n", + "13 1 0\n", + "14 3 2\n", + "15 6 0\n", + "21 9 6" ] }, "execution_count": 7, @@ -589,53 +573,53 @@ " \n", " \n", " 0\n", - " 0\n", - " 1\n", + " 8\n", + " 5\n", " \n", " \n", " 1\n", - " 0\n", " 5\n", + " 7\n", " \n", " \n", - " 4\n", - " 4\n", - " 2\n", + " 2\n", + " 5\n", + " 9\n", " \n", " \n", - " 5\n", - " 0\n", - " 7\n", + " 3\n", + " 4\n", + " 4\n", " \n", " \n", - " 6\n", - " 0\n", + " 4\n", " 0\n", - " \n", - " \n", - " 9\n", " 6\n", - " 8\n", " \n", " \n", - " 12\n", - " 2\n", - " 6\n", + " 5\n", + " 5\n", + " 1\n", " \n", " \n", " 13\n", - " 8\n", + " 1\n", + " 0\n", + " \n", + " \n", + " 14\n", " 3\n", + " 2\n", " \n", " \n", - " 15\n", - " 9\n", - " 9\n", + " 17\n", + " 7\n", + " 3\n", " \n", " \n", - " 25\n", - " 1\n", + " 18\n", " 4\n", + " 8\n", " \n", " \n", "\n", @@ -644,16 +628,16 @@ "text/plain": [ " x y\n", " \n", - "0 0 1\n", - "1 0 5\n", - "4 4 2\n", - "5 0 7\n", - "6 0 0\n", - "9 6 8\n", - "12 2 6\n", - "13 8 3\n", - "15 9 9\n", - "25 1 4" + "0 8 5\n", + "1 5 7\n", + "2 5 9\n", + "3 4 4\n", + "4 0 6\n", + "5 5 1\n", + "13 1 0\n", + "14 3 2\n", + "17 7 3\n", + "18 4 8" ] }, "execution_count": 8, @@ -709,44 +693,44 @@ " \n", " \n", " 0\n", - " 1\n", + " 3\n", " \n", " \n", " 1\n", - " 5\n", - " \n", - " \n", - " 3\n", " 2\n", " \n", " \n", - " 5\n", - " 7\n", + " 2\n", + " 4\n", " \n", " \n", - " 6\n", + " 3\n", " 0\n", " \n", " \n", - " 7\n", + " 4\n", " 6\n", " \n", " \n", - " 10\n", - " 4\n", + " 7\n", + " 7\n", " \n", " \n", - " 23\n", - " 3\n", + " 10\n", + " 1\n", " \n", " \n", - " 26\n", - " 9\n", + " 16\n", + " 5\n", " \n", " \n", - " 47\n", + " 44\n", " 8\n", " \n", + " \n", + " 53\n", + " 9\n", + " \n", " \n", "\n", "\n" @@ -754,16 +738,16 @@ "text/plain": [ " diff\n", " \n", - "0 1\n", - "1 5\n", - "3 2\n", - "5 7\n", - "6 0\n", - "7 6\n", - "10 4\n", - "23 3\n", - "26 9\n", - "47 8" + "0 3\n", + "1 2\n", + "2 4\n", + "3 0\n", + "4 6\n", + "7 7\n", + "10 1\n", + "16 5\n", + "44 8\n", + "53 9" ] }, "execution_count": 9, diff --git a/docs/notebooks/drop_na.ipynb b/docs/notebooks/drop_na.ipynb index 8cfa336f..49245d87 100644 --- a/docs/notebooks/drop_na.ipynb +++ b/docs/notebooks/drop_na.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 01:36:59][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 01:36:59][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 01:36:59][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 01:36:59][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 01:36:59][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 01:36:59][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 01:36:59][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 01:36:59][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 01:36:59][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 01:36:59][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # drop_na " + "###
★ drop_na
" ], "text/plain": [ "" @@ -83,10 +67,10 @@ ], "source": [ "# https://tidyr.tidyverse.org/reference/drop_na.html\n", + "%run nb_helpers.py\n", "\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(drop_na)" ] }, diff --git a/docs/notebooks/enframe.ipynb b/docs/notebooks/enframe.ipynb index 05ff86f0..96551a5e 100644 --- a/docs/notebooks/enframe.ipynb +++ b/docs/notebooks/enframe.ipynb @@ -15,7 +15,7 @@ { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -27,7 +27,7 @@ { "data": { "text/markdown": [ - "### # enframe " + "###
★ enframe
" ], "text/plain": [ "" @@ -62,7 +62,7 @@ { "data": { "text/markdown": [ - "### # deframe " + "###
★ deframe
" ], "text/plain": [ "" @@ -94,11 +94,11 @@ ], "source": [ "# https://tibble.tidyverse.org/reference/enframe.html\n", + "%run nb_helpers.py\n", "\n", "from datar.tibble import *\n", "from datar.base import seq\n", "\n", - "%run nb_helpers.py\n", "nb_header(enframe, deframe, book='enframe')" ] }, diff --git a/docs/notebooks/expand.ipynb b/docs/notebooks/expand.ipynb index 9ef9d710..58055ecb 100644 --- a/docs/notebooks/expand.ipynb +++ b/docs/notebooks/expand.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 01:39:34][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 01:39:34][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 01:39:34][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 01:39:34][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 01:39:34][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 01:39:34][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 01:39:34][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 01:39:34][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 01:39:34][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 01:39:34][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # expand " + "###
★ expand
" ], "text/plain": [ "" @@ -99,7 +83,7 @@ { "data": { "text/markdown": [ - "### # nesting " + "###
★ nesting
" ], "text/plain": [ "" @@ -153,7 +137,7 @@ { "data": { "text/markdown": [ - "### # crossing " + "###
★ crossing
" ], "text/plain": [ "" @@ -209,10 +193,10 @@ ], "source": [ "# https://tidyr.tidyverse.org/reference/expand.html\n", + "%run nb_helpers.py\n", "\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(expand, nesting, crossing)" ] }, @@ -269,42 +253,42 @@ " apple\n", " 2010\n", " XS\n", - " 0.110248\n", + " 0.834311\n", " \n", " \n", " 1\n", " orange\n", " 2010\n", " S\n", - " 0.032335\n", + " 0.611588\n", " \n", " \n", " 2\n", " apple\n", " 2012\n", " M\n", - " 0.096288\n", + " 1.153312\n", " \n", " \n", " 3\n", " orange\n", " 2010\n", " S\n", - " 0.850895\n", + " -0.929683\n", " \n", " \n", " 4\n", " orange\n", " 2010\n", " S\n", - " 0.277872\n", + " 0.908996\n", " \n", " \n", " 5\n", " orange\n", " 2012\n", " M\n", - " -1.816750\n", + " -0.228062\n", " \n", " \n", "\n", @@ -313,12 +297,12 @@ "text/plain": [ " type year size weights\n", " \n", - "0 apple 2010 XS 0.110248\n", - "1 orange 2010 S 0.032335\n", - "2 apple 2012 M 0.096288\n", - "3 orange 2010 S 0.850895\n", - "4 orange 2010 S 0.277872\n", - "5 orange 2012 M -1.816750" + "0 apple 2010 XS 0.834311\n", + "1 orange 2010 S 0.611588\n", + "2 apple 2012 M 1.153312\n", + "3 orange 2010 S -0.929683\n", + "4 orange 2010 S 0.908996\n", + "5 orange 2012 M -0.228062" ] }, "execution_count": 2, @@ -2018,7 +2002,7 @@ " apple\n", " 2010\n", " XS\n", - " 0.110248\n", + " 0.834311\n", " \n", " \n", " 1\n", @@ -2053,7 +2037,7 @@ " apple\n", " 2012\n", " M\n", - " 0.096288\n", + " 1.153312\n", " \n", " \n", " 6\n", @@ -2088,21 +2072,21 @@ " orange\n", " 2010\n", " S\n", - " 0.032335\n", + " 0.611588\n", " \n", " \n", " 11\n", " orange\n", " 2010\n", " S\n", - " 0.850895\n", + " -0.929683\n", " \n", " \n", " 12\n", " orange\n", " 2010\n", " S\n", - " 0.277872\n", + " 0.908996\n", " \n", " \n", " 13\n", @@ -2123,7 +2107,7 @@ " orange\n", " 2012\n", " M\n", - " -1.816750\n", + " -0.228062\n", " \n", " \n", " 16\n", @@ -2146,22 +2130,22 @@ "text/plain": [ " type year size weights\n", " \n", - "0 apple 2010 XS 0.110248\n", + "0 apple 2010 XS 0.834311\n", "1 apple 2012 XS NaN\n", "2 apple 2010 S NaN\n", "3 apple 2012 S NaN\n", "4 apple 2010 M NaN\n", - "5 apple 2012 M 0.096288\n", + "5 apple 2012 M 1.153312\n", "6 apple 2010 L NaN\n", "7 apple 2012 L NaN\n", "8 orange 2010 XS NaN\n", "9 orange 2012 XS NaN\n", - "10 orange 2010 S 0.032335\n", - "11 orange 2010 S 0.850895\n", - "12 orange 2010 S 0.277872\n", + "10 orange 2010 S 0.611588\n", + "11 orange 2010 S -0.929683\n", + "12 orange 2010 S 0.908996\n", "13 orange 2012 S NaN\n", "14 orange 2010 M NaN\n", - "15 orange 2012 M -1.816750\n", + "15 orange 2012 M -0.228062\n", "16 orange 2010 L NaN\n", "17 orange 2012 L NaN" ] diff --git a/docs/notebooks/expand_grid.ipynb b/docs/notebooks/expand_grid.ipynb index 46f36e8d..839a4a09 100644 --- a/docs/notebooks/expand_grid.ipynb +++ b/docs/notebooks/expand_grid.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 01:38:35][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 01:38:35][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 01:38:35][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 01:38:35][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 01:38:35][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 01:38:35][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 01:38:35][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 01:38:35][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 01:38:35][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 01:38:35][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # expand_grid " + "###
★ expand_grid
" ], "text/plain": [ "" @@ -93,10 +77,10 @@ ], "source": [ "# https://tidyr.tidyverse.org/reference/expand_grid.html\n", + "%run nb_helpers.py\n", "\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(expand_grid)" ] }, diff --git a/docs/notebooks/extract.ipynb b/docs/notebooks/extract.ipynb index e92def06..a674d41b 100644 --- a/docs/notebooks/extract.ipynb +++ b/docs/notebooks/extract.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 01:39:44][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 01:39:44][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 01:39:44][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 01:39:44][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 01:39:44][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 01:39:44][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 01:39:44][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 01:39:44][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 01:39:44][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 01:39:44][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # extract " + "###
★ extract
" ], "text/plain": [ "" @@ -88,10 +72,10 @@ ], "source": [ "# https://tidyr.tidyverse.org/reference/extract.html\n", + "%run nb_helpers.py\n", "\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(extract)" ] }, diff --git a/docs/notebooks/fill.ipynb b/docs/notebooks/fill.ipynb index 208106ae..35cf603b 100644 --- a/docs/notebooks/fill.ipynb +++ b/docs/notebooks/fill.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 01:39:59][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 01:39:59][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 01:39:59][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 01:39:59][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 01:39:59][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 01:39:59][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 01:39:59][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 01:39:59][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 01:39:59][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 01:39:59][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # fill " + "###
★ fill
" ], "text/plain": [ "" @@ -82,10 +66,10 @@ ], "source": [ "# https://tidyr.tidyverse.org/reference/fill.html\n", + "%run nb_helpers.py\n", "\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(fill)" ] }, diff --git a/docs/notebooks/filter-joins.ipynb b/docs/notebooks/filter-joins.ipynb index b361864f..adb8fae0 100644 --- a/docs/notebooks/filter-joins.ipynb +++ b/docs/notebooks/filter-joins.ipynb @@ -12,26 +12,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 01:40:07][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 01:40:07][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 01:40:07][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 01:40:07][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 01:40:07][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 01:40:07][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 01:40:07][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 01:40:07][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 01:40:07][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 01:40:07][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -43,7 +27,7 @@ { "data": { "text/markdown": [ - "### # semi_join " + "###
★ semi_join
" ], "text/plain": [ "" @@ -70,7 +54,7 @@ { "data": { "text/markdown": [ - "### # anti_join " + "###
★ anti_join
" ], "text/plain": [ "" @@ -97,11 +81,11 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/filter-joins.html\n", + "%run nb_helpers.py\n", "\n", "from datar.datasets import band_members, band_instruments\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(semi_join, anti_join, book='filter-joins')" ] }, diff --git a/docs/notebooks/filter.ipynb b/docs/notebooks/filter.ipynb index 78a53f05..24cffdf0 100644 --- a/docs/notebooks/filter.ipynb +++ b/docs/notebooks/filter.ipynb @@ -12,26 +12,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 01:45:09][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 01:45:09][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 01:45:09][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 01:45:09][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 01:45:09][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 01:45:09][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 01:45:09][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 01:45:09][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 01:45:09][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 01:45:09][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -43,7 +27,7 @@ { "data": { "text/markdown": [ - "### # filter " + "###
★ filter
" ], "text/plain": [ "" @@ -75,10 +59,10 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/filter.html\n", + "%run nb_helpers.py\n", "from datar.datasets import starwars\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(filter)" ] }, diff --git a/docs/notebooks/forcats_fct_multi.ipynb b/docs/notebooks/forcats_fct_multi.ipynb index ef32f183..7256146e 100644 --- a/docs/notebooks/forcats_fct_multi.ipynb +++ b/docs/notebooks/forcats_fct_multi.ipynb @@ -5,26 +5,10 @@ "execution_count": 1, "metadata": {}, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 01:45:24][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 01:45:24][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 01:45:24][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 01:45:24][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 01:45:24][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 01:45:24][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 01:45:24][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 01:45:24][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 01:45:24][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 01:45:24][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -36,7 +20,7 @@ { "data": { "text/markdown": [ - "### # fct_c " + "###
★ fct_c
" ], "text/plain": [ "" @@ -69,7 +53,7 @@ { "data": { "text/markdown": [ - "### # fct_cross " + "###
★ fct_cross
" ], "text/plain": [ "" @@ -103,9 +87,8 @@ } ], "source": [ - "from datar.all import *\n", - "\n", "%run nb_helpers.py\n", + "from datar.all import *\n", "\n", "nb_header(\n", " fct_c,\n", diff --git a/docs/notebooks/forcats_lvl_addrm.ipynb b/docs/notebooks/forcats_lvl_addrm.ipynb index 6d263272..2ce5153d 100644 --- a/docs/notebooks/forcats_lvl_addrm.ipynb +++ b/docs/notebooks/forcats_lvl_addrm.ipynb @@ -5,26 +5,10 @@ "execution_count": 1, "metadata": {}, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 01:45:37][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 01:45:37][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 01:45:37][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 01:45:37][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 01:45:37][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 01:45:37][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 01:45:37][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 01:45:37][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 01:45:37][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 01:45:37][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -36,7 +20,7 @@ { "data": { "text/markdown": [ - "### # fct_expand " + "###
★ fct_expand
" ], "text/plain": [ "" @@ -68,7 +52,7 @@ { "data": { "text/markdown": [ - "### # fct_explicit_na " + "###
★ fct_explicit_na
" ], "text/plain": [ "" @@ -103,7 +87,7 @@ { "data": { "text/markdown": [ - "### # fct_drop " + "###
★ fct_drop
" ], "text/plain": [ "" @@ -136,7 +120,7 @@ { "data": { "text/markdown": [ - "### # fct_unify " + "###
★ fct_unify
" ], "text/plain": [ "" @@ -167,9 +151,8 @@ } ], "source": [ - "from datar.all import *\n", - "\n", "%run nb_helpers.py\n", + "from datar.all import *\n", "\n", "nb_header(\n", " fct_expand,\n", @@ -195,7 +178,7 @@ { "data": { "text/plain": [ - "['b', 'b', 'c', 'a', 'c', ..., 'a', 'c', 'b', 'a', 'c']\n", + "['c', 'a', 'a', 'c', 'b', ..., 'c', 'a', 'c', 'a', 'b']\n", "Length: 20\n", "Categories (3, object): ['a', 'b', 'c']" ] @@ -218,7 +201,7 @@ { "data": { "text/plain": [ - "['b', 'b', 'c', 'a', 'c', ..., 'a', 'c', 'b', 'a', 'c']\n", + "['c', 'a', 'a', 'c', 'b', ..., 'c', 'a', 'c', 'a', 'b']\n", "Length: 20\n", "Categories (6, object): ['a', 'b', 'c', 'd', 'e', 'f']" ] @@ -240,7 +223,7 @@ { "data": { "text/plain": [ - "['b', 'b', 'c', 'a', 'c', ..., 'a', 'c', 'b', 'a', 'c']\n", + "['c', 'a', 'a', 'c', 'b', ..., 'c', 'a', 'c', 'a', 'b']\n", "Length: 20\n", "Categories (6, object): ['a', 'b', 'c', 'd', 'e', 'f']" ] diff --git a/docs/notebooks/forcats_lvl_order.ipynb b/docs/notebooks/forcats_lvl_order.ipynb index 7c9cdf84..f6c92c6c 100644 --- a/docs/notebooks/forcats_lvl_order.ipynb +++ b/docs/notebooks/forcats_lvl_order.ipynb @@ -5,26 +5,10 @@ "execution_count": 1, "metadata": {}, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 01:52:56][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 01:52:56][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 01:52:56][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 01:52:56][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 01:52:56][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 01:52:56][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 01:52:56][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 01:52:56][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 01:52:56][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 01:52:56][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -36,7 +20,7 @@ { "data": { "text/markdown": [ - "### # fct_relevel " + "###
★ fct_relevel
" ], "text/plain": [ "" @@ -75,7 +59,7 @@ { "data": { "text/markdown": [ - "### # fct_inorder " + "###
★ fct_inorder
" ], "text/plain": [ "" @@ -107,7 +91,7 @@ { "data": { "text/markdown": [ - "### # fct_infreq " + "###
★ fct_infreq
" ], "text/plain": [ "" @@ -139,7 +123,7 @@ { "data": { "text/markdown": [ - "### # fct_inseq " + "###
★ fct_inseq
" ], "text/plain": [ "" @@ -171,7 +155,7 @@ { "data": { "text/markdown": [ - "### # fct_reorder " + "###
★ fct_reorder
" ], "text/plain": [ "" @@ -208,7 +192,7 @@ { "data": { "text/markdown": [ - "### # fct_reorder2 " + "###
★ fct_reorder2
" ], "text/plain": [ "" @@ -246,7 +230,7 @@ { "data": { "text/markdown": [ - "### # fct_rev " + "###
★ fct_rev
" ], "text/plain": [ "" @@ -276,7 +260,7 @@ { "data": { "text/markdown": [ - "### # fct_shift " + "###
★ fct_shift
" ], "text/plain": [ "" @@ -308,7 +292,7 @@ { "data": { "text/markdown": [ - "### # fct_shuffle " + "###
★ fct_shuffle
" ], "text/plain": [ "" @@ -338,7 +322,7 @@ { "data": { "text/markdown": [ - "### # first2 " + "###
★ first2
" ], "text/plain": [ "" @@ -369,7 +353,7 @@ { "data": { "text/markdown": [ - "### # last2 " + "###
★ last2
" ], "text/plain": [ "" @@ -399,12 +383,12 @@ } ], "source": [ + "%run nb_helpers.py\n", + "\n", "import plotnine as p9\n", "from datar.all import *\n", "from datar.datasets import gss_cat, iris, ChickWeight\n", "\n", - "%run nb_helpers.py\n", - "\n", "nb_header(\n", " fct_relevel,\n", " fct_inorder,\n", @@ -586,7 +570,7 @@ "data": { "text/plain": [ "['a', 'b', 'c', 'd']\n", - "Categories (4, object): ['a', 'd', 'c', 'b']" + "Categories (4, object): ['a', 'd', 'b', 'c']" ] }, "execution_count": 9, @@ -773,7 +757,7 @@ "name": "stderr", "output_type": "stream", "text": [ - "[2022-03-06 01:53:12][datar][WARNING] [fct_relevel] Unknown levels in `_f`: ['e']\n" + "[2022-03-18 17:46:13][datar][WARNING] [fct_relevel] Unknown levels in `_f`: ['e']\n" ] }, { @@ -961,7 +945,7 @@ { "data": { "text/plain": [ - "" + "" ] }, "execution_count": 20, @@ -993,7 +977,7 @@ { "data": { "text/plain": [ - "" + "" ] }, "execution_count": 21, @@ -1027,7 +1011,7 @@ { "data": { "text/plain": [ - "" + "" ] }, "execution_count": 22, @@ -1050,7 +1034,7 @@ "outputs": [ { "data": { - "image/png": "", + "image/png": "", "text/plain": [ "
" ] @@ -1061,7 +1045,7 @@ { "data": { "text/plain": [ - "" + "" ] }, "execution_count": 23, @@ -1091,7 +1075,7 @@ "outputs": [ { "data": { - "image/png": "", + "image/png": "", "text/plain": [ "
" ] @@ -1102,7 +1086,7 @@ { "data": { "text/plain": [ - "" + "" ] }, "execution_count": 24, @@ -1160,7 +1144,7 @@ "data": { "text/plain": [ "['a', 'b', 'c']\n", - "Categories (3, object): ['b', 'c', 'a']" + "Categories (3, object): ['c', 'a', 'b']" ] }, "execution_count": 26, diff --git a/docs/notebooks/forcats_lvl_value.ipynb b/docs/notebooks/forcats_lvl_value.ipynb index 9724efb1..8718da5a 100644 --- a/docs/notebooks/forcats_lvl_value.ipynb +++ b/docs/notebooks/forcats_lvl_value.ipynb @@ -5,26 +5,10 @@ "execution_count": 1, "metadata": {}, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 01:55:37][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 01:55:37][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 01:55:37][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 01:55:37][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 01:55:37][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 01:55:37][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 01:55:37][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 01:55:37][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 01:55:37][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 01:55:37][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -36,7 +20,7 @@ { "data": { "text/markdown": [ - "### # fct_anon " + "###
★ fct_anon
" ], "text/plain": [ "" @@ -67,7 +51,7 @@ { "data": { "text/markdown": [ - "### # fct_collapse " + "###
★ fct_collapse
" ], "text/plain": [ "" @@ -103,7 +87,7 @@ { "data": { "text/markdown": [ - "### # fct_lump " + "###
★ fct_lump
" ], "text/plain": [ "" @@ -149,7 +133,7 @@ { "data": { "text/markdown": [ - "### # fct_lump_min " + "###
★ fct_lump_min
" ], "text/plain": [ "" @@ -185,7 +169,7 @@ { "data": { "text/markdown": [ - "### # fct_lump_prop " + "###
★ fct_lump_prop
" ], "text/plain": [ "" @@ -224,7 +208,7 @@ { "data": { "text/markdown": [ - "### # fct_lump_n " + "###
★ fct_lump_n
" ], "text/plain": [ "" @@ -266,7 +250,7 @@ { "data": { "text/markdown": [ - "### # fct_lump_lowfreq " + "###
★ fct_lump_lowfreq
" ], "text/plain": [ "" @@ -299,7 +283,7 @@ { "data": { "text/markdown": [ - "### # fct_other " + "###
★ fct_other
" ], "text/plain": [ "" @@ -339,7 +323,7 @@ { "data": { "text/markdown": [ - "### # fct_recode " + "###
★ fct_recode
" ], "text/plain": [ "" @@ -386,7 +370,7 @@ { "data": { "text/markdown": [ - "### # fct_relabel " + "###
★ fct_relabel
" ], "text/plain": [ "" @@ -421,13 +405,13 @@ } ], "source": [ + "%run nb_helpers.py\n", + "\n", "from datar.all import *\n", "from datar.datasets import gss_cat\n", "\n", "gss_cat >>= mutate(rincome=as_factor(f.rincome))\n", "\n", - "%run nb_helpers.py\n", - "\n", "nb_header(\n", " fct_anon,\n", " fct_collapse,\n", @@ -633,52 +617,52 @@ " \n", " 0\n", " 00\n", - " 95\n", + " 104\n", " \n", " \n", " 1\n", " 01\n", - " 15\n", + " 147\n", " \n", " \n", " 2\n", " 02\n", - " 689\n", + " 388\n", " \n", " \n", " 3\n", " 03\n", - " 388\n", + " 32\n", " \n", " \n", " 4\n", " 04\n", - " 5124\n", + " 689\n", " \n", " \n", " 5\n", " 05\n", - " 32\n", + " 109\n", " \n", " \n", " 6\n", " 06\n", - " 147\n", + " 5124\n", " \n", " \n", " 7\n", " 07\n", - " 23\n", + " 3523\n", " \n", " \n", " 8\n", " 08\n", - " 109\n", + " 23\n", " \n", " \n", " 9\n", " 09\n", - " 224\n", + " 10846\n", " \n", " \n", " 10\n", @@ -688,22 +672,22 @@ " \n", " 11\n", " 11\n", - " 104\n", + " 224\n", " \n", " \n", " 12\n", " 12\n", - " 71\n", + " 15\n", " \n", " \n", " 13\n", " 13\n", - " 3523\n", + " 71\n", " \n", " \n", " 14\n", " 14\n", - " 10846\n", + " 95\n", " \n", " \n", "\n", @@ -712,21 +696,21 @@ "text/plain": [ " f n\n", " \n", - "0 00 95\n", - "1 01 15\n", - "2 02 689\n", - "3 03 388\n", - "4 04 5124\n", - "5 05 32\n", - "6 06 147\n", - "7 07 23\n", - "8 08 109\n", - "9 09 224\n", + "0 00 104\n", + "1 01 147\n", + "2 02 388\n", + "3 03 32\n", + "4 04 689\n", + "5 05 109\n", + "6 06 5124\n", + "7 07 3523\n", + "8 08 23\n", + "9 09 10846\n", "10 10 93\n", - "11 11 104\n", - "12 12 71\n", - "13 13 3523\n", - "14 14 10846" + "11 11 224\n", + "12 12 15\n", + "13 13 71\n", + "14 14 95" ] }, "execution_count": 3, @@ -777,77 +761,77 @@ " \n", " 0\n", " X00\n", - " 388\n", + " 224\n", " \n", " \n", " 1\n", " X01\n", - " 5124\n", + " 71\n", " \n", " \n", " 2\n", " X02\n", - " 32\n", + " 104\n", " \n", " \n", " 3\n", " X03\n", - " 93\n", + " 109\n", " \n", " \n", " 4\n", " X04\n", - " 104\n", + " 689\n", " \n", " \n", " 5\n", " X05\n", - " 71\n", + " 147\n", " \n", " \n", " 6\n", " X06\n", - " 23\n", + " 3523\n", " \n", " \n", " 7\n", " X07\n", - " 147\n", + " 93\n", " \n", " \n", " 8\n", " X08\n", - " 10846\n", + " 15\n", " \n", " \n", " 9\n", " X09\n", - " 95\n", + " 10846\n", " \n", " \n", " 10\n", " X10\n", - " 109\n", + " 5124\n", " \n", " \n", " 11\n", " X11\n", - " 15\n", + " 95\n", " \n", " \n", " 12\n", " X12\n", - " 224\n", + " 23\n", " \n", " \n", " 13\n", " X13\n", - " 3523\n", + " 32\n", " \n", " \n", " 14\n", " X14\n", - " 689\n", + " 388\n", " \n", " \n", "\n", @@ -856,21 +840,21 @@ "text/plain": [ " f n\n", " \n", - "0 X00 388\n", - "1 X01 5124\n", - "2 X02 32\n", - "3 X03 93\n", - "4 X04 104\n", - "5 X05 71\n", - "6 X06 23\n", - "7 X07 147\n", - "8 X08 10846\n", - "9 X09 95\n", - "10 X10 109\n", - "11 X11 15\n", - "12 X12 224\n", - "13 X13 3523\n", - "14 X14 689" + "0 X00 224\n", + "1 X01 71\n", + "2 X02 104\n", + "3 X03 109\n", + "4 X04 689\n", + "5 X05 147\n", + "6 X06 3523\n", + "7 X07 93\n", + "8 X08 15\n", + "9 X09 10846\n", + "10 X10 5124\n", + "11 X11 95\n", + "12 X12 23\n", + "13 X13 32\n", + "14 X14 388" ] }, "execution_count": 4, @@ -1133,7 +1117,7 @@ "name": "stderr", "output_type": "stream", "text": [ - "[2022-03-06 01:55:55][datar][WARNING] [fct_recode] Unknown levels in `_f`: {'bananana'}\n" + "[2022-03-18 17:45:57][datar][WARNING] [fct_recode] Unknown levels in `_f`: {'bananana'}\n" ] }, { @@ -1205,7 +1189,7 @@ }, { "cell_type": "code", - "execution_count": 12, + "execution_count": 11, "metadata": {}, "outputs": [ { @@ -1275,7 +1259,7 @@ "count 40 10 5 27 1 1 1 1 1" ] }, - "execution_count": 12, + "execution_count": 11, "metadata": {}, "output_type": "execute_result" } @@ -1287,7 +1271,7 @@ }, { "cell_type": "code", - "execution_count": 14, + "execution_count": 12, "metadata": {}, "outputs": [ { @@ -1298,7 +1282,7 @@ "Categories (4, object): ['A', 'B', 'D', 'Other']" ] }, - "execution_count": 14, + "execution_count": 12, "metadata": {}, "output_type": "execute_result" }, @@ -1323,38 +1307,29 @@ " \n", " \n", " \n", - " A\n", - " B\n", - " D\n", - " Other\n", + " warn_builtin_names\n", " \n", " \n", " \n", " \n", " \n", " <int64>\n", - " <int64>\n", - " <int64>\n", - " <int64>\n", " \n", " \n", " count\n", - " 40\n", - " 10\n", - " 27\n", - " 10\n", + " 1\n", " \n", " \n", "\n", "\n" ], "text/plain": [ - " A B D Other\n", - " \n", - "count 40 10 27 10" + " warn_builtin_names\n", + " \n", + "count 1" ] }, - "execution_count": 14, + "execution_count": 12, "metadata": {}, "output_type": "execute_result" } @@ -1366,7 +1341,7 @@ }, { "cell_type": "code", - "execution_count": 15, + "execution_count": 13, "metadata": {}, "outputs": [ { @@ -1377,7 +1352,7 @@ "Categories (4, object): ['A', 'B', 'D', 'Other']" ] }, - "execution_count": 15, + "execution_count": 13, "metadata": {}, "output_type": "execute_result" }, @@ -1402,38 +1377,29 @@ " \n", " \n", " \n", - " A\n", - " B\n", - " D\n", - " Other\n", + " warn_builtin_names\n", " \n", " \n", " \n", " \n", " \n", " <int64>\n", - " <int64>\n", - " <int64>\n", - " <int64>\n", " \n", " \n", " count\n", - " 40\n", - " 10\n", - " 27\n", - " 10\n", + " 1\n", " \n", " \n", "\n", "\n" ], "text/plain": [ - " A B D Other\n", - " \n", - "count 40 10 27 10" + " warn_builtin_names\n", + " \n", + "count 1" ] }, - "execution_count": 15, + "execution_count": 13, "metadata": {}, "output_type": "execute_result" } @@ -1445,7 +1411,7 @@ }, { "cell_type": "code", - "execution_count": 16, + "execution_count": 14, "metadata": {}, "outputs": [ { @@ -1456,7 +1422,7 @@ "Categories (5, object): ['A', 'B', 'C', 'D', 'Other']" ] }, - "execution_count": 16, + "execution_count": 14, "metadata": {}, "output_type": "execute_result" }, @@ -1481,41 +1447,29 @@ " \n", " \n", " \n", - " A\n", - " B\n", - " C\n", - " D\n", - " Other\n", + " warn_builtin_names\n", " \n", " \n", " \n", " \n", " \n", " <int64>\n", - " <int64>\n", - " <int64>\n", - " <int64>\n", - " <int64>\n", " \n", " \n", " count\n", - " 40\n", - " 10\n", - " 5\n", - " 27\n", - " 5\n", + " 1\n", " \n", " \n", "\n", "\n" ], "text/plain": [ - " A B C D Other\n", - " \n", - "count 40 10 5 27 5" + " warn_builtin_names\n", + " \n", + "count 1" ] }, - "execution_count": 16, + "execution_count": 14, "metadata": {}, "output_type": "execute_result" } @@ -1527,7 +1481,7 @@ }, { "cell_type": "code", - "execution_count": 17, + "execution_count": 15, "metadata": {}, "outputs": [ { @@ -1538,7 +1492,7 @@ "Categories (3, object): ['A', 'D', 'Other']" ] }, - "execution_count": 17, + "execution_count": 15, "metadata": {}, "output_type": "execute_result" }, @@ -1563,35 +1517,29 @@ " \n", " \n", " \n", - " A\n", - " D\n", - " Other\n", + " warn_builtin_names\n", " \n", " \n", " \n", " \n", " \n", " <int64>\n", - " <int64>\n", - " <int64>\n", " \n", " \n", " count\n", - " 40\n", - " 27\n", - " 20\n", + " 1\n", " \n", " \n", "\n", "\n" ], "text/plain": [ - " A D Other\n", - " \n", - "count 40 27 20" + " warn_builtin_names\n", + " \n", + "count 1" ] }, - "execution_count": 17, + "execution_count": 15, "metadata": {}, "output_type": "execute_result" } @@ -1603,18 +1551,18 @@ }, { "cell_type": "code", - "execution_count": 18, + "execution_count": 16, "metadata": {}, "outputs": [ { "data": { "text/plain": [ - "['H', 'I', 'I', 'D', 'G', ..., 'E', 'H', 'I', 'F', 'E']\n", + "['F', 'F', 'D', 'G', 'K', ..., 'H', 'G', 'E', 'E', 'J']\n", "Length: 100\n", - "Categories (12, object): ['A', 'B', 'C', 'D', ..., 'I', 'J', 'K', 'L']" + "Categories (11, object): ['A', 'B', 'C', 'D', ..., 'H', 'I', 'J', 'K']" ] }, - "execution_count": 18, + "execution_count": 16, "metadata": {}, "output_type": "execute_result" } @@ -1626,7 +1574,7 @@ }, { "cell_type": "code", - "execution_count": 19, + "execution_count": 17, "metadata": {}, "outputs": [ { @@ -1661,7 +1609,6 @@ " I\n", " J\n", " K\n", - " L\n", " \n", " \n", " \n", @@ -1678,22 +1625,20 @@ " <int64>\n", " <int64>\n", " <int64>\n", - " <int64>\n", " \n", " \n", " count\n", - " 2\n", " 1\n", - " 9\n", - " 14\n", - " 14\n", - " 18\n", + " 4\n", " 12\n", + " 13\n", + " 27\n", " 12\n", + " 8\n", " 12\n", " 3\n", - " 1\n", - " 2\n", + " 4\n", + " 4\n", " \n", " \n", "\n", @@ -1702,14 +1647,14 @@ "text/plain": [ " A B C D E F G H I \\\n", " \n", - "count 2 1 9 14 14 18 12 12 12 \n", + "count 1 4 12 13 27 12 8 12 3 \n", "\n", - " J K L \n", - " \n", - "count 3 1 2 " + " J K \n", + " \n", + "count 4 4 " ] }, - "execution_count": 19, + "execution_count": 17, "metadata": {}, "output_type": "execute_result" } @@ -1720,7 +1665,7 @@ }, { "cell_type": "code", - "execution_count": 20, + "execution_count": 18, "metadata": {}, "outputs": [ { @@ -1744,7 +1689,6 @@ " \n", " \n", " \n", - " A\n", " B\n", " C\n", " D\n", @@ -1755,7 +1699,7 @@ " I\n", " J\n", " K\n", - " L\n", + " Other\n", " \n", " \n", " \n", @@ -1772,38 +1716,36 @@ " <int64>\n", " <int64>\n", " <int64>\n", - " <int64>\n", " \n", " \n", " count\n", - " 2\n", - " 1\n", - " 9\n", - " 14\n", - " 14\n", - " 18\n", + " 4\n", " 12\n", + " 13\n", + " 27\n", " 12\n", + " 8\n", " 12\n", " 3\n", + " 4\n", + " 4\n", " 1\n", - " 2\n", " \n", " \n", "\n", "\n" ], "text/plain": [ - " A B C D E F G H I \\\n", + " B C D E F G H I J \\\n", " \n", - "count 2 1 9 14 14 18 12 12 12 \n", + "count 4 12 13 27 12 8 12 3 4 \n", "\n", - " J K L \n", - " \n", - "count 3 1 2 " + " K Other \n", + " \n", + "count 4 1 " ] }, - "execution_count": 20, + "execution_count": 18, "metadata": {}, "output_type": "execute_result" } @@ -1814,18 +1756,18 @@ }, { "cell_type": "code", - "execution_count": 21, + "execution_count": 19, "metadata": {}, "outputs": [ { "data": { "text/plain": [ - "['Other', 'Other', 'Other', 'D', 'Other', ..., 'E', 'Other', 'Other', 'F', 'E']\n", + "['F', 'F', 'D', 'Other', 'Other', ..., 'H', 'Other', 'E', 'E', 'Other']\n", "Length: 100\n", - "Categories (4, object): ['D', 'E', 'F', 'Other']" + "Categories (6, object): ['C', 'D', 'E', 'F', 'H', 'Other']" ] }, - "execution_count": 21, + "execution_count": 19, "metadata": {}, "output_type": "execute_result" } @@ -1836,18 +1778,18 @@ }, { "cell_type": "code", - "execution_count": 22, + "execution_count": 20, "metadata": {}, "outputs": [ { "data": { "text/plain": [ - "['H', 'I', 'I', 'D', 'G', ..., 'E', 'H', 'I', 'F', 'E']\n", + "['F', 'F', 'D', 'Other', 'Other', ..., 'H', 'Other', 'E', 'E', 'Other']\n", "Length: 100\n", - "Categories (7, object): ['D', 'E', 'F', 'G', 'H', 'I', 'Other']" + "Categories (6, object): ['C', 'D', 'E', 'F', 'H', 'Other']" ] }, - "execution_count": 22, + "execution_count": 20, "metadata": {}, "output_type": "execute_result" } @@ -1858,18 +1800,18 @@ }, { "cell_type": "code", - "execution_count": 23, + "execution_count": 21, "metadata": {}, "outputs": [ { "data": { "text/plain": [ - "['Other', 'Other', 'Other', 'Other', 'Other', ..., 'Other', 'Other', 'Other', 'Other', 'Other']\n", + "['Other', 'Other', 'Other', 'Other', 'K', ..., 'Other', 'Other', 'Other', 'Other', 'J']\n", "Length: 100\n", - "Categories (5, object): ['A', 'B', 'K', 'L', 'Other']" + "Categories (6, object): ['A', 'B', 'I', 'J', 'K', 'Other']" ] }, - "execution_count": 23, + "execution_count": 21, "metadata": {}, "output_type": "execute_result" } @@ -1881,18 +1823,18 @@ }, { "cell_type": "code", - "execution_count": 24, + "execution_count": 22, "metadata": {}, "outputs": [ { "data": { "text/plain": [ - "['Other', 'Other', 'Other', 'Other', 'Other', ..., 'Other', 'Other', 'Other', 'Other', 'Other']\n", + "['Other', 'Other', 'Other', 'G', 'K', ..., 'Other', 'G', 'Other', 'Other', 'J']\n", "Length: 100\n", - "Categories (7, object): ['A', 'B', 'C', 'J', 'K', 'L', 'Other']" + "Categories (7, object): ['A', 'B', 'G', 'I', 'J', 'K', 'Other']" ] }, - "execution_count": 24, + "execution_count": 22, "metadata": {}, "output_type": "execute_result" } @@ -1903,18 +1845,18 @@ }, { "cell_type": "code", - "execution_count": 25, + "execution_count": 23, "metadata": {}, "outputs": [ { "data": { "text/plain": [ - "['Other', 'I', 'I', 'D', 'G', ..., 'E', 'Other', 'I', 'F', 'E']\n", + "['F', 'F', 'D', 'Other', 'Other', ..., 'H', 'Other', 'E', 'E', 'Other']\n", "Length: 100\n", - "Categories (6, object): ['D', 'E', 'F', 'G', 'I', 'Other']" + "Categories (6, object): ['C', 'D', 'E', 'F', 'H', 'Other']" ] }, - "execution_count": 25, + "execution_count": 23, "metadata": {}, "output_type": "execute_result" } @@ -1926,18 +1868,18 @@ }, { "cell_type": "code", - "execution_count": 26, + "execution_count": 24, "metadata": {}, "outputs": [ { "data": { "text/plain": [ - "['H', 'I', 'I', 'D', 'G', ..., 'E', 'H', 'I', 'F', 'E']\n", + "['F', 'F', 'D', 'G', 'Other', ..., 'H', 'G', 'E', 'E', 'Other']\n", "Length: 100\n", - "Categories (7, object): ['D', 'E', 'F', 'G', 'H', 'I', 'Other']" + "Categories (7, object): ['C', 'D', 'E', 'F', 'G', 'H', 'Other']" ] }, - "execution_count": 26, + "execution_count": 24, "metadata": {}, "output_type": "execute_result" } @@ -1948,18 +1890,18 @@ }, { "cell_type": "code", - "execution_count": 27, + "execution_count": 25, "metadata": {}, "outputs": [ { "data": { "text/plain": [ - "['H', 'I', 'I', 'D', 'G', ..., 'E', 'H', 'I', 'F', 'E']\n", + "['F', 'F', 'D', 'G', 'Other', ..., 'H', 'G', 'E', 'E', 'Other']\n", "Length: 100\n", - "Categories (7, object): ['D', 'E', 'F', 'G', 'H', 'I', 'Other']" + "Categories (7, object): ['C', 'D', 'E', 'F', 'G', 'H', 'Other']" ] }, - "execution_count": 27, + "execution_count": 25, "metadata": {}, "output_type": "execute_result" } @@ -1970,7 +1912,7 @@ }, { "cell_type": "code", - "execution_count": 28, + "execution_count": 26, "metadata": {}, "outputs": [ { @@ -1994,12 +1936,11 @@ " \n", " \n", " \n", + " C\n", " D\n", " E\n", " F\n", - " G\n", " H\n", - " I\n", " Other\n", " \n", " \n", @@ -2012,29 +1953,27 @@ " <int64>\n", " <int64>\n", " <int64>\n", - " <int64>\n", " \n", " \n", " count\n", - " 14\n", - " 14\n", - " 18\n", " 12\n", + " 13\n", + " 27\n", " 12\n", " 12\n", - " 18\n", + " 24\n", " \n", " \n", "\n", "\n" ], "text/plain": [ - " D E F G H I Other\n", - " \n", - "count 14 14 18 12 12 12 18" + " C D E F H Other\n", + " \n", + "count 12 13 27 12 12 24" ] }, - "execution_count": 28, + "execution_count": 26, "metadata": {}, "output_type": "execute_result" } @@ -2046,7 +1985,7 @@ }, { "cell_type": "code", - "execution_count": 29, + "execution_count": 27, "metadata": {}, "outputs": [ { @@ -2070,7 +2009,7 @@ " \n", " \n", " \n", - " F\n", + " E\n", " Other\n", " \n", " \n", @@ -2082,20 +2021,20 @@ " \n", " \n", " count\n", - " 18\n", - " 82\n", + " 27\n", + " 73\n", " \n", " \n", "\n", "\n" ], "text/plain": [ - " F Other\n", + " E Other\n", " \n", - "count 18 82" + "count 27 73" ] }, - "execution_count": 29, + "execution_count": 27, "metadata": {}, "output_type": "execute_result" } @@ -2113,7 +2052,7 @@ }, { "cell_type": "code", - "execution_count": 30, + "execution_count": 28, "metadata": {}, "outputs": [ { @@ -2124,7 +2063,7 @@ "Categories (3, object): ['A', 'B', 'Other']" ] }, - "execution_count": 30, + "execution_count": 28, "metadata": {}, "output_type": "execute_result" } @@ -2135,18 +2074,18 @@ }, { "cell_type": "code", - "execution_count": 31, + "execution_count": 29, "metadata": {}, "outputs": [ { "data": { "text/plain": [ - "['I', 'J', 'J', 'E', 'H', ..., 'F', 'I', 'J', 'G', 'F']\n", + "['F', 'F', 'D', 'G', 'K', ..., 'H', 'G', 'E', 'E', 'J']\n", "Length: 100\n", - "Categories (11, object): ['C', 'D', 'E', 'F', ..., 'J', 'K', 'L', 'Other']" + "Categories (10, object): ['C', 'D', 'E', 'F', ..., 'I', 'J', 'K', 'Other']" ] }, - "execution_count": 31, + "execution_count": 29, "metadata": {}, "output_type": "execute_result" } @@ -2164,7 +2103,7 @@ }, { "cell_type": "code", - "execution_count": 32, + "execution_count": 30, "metadata": {}, "outputs": [ { @@ -2174,7 +2113,7 @@ "Categories (3, object): ['fruit', 'bear', 'dear']" ] }, - "execution_count": 32, + "execution_count": 30, "metadata": {}, "output_type": "execute_result" } @@ -2186,14 +2125,14 @@ }, { "cell_type": "code", - "execution_count": 33, + "execution_count": 31, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ - "[2022-03-06 01:59:10][datar][WARNING] [fct_recode] Unknown levels in `_f`: {'bananana'}\n" + "[2022-03-18 17:46:03][datar][WARNING] [fct_recode] Unknown levels in `_f`: {'bananana'}\n" ] }, { @@ -2203,7 +2142,7 @@ "Categories (4, object): ['fruit', 'banana', 'bear', 'dear']" ] }, - "execution_count": 33, + "execution_count": 31, "metadata": {}, "output_type": "execute_result" } @@ -2215,7 +2154,7 @@ }, { "cell_type": "code", - "execution_count": 34, + "execution_count": 32, "metadata": {}, "outputs": [ { @@ -2225,7 +2164,7 @@ "Categories (3, object): ['fruit', 'bear', 'dear']" ] }, - "execution_count": 34, + "execution_count": 32, "metadata": {}, "output_type": "execute_result" } @@ -2237,7 +2176,7 @@ }, { "cell_type": "code", - "execution_count": 35, + "execution_count": 33, "metadata": {}, "outputs": [ { @@ -2247,7 +2186,7 @@ "Categories (4, object): ['an apple', 'banana', 'a bear', 'dear']" ] }, - "execution_count": 35, + "execution_count": 33, "metadata": {}, "output_type": "execute_result" } @@ -2265,7 +2204,7 @@ }, { "cell_type": "code", - "execution_count": 36, + "execution_count": 34, "metadata": {}, "outputs": [ { @@ -2368,7 +2307,7 @@ "9 Strong republican 2314" ] }, - "execution_count": 36, + "execution_count": 34, "metadata": {}, "output_type": "execute_result" } @@ -2379,7 +2318,7 @@ }, { "cell_type": "code", - "execution_count": 37, + "execution_count": 35, "metadata": {}, "outputs": [ { @@ -2482,7 +2421,7 @@ "9 Strong republican 2314" ] }, - "execution_count": 37, + "execution_count": 35, "metadata": {}, "output_type": "execute_result" } @@ -2493,7 +2432,7 @@ }, { "cell_type": "code", - "execution_count": 38, + "execution_count": 36, "metadata": {}, "outputs": [ { @@ -2632,7 +2571,7 @@ "15 $4000 to 4999 226" ] }, - "execution_count": 38, + "execution_count": 36, "metadata": {}, "output_type": "execute_result" } @@ -2643,7 +2582,7 @@ }, { "cell_type": "code", - "execution_count": 39, + "execution_count": 37, "metadata": {}, "outputs": [ { @@ -2655,7 +2594,7 @@ " 'Gt $5000.0', 'Gt $0.0'], dtype=object)" ] }, - "execution_count": 39, + "execution_count": 37, "metadata": {}, "output_type": "execute_result" } @@ -2674,7 +2613,7 @@ }, { "cell_type": "code", - "execution_count": 40, + "execution_count": 38, "metadata": {}, "outputs": [ { @@ -2777,7 +2716,7 @@ "9 No answer 183" ] }, - "execution_count": 40, + "execution_count": 38, "metadata": {}, "output_type": "execute_result" } diff --git a/docs/notebooks/forcats_misc.ipynb b/docs/notebooks/forcats_misc.ipynb index dad038d9..515445c9 100644 --- a/docs/notebooks/forcats_misc.ipynb +++ b/docs/notebooks/forcats_misc.ipynb @@ -5,26 +5,10 @@ "execution_count": 1, "metadata": {}, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 01:55:37][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 01:55:37][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 01:55:37][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 01:55:37][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 01:55:37][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 01:55:37][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 01:55:37][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 01:55:37][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 01:55:37][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 01:55:37][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -36,7 +20,7 @@ { "data": { "text/markdown": [ - "### # fct_inorder " + "###
★ fct_inorder
" ], "text/plain": [ "" @@ -68,7 +52,7 @@ { "data": { "text/markdown": [ - "### # fct_count " + "###
★ fct_count
" ], "text/plain": [ "" @@ -102,7 +86,7 @@ { "data": { "text/markdown": [ - "### # fct_match " + "###
★ fct_match
" ], "text/plain": [ "" @@ -135,7 +119,7 @@ { "data": { "text/markdown": [ - "### # fct_unique " + "###
★ fct_unique
" ], "text/plain": [ "" @@ -165,7 +149,7 @@ { "data": { "text/markdown": [ - "### # lvls_reorder " + "###
★ lvls_reorder
" ], "text/plain": [ "" @@ -200,7 +184,7 @@ { "data": { "text/markdown": [ - "### # lvls_revalue " + "###
★ lvls_revalue
" ], "text/plain": [ "" @@ -232,7 +216,7 @@ { "data": { "text/markdown": [ - "### # lvls_expand " + "###
★ lvls_expand
" ], "text/plain": [ "" @@ -264,7 +248,7 @@ { "data": { "text/markdown": [ - "### # lvls_union " + "###
★ lvls_union
" ], "text/plain": [ "" @@ -293,11 +277,12 @@ } ], "source": [ + "%run nb_helpers.py\n", + "\n", "import numpy\n", "from datar.all import *\n", "from datar.datasets import gss_cat\n", "\n", - "%run nb_helpers.py\n", "\n", "nb_header(\n", " as_factor,\n", @@ -372,7 +357,7 @@ "name": "stderr", "output_type": "stream", "text": [ - "/home/pwwang/miniconda3/lib/python3.9/site-packages/IPython/lib/pretty.py:700: FutureWarning: Index.ravel returning ndarray is deprecated; in a future version this will return a view on self.\n", + "/home/pwwang/miniconda3/lib/python3.9/site-packages/IPython/lib/pretty.py:778: FutureWarning: Index.ravel returning ndarray is deprecated; in a future version this will return a view on self.\n", " output = repr(obj)\n" ] }, @@ -427,25 +412,24 @@ " \n", " \n", " a\n", + " b\n", " c\n", " d\n", " e\n", " f\n", - " g\n", " h\n", - " i\n", " j\n", " k\n", - " ...\n", + " l\n", + " m\n", + " n\n", + " o\n", " p\n", - " q\n", " r\n", " s\n", " t\n", " u\n", - " v\n", - " w\n", - " y\n", + " x\n", " z\n", " \n", " \n", @@ -462,7 +446,6 @@ " <int64>\n", " <int64>\n", " <int64>\n", - " ...\n", " <int64>\n", " <int64>\n", " <int64>\n", @@ -476,47 +459,43 @@ " \n", " \n", " count\n", - " 22\n", - " 26\n", - " 4\n", - " 5\n", - " 1\n", - " 71\n", - " 41\n", - " 91\n", - " 12\n", - " 78\n", - " ...\n", - " 1\n", + " 113\n", + " 110\n", + " 19\n", + " 37\n", + " 76\n", + " 38\n", + " 11\n", + " 98\n", + " 14\n", " 2\n", - " 119\n", - " 90\n", - " 8\n", + " 101\n", + " 92\n", + " 6\n", + " 10\n", + " 84\n", + " 11\n", + " 49\n", + " 2\n", + " 126\n", " 1\n", - " 3\n", - " 25\n", - " 125\n", - " 99\n", " \n", " \n", "\n", - "

1 rows × 22 columns

\n", "\n" ], "text/plain": [ - " a c d e f g h i j \\\n", + " a b c d e f h j k \\\n", " \n", - "count 22 26 4 5 1 71 41 91 12 \n", - "\n", - " k ... p q r s t u v \\\n", - " ... \n", - "count 78 1 2 119 90 8 1 3 \n", + "count 113 110 19 37 76 38 11 98 14 \n", "\n", - " w y z \n", - " \n", - "count 25 125 99 \n", + " l m n o p r s t u \\\n", + " \n", + "count 2 101 92 6 10 84 11 49 2 \n", "\n", - "[1 rows x 22 columns]" + " x z \n", + " \n", + "count 126 1 " ] }, "execution_count": 5, @@ -568,112 +547,102 @@ " \n", " 0\n", " a\n", - " 22\n", + " 113\n", " \n", " \n", " 1\n", - " c\n", - " 26\n", + " b\n", + " 110\n", " \n", " \n", " 2\n", - " d\n", - " 4\n", + " c\n", + " 19\n", " \n", " \n", " 3\n", - " e\n", - " 5\n", + " d\n", + " 37\n", " \n", " \n", " 4\n", - " f\n", - " 1\n", + " e\n", + " 76\n", " \n", " \n", " 5\n", - " g\n", - " 71\n", + " f\n", + " 38\n", " \n", " \n", " 6\n", " h\n", - " 41\n", + " 11\n", " \n", " \n", " 7\n", - " i\n", - " 91\n", + " j\n", + " 98\n", " \n", " \n", " 8\n", - " j\n", - " 12\n", + " k\n", + " 14\n", " \n", " \n", " 9\n", - " k\n", - " 78\n", + " l\n", + " 2\n", " \n", " \n", " 10\n", " m\n", - " 125\n", + " 101\n", " \n", " \n", " 11\n", - " o\n", - " 51\n", + " n\n", + " 92\n", " \n", " \n", " 12\n", - " p\n", - " 1\n", + " o\n", + " 6\n", " \n", " \n", " 13\n", - " q\n", - " 2\n", + " p\n", + " 10\n", " \n", " \n", " 14\n", " r\n", - " 119\n", + " 84\n", " \n", " \n", " 15\n", " s\n", - " 90\n", + " 11\n", " \n", " \n", " 16\n", " t\n", - " 8\n", + " 49\n", " \n", " \n", " 17\n", " u\n", - " 1\n", + " 2\n", " \n", " \n", " 18\n", - " v\n", - " 3\n", + " x\n", + " 126\n", " \n", " \n", " 19\n", - " w\n", - " 25\n", - " \n", - " \n", - " 20\n", - " y\n", - " 125\n", - " \n", - " \n", - " 21\n", " z\n", - " 99\n", + " 1\n", " \n", " \n", "\n", @@ -682,28 +651,26 @@ "text/plain": [ " f n\n", " \n", - "0 a 22\n", - "1 c 26\n", - "2 d 4\n", - "3 e 5\n", - "4 f 1\n", - "5 g 71\n", - "6 h 41\n", - "7 i 91\n", - "8 j 12\n", - "9 k 78\n", - "10 m 125\n", - "11 o 51\n", - "12 p 1\n", - "13 q 2\n", - "14 r 119\n", - "15 s 90\n", - "16 t 8\n", - "17 u 1\n", - "18 v 3\n", - "19 w 25\n", - "20 y 125\n", - "21 z 99" + "0 a 113\n", + "1 b 110\n", + "2 c 19\n", + "3 d 37\n", + "4 e 76\n", + "5 f 38\n", + "6 h 11\n", + "7 j 98\n", + "8 k 14\n", + "9 l 2\n", + "10 m 101\n", + "11 n 92\n", + "12 o 6\n", + "13 p 10\n", + "14 r 84\n", + "15 s 11\n", + "16 t 49\n", + "17 u 2\n", + "18 x 126\n", + "19 z 1" ] }, "execution_count": 6, @@ -752,113 +719,103 @@ " <int64>\n", " \n", " \n", - " 10\n", - " m\n", - " 125\n", + " 18\n", + " x\n", + " 126\n", " \n", " \n", - " 20\n", - " y\n", - " 125\n", + " 0\n", + " a\n", + " 113\n", " \n", " \n", - " 14\n", - " r\n", - " 119\n", + " 1\n", + " b\n", + " 110\n", " \n", " \n", - " 21\n", - " z\n", - " 99\n", + " 10\n", + " m\n", + " 101\n", " \n", " \n", " 7\n", - " i\n", - " 91\n", - " \n", - " \n", - " 15\n", - " s\n", - " 90\n", + " j\n", + " 98\n", " \n", " \n", - " 9\n", - " k\n", - " 78\n", + " 11\n", + " n\n", + " 92\n", " \n", " \n", - " 5\n", - " g\n", - " 71\n", + " 14\n", + " r\n", + " 84\n", " \n", " \n", - " 11\n", - " o\n", - " 51\n", + " 4\n", + " e\n", + " 76\n", " \n", " \n", - " 6\n", - " h\n", - " 41\n", + " 16\n", + " t\n", + " 49\n", " \n", " \n", - " 1\n", - " c\n", - " 26\n", + " 5\n", + " f\n", + " 38\n", " \n", " \n", - " 19\n", - " w\n", - " 25\n", + " 3\n", + " d\n", + " 37\n", " \n", " \n", - " 0\n", - " a\n", - " 22\n", + " 2\n", + " c\n", + " 19\n", " \n", " \n", " 8\n", - " j\n", - " 12\n", + " k\n", + " 14\n", " \n", " \n", - " 16\n", - " t\n", - " 8\n", + " 6\n", + " h\n", + " 11\n", " \n", " \n", - " 3\n", - " e\n", - " 5\n", + " 15\n", + " s\n", + " 11\n", " \n", " \n", - " 2\n", - " d\n", - " 4\n", + " 13\n", + " p\n", + " 10\n", " \n", " \n", - " 18\n", - " v\n", - " 3\n", + " 12\n", + " o\n", + " 6\n", " \n", " \n", - " 13\n", - " q\n", + " 9\n", + " l\n", " 2\n", " \n", " \n", - " 4\n", - " f\n", - " 1\n", - " \n", - " \n", " 17\n", " u\n", - " 1\n", + " 2\n", " \n", " \n", - " 12\n", - " p\n", + " 19\n", + " z\n", " 1\n", " \n", " \n", @@ -868,28 +825,26 @@ "text/plain": [ " f n\n", " \n", - "10 m 125\n", - "20 y 125\n", - "14 r 119\n", - "21 z 99\n", - "7 i 91\n", - "15 s 90\n", - "9 k 78\n", - "5 g 71\n", - "11 o 51\n", - "6 h 41\n", - "1 c 26\n", - "19 w 25\n", - "0 a 22\n", - "8 j 12\n", - "16 t 8\n", - "3 e 5\n", - "2 d 4\n", - "18 v 3\n", - "13 q 2\n", - "4 f 1\n", - "17 u 1\n", - "12 p 1" + "18 x 126\n", + "0 a 113\n", + "1 b 110\n", + "10 m 101\n", + "7 j 98\n", + "11 n 92\n", + "14 r 84\n", + "4 e 76\n", + "16 t 49\n", + "5 f 38\n", + "3 d 37\n", + "2 c 19\n", + "8 k 14\n", + "6 h 11\n", + "15 s 11\n", + "13 p 10\n", + "12 o 6\n", + "9 l 2\n", + "17 u 2\n", + "19 z 1" ] }, "execution_count": 7, @@ -940,134 +895,122 @@ " <float64>\n", " \n", " \n", - " 10\n", - " m\n", - " 125\n", - " 0.125\n", + " 18\n", + " x\n", + " 126\n", + " 0.126\n", " \n", " \n", - " 20\n", - " y\n", - " 125\n", - " 0.125\n", + " 0\n", + " a\n", + " 113\n", + " 0.113\n", " \n", " \n", - " 14\n", - " r\n", - " 119\n", - " 0.119\n", + " 1\n", + " b\n", + " 110\n", + " 0.110\n", " \n", " \n", - " 21\n", - " z\n", - " 99\n", - " 0.099\n", + " 10\n", + " m\n", + " 101\n", + " 0.101\n", " \n", " \n", " 7\n", - " i\n", - " 91\n", - " 0.091\n", - " \n", - " \n", - " 15\n", - " s\n", - " 90\n", - " 0.090\n", + " j\n", + " 98\n", + " 0.098\n", " \n", " \n", - " 9\n", - " k\n", - " 78\n", - " 0.078\n", + " 11\n", + " n\n", + " 92\n", + " 0.092\n", " \n", " \n", - " 5\n", - " g\n", - " 71\n", - " 0.071\n", + " 14\n", + " r\n", + " 84\n", + " 0.084\n", " \n", " \n", - " 11\n", - " o\n", - " 51\n", - " 0.051\n", + " 4\n", + " e\n", + " 76\n", + " 0.076\n", " \n", " \n", - " 6\n", - " h\n", - " 41\n", - " 0.041\n", + " 16\n", + " t\n", + " 49\n", + " 0.049\n", " \n", " \n", - " 1\n", - " c\n", - " 26\n", - " 0.026\n", + " 5\n", + " f\n", + " 38\n", + " 0.038\n", " \n", " \n", - " 19\n", - " w\n", - " 25\n", - " 0.025\n", + " 3\n", + " d\n", + " 37\n", + " 0.037\n", " \n", " \n", - " 0\n", - " a\n", - " 22\n", - " 0.022\n", + " 2\n", + " c\n", + " 19\n", + " 0.019\n", " \n", " \n", " 8\n", - " j\n", - " 12\n", - " 0.012\n", + " k\n", + " 14\n", + " 0.014\n", " \n", " \n", - " 16\n", - " t\n", - " 8\n", - " 0.008\n", + " 6\n", + " h\n", + " 11\n", + " 0.011\n", " \n", " \n", - " 3\n", - " e\n", - " 5\n", - " 0.005\n", + " 15\n", + " s\n", + " 11\n", + " 0.011\n", " \n", " \n", - " 2\n", - " d\n", - " 4\n", - " 0.004\n", + " 13\n", + " p\n", + " 10\n", + " 0.010\n", " \n", " \n", - " 18\n", - " v\n", - " 3\n", - " 0.003\n", + " 12\n", + " o\n", + " 6\n", + " 0.006\n", " \n", " \n", - " 13\n", - " q\n", + " 9\n", + " l\n", " 2\n", " 0.002\n", " \n", " \n", - " 4\n", - " f\n", - " 1\n", - " 0.001\n", - " \n", - " \n", " 17\n", " u\n", - " 1\n", - " 0.001\n", + " 2\n", + " 0.002\n", " \n", " \n", - " 12\n", - " p\n", + " 19\n", + " z\n", " 1\n", " 0.001\n", " \n", @@ -1078,28 +1021,26 @@ "text/plain": [ " f n p\n", " \n", - "10 m 125 0.125\n", - "20 y 125 0.125\n", - "14 r 119 0.119\n", - "21 z 99 0.099\n", - "7 i 91 0.091\n", - "15 s 90 0.090\n", - "9 k 78 0.078\n", - "5 g 71 0.071\n", - "11 o 51 0.051\n", - "6 h 41 0.041\n", - "1 c 26 0.026\n", - "19 w 25 0.025\n", - "0 a 22 0.022\n", - "8 j 12 0.012\n", - "16 t 8 0.008\n", - "3 e 5 0.005\n", - "2 d 4 0.004\n", - "18 v 3 0.003\n", - "13 q 2 0.002\n", - "4 f 1 0.001\n", - "17 u 1 0.001\n", - "12 p 1 0.001" + "18 x 126 0.126\n", + "0 a 113 0.113\n", + "1 b 110 0.110\n", + "10 m 101 0.101\n", + "7 j 98 0.098\n", + "11 n 92 0.092\n", + "14 r 84 0.084\n", + "4 e 76 0.076\n", + "16 t 49 0.049\n", + "5 f 38 0.038\n", + "3 d 37 0.037\n", + "2 c 19 0.019\n", + "8 k 14 0.014\n", + "6 h 11 0.011\n", + "15 s 11 0.011\n", + "13 p 10 0.010\n", + "12 o 6 0.006\n", + "9 l 2 0.002\n", + "17 u 2 0.002\n", + "19 z 1 0.001" ] }, "execution_count": 8, @@ -1268,9 +1209,9 @@ { "data": { "text/plain": [ - "['g', 'i', 'f', 'k', 'd', ..., 'o', 'j', 'e', 'm', 'n']\n", - "Length: 13\n", - "Categories (13, object): ['d', 'e', 'f', 'g', ..., 'm', 'n', 'o', 'p']" + "['l', 'm', 'h', 'u', 'k', ..., 'n', 'd', 'q', 'p', 'e']\n", + "Length: 15\n", + "Categories (15, object): ['d', 'e', 'f', 'g', ..., 'o', 'p', 'q', 'u']" ] }, "execution_count": 12, @@ -1292,9 +1233,9 @@ { "data": { "text/plain": [ - "['d', 'e', 'f', 'g', 'h', ..., 'l', 'm', 'n', 'o', 'p']\n", - "Length: 13\n", - "Categories (13, object): ['d', 'e', 'f', 'g', ..., 'm', 'n', 'o', 'p']" + "['d', 'e', 'f', 'g', 'h', ..., 'n', 'o', 'p', 'q', 'u']\n", + "Length: 15\n", + "Categories (15, object): ['d', 'e', 'f', 'g', ..., 'o', 'p', 'q', 'u']" ] }, "execution_count": 13, @@ -1315,7 +1256,7 @@ }, { "cell_type": "code", - "execution_count": 18, + "execution_count": 14, "metadata": {}, "outputs": [ { @@ -1325,7 +1266,7 @@ "Categories (3, object): ['c', 'b', 'a']" ] }, - "execution_count": 18, + "execution_count": 14, "metadata": {}, "output_type": "execute_result" } diff --git a/docs/notebooks/full_seq.ipynb b/docs/notebooks/full_seq.ipynb index 5441c317..c9cd29b7 100644 --- a/docs/notebooks/full_seq.ipynb +++ b/docs/notebooks/full_seq.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 01:55:17][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 01:55:17][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 01:55:17][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 01:55:17][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 01:55:17][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 01:55:17][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 01:55:17][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 01:55:17][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 01:55:17][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 01:55:17][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # full_seq " + "###
★ full_seq
" ], "text/plain": [ "" @@ -78,10 +62,10 @@ ], "source": [ "# https://tidyr.tidyverse.org/reference/full_seq.html\n", + "%run nb_helpers.py\n", "\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(full_seq)" ] }, diff --git a/docs/notebooks/group_by.ipynb b/docs/notebooks/group_by.ipynb index bd79c355..55211cd9 100644 --- a/docs/notebooks/group_by.ipynb +++ b/docs/notebooks/group_by.ipynb @@ -12,26 +12,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 01:54:51][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 01:54:51][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 01:54:51][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 01:54:51][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 01:54:51][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 01:54:51][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 01:54:51][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 01:54:51][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 01:54:51][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 01:54:51][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -43,7 +27,7 @@ { "data": { "text/markdown": [ - "### # group_by " + "###
★ group_by
" ], "text/plain": [ "" @@ -91,7 +75,7 @@ { "data": { "text/markdown": [ - "### # ungroup " + "###
★ ungroup
" ], "text/plain": [ "" @@ -124,10 +108,11 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/group_by.html\n", + "%run nb_helpers.py\n", + "\n", "from datar.datasets import mtcars\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(group_by, ungroup)" ] }, @@ -1077,7 +1062,7 @@ "name": "stderr", "output_type": "stream", "text": [ - "[2022-03-06 01:55:14][datar][ INFO] `summarise()` has grouped output by ['vs'] (override with `_groups` argument)\n" + "[2022-03-18 17:45:11][datar][ INFO] `summarise()` has grouped output by ['vs'] (override with `_groups` argument)\n" ] }, { diff --git a/docs/notebooks/group_map.ipynb b/docs/notebooks/group_map.ipynb index 6a619752..9bb3cea5 100644 --- a/docs/notebooks/group_map.ipynb +++ b/docs/notebooks/group_map.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 01:54:27][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 01:54:27][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 01:54:27][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 01:54:27][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 01:54:27][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 01:54:27][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 01:54:27][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 01:54:27][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 01:54:27][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 01:54:27][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # group_map " + "###
★ group_map
" ], "text/plain": [ "" @@ -68,11 +52,11 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/group_map.html\n", + "%run nb_helpers.py\n", "\n", "from datar.datasets import mtcars, iris\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(group_map)" ] }, diff --git a/docs/notebooks/group_split.ipynb b/docs/notebooks/group_split.ipynb index 80366be3..98a717e9 100644 --- a/docs/notebooks/group_split.ipynb +++ b/docs/notebooks/group_split.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 01:54:16][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 01:54:16][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 01:54:16][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 01:54:16][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 01:54:16][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 01:54:16][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 01:54:16][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 01:54:16][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 01:54:16][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 01:54:16][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # group_split " + "###
★ group_split
" ], "text/plain": [ "" @@ -68,11 +52,11 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/group_split.html\n", + "%run nb_helpers.py\n", "\n", "from datar.datasets import iris\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(group_split)" ] }, @@ -776,7 +760,7 @@ }, { "cell_type": "code", - "execution_count": 8, + "execution_count": 10, "id": "65de8d54", "metadata": { "execution": { @@ -790,21 +774,22 @@ { "data": { "text/plain": [ - "" + "" ] }, - "execution_count": 8, + "execution_count": 10, "metadata": {}, "output_type": "execute_result" } ], "source": [ - "iris >> group_by(f.Species) >> group_keys() >> rowwise() >> group_split()" + "out = iris >> group_by(f.Species) >> group_keys() >> rowwise() >> group_split()\n", + "out" ] }, { "cell_type": "code", - "execution_count": 9, + "execution_count": 11, "id": "264e6811", "metadata": { "execution": { @@ -829,13 +814,13 @@ " 0 virginica]" ] }, - "execution_count": 9, + "execution_count": 11, "metadata": {}, "output_type": "execute_result" } ], "source": [ - "list(_)" + "list(out)" ] }, { diff --git a/docs/notebooks/group_trim.ipynb b/docs/notebooks/group_trim.ipynb index b6549e92..bc4b7545 100644 --- a/docs/notebooks/group_trim.ipynb +++ b/docs/notebooks/group_trim.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 02:01:31][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 02:01:31][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 02:01:31][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 02:01:32][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 02:01:32][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 02:01:32][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 02:01:32][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 02:01:32][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 02:01:32][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 02:01:32][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # group_trim " + "###
★ group_trim
" ], "text/plain": [ "" @@ -68,16 +52,16 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/group_trim.html\n", + "%run nb_helpers.py\n", "\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(group_trim)" ] }, { "cell_type": "code", - "execution_count": 9, + "execution_count": 2, "id": "d4c86c45", "metadata": { "execution": { @@ -146,7 +130,7 @@ "2 c []" ] }, - "execution_count": 9, + "execution_count": 2, "metadata": {}, "output_type": "execute_result" } @@ -158,7 +142,7 @@ }, { "cell_type": "code", - "execution_count": 10, + "execution_count": 3, "id": "a11f49fc", "metadata": { "execution": { @@ -221,7 +205,7 @@ "1 b [1]" ] }, - "execution_count": 10, + "execution_count": 3, "metadata": {}, "output_type": "execute_result" } diff --git a/docs/notebooks/lead-lag.ipynb b/docs/notebooks/lead-lag.ipynb index c82c8fa5..5a0f3d29 100644 --- a/docs/notebooks/lead-lag.ipynb +++ b/docs/notebooks/lead-lag.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 16:46:16][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 16:46:16][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 16:46:16][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 16:46:16][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 16:46:16][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 16:46:16][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 16:46:16][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 16:46:16][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 16:46:16][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 16:46:16][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # lead " + "###
★ lead
" ], "text/plain": [ "" @@ -79,7 +63,7 @@ { "data": { "text/markdown": [ - "### # lag " + "###
★ lag
" ], "text/plain": [ "" @@ -105,11 +89,10 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/lead-lag.html\n", + "%run nb_helpers.py\n", "\n", - "from datar import f\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(lead, lag, book='lead-lag')" ] }, @@ -129,12 +112,7 @@ { "data": { "text/plain": [ - "0 NaN\n", - "1 1.0\n", - "2 2.0\n", - "3 3.0\n", - "4 4.0\n", - "dtype: float64" + "array([nan, 1., 2., 3., 4.])" ] }, "execution_count": 2, @@ -164,12 +142,7 @@ { "data": { "text/plain": [ - "0 2.0\n", - "1 3.0\n", - "2 4.0\n", - "3 5.0\n", - "4 NaN\n", - "dtype: float64" + "array([ 2., 3., 4., 5., nan])" ] }, "execution_count": 3, @@ -296,12 +269,7 @@ { "data": { "text/plain": [ - "0 NaN\n", - "1 1.0\n", - "2 2.0\n", - "3 3.0\n", - "4 4.0\n", - "dtype: float64" + "array([nan, 1., 2., 3., 4.])" ] }, "execution_count": 5, @@ -329,12 +297,7 @@ { "data": { "text/plain": [ - "0 NaN\n", - "1 NaN\n", - "2 1.0\n", - "3 2.0\n", - "4 3.0\n", - "dtype: float64" + "array([nan, nan, 1., 2., 3.])" ] }, "execution_count": 6, @@ -362,12 +325,7 @@ { "data": { "text/plain": [ - "0 2.0\n", - "1 3.0\n", - "2 4.0\n", - "3 5.0\n", - "4 NaN\n", - "dtype: float64" + "array([ 2., 3., 4., 5., nan])" ] }, "execution_count": 7, @@ -395,12 +353,7 @@ { "data": { "text/plain": [ - "0 3.0\n", - "1 4.0\n", - "2 5.0\n", - "3 NaN\n", - "4 NaN\n", - "dtype: float64" + "array([ 3., 4., 5., nan, nan])" ] }, "execution_count": 8, @@ -428,12 +381,7 @@ { "data": { "text/plain": [ - "0 0\n", - "1 1\n", - "2 2\n", - "3 3\n", - "4 4\n", - "dtype: int64" + "array([0, 1, 2, 3, 4])" ] }, "execution_count": 9, @@ -461,12 +409,7 @@ { "data": { "text/plain": [ - "0 2\n", - "1 3\n", - "2 4\n", - "3 5\n", - "4 6\n", - "dtype: int64" + "array([2, 3, 4, 5, 6])" ] }, "execution_count": 10, @@ -528,19 +471,19 @@ " 0\n", " 2000\n", " 0\n", - " 4.0\n", + " 1.0\n", " \n", " \n", " 1\n", " 2001\n", " 1\n", - " 0.0\n", + " 4.0\n", " \n", " \n", " 2\n", " 2002\n", " 4\n", - " NaN\n", + " 16.0\n", " \n", " \n", " 3\n", @@ -552,13 +495,13 @@ " 4\n", " 2004\n", " 16\n", - " 1.0\n", + " NaN\n", " \n", " \n", " 5\n", " 2005\n", " 25\n", - " 16.0\n", + " 0.0\n", " \n", " \n", "\n", @@ -567,12 +510,12 @@ "text/plain": [ " year value previous_year_value\n", " \n", - "0 2000 0 4.0\n", - "1 2001 1 0.0\n", - "2 2002 4 NaN\n", + "0 2000 0 1.0\n", + "1 2001 1 4.0\n", + "2 2002 4 16.0\n", "3 2003 9 25.0\n", - "4 2004 16 1.0\n", - "5 2005 25 16.0" + "4 2004 16 NaN\n", + "5 2005 25 0.0" ] }, "execution_count": 11, @@ -640,37 +583,37 @@ " 0\n", " 2000\n", " 0\n", - " 1.0\n", + " NaN\n", " \n", " \n", " 1\n", " 2001\n", " 1\n", - " NaN\n", + " 0.0\n", " \n", " \n", " 2\n", " 2002\n", " 4\n", - " 0.0\n", + " 1.0\n", " \n", " \n", " 3\n", " 2003\n", " 9\n", - " 9.0\n", + " 4.0\n", " \n", " \n", " 4\n", " 2004\n", " 16\n", - " 16.0\n", + " 9.0\n", " \n", " \n", " 5\n", " 2005\n", " 25\n", - " 4.0\n", + " 16.0\n", " \n", " \n", "\n", @@ -679,12 +622,12 @@ "text/plain": [ " year value previous_year_value\n", " \n", - "0 2000 0 1.0\n", - "1 2001 1 NaN\n", - "2 2002 4 0.0\n", - "3 2003 9 9.0\n", - "4 2004 16 16.0\n", - "5 2005 25 4.0" + "0 2000 0 NaN\n", + "1 2001 1 0.0\n", + "2 2002 4 1.0\n", + "3 2003 9 4.0\n", + "4 2004 16 9.0\n", + "5 2005 25 16.0" ] }, "execution_count": 12, diff --git a/docs/notebooks/mutate-joins.ipynb b/docs/notebooks/mutate-joins.ipynb index 9f07f956..389be7e1 100644 --- a/docs/notebooks/mutate-joins.ipynb +++ b/docs/notebooks/mutate-joins.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 01:43:32][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 01:43:32][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 01:43:32][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 01:43:32][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 01:43:32][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 01:43:32][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 01:43:32][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 01:43:32][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 01:43:32][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 01:43:32][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # inner_join " + "###
★ inner_join
" ], "text/plain": [ "" @@ -88,7 +72,7 @@ { "data": { "text/markdown": [ - "### # left_join " + "###
★ left_join
" ], "text/plain": [ "" @@ -115,7 +99,7 @@ { "data": { "text/markdown": [ - "### # right_join " + "###
★ right_join
" ], "text/plain": [ "" @@ -146,7 +130,7 @@ { "data": { "text/markdown": [ - "### # full_join " + "###
★ full_join
" ], "text/plain": [ "" @@ -173,10 +157,11 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/mutate-joins.html\n", + "%run nb_helpers.py\n", + "\n", "from datar.datasets import band_members, band_instruments, band_instruments2\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(inner_join, left_join, right_join, full_join, book='mutate-joins')" ] }, diff --git a/docs/notebooks/mutate.ipynb b/docs/notebooks/mutate.ipynb index efe21dd5..15efc420 100644 --- a/docs/notebooks/mutate.ipynb +++ b/docs/notebooks/mutate.ipynb @@ -12,26 +12,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 02:01:53][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 02:01:53][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 02:01:53][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 02:01:54][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 02:01:54][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 02:01:54][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 02:01:54][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 02:01:54][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 02:01:54][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 02:01:54][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -43,7 +27,7 @@ { "data": { "text/markdown": [ - "### # mutate " + "###
★ mutate
" ], "text/plain": [ "" @@ -117,7 +101,7 @@ { "data": { "text/markdown": [ - "### # transmute " + "###
★ transmute
" ], "text/plain": [ "" @@ -144,10 +128,11 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/mutate.html\n", + "%run nb_helpers.py\n", + "\n", "from datar.datasets import starwars\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(mutate, transmute)" ] }, @@ -1070,7 +1055,7 @@ }, { "cell_type": "code", - "execution_count": 11, + "execution_count": 10, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:27:33.853847Z", @@ -1129,7 +1114,7 @@ "0 1 6 2" ] }, - "execution_count": 11, + "execution_count": 10, "metadata": {}, "output_type": "execute_result" } @@ -1141,7 +1126,7 @@ }, { "cell_type": "code", - "execution_count": 12, + "execution_count": 11, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:27:33.903931Z", @@ -1206,7 +1191,7 @@ "0 1 2 a b 3" ] }, - "execution_count": 12, + "execution_count": 11, "metadata": {}, "output_type": "execute_result" } @@ -1218,7 +1203,7 @@ }, { "cell_type": "code", - "execution_count": 13, + "execution_count": 12, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:27:33.959501Z", @@ -1277,7 +1262,7 @@ "0 1 2 3" ] }, - "execution_count": 13, + "execution_count": 12, "metadata": {}, "output_type": "execute_result" } @@ -1288,7 +1273,7 @@ }, { "cell_type": "code", - "execution_count": 14, + "execution_count": 13, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:27:34.079819Z", @@ -1347,7 +1332,7 @@ "0 a b 3" ] }, - "execution_count": 14, + "execution_count": 13, "metadata": {}, "output_type": "execute_result" } @@ -1358,7 +1343,7 @@ }, { "cell_type": "code", - "execution_count": 15, + "execution_count": 14, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:27:34.156265Z", @@ -1411,7 +1396,7 @@ "0 3" ] }, - "execution_count": 15, + "execution_count": 14, "metadata": {}, "output_type": "execute_result" } @@ -1422,7 +1407,7 @@ }, { "cell_type": "code", - "execution_count": 16, + "execution_count": 15, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:27:34.225635Z", @@ -1567,7 +1552,7 @@ "[87 rows x 4 columns]" ] }, - "execution_count": 16, + "execution_count": 15, "metadata": {}, "output_type": "execute_result" } @@ -1580,7 +1565,7 @@ }, { "cell_type": "code", - "execution_count": 17, + "execution_count": 16, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:27:34.326340Z", @@ -1725,7 +1710,7 @@ "[87 rows x 4 columns]" ] }, - "execution_count": 17, + "execution_count": 16, "metadata": {}, "output_type": "execute_result" } @@ -1740,7 +1725,7 @@ }, { "cell_type": "code", - "execution_count": 18, + "execution_count": 17, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:27:34.629345Z", @@ -2003,7 +1988,7 @@ "[87 rows x 12 columns]" ] }, - "execution_count": 18, + "execution_count": 17, "metadata": {}, "output_type": "execute_result" } diff --git a/docs/notebooks/n_distinct.ipynb b/docs/notebooks/n_distinct.ipynb index d606dac2..fd1fc6e8 100644 --- a/docs/notebooks/n_distinct.ipynb +++ b/docs/notebooks/n_distinct.ipynb @@ -16,7 +16,7 @@ { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -28,7 +28,7 @@ { "data": { "text/markdown": [ - "### # sample " + "###
★ sample
" ], "text/plain": [ "" @@ -69,7 +69,7 @@ { "data": { "text/markdown": [ - "### # n_distinct " + "###
★ n_distinct
" ], "text/plain": [ "" @@ -93,10 +93,10 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/n_distinct.html\n", + "%run nb_helpers.py\n", "\n", "from datar.all import sample, n_distinct\n", "\n", - "%run nb_helpers.py\n", "nb_header(sample, n_distinct, book='n_distinct')" ] }, diff --git a/docs/notebooks/na_if.ipynb b/docs/notebooks/na_if.ipynb index 7369927e..ec9c436b 100644 --- a/docs/notebooks/na_if.ipynb +++ b/docs/notebooks/na_if.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 02:17:42][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 02:17:42][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 02:17:42][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 02:17:42][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 02:17:42][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 02:17:42][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 02:17:42][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 02:17:42][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 02:17:42][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 02:17:42][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # na_if " + "###
★ na_if
" ], "text/plain": [ "" @@ -75,10 +59,11 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/na_if.html\n", + "%run nb_helpers.py\n", + "\n", "from datar.datasets import starwars\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(na_if)" ] }, @@ -98,12 +83,7 @@ { "data": { "text/plain": [ - "0 0.0\n", - "1 1.0\n", - "2 NaN\n", - "3 3.0\n", - "4 4.0\n", - "Name: x, dtype: float64" + "array([ 0., 1., nan, 3., 4.])" ] }, "execution_count": 2, diff --git a/docs/notebooks/nb_helpers.py b/docs/notebooks/nb_helpers.py index 3420582a..534c1ae8 100644 --- a/docs/notebooks/nb_helpers.py +++ b/docs/notebooks/nb_helpers.py @@ -4,38 +4,58 @@ from IPython.display import display, Markdown, HTML from IPython.core.interactiveshell import InteractiveShell import pardoc -from varname.helpers import debug +from varname.helpers import debug # noqa +from datar import options + +_ = options(warn_builtin_names=False) InteractiveShell.ast_node_interactivity = "all" BINDER_URL = ( - 'https://mybinder.org/v2/gh/pwwang/datar/' - '93d069f3ca36711fc811c61dcf60e9fc3d1460a5?filepath=docs%2Fnotebooks%2F' + "https://mybinder.org/v2/gh/pwwang/datar/" + "dev?filepath=docs%2Fnotebooks%2F" ) + def nb_header(*funcs, book=None): """Print the header of a notebooks, mostly the docs""" if book is None: book = funcs[0].__name__ - display(HTML( - '
Try this notebook ' - f'on ' - 'binder.
' - )) + display( + HTML( + '
' + 'Try this notebook on ' + f'' + "binder.
" + ) + ) for func in funcs: try: + parsed = pardoc.google_parser.parse(func.__doc__) + try: + del parsed["Examples"] + except KeyError: + pass + except Exception: + formatted = func.__doc__ + else: formatted = pardoc.google_parser.format( - func.__doc__, - to='markdown', + parsed, + to="markdown", heading=5, - indent_base='  ' + indent_base="  ", ) - except: - formatted = func.__doc__ - display(Markdown(f'{"#"*3} # {func.__name__} ')) + + display(Markdown( + f'{"#"*3} ' + '
' + f'★ {func.__name__}' + '
') + ) display(Markdown(formatted)) + @contextmanager def try_catch(): """Catch the error and print it out""" diff --git a/docs/notebooks/near.ipynb b/docs/notebooks/near.ipynb index 4bfb36f5..69196782 100644 --- a/docs/notebooks/near.ipynb +++ b/docs/notebooks/near.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 02:18:19][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 02:18:19][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 02:18:19][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 02:18:19][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 02:18:19][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 02:18:19][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 02:18:19][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 02:18:19][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 02:18:19][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 02:18:19][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # near " + "###
★ near
" ], "text/plain": [ "" @@ -80,10 +64,10 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/near.html\n", + "%run nb_helpers.py\n", "\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(near)" ] }, @@ -103,8 +87,7 @@ { "data": { "text/plain": [ - "0 False\n", - "Name: x, dtype: bool" + "array([False])" ] }, "execution_count": 2, diff --git a/docs/notebooks/nest-join.ipynb b/docs/notebooks/nest-join.ipynb index 54329d16..c59cb87d 100644 --- a/docs/notebooks/nest-join.ipynb +++ b/docs/notebooks/nest-join.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 02:19:33][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 02:19:33][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 02:19:33][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 02:19:33][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 02:19:33][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 02:19:33][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 02:19:33][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 02:19:33][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 02:19:33][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 02:19:33][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # nest_join " + "###
★ nest_join
" ], "text/plain": [ "" @@ -72,11 +56,11 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/nest_join.html\n", + "%run nb_helpers.py\n", "\n", "from datar.datasets import band_members, band_instruments\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(nest_join, book='nest-join')" ] }, @@ -168,7 +152,7 @@ }, { "cell_type": "code", - "execution_count": 4, + "execution_count": 3, "id": "french-egyptian", "metadata": { "execution": { @@ -190,7 +174,7 @@ " 0 guitar]" ] }, - "execution_count": 4, + "execution_count": 3, "metadata": {}, "output_type": "execute_result" } diff --git a/docs/notebooks/nest.ipynb b/docs/notebooks/nest.ipynb index ecb9da7b..4348be36 100644 --- a/docs/notebooks/nest.ipynb +++ b/docs/notebooks/nest.ipynb @@ -12,26 +12,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 02:23:01][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 02:23:01][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 02:23:01][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 02:23:01][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 02:23:01][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 02:23:01][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 02:23:01][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 02:23:01][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 02:23:01][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 02:23:01][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -43,7 +27,7 @@ { "data": { "text/markdown": [ - "### # nest " + "###
★ nest
" ], "text/plain": [ "" @@ -80,7 +64,7 @@ { "data": { "text/markdown": [ - "### # unnest " + "###
★ unnest
" ], "text/plain": [ "" @@ -141,10 +125,10 @@ } ], "source": [ + "%run nb_helpers.py\n", "from datar.datasets import iris, fish_encounters, mtcars\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(nest, unnest)" ] }, @@ -393,7 +377,7 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": 6, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:28:27.142333Z", @@ -403,68 +387,6 @@ } }, "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
Speciesdata
<object><object>
0setosa<DF 50x4>
1versicolor<DF 50x4>
2virginica<DF 50x4>
\n", - "
\n" - ], - "text/plain": [ - " Species data\n", - " \n", - "0 setosa \n", - "1 versicolor \n", - "2 virginica " - ] - }, - "execution_count": 5, - "metadata": {}, - "output_type": "execute_result" - }, { "data": { "text/html": [ @@ -909,19 +831,19 @@ "49 5.0 3.3 1.4 0.2" ] }, - "execution_count": 5, + "execution_count": 6, "metadata": {}, "output_type": "execute_result" } ], "source": [ - "iris >> nest(data=~f.Species)\n", - "_.data[0]" + "out = iris >> nest(data=~f.Species)\n", + "out.data[0]" ] }, { "cell_type": "code", - "execution_count": 6, + "execution_count": 7, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:28:27.186712Z", @@ -989,7 +911,7 @@ "2 virginica " ] }, - "execution_count": 6, + "execution_count": 7, "metadata": {}, "output_type": "execute_result" } @@ -1001,7 +923,7 @@ }, { "cell_type": "code", - "execution_count": 7, + "execution_count": 8, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:28:27.207533Z", @@ -1074,7 +996,7 @@ "2 virginica " ] }, - "execution_count": 7, + "execution_count": 8, "metadata": {}, "output_type": "execute_result" } @@ -1085,7 +1007,7 @@ }, { "cell_type": "code", - "execution_count": 8, + "execution_count": 9, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:28:27.265853Z", @@ -1158,7 +1080,7 @@ "2 virginica " ] }, - "execution_count": 8, + "execution_count": 9, "metadata": {}, "output_type": "execute_result" } @@ -1169,7 +1091,7 @@ }, { "cell_type": "code", - "execution_count": 9, + "execution_count": 10, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:28:27.333173Z", @@ -1335,7 +1257,7 @@ "[TibbleGrouped: fish (n=19)]" ] }, - "execution_count": 9, + "execution_count": 10, "metadata": {}, "output_type": "execute_result" } @@ -1346,7 +1268,7 @@ }, { "cell_type": "code", - "execution_count": 15, + "execution_count": 11, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:28:27.401063Z", @@ -1421,7 +1343,7 @@ "[TibbleGrouped: cyl (n=3)]" ] }, - "execution_count": 15, + "execution_count": 11, "metadata": {}, "output_type": "execute_result" } @@ -1441,7 +1363,7 @@ }, { "cell_type": "code", - "execution_count": 19, + "execution_count": 12, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:28:27.451681Z", @@ -1521,7 +1443,7 @@ "3 3 3 2" ] }, - "execution_count": 19, + "execution_count": 12, "metadata": {}, "output_type": "execute_result" } @@ -1540,7 +1462,7 @@ }, { "cell_type": "code", - "execution_count": 20, + "execution_count": 13, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:28:27.535876Z", @@ -1627,7 +1549,7 @@ "4 3 3.0 2.0" ] }, - "execution_count": 20, + "execution_count": 13, "metadata": {}, "output_type": "execute_result" } @@ -1638,7 +1560,7 @@ }, { "cell_type": "code", - "execution_count": 21, + "execution_count": 14, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:28:27.550880Z", @@ -1711,7 +1633,7 @@ "2 c 3 22" ] }, - "execution_count": 21, + "execution_count": 14, "metadata": {}, "output_type": "execute_result" } @@ -1727,7 +1649,7 @@ }, { "cell_type": "code", - "execution_count": 22, + "execution_count": 15, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:28:27.614822Z", @@ -1814,7 +1736,7 @@ "4 c 3 22" ] }, - "execution_count": 22, + "execution_count": 15, "metadata": {}, "output_type": "execute_result" } diff --git a/docs/notebooks/nth.ipynb b/docs/notebooks/nth.ipynb index 08406e32..fddcf97b 100644 --- a/docs/notebooks/nth.ipynb +++ b/docs/notebooks/nth.ipynb @@ -16,7 +16,7 @@ { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -28,7 +28,7 @@ { "data": { "text/markdown": [ - "### # nth " + "###
★ nth
" ], "text/plain": [ "" @@ -64,7 +64,7 @@ { "data": { "text/markdown": [ - "### # first " + "###
★ first
" ], "text/plain": [ "" @@ -88,7 +88,7 @@ { "data": { "text/markdown": [ - "### # last " + "###
★ last
" ], "text/plain": [ "" @@ -112,10 +112,10 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/nth.html\n", + "%run nb_helpers.py\n", "\n", "from datar.all import nth, first, last\n", "\n", - "%run nb_helpers.py\n", "nb_header(nth, first, last)" ] }, @@ -348,7 +348,7 @@ }, { "cell_type": "code", - "execution_count": 11, + "execution_count": 10, "id": "advanced-stations", "metadata": { "execution": { @@ -363,7 +363,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "[ValueError] 'NoneType' object has no attribute 'iloc' (registered function: nth) (registered function: first)\n" + "[ValueError] 'NoneType' object has no attribute 'iloc' (registered function: first)\n" ] } ], diff --git a/docs/notebooks/pack.ipynb b/docs/notebooks/pack.ipynb index 92a8c9b3..07205e2b 100644 --- a/docs/notebooks/pack.ipynb +++ b/docs/notebooks/pack.ipynb @@ -12,26 +12,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 02:20:43][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 02:20:43][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 02:20:43][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 02:20:43][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 02:20:43][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 02:20:43][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 02:20:43][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 02:20:43][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 02:20:43][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 02:20:43][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -43,7 +27,7 @@ { "data": { "text/markdown": [ - "### # pack " + "###
★ pack
" ], "text/plain": [ "" @@ -77,7 +61,7 @@ { "data": { "text/markdown": [ - "### # unpack " + "###
★ unpack
" ], "text/plain": [ "" @@ -127,10 +111,11 @@ } ], "source": [ + "%run nb_helpers.py\n", + "\n", "from datar.datasets import iris\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(pack, unpack)" ] }, @@ -553,7 +538,7 @@ }, { "cell_type": "code", - "execution_count": 7, + "execution_count": 6, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:28:11.791974Z", @@ -608,7 +593,7 @@ " 1\n", " 4\n", " a\n", - " 0.377095\n", + " 0.661364\n", " True\n", " \n", " \n", @@ -617,7 +602,7 @@ " 2\n", " 3\n", " b\n", - " 0.194955\n", + " 0.607962\n", " False\n", " \n", " \n", @@ -626,7 +611,7 @@ " 3\n", " 2\n", " c\n", - " 0.958411\n", + " 0.211850\n", " NaN\n", " \n", " \n", @@ -636,12 +621,12 @@ "text/plain": [ " x y$a y$b z$X z$Y z$Z\n", " \n", - "0 1 1 4 a 0.377095 True\n", - "1 2 2 3 b 0.194955 False\n", - "2 3 3 2 c 0.958411 NaN" + "0 1 1 4 a 0.661364 True\n", + "1 2 2 3 b 0.607962 False\n", + "2 3 3 2 c 0.211850 NaN" ] }, - "execution_count": 7, + "execution_count": 6, "metadata": {}, "output_type": "execute_result" } @@ -659,7 +644,7 @@ }, { "cell_type": "code", - "execution_count": 8, + "execution_count": 7, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:28:11.848630Z", @@ -714,7 +699,7 @@ " 1\n", " 4\n", " a\n", - " 0.377095\n", + " 0.661364\n", " True\n", " \n", " \n", @@ -723,7 +708,7 @@ " 2\n", " 3\n", " b\n", - " 0.194955\n", + " 0.607962\n", " False\n", " \n", " \n", @@ -732,7 +717,7 @@ " 3\n", " 2\n", " c\n", - " 0.958411\n", + " 0.211850\n", " NaN\n", " \n", " \n", @@ -742,12 +727,12 @@ "text/plain": [ " x a b z$X z$Y z$Z\n", " \n", - "0 1 1 4 a 0.377095 True\n", - "1 2 2 3 b 0.194955 False\n", - "2 3 3 2 c 0.958411 NaN" + "0 1 1 4 a 0.661364 True\n", + "1 2 2 3 b 0.607962 False\n", + "2 3 3 2 c 0.211850 NaN" ] }, - "execution_count": 8, + "execution_count": 7, "metadata": {}, "output_type": "execute_result" } @@ -758,7 +743,7 @@ }, { "cell_type": "code", - "execution_count": 9, + "execution_count": 8, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:28:11.916193Z", @@ -813,7 +798,7 @@ " 1\n", " 4\n", " a\n", - " 0.377095\n", + " 0.661364\n", " True\n", " \n", " \n", @@ -822,7 +807,7 @@ " 2\n", " 3\n", " b\n", - " 0.194955\n", + " 0.607962\n", " False\n", " \n", " \n", @@ -831,7 +816,7 @@ " 3\n", " 2\n", " c\n", - " 0.958411\n", + " 0.211850\n", " NaN\n", " \n", " \n", @@ -841,12 +826,12 @@ "text/plain": [ " x a b X Y Z\n", " \n", - "0 1 1 4 a 0.377095 True\n", - "1 2 2 3 b 0.194955 False\n", - "2 3 3 2 c 0.958411 NaN" + "0 1 1 4 a 0.661364 True\n", + "1 2 2 3 b 0.607962 False\n", + "2 3 3 2 c 0.211850 NaN" ] }, - "execution_count": 9, + "execution_count": 8, "metadata": {}, "output_type": "execute_result" } @@ -857,7 +842,7 @@ }, { "cell_type": "code", - "execution_count": 10, + "execution_count": 9, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:28:11.947604Z", @@ -912,7 +897,7 @@ " 1\n", " 4\n", " a\n", - " 0.377095\n", + " 0.661364\n", " True\n", " \n", " \n", @@ -921,7 +906,7 @@ " 2\n", " 3\n", " b\n", - " 0.194955\n", + " 0.607962\n", " False\n", " \n", " \n", @@ -930,7 +915,7 @@ " 3\n", " 2\n", " c\n", - " 0.958411\n", + " 0.211850\n", " NaN\n", " \n", " \n", @@ -940,12 +925,12 @@ "text/plain": [ " x y_a y_b z_X z_Y z_Z\n", " \n", - "0 1 1 4 a 0.377095 True\n", - "1 2 2 3 b 0.194955 False\n", - "2 3 3 2 c 0.958411 NaN" + "0 1 1 4 a 0.661364 True\n", + "1 2 2 3 b 0.607962 False\n", + "2 3 3 2 c 0.211850 NaN" ] }, - "execution_count": 10, + "execution_count": 9, "metadata": {}, "output_type": "execute_result" } @@ -956,7 +941,7 @@ }, { "cell_type": "code", - "execution_count": 11, + "execution_count": 10, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:28:11.965059Z", @@ -1011,7 +996,7 @@ " 1\n", " 4\n", " a\n", - " 0.377095\n", + " 0.661364\n", " True\n", " \n", " \n", @@ -1020,7 +1005,7 @@ " 2\n", " 3\n", " b\n", - " 0.194955\n", + " 0.607962\n", " False\n", " \n", " \n", @@ -1029,7 +1014,7 @@ " 3\n", " 2\n", " c\n", - " 0.958411\n", + " 0.211850\n", " NaN\n", " \n", " \n", @@ -1039,12 +1024,12 @@ "text/plain": [ " x a b X Y Z\n", " \n", - "0 1 1 4 a 0.377095 True\n", - "1 2 2 3 b 0.194955 False\n", - "2 3 3 2 c 0.958411 NaN" + "0 1 1 4 a 0.661364 True\n", + "1 2 2 3 b 0.607962 False\n", + "2 3 3 2 c 0.211850 NaN" ] }, - "execution_count": 11, + "execution_count": 10, "metadata": {}, "output_type": "execute_result" } @@ -1057,7 +1042,7 @@ }, { "cell_type": "code", - "execution_count": 12, + "execution_count": 11, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:28:11.981674Z", @@ -1112,7 +1097,7 @@ " 1\n", " 4\n", " a\n", - " 0.377095\n", + " 0.661364\n", " True\n", " \n", " \n", @@ -1121,7 +1106,7 @@ " 2\n", " 3\n", " b\n", - " 0.194955\n", + " 0.607962\n", " False\n", " \n", " \n", @@ -1130,7 +1115,7 @@ " 3\n", " 2\n", " c\n", - " 0.958411\n", + " 0.211850\n", " NaN\n", " \n", " \n", @@ -1140,12 +1125,12 @@ "text/plain": [ " x a b X Y Z\n", " \n", - "0 1 1 4 a 0.377095 True\n", - "1 2 2 3 b 0.194955 False\n", - "2 3 3 2 c 0.958411 NaN" + "0 1 1 4 a 0.661364 True\n", + "1 2 2 3 b 0.607962 False\n", + "2 3 3 2 c 0.211850 NaN" ] }, - "execution_count": 12, + "execution_count": 11, "metadata": {}, "output_type": "execute_result" } diff --git a/docs/notebooks/pivot_longer.ipynb b/docs/notebooks/pivot_longer.ipynb index 3db49483..ad4896dd 100644 --- a/docs/notebooks/pivot_longer.ipynb +++ b/docs/notebooks/pivot_longer.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 02:20:51][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 02:20:51][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 02:20:51][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 02:20:51][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 02:20:51][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 02:20:51][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 02:20:51][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 02:20:51][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 02:20:51][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 02:20:51][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # pivot_longer " + "###
★ pivot_longer
" ], "text/plain": [ "" @@ -154,11 +138,11 @@ ], "source": [ "# https://tidyr.tidyverse.org/reference/pivot_longer.html\n", + "%run nb_helpers.py\n", "\n", "from datar.datasets import relig_income, billboard, who, anscombe\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(pivot_longer)" ] }, diff --git a/docs/notebooks/pivot_wider.ipynb b/docs/notebooks/pivot_wider.ipynb index 819bfecf..1e41b10e 100644 --- a/docs/notebooks/pivot_wider.ipynb +++ b/docs/notebooks/pivot_wider.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 02:21:03][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 02:21:03][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 02:21:03][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 02:21:03][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 02:21:03][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 02:21:03][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 02:21:03][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 02:21:03][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 02:21:03][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 02:21:03][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # pivot_wider " + "###
★ pivot_wider
" ], "text/plain": [ "" @@ -103,11 +87,11 @@ ], "source": [ "# https://tidyr.tidyverse.org/reference/pivot_wider.html\n", + "%run nb_helpers.py\n", "\n", "from datar.datasets import fish_encounters, us_rent_income, warpbreaks \n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(pivot_wider)" ] }, diff --git a/docs/notebooks/pull.ipynb b/docs/notebooks/pull.ipynb index 0f0bc210..e3af6251 100644 --- a/docs/notebooks/pull.ipynb +++ b/docs/notebooks/pull.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 02:28:49][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 02:28:49][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 02:28:49][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 02:28:49][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 02:28:49][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 02:28:49][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 02:28:49][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 02:28:49][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 02:28:49][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 02:28:49][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # pull " + "###
★ pull
" ], "text/plain": [ "" @@ -106,11 +90,11 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/pull.html\n", + "%run nb_helpers.py\n", "\n", "from datar.datasets import starwars, mtcars\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(pull)" ] }, @@ -295,7 +279,7 @@ }, { "cell_type": "code", - "execution_count": 6, + "execution_count": 5, "id": "suspended-cooler", "metadata": { "execution": { @@ -344,7 +328,7 @@ "Name: cyl, dtype: int64" ] }, - "execution_count": 6, + "execution_count": 5, "metadata": {}, "output_type": "execute_result" } @@ -355,7 +339,7 @@ }, { "cell_type": "code", - "execution_count": 7, + "execution_count": 6, "id": "iraqi-shaft", "metadata": { "execution": { @@ -382,7 +366,7 @@ "Name: z, dtype: int64" ] }, - "execution_count": 7, + "execution_count": 6, "metadata": {}, "output_type": "execute_result" } @@ -394,7 +378,7 @@ }, { "cell_type": "code", - "execution_count": 8, + "execution_count": 7, "id": "danish-assignment", "metadata": { "execution": { @@ -497,7 +481,7 @@ " 'Padmé Amidala': 165.0}" ] }, - "execution_count": 8, + "execution_count": 7, "metadata": {}, "output_type": "execute_result" } diff --git a/docs/notebooks/ranking.ipynb b/docs/notebooks/ranking.ipynb index f4a0e0d8..37335637 100644 --- a/docs/notebooks/ranking.ipynb +++ b/docs/notebooks/ranking.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 02:28:54][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 02:28:54][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 02:28:54][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 02:28:54][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 02:28:54][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 02:28:54][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 02:28:54][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 02:28:54][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 02:28:54][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 02:28:54][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # row_number " + "###
★ row_number
" ], "text/plain": [ "" @@ -77,7 +61,7 @@ { "data": { "text/markdown": [ - "### # min_rank " + "###
★ min_rank
" ], "text/plain": [ "" @@ -101,7 +85,7 @@ { "data": { "text/markdown": [ - "### # dense_rank " + "###
★ dense_rank
" ], "text/plain": [ "" @@ -125,7 +109,7 @@ { "data": { "text/markdown": [ - "### # percent_rank " + "###
★ percent_rank
" ], "text/plain": [ "" @@ -149,7 +133,7 @@ { "data": { "text/markdown": [ - "### # cume_dist " + "###
★ cume_dist
" ], "text/plain": [ "" @@ -173,7 +157,7 @@ { "data": { "text/markdown": [ - "### # ntile " + "###
★ ntile
" ], "text/plain": [ "" @@ -188,13 +172,13 @@ "##### A rough rank, which breaks the input vector into `n` buckets.\n", "\n", "##### Note:\n", - "  The output tiles are 0-based. \n", + "  The output tiles are 1-based. \n", "  The result is slightly different from dplyr's ntile. \n", "  >>> ntile(c(1,2,NA,1,0,NA), 2) # dplyr \n", "  >>> # 1 2 NA 2 1 NA \n", "  >>> ntile([1,2,NA,1,0,NA], n=2) # datar \n", - "  >>> # [0, 1, NA, 0, 0, NA] \n", - "  >>> # Categories (2, int64): [0 < 1] \n" + "  >>> # [1, 2, NA, 1, 1, NA] \n", + "  >>> # Categories (2, int64): [1 < 2] \n" ], "text/plain": [ "" @@ -206,13 +190,13 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/ranking.html\n", + "%run nb_helpers.py\n", + "\n", "import numpy\n", - "from pandas.core.series import Series\n", "\n", "from datar.datasets import mtcars\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(row_number, min_rank, dense_rank, percent_rank, cume_dist, ntile)" ] }, @@ -278,7 +262,7 @@ " 4.0\n", " 1.00\n", " 1.0\n", - " 1\n", + " 2\n", " \n", " \n", " 1\n", @@ -288,7 +272,7 @@ " 1.0\n", " 0.00\n", " 0.2\n", - " 0\n", + " 1\n", " \n", " \n", " 2\n", @@ -298,7 +282,7 @@ " 3.0\n", " 0.75\n", " 0.8\n", - " 0\n", + " 1\n", " \n", " \n", " 3\n", @@ -308,7 +292,7 @@ " 2.0\n", " 0.25\n", " 0.6\n", - " 0\n", + " 1\n", " \n", " \n", " 4\n", @@ -318,7 +302,7 @@ " 2.0\n", " 0.25\n", " 0.6\n", - " 0\n", + " 1\n", " \n", " \n", " 5\n", @@ -346,11 +330,11 @@ "\n", " ntile \n", " \n", - "0 1 \n", - "1 0 \n", - "2 0 \n", - "3 0 \n", - "4 0 \n", + "0 2 \n", + "1 1 \n", + "2 1 \n", + "3 1 \n", + "4 1 \n", "5 NaN " ] }, @@ -418,42 +402,42 @@ " \n", " 0\n", " 0\n", - " 0\n", + " 1\n", " \n", " \n", " 1\n", " 1\n", - " 0\n", + " 1\n", " \n", " \n", " 2\n", " 2\n", - " 0\n", + " 1\n", " \n", " \n", " 3\n", " 3\n", - " 1\n", + " 2\n", " \n", " \n", " 4\n", " 4\n", - " 1\n", + " 2\n", " \n", " \n", " 5\n", " 5\n", - " 2\n", + " 3\n", " \n", " \n", " 6\n", " 6\n", - " 2\n", + " 3\n", " \n", " \n", " 7\n", " 7\n", - " 2\n", + " 3\n", " \n", " \n", "\n", @@ -462,14 +446,14 @@ "text/plain": [ " x ntile\n", " \n", - "0 0 0\n", - "1 1 0\n", - "2 2 0\n", - "3 3 1\n", - "4 4 1\n", - "5 5 2\n", - "6 6 2\n", - "7 7 2" + "0 0 1\n", + "1 1 1\n", + "2 2 1\n", + "3 3 2\n", + "4 4 2\n", + "5 5 3\n", + "6 6 3\n", + "7 7 3" ] }, "execution_count": 3, diff --git a/docs/notebooks/recode.ipynb b/docs/notebooks/recode.ipynb index 917300e3..22025927 100644 --- a/docs/notebooks/recode.ipynb +++ b/docs/notebooks/recode.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 02:29:14][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 02:29:15][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 02:29:15][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 02:29:15][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 02:29:15][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 02:29:15][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 02:29:15][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 02:29:15][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 02:29:15][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 02:29:15][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # recode " + "###
★ recode
" ], "text/plain": [ "" @@ -84,10 +68,10 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/recode.html\n", + "%run nb_helpers.py\n", "\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(recode)" ] }, @@ -107,8 +91,8 @@ { "data": { "text/plain": [ - "array(['b', 'c', 'b', 'Apple', 'Apple', 'Apple', 'b', 'b', 'c', 'Apple'],\n", - " dtype='Try this notebook on binder." + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -43,7 +27,7 @@ { "data": { "text/markdown": [ - "### # relocate " + "###
★ relocate
" ], "text/plain": [ "" @@ -88,9 +72,9 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/relocate.html\n", + "%run nb_helpers.py\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(relocate)" ] }, diff --git a/docs/notebooks/rename.ipynb b/docs/notebooks/rename.ipynb index 315a1d39..908a829d 100644 --- a/docs/notebooks/rename.ipynb +++ b/docs/notebooks/rename.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 02:31:02][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 02:31:02][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 02:31:02][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 02:31:02][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 02:31:02][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 02:31:02][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 02:31:02][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 02:31:02][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 02:31:02][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 02:31:02][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # rename " + "###
★ rename
" ], "text/plain": [ "" @@ -76,7 +60,7 @@ { "data": { "text/markdown": [ - "### # rename_with " + "###
★ rename_with
" ], "text/plain": [ "" @@ -113,11 +97,11 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/rename.html\n", + "%run nb_helpers.py\n", "\n", "from datar.datasets import iris\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(rename, rename_with)" ] }, @@ -803,7 +787,7 @@ }, { "cell_type": "code", - "execution_count": 7, + "execution_count": 6, "id": "f9cee963", "metadata": { "execution": { @@ -962,7 +946,7 @@ "[150 rows x 5 columns]" ] }, - "execution_count": 7, + "execution_count": 6, "metadata": {}, "output_type": "execute_result" } diff --git a/docs/notebooks/replace_na.ipynb b/docs/notebooks/replace_na.ipynb index b2d6b233..50f84752 100644 --- a/docs/notebooks/replace_na.ipynb +++ b/docs/notebooks/replace_na.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 02:31:08][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 02:31:08][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 02:31:08][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 02:31:08][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 02:31:08][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 02:31:08][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 02:31:08][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 02:31:08][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 02:31:08][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 02:31:08][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # replace_na " + "###
★ replace_na
" ], "text/plain": [ "" @@ -84,10 +68,10 @@ ], "source": [ "# https://tidyr.tidyverse.org/reference/replace_na.html\n", + "%run nb_helpers.py\n", "\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(replace_na)" ] }, diff --git a/docs/notebooks/rownames.ipynb b/docs/notebooks/rownames.ipynb index f19bc781..cae3c315 100644 --- a/docs/notebooks/rownames.ipynb +++ b/docs/notebooks/rownames.ipynb @@ -2,7 +2,7 @@ "cells": [ { "cell_type": "code", - "execution_count": 2, + "execution_count": 1, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:27:24.723831Z", @@ -15,7 +15,7 @@ { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -27,7 +27,7 @@ { "data": { "text/markdown": [ - "### # has_rownames " + "###
★ has_rownames
" ], "text/plain": [ "" @@ -59,7 +59,7 @@ { "data": { "text/markdown": [ - "### # remove_rownames " + "###
★ remove_rownames
" ], "text/plain": [ "" @@ -91,7 +91,7 @@ { "data": { "text/markdown": [ - "### # rownames_to_column " + "###
★ rownames_to_column
" ], "text/plain": [ "" @@ -125,7 +125,7 @@ { "data": { "text/markdown": [ - "### # rowid_to_column " + "###
★ rowid_to_column
" ], "text/plain": [ "" @@ -156,7 +156,7 @@ { "data": { "text/markdown": [ - "### # column_to_rownames " + "###
★ column_to_rownames
" ], "text/plain": [ "" @@ -189,18 +189,18 @@ ], "source": [ "# https://tibble.tidyverse.org/reference/add_row.html\n", + "%run nb_helpers.py\n", "\n", "from datar.tibble import *\n", "from datar.base import head\n", "from datar.datasets import mtcars, iris\n", "\n", - "%run nb_helpers.py\n", "nb_header(has_rownames, remove_rownames, rownames_to_column, rowid_to_column, column_to_rownames, book='rownames')" ] }, { "cell_type": "code", - "execution_count": 3, + "execution_count": 2, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:27:27.100163Z", @@ -216,7 +216,7 @@ "True" ] }, - "execution_count": 3, + "execution_count": 2, "metadata": {}, "output_type": "execute_result" } @@ -227,7 +227,7 @@ }, { "cell_type": "code", - "execution_count": 4, + "execution_count": 3, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:27:27.111548Z", @@ -243,7 +243,7 @@ "False" ] }, - "execution_count": 4, + "execution_count": 3, "metadata": {}, "output_type": "execute_result" } @@ -254,7 +254,7 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": 4, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:27:27.125381Z", @@ -270,7 +270,7 @@ "False" ] }, - "execution_count": 5, + "execution_count": 4, "metadata": {}, "output_type": "execute_result" } @@ -281,7 +281,7 @@ }, { "cell_type": "code", - "execution_count": 6, + "execution_count": 5, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:27:27.135636Z", @@ -898,7 +898,7 @@ "31 2.780 18.60 1 1 4 2 " ] }, - "execution_count": 6, + "execution_count": 5, "metadata": {}, "output_type": "execute_result" } @@ -910,7 +910,7 @@ }, { "cell_type": "code", - "execution_count": 7, + "execution_count": 6, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:27:27.372381Z", @@ -1077,7 +1077,7 @@ "Valiant 20.22 1 0 3 1 " ] }, - "execution_count": 7, + "execution_count": 6, "metadata": {}, "output_type": "execute_result" } @@ -1088,7 +1088,7 @@ }, { "cell_type": "code", - "execution_count": 8, + "execution_count": 7, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:27:27.415514Z", @@ -1206,7 +1206,7 @@ "5 5.4 5 3.9 1.7 0.4 setosa" ] }, - "execution_count": 8, + "execution_count": 7, "metadata": {}, "output_type": "execute_result" } diff --git a/docs/notebooks/rows.ipynb b/docs/notebooks/rows.ipynb index 1c40ef36..7bb71c90 100644 --- a/docs/notebooks/rows.ipynb +++ b/docs/notebooks/rows.ipynb @@ -12,26 +12,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 02:31:19][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 02:31:19][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 02:31:19][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 02:31:19][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 02:31:19][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 02:31:19][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 02:31:19][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 02:31:19][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 02:31:19][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 02:31:19][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -43,7 +27,7 @@ { "data": { "text/markdown": [ - "### # rows_insert " + "###
★ rows_insert
" ], "text/plain": [ "" @@ -90,7 +74,7 @@ { "data": { "text/markdown": [ - "### # rows_update " + "###
★ rows_update
" ], "text/plain": [ "" @@ -136,7 +120,7 @@ { "data": { "text/markdown": [ - "### # rows_patch " + "###
★ rows_patch
" ], "text/plain": [ "" @@ -182,7 +166,7 @@ { "data": { "text/markdown": [ - "### # rows_upsert " + "###
★ rows_upsert
" ], "text/plain": [ "" @@ -231,7 +215,7 @@ { "data": { "text/markdown": [ - "### # rows_delete " + "###
★ rows_delete
" ], "text/plain": [ "" @@ -276,9 +260,9 @@ } ], "source": [ + "%run nb_helpers.py\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(\n", " rows_insert, \n", " rows_update, \n", @@ -390,7 +374,7 @@ "name": "stderr", "output_type": "stream", "text": [ - "[2022-03-06 02:31:21][datar][ INFO] Matching, by='a'\n" + "[2022-03-18 17:35:21][datar][ INFO] Matching, by='a'\n" ] }, { @@ -488,7 +472,7 @@ "name": "stderr", "output_type": "stream", "text": [ - "[2022-03-06 02:31:21][datar][ INFO] Matching, by='a'\n" + "[2022-03-18 17:35:22][datar][ INFO] Matching, by='a'\n" ] }, { @@ -520,7 +504,7 @@ "name": "stderr", "output_type": "stream", "text": [ - "[2022-03-06 02:31:21][datar][ INFO] Matching, by='a'\n" + "[2022-03-18 17:35:22][datar][ INFO] Matching, by='a'\n" ] }, { @@ -695,7 +679,7 @@ "name": "stderr", "output_type": "stream", "text": [ - "[2022-03-06 02:31:21][datar][ INFO] Matching, by='a'\n" + "[2022-03-18 17:35:23][datar][ INFO] Matching, by='a'\n" ] }, { @@ -786,7 +770,7 @@ "name": "stderr", "output_type": "stream", "text": [ - "[2022-03-06 02:31:21][datar][ INFO] Matching, by='a'\n" + "[2022-03-18 17:35:24][datar][ INFO] Matching, by='a'\n" ] }, { @@ -884,7 +868,7 @@ "name": "stderr", "output_type": "stream", "text": [ - "[2022-03-06 02:31:22][datar][ INFO] Matching, by='a'\n" + "[2022-03-18 17:35:25][datar][ INFO] Matching, by='a'\n" ] }, { @@ -961,8 +945,8 @@ "name": "stderr", "output_type": "stream", "text": [ - "[2022-03-06 02:31:22][datar][ INFO] Matching, by='a'\n", - "[2022-03-06 02:31:22][datar][ INFO] Ignoring extra columns: ['b']\n" + "[2022-03-18 17:35:25][datar][ INFO] Matching, by='a'\n", + "[2022-03-18 17:35:25][datar][ INFO] Ignoring extra columns: ['b']\n" ] }, { diff --git a/docs/notebooks/rowwise.ipynb b/docs/notebooks/rowwise.ipynb index ddb0e5d6..932ed163 100644 --- a/docs/notebooks/rowwise.ipynb +++ b/docs/notebooks/rowwise.ipynb @@ -12,26 +12,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 02:33:14][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 02:33:14][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 02:33:14][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 02:33:14][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 02:33:14][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 02:33:14][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 02:33:14][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 02:33:14][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 02:33:14][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 02:33:14][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -43,7 +27,7 @@ { "data": { "text/markdown": [ - "### # rowwise " + "###
★ rowwise
" ], "text/plain": [ "" @@ -78,11 +62,10 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/rowwise.html\n", + "%run nb_helpers.py\n", "\n", - "from datar.datasets import iris\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(rowwise)" ] }, @@ -135,45 +118,45 @@ " \n", " \n", " 0\n", - " 0.903370\n", - " 0.381683\n", - " 0.289784\n", - " 0.524946\n", + " 0.598889\n", + " 0.750540\n", + " 0.165758\n", + " 0.505062\n", " \n", " \n", " 1\n", - " 0.862827\n", - " 0.432840\n", - " 0.152457\n", - " 0.482708\n", + " 0.639200\n", + " 0.945952\n", + " 0.339303\n", + " 0.641485\n", " \n", " \n", " 2\n", - " 0.329482\n", - " 0.993187\n", - " 0.022119\n", - " 0.448263\n", + " 0.415240\n", + " 0.725756\n", + " 0.184642\n", + " 0.441879\n", " \n", " \n", " 3\n", - " 0.329133\n", - " 0.365489\n", - " 0.841347\n", - " 0.511990\n", + " 0.375989\n", + " 0.432068\n", + " 0.113932\n", + " 0.307329\n", " \n", " \n", " 4\n", - " 0.376668\n", - " 0.604747\n", - " 0.967709\n", - " 0.649708\n", + " 0.361752\n", + " 0.253792\n", + " 0.621856\n", + " 0.412466\n", " \n", " \n", " 5\n", - " 0.808531\n", - " 0.968855\n", - " 0.165438\n", - " 0.647608\n", + " 0.260691\n", + " 0.200419\n", + " 0.391062\n", + " 0.284058\n", " \n", " \n", "\n", @@ -183,12 +166,12 @@ "text/plain": [ " x y z m\n", " \n", - "0 0.903370 0.381683 0.289784 0.524946\n", - "1 0.862827 0.432840 0.152457 0.482708\n", - "2 0.329482 0.993187 0.022119 0.448263\n", - "3 0.329133 0.365489 0.841347 0.511990\n", - "4 0.376668 0.604747 0.967709 0.649708\n", - "5 0.808531 0.968855 0.165438 0.647608\n", + "0 0.598889 0.750540 0.165758 0.505062\n", + "1 0.639200 0.945952 0.339303 0.641485\n", + "2 0.415240 0.725756 0.184642 0.441879\n", + "3 0.375989 0.432068 0.113932 0.307329\n", + "4 0.361752 0.253792 0.621856 0.412466\n", + "5 0.260691 0.200419 0.391062 0.284058\n", "[TibbleRowwise: (n=6)]" ] }, @@ -205,7 +188,7 @@ }, { "cell_type": "code", - "execution_count": 8, + "execution_count": 3, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:28:10.067015Z", @@ -252,45 +235,45 @@ " \n", " \n", " 0\n", - " 0.903370\n", - " 0.381683\n", - " 0.289784\n", - " 0.524946\n", + " 0.598889\n", + " 0.750540\n", + " 0.165758\n", + " 0.505062\n", " \n", " \n", " 1\n", - " 0.862827\n", - " 0.432840\n", - " 0.152457\n", - " 0.482708\n", + " 0.639200\n", + " 0.945952\n", + " 0.339303\n", + " 0.641485\n", " \n", " \n", " 2\n", - " 0.329482\n", - " 0.993187\n", - " 0.022119\n", - " 0.448263\n", + " 0.415240\n", + " 0.725756\n", + " 0.184642\n", + " 0.441879\n", " \n", " \n", " 3\n", - " 0.329133\n", - " 0.365489\n", - " 0.841347\n", - " 0.511990\n", + " 0.375989\n", + " 0.432068\n", + " 0.113932\n", + " 0.307329\n", " \n", " \n", " 4\n", - " 0.376668\n", - " 0.604747\n", - " 0.967709\n", - " 0.649708\n", + " 0.361752\n", + " 0.253792\n", + " 0.621856\n", + " 0.412466\n", " \n", " \n", " 5\n", - " 0.808531\n", - " 0.968855\n", - " 0.165438\n", - " 0.647608\n", + " 0.260691\n", + " 0.200419\n", + " 0.391062\n", + " 0.284058\n", " \n", " \n", "\n", @@ -300,16 +283,16 @@ "text/plain": [ " x y z m\n", " \n", - "0 0.903370 0.381683 0.289784 0.524946\n", - "1 0.862827 0.432840 0.152457 0.482708\n", - "2 0.329482 0.993187 0.022119 0.448263\n", - "3 0.329133 0.365489 0.841347 0.511990\n", - "4 0.376668 0.604747 0.967709 0.649708\n", - "5 0.808531 0.968855 0.165438 0.647608\n", + "0 0.598889 0.750540 0.165758 0.505062\n", + "1 0.639200 0.945952 0.339303 0.641485\n", + "2 0.415240 0.725756 0.184642 0.441879\n", + "3 0.375989 0.432068 0.113932 0.307329\n", + "4 0.361752 0.253792 0.621856 0.412466\n", + "5 0.260691 0.200419 0.391062 0.284058\n", "[TibbleRowwise: (n=6)]" ] }, - "execution_count": 8, + "execution_count": 3, "metadata": {}, "output_type": "execute_result" } @@ -320,7 +303,7 @@ }, { "cell_type": "code", - "execution_count": 9, + "execution_count": 4, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:28:10.157870Z", @@ -367,45 +350,45 @@ " \n", " \n", " 0\n", - " 0.903370\n", - " 0.381683\n", - " 0.289784\n", - " 0.289784\n", + " 0.598889\n", + " 0.750540\n", + " 0.165758\n", + " 0.165758\n", " \n", " \n", " 1\n", - " 0.862827\n", - " 0.432840\n", - " 0.152457\n", - " 0.152457\n", + " 0.639200\n", + " 0.945952\n", + " 0.339303\n", + " 0.339303\n", " \n", " \n", " 2\n", - " 0.329482\n", - " 0.993187\n", - " 0.022119\n", - " 0.022119\n", + " 0.415240\n", + " 0.725756\n", + " 0.184642\n", + " 0.184642\n", " \n", " \n", " 3\n", - " 0.329133\n", - " 0.365489\n", - " 0.841347\n", - " 0.329133\n", + " 0.375989\n", + " 0.432068\n", + " 0.113932\n", + " 0.113932\n", " \n", " \n", " 4\n", - " 0.376668\n", - " 0.604747\n", - " 0.967709\n", - " 0.376668\n", + " 0.361752\n", + " 0.253792\n", + " 0.621856\n", + " 0.253792\n", " \n", " \n", " 5\n", - " 0.808531\n", - " 0.968855\n", - " 0.165438\n", - " 0.165438\n", + " 0.260691\n", + " 0.200419\n", + " 0.391062\n", + " 0.200419\n", " \n", " \n", "\n", @@ -415,16 +398,16 @@ "text/plain": [ " x y z m\n", " \n", - "0 0.903370 0.381683 0.289784 0.289784\n", - "1 0.862827 0.432840 0.152457 0.152457\n", - "2 0.329482 0.993187 0.022119 0.022119\n", - "3 0.329133 0.365489 0.841347 0.329133\n", - "4 0.376668 0.604747 0.967709 0.376668\n", - "5 0.808531 0.968855 0.165438 0.165438\n", + "0 0.598889 0.750540 0.165758 0.165758\n", + "1 0.639200 0.945952 0.339303 0.339303\n", + "2 0.415240 0.725756 0.184642 0.184642\n", + "3 0.375989 0.432068 0.113932 0.113932\n", + "4 0.361752 0.253792 0.621856 0.253792\n", + "5 0.260691 0.200419 0.391062 0.200419\n", "[TibbleRowwise: (n=6)]" ] }, - "execution_count": 9, + "execution_count": 4, "metadata": {}, "output_type": "execute_result" } @@ -435,7 +418,7 @@ }, { "cell_type": "code", - "execution_count": 13, + "execution_count": 5, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:28:10.231704Z", @@ -482,45 +465,45 @@ " \n", " \n", " 0\n", - " 0.903370\n", - " 0.381683\n", - " 0.289784\n", - " 0.289784\n", + " 0.598889\n", + " 0.750540\n", + " 0.165758\n", + " 0.165758\n", " \n", " \n", " 1\n", - " 0.862827\n", - " 0.432840\n", - " 0.152457\n", - " 0.152457\n", + " 0.639200\n", + " 0.945952\n", + " 0.339303\n", + " 0.339303\n", " \n", " \n", " 2\n", - " 0.329482\n", - " 0.993187\n", - " 0.022119\n", - " 0.022119\n", + " 0.415240\n", + " 0.725756\n", + " 0.184642\n", + " 0.184642\n", " \n", " \n", " 3\n", - " 0.329133\n", - " 0.365489\n", - " 0.841347\n", - " 0.329133\n", + " 0.375989\n", + " 0.432068\n", + " 0.113932\n", + " 0.113932\n", " \n", " \n", " 4\n", - " 0.376668\n", - " 0.604747\n", - " 0.967709\n", - " 0.376668\n", + " 0.361752\n", + " 0.253792\n", + " 0.621856\n", + " 0.253792\n", " \n", " \n", " 5\n", - " 0.808531\n", - " 0.968855\n", - " 0.165438\n", - " 0.165438\n", + " 0.260691\n", + " 0.200419\n", + " 0.391062\n", + " 0.200419\n", " \n", " \n", "\n", @@ -530,16 +513,16 @@ "text/plain": [ " x y z m\n", " \n", - "0 0.903370 0.381683 0.289784 0.289784\n", - "1 0.862827 0.432840 0.152457 0.152457\n", - "2 0.329482 0.993187 0.022119 0.022119\n", - "3 0.329133 0.365489 0.841347 0.329133\n", - "4 0.376668 0.604747 0.967709 0.376668\n", - "5 0.808531 0.968855 0.165438 0.165438\n", + "0 0.598889 0.750540 0.165758 0.165758\n", + "1 0.639200 0.945952 0.339303 0.339303\n", + "2 0.415240 0.725756 0.184642 0.184642\n", + "3 0.375989 0.432068 0.113932 0.113932\n", + "4 0.361752 0.253792 0.621856 0.253792\n", + "5 0.260691 0.200419 0.391062 0.200419\n", "[TibbleRowwise: (n=6)]" ] }, - "execution_count": 13, + "execution_count": 5, "metadata": {}, "output_type": "execute_result" } @@ -550,7 +533,7 @@ }, { "cell_type": "code", - "execution_count": 14, + "execution_count": 6, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:28:10.245426Z", @@ -597,45 +580,45 @@ " \n", " \n", " 0\n", - " 0.903370\n", - " 0.381683\n", - " 0.289784\n", - " 0.289784\n", + " 0.598889\n", + " 0.750540\n", + " 0.165758\n", + " 0.165758\n", " \n", " \n", " 1\n", - " 0.862827\n", - " 0.432840\n", - " 0.152457\n", - " 0.152457\n", + " 0.639200\n", + " 0.945952\n", + " 0.339303\n", + " 0.339303\n", " \n", " \n", " 2\n", - " 0.329482\n", - " 0.993187\n", - " 0.022119\n", - " 0.022119\n", + " 0.415240\n", + " 0.725756\n", + " 0.184642\n", + " 0.184642\n", " \n", " \n", " 3\n", - " 0.329133\n", - " 0.365489\n", - " 0.841347\n", - " 0.329133\n", + " 0.375989\n", + " 0.432068\n", + " 0.113932\n", + " 0.113932\n", " \n", " \n", " 4\n", - " 0.376668\n", - " 0.604747\n", - " 0.967709\n", - " 0.376668\n", + " 0.361752\n", + " 0.253792\n", + " 0.621856\n", + " 0.253792\n", " \n", " \n", " 5\n", - " 0.808531\n", - " 0.968855\n", - " 0.165438\n", - " 0.165438\n", + " 0.260691\n", + " 0.200419\n", + " 0.391062\n", + " 0.200419\n", " \n", " \n", "\n", @@ -644,15 +627,15 @@ "text/plain": [ " x y z m\n", " \n", - "0 0.903370 0.381683 0.289784 0.289784\n", - "1 0.862827 0.432840 0.152457 0.152457\n", - "2 0.329482 0.993187 0.022119 0.022119\n", - "3 0.329133 0.365489 0.841347 0.329133\n", - "4 0.376668 0.604747 0.967709 0.376668\n", - "5 0.808531 0.968855 0.165438 0.165438" + "0 0.598889 0.750540 0.165758 0.165758\n", + "1 0.639200 0.945952 0.339303 0.339303\n", + "2 0.415240 0.725756 0.184642 0.184642\n", + "3 0.375989 0.432068 0.113932 0.113932\n", + "4 0.361752 0.253792 0.621856 0.253792\n", + "5 0.260691 0.200419 0.391062 0.200419" ] }, - "execution_count": 14, + "execution_count": 6, "metadata": {}, "output_type": "execute_result" } @@ -663,7 +646,7 @@ }, { "cell_type": "code", - "execution_count": 16, + "execution_count": 7, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:28:10.296858Z", @@ -716,7 +699,7 @@ " 1\n", " 1\n", " 1\n", - " [-0.49710972258374775]\n", + " [-0.7634531680295189]\n", " \n", " \n", " 1\n", @@ -724,7 +707,7 @@ " 2\n", " 2\n", " 4\n", - " [-5.952767882433143, 1.3006955205328627]\n", + " [1.3116228201838442, -2.3156113026975653]\n", " \n", " \n", " 2\n", @@ -732,7 +715,7 @@ " 3\n", " 1\n", " 2\n", - " [-0.034757059529934686, 1.211681840606102, 0.4...\n", + " [1.47493909065586, -1.074116930262953, -1.0587...\n", " \n", " \n", "\n", @@ -748,13 +731,13 @@ "\n", " z \n", " \n", - "0 [-0.49710972258374775] \n", - "1 [-5.952767882433143, 1.3006955205328627] \n", - "2 [-0.034757059529934686, 1.211681840606102, 0.4... \n", + "0 [-0.7634531680295189] \n", + "1 [1.3116228201838442, -2.3156113026975653] \n", + "2 [1.47493909065586, -1.074116930262953, -1.0587... \n", "[TibbleRowwise: sim (n=3)]" ] }, - "execution_count": 16, + "execution_count": 7, "metadata": {}, "output_type": "execute_result" } diff --git a/docs/notebooks/select.ipynb b/docs/notebooks/select.ipynb index 742bbbaa..830a73c7 100644 --- a/docs/notebooks/select.ipynb +++ b/docs/notebooks/select.ipynb @@ -12,26 +12,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 02:33:21][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 02:33:21][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 02:33:21][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 02:33:21][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 02:33:21][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 02:33:21][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 02:33:21][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 02:33:21][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 02:33:21][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 02:33:21][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -43,7 +27,7 @@ { "data": { "text/markdown": [ - "### # select " + "###
★ select
" ], "text/plain": [ "" @@ -83,10 +67,11 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/select.html\n", + "%run nb_helpers.py\n", + "\n", "from datar.datasets import starwars, iris\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(select)" ] }, @@ -1979,7 +1964,7 @@ }, { "cell_type": "code", - "execution_count": 16, + "execution_count": 15, "metadata": { "execution": { "iopub.execute_input": "2021-07-16T22:27:15.890597Z", @@ -2124,7 +2109,7 @@ "[150 rows x 4 columns]" ] }, - "execution_count": 16, + "execution_count": 15, "metadata": {}, "output_type": "execute_result" } diff --git a/docs/notebooks/separate.ipynb b/docs/notebooks/separate.ipynb index ea1226d5..cf2593cc 100644 --- a/docs/notebooks/separate.ipynb +++ b/docs/notebooks/separate.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 02:33:28][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 02:33:28][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 02:33:28][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 02:33:28][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 02:33:28][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 02:33:28][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 02:33:28][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 02:33:28][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 02:33:28][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 02:33:28][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # separate " + "###
★ separate
" ], "text/plain": [ "" @@ -109,7 +93,7 @@ { "data": { "text/markdown": [ - "### # separate_rows " + "###
★ separate_rows
" ], "text/plain": [ "" @@ -143,10 +127,10 @@ ], "source": [ "# https://tidyr.tidyverse.org/reference/separate.html\n", + "%run nb_helpers.py\n", "\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(separate, separate_rows)" ] }, @@ -334,8 +318,8 @@ "name": "stderr", "output_type": "stream", "text": [ - "[2022-03-06 02:33:30][datar][WARNING] Expected 2 pieces. Additional pieces discarded in 1 rows ['x y z'].\n", - "[2022-03-06 02:33:30][datar][WARNING] Expected 2 pieces. Missing pieces filled with `NA` in 1 rows ['x'].\n" + "[2022-03-18 17:04:11][datar][WARNING] Expected 2 pieces. Additional pieces discarded in 1 rows ['x y z'].\n", + "[2022-03-18 17:04:11][datar][WARNING] Expected 2 pieces. Missing pieces filled with `NA` in 1 rows ['x'].\n" ] }, { @@ -601,7 +585,7 @@ "name": "stderr", "output_type": "stream", "text": [ - "[2022-03-06 02:33:33][datar][WARNING] Expected 3 pieces. Missing pieces filled with `NA` in 2 rows ['x', 'x y'].\n" + "[2022-03-18 17:04:14][datar][WARNING] Expected 3 pieces. Missing pieces filled with `NA` in 2 rows ['x', 'x y'].\n" ] }, { @@ -862,7 +846,7 @@ "name": "stderr", "output_type": "stream", "text": [ - "[2022-03-06 02:33:37][datar][WARNING] Expected 2 pieces. Missing pieces filled with `NA` in 1 rows ['z'].\n" + "[2022-03-18 17:04:16][datar][WARNING] Expected 2 pieces. Missing pieces filled with `NA` in 1 rows ['z'].\n" ] }, { @@ -947,7 +931,7 @@ }, { "cell_type": "code", - "execution_count": 11, + "execution_count": 12, "id": "f1a9ec03", "metadata": { "execution": { @@ -962,83 +946,9 @@ "name": "stderr", "output_type": "stream", "text": [ - "[2022-03-06 02:33:38][datar][WARNING] Expected 2 pieces. Missing pieces filled with `NA` in 1 rows ['z'].\n" + "[2022-03-18 17:04:58][datar][WARNING] Expected 2 pieces. Missing pieces filled with `NA` in 1 rows ['z'].\n" ] }, - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
keyvalue
<object><float64>
0x1.0
1x2.0
2y4.0
3zNaN
4NaNNaN
\n", - "
\n" - ], - "text/plain": [ - " key value\n", - " \n", - "0 x 1.0\n", - "1 x 2.0\n", - "2 y 4.0\n", - "3 z NaN\n", - "4 NaN NaN" - ] - }, - "execution_count": 11, - "metadata": {}, - "output_type": "execute_result" - }, { "data": { "text/plain": [ @@ -1047,19 +957,19 @@ "dtype: object" ] }, - "execution_count": 11, + "execution_count": 12, "metadata": {}, "output_type": "execute_result" } ], "source": [ - "df >> separate(f.x, c(\"key\",\"value\"), \":\", convert={'value': float}) \n", - "_.dtypes" + "out = df >> separate(f.x, c(\"key\",\"value\"), \":\", convert={'value': float}) \n", + "out.dtypes" ] }, { "cell_type": "code", - "execution_count": 12, + "execution_count": 13, "id": "c7af94b8", "metadata": { "execution": { @@ -1080,7 +990,7 @@ }, { "cell_type": "code", - "execution_count": 13, + "execution_count": 14, "id": "47243faf", "metadata": { "execution": { @@ -1175,7 +1085,7 @@ "5 3 h 6" ] }, - "execution_count": 13, + "execution_count": 14, "metadata": {}, "output_type": "execute_result" } diff --git a/docs/notebooks/setops.ipynb b/docs/notebooks/setops.ipynb index 43f2cd8e..281a2be4 100644 --- a/docs/notebooks/setops.ipynb +++ b/docs/notebooks/setops.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 02:33:42][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 02:33:42][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 02:33:42][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 02:33:42][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 02:33:42][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 02:33:42][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 02:33:42][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 02:33:42][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 02:33:42][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 02:33:42][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # intersect " + "###
★ intersect
" ], "text/plain": [ "" @@ -68,7 +52,7 @@ { "data": { "text/markdown": [ - "### # union " + "###
★ union
" ], "text/plain": [ "" @@ -92,7 +76,7 @@ { "data": { "text/markdown": [ - "### # setdiff " + "###
★ setdiff
" ], "text/plain": [ "" @@ -116,7 +100,7 @@ { "data": { "text/markdown": [ - "### # union_all " + "###
★ union_all
" ], "text/plain": [ "" @@ -147,7 +131,7 @@ { "data": { "text/markdown": [ - "### # setequal " + "###
★ setequal
" ], "text/plain": [ "" @@ -171,11 +155,11 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/setops.html\n", + "%run nb_helpers.py\n", "\n", "from datar.datasets import mtcars\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(intersect, union, setdiff, union_all, setequal, book='setops')" ] }, diff --git a/docs/notebooks/slice.ipynb b/docs/notebooks/slice.ipynb index b95a440d..ed17539d 100644 --- a/docs/notebooks/slice.ipynb +++ b/docs/notebooks/slice.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 02:11:36][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 02:11:36][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 02:11:36][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 02:11:36][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 02:11:36][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 02:11:36][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 02:11:36][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 02:11:36][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 02:11:36][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 02:11:36][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # slice " + "###
★ slice
" ], "text/plain": [ "" @@ -94,7 +78,7 @@ { "data": { "text/markdown": [ - "### # slice_head " + "###
★ slice_head
" ], "text/plain": [ "" @@ -132,7 +116,7 @@ { "data": { "text/markdown": [ - "### # slice_max " + "###
★ slice_max
" ], "text/plain": [ "" @@ -159,7 +143,7 @@ { "data": { "text/markdown": [ - "### # slice_min " + "###
★ slice_min
" ], "text/plain": [ "" @@ -198,7 +182,7 @@ { "data": { "text/markdown": [ - "### # slice_sample " + "###
★ slice_sample
" ], "text/plain": [ "" @@ -225,7 +209,7 @@ { "data": { "text/markdown": [ - "### # slice_tail " + "###
★ slice_tail
" ], "text/plain": [ "" @@ -252,11 +236,11 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/slice.html\n", + "%run nb_helpers.py\n", "\n", "from datar.datasets import mtcars\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(slice, slice_head, slice_max, slice_min, slice_sample, slice_tail)" ] }, @@ -361,7 +345,7 @@ }, { "cell_type": "code", - "execution_count": 29, + "execution_count": 3, "id": "93030877", "metadata": { "execution": { @@ -449,7 +433,7 @@ "Volvo 142E 1 1 4 2 " ] }, - "execution_count": 29, + "execution_count": 3, "metadata": {}, "output_type": "execute_result" } @@ -3084,18 +3068,18 @@ " <int64>\n", " \n", " \n", - " Valiant\n", - " 18.1\n", - " 6\n", - " 225.0\n", - " 105\n", + " Dodge Challenger\n", + " 15.5\n", + " 8\n", + " 318.0\n", + " 150\n", " 2.76\n", - " 3.460\n", - " 20.22\n", - " 1\n", + " 3.52\n", + " 16.87\n", + " 0\n", " 0\n", " 3\n", - " 1\n", + " 2\n", " \n", " \n", " Ford Pantera L\n", @@ -3104,7 +3088,7 @@ " 351.0\n", " 264\n", " 4.22\n", - " 3.170\n", + " 3.17\n", " 14.50\n", " 0\n", " 1\n", @@ -3112,67 +3096,67 @@ " 4\n", " \n", " \n", - " Porsche 914-2\n", - " 26.0\n", - " 4\n", - " 120.3\n", - " 91\n", - " 4.43\n", - " 2.140\n", - " 16.70\n", - " 0\n", - " 1\n", - " 5\n", - " 2\n", - " \n", - " \n", - " Toyota Corolla\n", - " 33.9\n", + " Fiat 128\n", + " 32.4\n", " 4\n", - " 71.1\n", - " 65\n", - " 4.22\n", - " 1.835\n", - " 19.90\n", + " 78.7\n", + " 66\n", + " 4.08\n", + " 2.20\n", + " 19.47\n", " 1\n", " 1\n", " 4\n", " 1\n", " \n", " \n", - " Merc 280C\n", - " 17.8\n", - " 6\n", - " 167.6\n", - " 123\n", - " 3.92\n", - " 3.440\n", - " 18.90\n", + " Maserati Bora\n", + " 15.0\n", + " 8\n", + " 301.0\n", + " 335\n", + " 3.54\n", + " 3.57\n", + " 14.60\n", + " 0\n", " 1\n", + " 5\n", + " 8\n", + " \n", + " \n", + " Merc 450SL\n", + " 17.3\n", + " 8\n", + " 275.8\n", + " 180\n", + " 3.07\n", + " 3.73\n", + " 17.60\n", " 0\n", - " 4\n", - " 4\n", + " 0\n", + " 3\n", + " 3\n", " \n", " \n", "\n", "\n" ], "text/plain": [ - " mpg cyl disp hp drat wt \\\n", - " \n", - "Valiant 18.1 6 225.0 105 2.76 3.460 \n", - "Ford Pantera L 15.8 8 351.0 264 4.22 3.170 \n", - "Porsche 914-2 26.0 4 120.3 91 4.43 2.140 \n", - "Toyota Corolla 33.9 4 71.1 65 4.22 1.835 \n", - "Merc 280C 17.8 6 167.6 123 3.92 3.440 \n", + " mpg cyl disp hp drat wt \\\n", + " \n", + "Dodge Challenger 15.5 8 318.0 150 2.76 3.52 \n", + "Ford Pantera L 15.8 8 351.0 264 4.22 3.17 \n", + "Fiat 128 32.4 4 78.7 66 4.08 2.20 \n", + "Maserati Bora 15.0 8 301.0 335 3.54 3.57 \n", + "Merc 450SL 17.3 8 275.8 180 3.07 3.73 \n", "\n", - " qsec vs am gear carb \n", - " \n", - "Valiant 20.22 1 0 3 1 \n", - "Ford Pantera L 14.50 0 1 5 4 \n", - "Porsche 914-2 16.70 0 1 5 2 \n", - "Toyota Corolla 19.90 1 1 4 1 \n", - "Merc 280C 18.90 1 0 4 4 " + " qsec vs am gear carb \n", + " \n", + "Dodge Challenger 16.87 0 0 3 2 \n", + "Ford Pantera L 14.50 0 1 5 4 \n", + "Fiat 128 19.47 1 1 4 1 \n", + "Maserati Bora 14.60 0 1 5 8 \n", + "Merc 450SL 17.60 0 0 3 3 " ] }, "execution_count": 15, @@ -3736,95 +3720,95 @@ " <int64>\n", " \n", " \n", - " Pontiac Firebird\n", - " 19.2\n", + " Merc 450SE\n", + " 16.4\n", " 8\n", - " 400.0\n", - " 175\n", - " 3.08\n", - " 3.845\n", - " 17.05\n", + " 275.8\n", + " 180\n", + " 3.07\n", + " 4.070\n", + " 17.40\n", " 0\n", " 0\n", " 3\n", - " 2\n", + " 3\n", " \n", " \n", - " Merc 240D\n", - " 24.4\n", - " 4\n", - " 146.7\n", - " 62\n", - " 3.69\n", - " 3.190\n", - " 20.00\n", + " Merc 280C\n", + " 17.8\n", + " 6\n", + " 167.6\n", + " 123\n", + " 3.92\n", + " 3.440\n", + " 18.90\n", " 1\n", " 0\n", " 4\n", - " 2\n", - " \n", - " \n", - " Cadillac Fleetwood\n", - " 10.4\n", - " 8\n", - " 472.0\n", - " 205\n", - " 2.93\n", - " 5.250\n", - " 17.98\n", - " 0\n", - " 0\n", - " 3\n", " 4\n", " \n", " \n", - " Ferrari Dino\n", - " 19.7\n", - " 6\n", - " 145.0\n", - " 175\n", - " 3.62\n", - " 2.770\n", - " 15.50\n", - " 0\n", + " Lotus Europa\n", + " 30.4\n", + " 4\n", + " 95.1\n", + " 113\n", + " 3.77\n", + " 1.513\n", + " 16.90\n", + " 1\n", " 1\n", " 5\n", - " 6\n", + " 2\n", " \n", " \n", - " Mazda RX4 Wag\n", + " Mazda RX4\n", " 21.0\n", " 6\n", " 160.0\n", " 110\n", " 3.90\n", - " 2.875\n", - " 17.02\n", + " 2.620\n", + " 16.46\n", " 0\n", " 1\n", " 4\n", " 4\n", " \n", + " \n", + " Camaro Z28\n", + " 13.3\n", + " 8\n", + " 350.0\n", + " 245\n", + " 3.73\n", + " 3.840\n", + " 15.41\n", + " 0\n", + " 0\n", + " 3\n", + " 4\n", + " \n", " \n", "\n", "\n" ], "text/plain": [ - " mpg cyl disp hp drat wt \\\n", - " \n", - "Pontiac Firebird 19.2 8 400.0 175 3.08 3.845 \n", - "Merc 240D 24.4 4 146.7 62 3.69 3.190 \n", - "Cadillac Fleetwood 10.4 8 472.0 205 2.93 5.250 \n", - "Ferrari Dino 19.7 6 145.0 175 3.62 2.770 \n", - "Mazda RX4 Wag 21.0 6 160.0 110 3.90 2.875 \n", + " mpg cyl disp hp drat wt \\\n", + " \n", + "Merc 450SE 16.4 8 275.8 180 3.07 4.070 \n", + "Merc 280C 17.8 6 167.6 123 3.92 3.440 \n", + "Lotus Europa 30.4 4 95.1 113 3.77 1.513 \n", + "Mazda RX4 21.0 6 160.0 110 3.90 2.620 \n", + "Camaro Z28 13.3 8 350.0 245 3.73 3.840 \n", "\n", - " qsec vs am gear carb \n", - " \n", - "Pontiac Firebird 17.05 0 0 3 2 \n", - "Merc 240D 20.00 1 0 4 2 \n", - "Cadillac Fleetwood 17.98 0 0 3 4 \n", - "Ferrari Dino 15.50 0 1 5 6 \n", - "Mazda RX4 Wag 17.02 0 1 4 4 " + " qsec vs am gear carb \n", + " \n", + "Merc 450SE 17.40 0 0 3 3 \n", + "Merc 280C 18.90 1 0 4 4 \n", + "Lotus Europa 16.90 1 1 5 2 \n", + "Mazda RX4 16.46 0 1 4 4 \n", + "Camaro Z28 15.41 0 0 3 4 " ] }, "execution_count": 19, @@ -3883,27 +3867,27 @@ " \n", " 0\n", " a\n", - " 0.809743\n", + " 0.739922\n", " \n", " \n", " 1\n", " b\n", - " 0.110534\n", + " 0.033397\n", " \n", " \n", " 2\n", " b\n", - " 0.363136\n", + " 0.851489\n", " \n", " \n", " 3\n", " c\n", - " 0.857736\n", + " 0.886006\n", " \n", " \n", " 4\n", " c\n", - " 0.187621\n", + " 0.068798\n", " \n", " \n", "\n", @@ -3913,11 +3897,11 @@ "text/plain": [ " group x\n", " \n", - "0 a 0.809743\n", - "1 b 0.110534\n", - "2 b 0.363136\n", - "3 c 0.857736\n", - "4 c 0.187621\n", + "0 a 0.739922\n", + "1 b 0.033397\n", + "2 b 0.851489\n", + "3 c 0.886006\n", + "4 c 0.068798\n", "[TibbleGrouped: group (n=3)]" ] }, @@ -3981,17 +3965,17 @@ " \n", " 0\n", " b\n", - " 0.110534\n", + " 0.033397\n", " \n", " \n", " 1\n", " c\n", - " 0.857736\n", + " 0.886006\n", " \n", " \n", " 2\n", " c\n", - " 0.187621\n", + " 0.068798\n", " \n", " \n", "\n", @@ -4001,9 +3985,9 @@ "text/plain": [ " group x\n", " \n", - "0 b 0.110534\n", - "1 c 0.857736\n", - "2 c 0.187621\n", + "0 b 0.033397\n", + "1 c 0.886006\n", + "2 c 0.068798\n", "[TibbleGrouped: group (n=2)]" ] }, @@ -5372,32 +5356,32 @@ " \n", " 0\n", " a\n", - " 0.024847\n", + " 0.137090\n", " \n", " \n", " 1\n", " a\n", - " 0.389788\n", + " 0.160933\n", " \n", " \n", " 2\n", " b\n", - " 0.001498\n", + " 0.066202\n", " \n", " \n", " 3\n", " b\n", - " 0.016201\n", + " 0.138360\n", " \n", " \n", " 4\n", " c\n", - " 0.004985\n", + " 0.043403\n", " \n", " \n", " 5\n", " c\n", - " 0.052600\n", + " 0.068841\n", " \n", " \n", "\n", @@ -5407,12 +5391,12 @@ "text/plain": [ " group x\n", " \n", - "0 a 0.024847\n", - "1 a 0.389788\n", - "2 b 0.001498\n", - "3 b 0.016201\n", - "4 c 0.004985\n", - "5 c 0.052600\n", + "0 a 0.137090\n", + "1 a 0.160933\n", + "2 b 0.066202\n", + "3 b 0.138360\n", + "4 c 0.043403\n", + "5 c 0.068841\n", "[TibbleGrouped: group (n=3)]" ] }, @@ -5476,32 +5460,32 @@ " \n", " 0\n", " a\n", - " 0.979691\n", + " 0.983779\n", " \n", " \n", " 1\n", " a\n", - " 0.969839\n", + " 0.872443\n", " \n", " \n", " 2\n", " b\n", - " 0.967242\n", + " 0.987097\n", " \n", " \n", " 3\n", " b\n", - " 0.906166\n", + " 0.936791\n", " \n", " \n", " 4\n", " c\n", - " 0.995052\n", + " 0.984012\n", " \n", " \n", " 5\n", " c\n", - " 0.994709\n", + " 0.932186\n", " \n", " \n", "\n", @@ -5511,12 +5495,12 @@ "text/plain": [ " group x\n", " \n", - "0 a 0.979691\n", - "1 a 0.969839\n", - "2 b 0.967242\n", - "3 b 0.906166\n", - "4 c 0.995052\n", - "5 c 0.994709\n", + "0 a 0.983779\n", + "1 a 0.872443\n", + "2 b 0.987097\n", + "3 b 0.936791\n", + "4 c 0.984012\n", + "5 c 0.932186\n", "[TibbleGrouped: group (n=3)]" ] }, @@ -5576,32 +5560,32 @@ " \n", " 0\n", " a\n", - " 0.903480\n", + " 0.461532\n", " \n", " \n", " 1\n", " a\n", - " 0.969839\n", + " 0.137090\n", " \n", " \n", " 2\n", " b\n", - " 0.464387\n", + " 0.987097\n", " \n", " \n", " 3\n", " b\n", - " 0.122231\n", + " 0.816681\n", " \n", " \n", " 4\n", " c\n", - " 0.804479\n", + " 0.390507\n", " \n", " \n", " 5\n", " c\n", - " 0.994709\n", + " 0.677276\n", " \n", " \n", "\n", @@ -5611,12 +5595,12 @@ "text/plain": [ " group x\n", " \n", - "0 a 0.903480\n", - "1 a 0.969839\n", - "2 b 0.464387\n", - "3 b 0.122231\n", - "4 c 0.804479\n", - "5 c 0.994709\n", + "0 a 0.461532\n", + "1 a 0.137090\n", + "2 b 0.987097\n", + "3 b 0.816681\n", + "4 c 0.390507\n", + "5 c 0.677276\n", "[TibbleGrouped: group (n=3)]" ] }, diff --git a/docs/notebooks/summarise.ipynb b/docs/notebooks/summarise.ipynb index 3452397d..ed1a0263 100644 --- a/docs/notebooks/summarise.ipynb +++ b/docs/notebooks/summarise.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 18:08:44][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 18:08:44][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 18:08:44][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 18:08:44][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 18:08:44][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 18:08:44][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 18:08:44][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 18:08:44][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 18:08:44][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 18:08:44][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # summarise " + "###
★ summarise
" ], "text/plain": [ "" @@ -64,30 +48,6 @@ "\n", "Aliases - `summarize` \n", "\n", - "##### Examples:\n", - "  >>> df = tibble(x=[1,2,3,4]) \n", - "  >>> df >> summarise(y=sum(f.x), z=f.y*2) \n", - "  >>> # y z \n", - "  >>> # 0 10 20 \n", - "  >>> df >> summarise(y=sum(f.x), z=f.x+f.y) # fail \n", - "\n", - "  But they should not be mixed in later argument. For example: \n", - "  >>> df = tibble(x=[1,2,3,4], g=list('aabb')) >> group_by(f.g) \n", - "  >>> df >> summarise(n=n() + f.x) \n", - "  >>> # as expected: \n", - "  >>> g n \n", - "  >>> # 0 a 3 \n", - "  >>> # 1 a 4 \n", - "  >>> # 2 b 5 \n", - "  >>> # 3 b 6 \n", - "  >>> # [Groups: ['g'] (n=2)] \n", - "  >>> # However: \n", - "  >>> df >> summarise(y=1, n=n() + f.y) \n", - "  >>> # n() will be recycling output instead of input \n", - "  >>> # g y n \n", - "  >>> # 0 a 1 2 \n", - "  >>> # 1 b 1 2 \n", - "\n", "##### Args:\n", "  `_groups`: Grouping structure of the result. \n", "    - \"drop_last\": dropping the last level of grouping.\n", @@ -115,11 +75,11 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/summarise.html\n", + "%run nb_helpers.py\n", "\n", "from datar.datasets import mtcars, starwars\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(summarise)" ] }, @@ -295,7 +255,7 @@ "name": "stderr", "output_type": "stream", "text": [ - "[2022-03-06 18:08:47][datar][ INFO] `summarise()` has grouped output by ['cyl'] (override with `_groups` argument)\n" + "[2022-03-18 17:33:44][datar][ INFO] `summarise()` has grouped output by ['cyl'] (override with `_groups` argument)\n" ] }, { @@ -508,7 +468,7 @@ }, { "cell_type": "code", - "execution_count": 8, + "execution_count": 6, "id": "e5098761", "metadata": { "execution": { @@ -523,7 +483,7 @@ "name": "stderr", "output_type": "stream", "text": [ - "[2022-03-06 18:10:24][datar][ INFO] `summarise()` has grouped output by ['cyl'] (override with `_groups` argument)\n" + "[2022-03-18 17:33:45][datar][ INFO] `summarise()` has grouped output by ['cyl'] (override with `_groups` argument)\n" ] }, { @@ -532,7 +492,7 @@ "['cyl']" ] }, - "execution_count": 8, + "execution_count": 6, "metadata": {}, "output_type": "execute_result" } @@ -546,7 +506,7 @@ }, { "cell_type": "code", - "execution_count": 9, + "execution_count": 7, "id": "01a62149", "metadata": { "execution": { @@ -620,7 +580,7 @@ "2 8 353.100000 NaN" ] }, - "execution_count": 9, + "execution_count": 7, "metadata": {}, "output_type": "execute_result" } @@ -634,7 +594,7 @@ }, { "cell_type": "code", - "execution_count": 10, + "execution_count": 8, "id": "d2f97ff6", "metadata": { "execution": { @@ -703,7 +663,7 @@ "2 8 706.200000" ] }, - "execution_count": 10, + "execution_count": 8, "metadata": {}, "output_type": "execute_result" } @@ -717,7 +677,7 @@ }, { "cell_type": "code", - "execution_count": 11, + "execution_count": 9, "id": "f4bd8382", "metadata": { "execution": { @@ -771,7 +731,7 @@ "0 97.311864" ] }, - "execution_count": 11, + "execution_count": 9, "metadata": {}, "output_type": "execute_result" } diff --git a/docs/notebooks/tibble.ipynb b/docs/notebooks/tibble.ipynb index 66e47da5..b34e2b7d 100644 --- a/docs/notebooks/tibble.ipynb +++ b/docs/notebooks/tibble.ipynb @@ -2,7 +2,7 @@ "cells": [ { "cell_type": "code", - "execution_count": 3, + "execution_count": 1, "id": "8b02806d", "metadata": { "execution": { @@ -16,7 +16,7 @@ { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -28,7 +28,7 @@ { "data": { "text/markdown": [ - "### # tibble " + "###
★ tibble
" ], "text/plain": [ "" @@ -77,7 +77,7 @@ { "data": { "text/markdown": [ - "### # tibble_row " + "###
★ tibble_row
" ], "text/plain": [ "" @@ -120,7 +120,7 @@ { "data": { "text/markdown": [ - "### # tribble " + "###
★ tribble
" ], "text/plain": [ "" @@ -142,14 +142,6 @@ "\n", "  `_dtypes`: The dtypes for each columns to convert to. \n", "\n", - "##### Examples:\n", - "  >>> tribble( \n", - "  >>> f.colA, f.colB, \n", - "  >>> \"a\", 1, \n", - "  >>> \"b\", 2, \n", - "  >>> \"c\", 3, \n", - "  >>> ) \n", - "\n", "##### Returns:\n", "  A dataframe \n" ], @@ -164,18 +156,18 @@ "source": [ "# https://tibble.tidyverse.org/reference/tibble.html\n", "# https://tibble.tidyverse.org/reference/tribble.html\n", + "%run nb_helpers.py\n", "\n", "from datar import f\n", "from datar.tibble import tibble, tibble_row, tribble\n", "from datar.base import diag, runif\n", "\n", - "%run nb_helpers.py\n", "nb_header(tibble, tibble_row, tribble)" ] }, { "cell_type": "code", - "execution_count": 5, + "execution_count": 2, "id": "a786d6b2", "metadata": { "execution": { @@ -256,7 +248,7 @@ "4 4 8" ] }, - "execution_count": 5, + "execution_count": 2, "metadata": {}, "output_type": "execute_result" } @@ -268,7 +260,7 @@ }, { "cell_type": "code", - "execution_count": 6, + "execution_count": 3, "id": "875fe6f2", "metadata": { "execution": { @@ -356,7 +348,7 @@ "4 4 8 1" ] }, - "execution_count": 6, + "execution_count": 3, "metadata": {}, "output_type": "execute_result" } @@ -367,7 +359,7 @@ }, { "cell_type": "code", - "execution_count": 7, + "execution_count": 4, "id": "fc39e6d2", "metadata": { "execution": { @@ -411,53 +403,53 @@ " \n", " \n", " 0\n", - " 0.829673\n", - " 1.659347\n", + " 0.723690\n", + " 1.447381\n", " \n", " \n", " 1\n", - " 0.682616\n", - " 1.365232\n", + " 0.800989\n", + " 1.601979\n", " \n", " \n", " 2\n", - " 0.594559\n", - " 1.189117\n", + " 0.163617\n", + " 0.327234\n", " \n", " \n", " 3\n", - " 0.245247\n", - " 0.490494\n", + " 0.220090\n", + " 0.440180\n", " \n", " \n", " 4\n", - " 0.393295\n", - " 0.786590\n", + " 0.402084\n", + " 0.804168\n", " \n", " \n", " 5\n", - " 0.736311\n", - " 1.472622\n", + " 0.320978\n", + " 0.641955\n", " \n", " \n", " 6\n", - " 0.159279\n", - " 0.318559\n", + " 0.350461\n", + " 0.700921\n", " \n", " \n", " 7\n", - " 0.459043\n", - " 0.918085\n", + " 0.391470\n", + " 0.782941\n", " \n", " \n", " 8\n", - " 0.237187\n", - " 0.474374\n", + " 0.483530\n", + " 0.967060\n", " \n", " \n", " 9\n", - " 0.768807\n", - " 1.537615\n", + " 0.690136\n", + " 1.380271\n", " \n", " \n", "\n", @@ -466,19 +458,19 @@ "text/plain": [ " x y\n", " \n", - "0 0.829673 1.659347\n", - "1 0.682616 1.365232\n", - "2 0.594559 1.189117\n", - "3 0.245247 0.490494\n", - "4 0.393295 0.786590\n", - "5 0.736311 1.472622\n", - "6 0.159279 0.318559\n", - "7 0.459043 0.918085\n", - "8 0.237187 0.474374\n", - "9 0.768807 1.537615" + "0 0.723690 1.447381\n", + "1 0.800989 1.601979\n", + "2 0.163617 0.327234\n", + "3 0.220090 0.440180\n", + "4 0.402084 0.804168\n", + "5 0.320978 0.641955\n", + "6 0.350461 0.700921\n", + "7 0.391470 0.782941\n", + "8 0.483530 0.967060\n", + "9 0.690136 1.380271" ] }, - "execution_count": 7, + "execution_count": 4, "metadata": {}, "output_type": "execute_result" } @@ -489,7 +481,7 @@ }, { "cell_type": "code", - "execution_count": 8, + "execution_count": 5, "id": "dada58f8", "metadata": { "execution": { @@ -516,7 +508,7 @@ }, { "cell_type": "code", - "execution_count": 9, + "execution_count": 6, "id": "8a22cb4b", "metadata": { "execution": { @@ -531,9 +523,9 @@ "name": "stderr", "output_type": "stream", "text": [ - "[2022-03-06 02:37:22][datar][WARNING] New names:\n", - "[2022-03-06 02:37:22][datar][WARNING] * '1' -> '1__0'\n", - "[2022-03-06 02:37:22][datar][WARNING] * '1' -> '1__1'\n" + "[2022-03-18 17:33:27][datar][WARNING] New names:\n", + "[2022-03-18 17:33:27][datar][WARNING] * '1' -> '1__0'\n", + "[2022-03-18 17:33:27][datar][WARNING] * '1' -> '1__1'\n" ] }, { @@ -582,7 +574,7 @@ "0 1 1" ] }, - "execution_count": 9, + "execution_count": 6, "metadata": {}, "output_type": "execute_result" } @@ -593,7 +585,7 @@ }, { "cell_type": "code", - "execution_count": 10, + "execution_count": 7, "id": "4e811ce7", "metadata": { "execution": { @@ -608,9 +600,9 @@ "name": "stderr", "output_type": "stream", "text": [ - "[2022-03-06 02:37:23][datar][WARNING] New names:\n", - "[2022-03-06 02:37:23][datar][WARNING] * '1' -> '1__0'\n", - "[2022-03-06 02:37:23][datar][WARNING] * '1' -> '1__1'\n" + "[2022-03-18 17:33:27][datar][WARNING] New names:\n", + "[2022-03-18 17:33:27][datar][WARNING] * '1' -> '1__0'\n", + "[2022-03-18 17:33:27][datar][WARNING] * '1' -> '1__1'\n" ] }, { @@ -662,7 +654,7 @@ "0 1 1 True" ] }, - "execution_count": 10, + "execution_count": 7, "metadata": {}, "output_type": "execute_result" } @@ -674,7 +666,7 @@ }, { "cell_type": "code", - "execution_count": 11, + "execution_count": 8, "id": "6007cacc", "metadata": { "execution": { @@ -731,7 +723,7 @@ "0 1 1" ] }, - "execution_count": 11, + "execution_count": 8, "metadata": {}, "output_type": "execute_result" } @@ -742,7 +734,7 @@ }, { "cell_type": "code", - "execution_count": 12, + "execution_count": 9, "id": "aadc8985", "metadata": { "execution": { @@ -757,9 +749,9 @@ "name": "stderr", "output_type": "stream", "text": [ - "[2022-03-06 02:37:25][datar][WARNING] New names:\n", - "[2022-03-06 02:37:25][datar][WARNING] * '1' -> '_1'\n", - "[2022-03-06 02:37:25][datar][WARNING] * '2' -> '_2'\n" + "[2022-03-18 17:33:28][datar][WARNING] New names:\n", + "[2022-03-18 17:33:28][datar][WARNING] * '1' -> '_1'\n", + "[2022-03-18 17:33:28][datar][WARNING] * '2' -> '_2'\n" ] }, { @@ -808,7 +800,7 @@ "0 1 2" ] }, - "execution_count": 12, + "execution_count": 9, "metadata": {}, "output_type": "execute_result" } @@ -820,7 +812,7 @@ }, { "cell_type": "code", - "execution_count": 13, + "execution_count": 10, "id": "7a863e15", "metadata": { "execution": { @@ -877,7 +869,7 @@ "0 1 1" ] }, - "execution_count": 13, + "execution_count": 10, "metadata": {}, "output_type": "execute_result" } @@ -901,7 +893,7 @@ }, { "cell_type": "code", - "execution_count": 14, + "execution_count": 11, "id": "c76a319b", "metadata": { "execution": { @@ -958,7 +950,7 @@ "0 2 3" ] }, - "execution_count": 14, + "execution_count": 11, "metadata": {}, "output_type": "execute_result" } @@ -976,7 +968,7 @@ }, { "cell_type": "code", - "execution_count": 15, + "execution_count": 12, "id": "20cff9a2", "metadata": { "execution": { @@ -1033,7 +1025,7 @@ "0 1 1" ] }, - "execution_count": 15, + "execution_count": 12, "metadata": {}, "output_type": "execute_result" } @@ -1044,7 +1036,7 @@ }, { "cell_type": "code", - "execution_count": 16, + "execution_count": 13, "id": "7e006c14", "metadata": { "execution": { @@ -1123,7 +1115,7 @@ "2 6 9 2 6" ] }, - "execution_count": 16, + "execution_count": 13, "metadata": {}, "output_type": "execute_result" } @@ -1141,7 +1133,7 @@ }, { "cell_type": "code", - "execution_count": 17, + "execution_count": 14, "id": "2d9a00e0", "metadata": { "execution": { @@ -1246,7 +1238,7 @@ "3 3 0 0 0 1 0 0" ] }, - "execution_count": 17, + "execution_count": 14, "metadata": {}, "output_type": "execute_result" } @@ -1263,7 +1255,7 @@ }, { "cell_type": "code", - "execution_count": 18, + "execution_count": 15, "id": "bdef0cd4", "metadata": { "execution": { @@ -1289,7 +1281,7 @@ }, { "cell_type": "code", - "execution_count": 19, + "execution_count": 16, "id": "0b39dd2f", "metadata": { "execution": { @@ -1343,7 +1335,7 @@ "0 3" ] }, - "execution_count": 19, + "execution_count": 16, "metadata": {}, "output_type": "execute_result" } @@ -1354,7 +1346,7 @@ }, { "cell_type": "code", - "execution_count": 20, + "execution_count": 17, "id": "e066dd0e", "metadata": { "execution": { @@ -1411,7 +1403,7 @@ "0 1 1" ] }, - "execution_count": 20, + "execution_count": 17, "metadata": {}, "output_type": "execute_result" } @@ -1423,7 +1415,7 @@ }, { "cell_type": "code", - "execution_count": 21, + "execution_count": 18, "id": "065802b4", "metadata": { "execution": { @@ -1480,7 +1472,7 @@ "0 1 3" ] }, - "execution_count": 21, + "execution_count": 18, "metadata": {}, "output_type": "execute_result" } @@ -1491,7 +1483,7 @@ }, { "cell_type": "code", - "execution_count": 22, + "execution_count": 19, "id": "948a38e3", "metadata": { "execution": { @@ -1560,7 +1552,7 @@ "2 c 3" ] }, - "execution_count": 22, + "execution_count": 19, "metadata": {}, "output_type": "execute_result" } @@ -1576,7 +1568,7 @@ }, { "cell_type": "code", - "execution_count": 23, + "execution_count": 20, "id": "3730b8a8", "metadata": { "execution": { @@ -1639,7 +1631,7 @@ "1 b [4, 5, 6]" ] }, - "execution_count": 23, + "execution_count": 20, "metadata": {}, "output_type": "execute_result" } @@ -1654,7 +1646,7 @@ }, { "cell_type": "code", - "execution_count": 24, + "execution_count": 21, "id": "057cd848", "metadata": { "execution": { @@ -1711,7 +1703,7 @@ "0 1 [2, 3]" ] }, - "execution_count": 24, + "execution_count": 21, "metadata": {}, "output_type": "execute_result" } diff --git a/docs/notebooks/uncount.ipynb b/docs/notebooks/uncount.ipynb index f9536e42..5ce95e2e 100644 --- a/docs/notebooks/uncount.ipynb +++ b/docs/notebooks/uncount.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 02:36:03][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 02:36:03][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 02:36:03][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 02:36:03][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 02:36:03][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 02:36:03][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 02:36:03][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 02:36:03][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 02:36:03][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 02:36:03][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # uncount " + "###
★ uncount
" ], "text/plain": [ "" @@ -80,10 +64,10 @@ ], "source": [ "# https://tidyr.tidyverse.org/reference/uncount.html\n", + "%run nb_helpers.py\n", "\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(uncount)" ] }, diff --git a/docs/notebooks/unite.ipynb b/docs/notebooks/unite.ipynb index d9fd40bd..c7db4242 100644 --- a/docs/notebooks/unite.ipynb +++ b/docs/notebooks/unite.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 18:12:37][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 18:12:37][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 18:12:37][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 18:12:37][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 18:12:37][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 18:12:37][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 18:12:37][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 18:12:37][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 18:12:37][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 18:12:37][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # unite " + "###
★ unite
" ], "text/plain": [ "" @@ -80,10 +64,10 @@ ], "source": [ "# https://tidyr.tidyverse.org/reference/unite.html\n", + "%run nb_helpers.py\n", "\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(unite)\n" ] }, @@ -375,7 +359,7 @@ "name": "stderr", "output_type": "stream", "text": [ - "[2022-03-06 18:12:40][datar][WARNING] Expected 2 pieces. Missing pieces filled with `NA` in 3 rows ['a', 'b', ''].\n" + "[2022-03-18 17:32:56][datar][WARNING] Expected 2 pieces. Missing pieces filled with `NA` in 3 rows ['a', 'b', ''].\n" ] }, { diff --git a/docs/notebooks/with_groups.ipynb b/docs/notebooks/with_groups.ipynb index 2bdeafb2..4db92ef0 100644 --- a/docs/notebooks/with_groups.ipynb +++ b/docs/notebooks/with_groups.ipynb @@ -13,26 +13,10 @@ } }, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[2022-03-06 18:19:37][datar][WARNING] Builtin name \"min\" has been overriden by datar.\n", - "[2022-03-06 18:19:37][datar][WARNING] Builtin name \"max\" has been overriden by datar.\n", - "[2022-03-06 18:19:37][datar][WARNING] Builtin name \"sum\" has been overriden by datar.\n", - "[2022-03-06 18:19:37][datar][WARNING] Builtin name \"abs\" has been overriden by datar.\n", - "[2022-03-06 18:19:37][datar][WARNING] Builtin name \"round\" has been overriden by datar.\n", - "[2022-03-06 18:19:37][datar][WARNING] Builtin name \"all\" has been overriden by datar.\n", - "[2022-03-06 18:19:37][datar][WARNING] Builtin name \"any\" has been overriden by datar.\n", - "[2022-03-06 18:19:37][datar][WARNING] Builtin name \"re\" has been overriden by datar.\n", - "[2022-03-06 18:19:37][datar][WARNING] Builtin name \"filter\" has been overriden by datar.\n", - "[2022-03-06 18:19:37][datar][WARNING] Builtin name \"slice\" has been overriden by datar.\n" - ] - }, { "data": { "text/html": [ - "
Try this notebook on binder.
" + "
Try this notebook on binder.
" ], "text/plain": [ "" @@ -44,7 +28,7 @@ { "data": { "text/markdown": [ - "### # with_groups " + "###
★ with_groups
" ], "text/plain": [ "" @@ -78,10 +62,10 @@ ], "source": [ "# https://dplyr.tidyverse.org/reference/with_groups.html\n", + "%run nb_helpers.py\n", "\n", "from datar.all import *\n", "\n", - "%run nb_helpers.py\n", "nb_header(with_groups)" ] }, @@ -134,32 +118,32 @@ " \n", " 0\n", " 1\n", - " 0.787068\n", - " 0.869330\n", + " 0.821443\n", + " 0.493316\n", " \n", " \n", " 1\n", " 1\n", - " 0.951592\n", - " 0.869330\n", + " 0.165189\n", + " 0.493316\n", " \n", " \n", " 2\n", " 2\n", - " 0.993726\n", - " 0.618664\n", + " 0.264447\n", + " 0.539342\n", " \n", " \n", " 3\n", " 2\n", - " 0.243601\n", - " 0.618664\n", + " 0.814237\n", + " 0.539342\n", " \n", " \n", " 4\n", " 3\n", - " 0.035540\n", - " 0.035540\n", + " 0.488513\n", + " 0.488513\n", " \n", " \n", "\n", @@ -169,11 +153,11 @@ "text/plain": [ " g x x_mean\n", " \n", - "0 1 0.787068 0.869330\n", - "1 1 0.951592 0.869330\n", - "2 2 0.993726 0.618664\n", - "3 2 0.243601 0.618664\n", - "4 3 0.035540 0.035540\n", + "0 1 0.821443 0.493316\n", + "1 1 0.165189 0.493316\n", + "2 2 0.264447 0.539342\n", + "3 2 0.814237 0.539342\n", + "4 3 0.488513 0.488513\n", "[TibbleGrouped: g (n=3)]" ] }, @@ -236,32 +220,32 @@ " \n", " 0\n", " 1\n", - " 0.787068\n", - " 0.787068\n", + " 0.821443\n", + " 0.821443\n", " \n", " \n", " 1\n", " 1\n", - " 0.951592\n", - " 0.787068\n", + " 0.165189\n", + " 0.821443\n", " \n", " \n", " 2\n", " 2\n", - " 0.993726\n", - " 0.787068\n", + " 0.264447\n", + " 0.264447\n", " \n", " \n", " 3\n", " 2\n", - " 0.243601\n", - " 0.787068\n", + " 0.814237\n", + " 0.264447\n", " \n", " \n", " 4\n", " 3\n", - " 0.035540\n", - " 0.787068\n", + " 0.488513\n", + " 0.488513\n", " \n", " \n", "\n", @@ -271,11 +255,11 @@ "text/plain": [ " g x x1\n", " \n", - "0 1 0.787068 0.787068\n", - "1 1 0.951592 0.787068\n", - "2 2 0.993726 0.787068\n", - "3 2 0.243601 0.787068\n", - "4 3 0.035540 0.787068\n", + "0 1 0.821443 0.821443\n", + "1 1 0.165189 0.821443\n", + "2 2 0.264447 0.264447\n", + "3 2 0.814237 0.264447\n", + "4 3 0.488513 0.488513\n", "[TibbleGrouped: g (n=3)]" ] }, @@ -338,32 +322,32 @@ " \n", " 0\n", " 1\n", - " 0.787068\n", - " 0.602306\n", + " 0.821443\n", + " 0.510766\n", " \n", " \n", " 1\n", " 1\n", - " 0.951592\n", - " 0.602306\n", + " 0.165189\n", + " 0.510766\n", " \n", " \n", " 2\n", " 2\n", - " 0.993726\n", - " 0.602306\n", + " 0.264447\n", + " 0.510766\n", " \n", " \n", " 3\n", " 2\n", - " 0.243601\n", - " 0.602306\n", + " 0.814237\n", + " 0.510766\n", " \n", " \n", " 4\n", " 3\n", - " 0.035540\n", - " 0.602306\n", + " 0.488513\n", + " 0.510766\n", " \n", " \n", "\n", @@ -372,11 +356,11 @@ "text/plain": [ " g x x_mean\n", " \n", - "0 1 0.787068 0.602306\n", - "1 1 0.951592 0.602306\n", - "2 2 0.993726 0.602306\n", - "3 2 0.243601 0.602306\n", - "4 3 0.035540 0.602306" + "0 1 0.821443 0.510766\n", + "1 1 0.165189 0.510766\n", + "2 2 0.264447 0.510766\n", + "3 2 0.814237 0.510766\n", + "4 3 0.488513 0.510766" ] }, "execution_count": 4, @@ -434,23 +418,23 @@ " \n", " \n", " 0\n", - " 0.787068\n", + " 0.821443\n", " \n", " \n", " 1\n", - " 0.951592\n", + " 0.165189\n", " \n", " \n", " 2\n", - " 0.993726\n", + " 0.264447\n", " \n", " \n", " 3\n", - " 0.243601\n", + " 0.814237\n", " \n", " \n", " 4\n", - " 0.035540\n", + " 0.488513\n", " \n", " \n", "\n", @@ -459,11 +443,11 @@ "text/plain": [ " x\n", " \n", - "0 0.787068\n", - "1 0.951592\n", - "2 0.993726\n", - "3 0.243601\n", - "4 0.035540" + "0 0.821443\n", + "1 0.165189\n", + "2 0.264447\n", + "3 0.814237\n", + "4 0.488513" ] }, "execution_count": 5, diff --git a/docs/reference-maps/base.md b/docs/reference-maps/base.md index 764e69bc..6ebf5f8b 100644 --- a/docs/reference-maps/base.md +++ b/docs/reference-maps/base.md @@ -82,60 +82,60 @@ See [here](../stats) for APIs ported from `r-stats` and [here](../utils) for API |API|Description|Notebook example| |---|---|---:| -|[`bessel_i`][22]|Bessel Functions of integer and fractional order of first kind|[:material-notebook:][4]| -|[`bessel_k`][24]|Bessel Functions of integer and fractional order of second kind|[:material-notebook:][4]| -|[`bessel_j`][23]|Modified Bessel functions of first kind|[:material-notebook:][4]| -|[`bessel_y`][25]|Modified Bessel functions of third kind|[:material-notebook:][4]| +|[`bessel_i()`][22]|Bessel Functions of integer and fractional order of first kind|[:material-notebook:][4]| +|[`bessel_k()`][24]|Bessel Functions of integer and fractional order of second kind|[:material-notebook:][4]| +|[`bessel_j()`][23]|Modified Bessel functions of first kind|[:material-notebook:][4]| +|[`bessel_y()`][25]|Modified Bessel functions of third kind|[:material-notebook:][4]| ### Casting values between types |API|Description|Notebook example| |---|---|---:| -|[`as_integer`][26] [`as_int`][]|Cast data to integer|[:material-notebook:][4]| -|[`as_double`][27]|Cast data to double (`numpy.float64`)|[:material-notebook:][4]| -|[`as_float`][28]|Cast data to float (`numpy.float_`)|[:material-notebook:][4]| -|[`as_numeric`][29]|Cast data to numeric|[:material-notebook:][4]| +|[`as_integer()`][26] [`as_int`][26]|Cast data to integer|[:material-notebook:][4]| +|[`as_double()`][27]|Cast data to double (`numpy.float64`)|[:material-notebook:][4]| +|[`as_float()`][28]|Cast data to float (`numpy.float_`)|[:material-notebook:][4]| +|[`as_numeric()`][29]|Cast data to numeric|[:material-notebook:][4]| ### Complex numbers |API|Description|Notebook example| |---|---|---:| -|[`re`][30]|Get the real part of a complex number|[:material-notebook:][4]| -|[`mod`][31]|Get the modulus of a complex number|[:material-notebook:][4]| -|[`im`][32]|Get the imaginary part of a complex number|[:material-notebook:][4]| -|[`arg`][33]|Get the argument of a complex number|[:material-notebook:][4]| -|[`conj`][34]|Get the complex conjugate of a complex number|[:material-notebook:][4]| -|[`is_complex`][35]|Test if data is complex number|[:material-notebook:][4]| -|[`as_complex`][36]|Cast data to a complex number|[:material-notebook:][4]| +|[`re()`][30]|Get the real part of a complex number|[:material-notebook:][4]| +|[`mod()`][31]|Get the modulus of a complex number|[:material-notebook:][4]| +|[`im()`][32]|Get the imaginary part of a complex number|[:material-notebook:][4]| +|[`arg()`][33]|Get the argument of a complex number|[:material-notebook:][4]| +|[`conj()`][34]|Get the complex conjugate of a complex number|[:material-notebook:][4]| +|[`is_complex()`][35]|Test if data is complex number|[:material-notebook:][4]| +|[`as_complex()`][36]|Cast data to a complex number|[:material-notebook:][4]| ### Cumulativate functions |API|Description|Notebook example| |---|---|---:| -|[`cumsum`][37]|Cummulative sum|[:material-notebook:][4]| -|[`cumprod`][38]|Cummulative product|[:material-notebook:][4]| -|[`cummin`][39]|Cummulative min|[:material-notebook:][4]| -|[`cummax`][40]|Cummulative max|[:material-notebook:][4]| +|[`cumsum()`][37]|Cummulative sum|[:material-notebook:][4]| +|[`cumprod()`][38]|Cummulative product|[:material-notebook:][4]| +|[`cummin()`][39]|Cummulative min|[:material-notebook:][4]| +|[`cummax()`][40]|Cummulative max|[:material-notebook:][4]| ### Date functions |API|Description|Notebook example| |---|---|---:| -|[`as_date`][41]|Cast data to date|[:material-notebook:][4]| -|[**`as_pd_date`**][150]|Alias of `pandas.to_datetime()`|| +|[`as_date()`][41]|Cast data to date|[:material-notebook:][4]| +|[**`as_pd_date()`**][150]|Alias of `pandas.to_datetime()`|| ### Factor data |API|Description|Notebook example| |---|---|---:| -|[`factor`][42]|Construct factor|[:material-notebook:][4]| -|[`droplevels`][43]|Drop unused levels|[:material-notebook:][4]| -|[`levels`][44]|Get levels of factors|[:material-notebook:][4]| -|[`is_factor`][45] [`is_categorical`][45]|Test if data is factor|[:material-notebook:][4]| -|[`as_factor`][46] [`as_categorical`][46]|Cast data to factor|[:material-notebook:][4]| -|[`is_ordered`][140]|Check if a factor is ordered|| -|[`nlevels`][141]|Get number of levels of a factor|| -|[`ordered`][142]|Create an ordered factor|| +|[`factor()`][42]|Construct factor|[:material-notebook:][4]| +|[`droplevels()`][43]|Drop unused levels|[:material-notebook:][4]| +|[`levels()`][44]|Get levels of factors|[:material-notebook:][4]| +|[`is_factor()`][45] [`is_categorical`][45]|Test if data is factor|[:material-notebook:][4]| +|[`as_factor()`][46] [`as_categorical`][46]|Cast data to factor|[:material-notebook:][4]| +|[`is_ordered()`][140]|Check if a factor is ordered|| +|[`nlevels()`][141]|Get number of levels of a factor|| +|[`ordered()`][142]|Create an ordered factor|| ### Logical/Boolean values @@ -143,10 +143,10 @@ See [here](../stats) for APIs ported from `r-stats` and [here](../utils) for API |---|---|---:| |`TRUE`|Logical true|[:material-notebook:][4]| |`FALSE`|Logical false|[:material-notebook:][4]| -|[`is_true`][47]|Test if data is scalar true (R's `isTRUE`)|[:material-notebook:][4]| -|[`is_false`][48]|Test if data is scalar false (R's `FALSE`)|[:material-notebook:][4]| -|[`is_logical`][49] [`is_bool`][49]|Test if data is logical/boolean|[:material-notebook:][4]| -|[`as_logical`][50] [`as_bool`][50]|Cast data to logical/boolean|[:material-notebook:][4]| +|[`is_true()`][47]|Test if data is scalar true (R's `isTRUE`)|[:material-notebook:][4]| +|[`is_false()`][48]|Test if data is scalar false (R's `FALSE`)|[:material-notebook:][4]| +|[`is_logical()`][49] [`is_bool()`][49]|Test if data is logical/boolean|[:material-notebook:][4]| +|[`as_logical()`][50] [`as_bool()`][50]|Cast data to logical/boolean|[:material-notebook:][4]| ### NA (missing values) @@ -157,122 +157,122 @@ See [here](../stats) for APIs ported from `r-stats` and [here](../utils) for API |`NaN`|Missing value, same as `NA`|[:material-notebook:][4]| |[`is_na()`][51]|Test if data is NA|[:material-notebook:][4]| |[`any_na()`][52]|Test if any element is NA|[:material-notebook:][4]| -|[`is_finite`][126]|Test if x is finite|| -|[`is_infinite`][127]|Test if x is infinite|| -|[`is_nan`][128]|Test if x is nan|| +|[`is_finite()`][126]|Test if x is finite|| +|[`is_infinite()`][127]|Test if x is infinite|| +|[`is_nan()`][128]|Test if x is nan|| ### NULL |API|Description|Notebook example| |---|---|---:| |`NULL`|NULL value|[:material-notebook:][4]| -|[`is_null`][53]|Test if data is null|[:material-notebook:][4]| -|[`as_null`][54]|Cast anything to NULL|[:material-notebook:][4]| +|[`is_null()`][53]|Test if data is null|[:material-notebook:][4]| +|[`as_null()`][54]|Cast anything to NULL|[:material-notebook:][4]| ### Random |API|Description|Notebook example| |---|---|---:| -|[`set_seed`][55]|Set the randomization seed|[:material-notebook:][4]| +|[`set_seed()`][55]|Set the randomization seed|[:material-notebook:][4]| ### Functions to create and manipulate sequences |API|Description|Notebook example| |---|---|---:| -|[`c`][56]|Collection of data|[:material-notebook:][4]| -|[`seq`][57]|Generate sequence|[:material-notebook:][4]| -|[`seq_len`][58]|Generate sequence with length|[:material-notebook:][4]| -|[`seq_along`][59]|Generate sequence along with another sequence|[:material-notebook:][4]| -|[`rev`][60]|Reverse a sequence|[:material-notebook:][4]| -|[`rep`][61]|Generate sequence with repeats|[:material-notebook:][4]| -|[`lengths`][62]|Get the length of elements in the sequence|[:material-notebook:][4]| -|[`unique`][63]|Get the unique elements|[:material-notebook:][4]| -|[`sample`][64]|Sample the elements from sequence|[:material-notebook:][4]| -|[`length`][65]|Get the length of data|[:material-notebook:][4]| -|[`match`][129]|match returns a vector of the positions of (first) matches of its first argument in its second.|| -|[`rank`][143]|Returns the sample ranks of the values in a vector.|[:material-notebook:][163]| -|[`order`][144]|Returns a permutation which rearranges its first argument into ascending or descending order|| -|[`sort`][145]|Sorting or Ordering Vectors|| +|[`c()`][56]|Collection of data|[:material-notebook:][4]| +|[`seq()`][57]|Generate sequence|[:material-notebook:][4]| +|[`seq_len()`][58]|Generate sequence with length|[:material-notebook:][4]| +|[`seq_along()`][59]|Generate sequence along with another sequence|[:material-notebook:][4]| +|[`rev()`][60]|Reverse a sequence|[:material-notebook:][4]| +|[`rep()`][61]|Generate sequence with repeats|[:material-notebook:][4]| +|[`lengths()`][62]|Get the length of elements in the sequence|[:material-notebook:][4]| +|[`unique()`][63]|Get the unique elements|[:material-notebook:][4]| +|[`sample()`][64]|Sample the elements from sequence|[:material-notebook:][4]| +|[`length()`][65]|Get the length of data|[:material-notebook:][4]| +|[`match()`][129]|match returns a vector of the positions of (first) matches of its first argument in its second.|| +|[`rank()`][143]|Returns the sample ranks of the values in a vector.|[:material-notebook:][163]| +|[`order()`][144]|Returns a permutation which rearranges its first argument into ascending or descending order|| +|[`sort()`][145]|Sorting or Ordering Vectors|| ### Special functions |API|Description|Notebook example| |---|---|---:| -|[`beta`][66]|Beta function|[:material-notebook:][4]| -|[`lbeta`][67]|Natural logarithm of beta function|[:material-notebook:][4]| -|[`gamma`][68]|Gamma function|[:material-notebook:][4]| -|[`lgamma`][69]|Natural logarithm of gamma function|[:material-notebook:][4]| -|[`digamma`][70]|the first derivatives of the logarithm of the gamma function.|[:material-notebook:][4]| -|[`trigamma`][71]|the second derivatives of the logarithm of the gamma function.|[:material-notebook:][4]| -|[`psigamma`][72]|polygamma funnction|[:material-notebook:][4]| -|[`choose`][73]|binomial coefficients|[:material-notebook:][4]| -|[`lchoose`][74]|the logarithms of binomial coefficients.|[:material-notebook:][4]| -|[`factorial`][75]|factorial|[:material-notebook:][4]| -|[`lfactorial`][76]|Natural logarithm of factorial|[:material-notebook:][4]| +|[`beta()`][66]|Beta function|[:material-notebook:][4]| +|[`lbeta()`][67]|Natural logarithm of beta function|[:material-notebook:][4]| +|[`gamma()`][68]|Gamma function|[:material-notebook:][4]| +|[`lgamma()`][69]|Natural logarithm of gamma function|[:material-notebook:][4]| +|[`digamma()`][70]|the first derivatives of the logarithm of the gamma function.|[:material-notebook:][4]| +|[`trigamma()`][71]|the second derivatives of the logarithm of the gamma function.|[:material-notebook:][4]| +|[`psigamma()`][72]|polygamma funnction|[:material-notebook:][4]| +|[`choose()`][73]|binomial coefficients|[:material-notebook:][4]| +|[`lchoose()`][74]|the logarithms of binomial coefficients.|[:material-notebook:][4]| +|[`factorial()`][75]|factorial|[:material-notebook:][4]| +|[`lfactorial()`][76]|Natural logarithm of factorial|[:material-notebook:][4]| ### String functions |API|Description|Notebook example| |---|---|---:| -|[`is_character`][77] [`is_str`][77] [`is_string`][77]|Test if data is string|[:material-notebook:][4]| -|[`as_character`][78] [`as_str`][78] [`as_string`][78]|Cast data to string|[:material-notebook:][4]| -|[`grep`][79]|Test if pattern in string|[:material-notebook:][4]| -|[`grepl`][80]|Logical version of `grep`|[:material-notebook:][4]| -|[`sub`][81]|Replace substrings in strings|[:material-notebook:][4]| -|[`gsub`][82]|Replace all matched substring in strings|[:material-notebook:][4]| -|[`nchar`][83]|Get length of string|[:material-notebook:][4]| -|[`nzhcar`][84]|Test if string is not empty|[:material-notebook:][4]| -|[`paste`][85]|Concatenate strings|[:material-notebook:][4]| -|[`paste0`][86]|Concatenate strings with `sep=''`|[:material-notebook:][4]| -|[`sprintf`][87]|C-style string formatting|[:material-notebook:][4]| -|[`substr`][88]|Get substring|[:material-notebook:][4]| -|[`substring`][89]|Get substring with a start only|[:material-notebook:][4]| -|[`strsplit`][90]|Split strings with delimiter|[:material-notebook:][4]| -|[`startswith`][130]|Test if strings start with given prefix|| -|[`endswith`][131]|Test if strings end with given suffix|| -|[`strtoi`][132]|Convert strings to integers|| -|[`chartr`][133]|Replace characters in strings|| -|[`tolower`][134]|Transform strings to lower case|| -|[`toupper`][135]|Transform strings to upper case|| -|[`trimws`][149]|Remove leading and/or trailing whitespace from character strings.|| +|[`is_character()`][77] [`is_str`][77] [`is_string`][77]|Test if data is string|[:material-notebook:][4]| +|[`as_character()`][78] [`as_str`][78] [`as_string`][78]|Cast data to string|[:material-notebook:][4]| +|[`grep()`][79]|Test if pattern in string|[:material-notebook:][4]| +|[`grepl()`][80]|Logical version of `grep`|[:material-notebook:][4]| +|[`sub()`][81]|Replace substrings in strings|[:material-notebook:][4]| +|[`gsub()`][82]|Replace all matched substring in strings|[:material-notebook:][4]| +|[`nchar()`][83]|Get length of string|[:material-notebook:][4]| +|[`nzhcar()`][84]|Test if string is not empty|[:material-notebook:][4]| +|[`paste()`][85]|Concatenate strings|[:material-notebook:][4]| +|[`paste0()`][86]|Concatenate strings with `sep=''`|[:material-notebook:][4]| +|[`sprintf()`][87]|C-style string formatting|[:material-notebook:][4]| +|[`substr()`][88]|Get substring|[:material-notebook:][4]| +|[`substring()`][89]|Get substring with a start only|[:material-notebook:][4]| +|[`strsplit()`][90]|Split strings with delimiter|[:material-notebook:][4]| +|[`startswith()`][130]|Test if strings start with given prefix|| +|[`endswith()`][131]|Test if strings end with given suffix|| +|[`strtoi()`][132]|Convert strings to integers|| +|[`chartr()`][133]|Replace characters in strings|| +|[`tolower()`][134]|Transform strings to lower case|| +|[`toupper()`][135]|Transform strings to upper case|| +|[`trimws()`][149]|Remove leading and/or trailing whitespace from character strings.|| ### Table |API|Description|Notebook example| |---|---|---:| -|[`table`][91]|Cross Tabulation and Table Creation|[:material-notebook:][4]| -|[`tabulate`][146]|Takes the integer-valued vector `bin` and counts the number of times each integer occurs in it.|| +|[`table()`][91]|Cross Tabulation and Table Creation|[:material-notebook:][4]| +|[`tabulate()`][146]|Takes the integer-valued vector `bin` and counts the number of times each integer occurs in it.|| ### Testing value types |API|Description|Notebook example| |---|---|---:| -|[`is_double`][92] [`is_float`][92]|Test if data is double or float (`numpy.float_`)|[:material-notebook:][4]| -|[`is_integer`][93] [`is_int`][93]|Test if data is integer|[:material-notebook:][4]| -|[`is_numeric`][94]|Test if data is numeric|[:material-notebook:][4]| -|[`is_atomic`][95]|Test is data is atomic|[:material-notebook:][4]| -|[`is_element, `is_in`][96]|Test if value is an element of an array (R's `%in`)|[:material-notebook:][4]| +|[`is_double()`][92] [`is_float()`][92]|Test if data is double or float (`numpy.float_`)|[:material-notebook:][4]| +|[`is_integer()`][93] [`is_int()`][93]|Test if data is integer|[:material-notebook:][4]| +|[`is_numeric()`][94]|Test if data is numeric|[:material-notebook:][4]| +|[`is_atomic()`][95]|Test is data is atomic|[:material-notebook:][4]| +|[`is_element(), `is_in()`][96]|Test if value is an element of an array (R's `%in`)|[:material-notebook:][4]| ### Trigonometric and hyper bolic functions |API|Description|Notebook example| |---|---|---:| -|[`cos`][97]|cosine|[:material-notebook:][4]| -|[`sin`][98]|sine|[:material-notebook:][4]| -|[`tan`][99]|tangent|[:material-notebook:][4]| -|[`acos`][100]|Arc-cosine|[:material-notebook:][4]| -|[`asin`][101]|Arc-sine|[:material-notebook:][4]| -|[`atan`][102]|Arc-tangent|[:material-notebook:][4]| -|[`atan2`][103]|`atan(y/x)`|[:material-notebook:][4]| -|[`cospi`][104]|`cos(pi*x)`|[:material-notebook:][4]| -|[`sinpi`][105]|`sin(pi*x)`|[:material-notebook:][4]| -|[`tanpi`][106]|`tan(pi*x)`|[:material-notebook:][4]| -|[`cosh`][107]|Hyperbolic cosine|[:material-notebook:][4]| -|[`sinh`][108]|Hyperbolic sine|[:material-notebook:][4]| -|[`tanh`][109]|Hyperbolic tangent|[:material-notebook:][4]| -|[`acosh`][110]|Hyperbolic cosine|[:material-notebook:][4]| -|[`asinh`][111]|Hyperbolic sine|[:material-notebook:][4]| -|[`atanh`][112]|Hyperbolic tangent|[:material-notebook:][4]| +|[`cos()`][97]|cosine|[:material-notebook:][4]| +|[`sin()`][98]|sine|[:material-notebook:][4]| +|[`tan()`][99]|tangent|[:material-notebook:][4]| +|[`acos()`][100]|Arc-cosine|[:material-notebook:][4]| +|[`asin()`][101]|Arc-sine|[:material-notebook:][4]| +|[`atan()`][102]|Arc-tangent|[:material-notebook:][4]| +|[`atan2()`][103]|`atan(y/x)`|[:material-notebook:][4]| +|[`cospi()`][104]|`cos(pi*x)`|[:material-notebook:][4]| +|[`sinpi()`][105]|`sin(pi*x)`|[:material-notebook:][4]| +|[`tanpi()`][106]|`tan(pi*x)`|[:material-notebook:][4]| +|[`cosh()`][107]|Hyperbolic cosine|[:material-notebook:][4]| +|[`sinh()`][108]|Hyperbolic sine|[:material-notebook:][4]| +|[`tanh()`][109]|Hyperbolic tangent|[:material-notebook:][4]| +|[`acosh()`][110]|Hyperbolic cosine|[:material-notebook:][4]| +|[`asinh()`][111]|Hyperbolic sine|[:material-notebook:][4]| +|[`atanh()`][112]|Hyperbolic tangent|[:material-notebook:][4]| ### Which @@ -285,18 +285,18 @@ See [here](../stats) for APIs ported from `r-stats` and [here](../utils) for API |API|Description|Notebook example| |---|---|---:| -|[`cut`][113]|Convert Numeric to Factor|[:material-notebook:][163]| -|[`diff`][164]|Returns suitably lagged and iterated differences.|[:material-notebook:][163]| -|[`identity`][114]|Identity Function|[:material-notebook:][163]| -|[`expandgrid`][115]|Create a Data Frame from All Combinations of Factor Variables|[:material-notebook:][163]| -|[`outer`][165]|Compute the outer product of two vectors.|[:material-notebook:][163]| -|[`max_col`][136]|Find the maximum position for each row of a matrix|| -|[`append`][147]|Add elements to a vector.|| -|[`complete_cases`][137]|Get a bool array indicating whether the values of rows are complete in a data frame.|| -|[`proportions`][147], [`prop_table`][147]|Returns conditional proportions given `margins`|| -|[`make_names`][137]|Make names available as columns and can be accessed by `df.`|[:material-notebook:][163]| -|[`make_unique`][138]|Make the names unique, alias of `make_names(names, unique=True)`|[:material-notebook:][163]| -|[**`data_context`**][116]|Mimic R's `with`|[:material-notebook:][163]| +|[`cut()`][113]|Convert Numeric to Factor|[:material-notebook:][163]| +|[`diff()`][164]|Returns suitably lagged and iterated differences.|[:material-notebook:][163]| +|[`identity()`][114]|Identity Function|[:material-notebook:][163]| +|[`expandgrid()`][115]|Create a Data Frame from All Combinations of Factor Variables|[:material-notebook:][163]| +|[`outer()`][165]|Compute the outer product of two vectors.|[:material-notebook:][163]| +|[`max_col()`][136]|Find the maximum position for each row of a matrix|| +|[`append()`][147]|Add elements to a vector.|| +|[`complete_cases()`][137]|Get a bool array indicating whether the values of rows are complete in a data frame.|| +|[`proportions()`][147], [`prop_table`][147]|Returns conditional proportions given `margins`|| +|[`make_names()`][137]|Make names available as columns and can be accessed by `df.`|[:material-notebook:][163]| +|[`make_unique()`][138]|Make the names unique, alias of `make_names(names, unique=True)`|[:material-notebook:][163]| +|[**`data_context()`**][116]|Mimic R's `with`|[:material-notebook:][163]| [1]: ../../api/datar.base.which/#datar.dplyr.which.which diff --git a/docs/reference-maps/datar.md b/docs/reference-maps/datar.md index d9d2d9ff..aecd6c57 100644 --- a/docs/reference-maps/datar.md +++ b/docs/reference-maps/datar.md @@ -28,11 +28,12 @@ |[**`flatten()`**][2]|Flatten values of data frames|[:material-notebook:][1]| ### Functions + |[**`itemgetter()`**][3]|Turn `a[f.x]` to a valid verb argument with `itemgetter(a, f.x)`|[:material-notebook:][1]| |[**`attrgetter()`**][4]|`f.x.` but works with `SeriesGroupBy` object|[:material-notebook:][1]| -|[**`pd_str()`**][4]|`f.x.str` but works with `SeriesGroupBy` object|[:material-notebook:][1]| -|[**`pd_cat()`**][4]|`f.x.cat` but works with `SeriesGroupBy` object|[:material-notebook:][1]| -|[**`pd_dt()`**][4]|`f.x.dt` but works with `SeriesGroupBy` object|[:material-notebook:][1]| +|[**`pd_str()`**][4]|`str` accessor but works with `SeriesGroupBy` object|[:material-notebook:][1]| +|[**`pd_cat()`**][4]|`cat` accessor but works with `SeriesGroupBy` object|[:material-notebook:][1]| +|[**`pd_dt()`**][4]|`dt` accessor but works with `SeriesGroupBy` object|[:material-notebook:][1]| [1]: ../../notebooks/datar diff --git a/docs/reference-maps/tibble.md b/docs/reference-maps/tibble.md index af1b7a3f..99054023 100644 --- a/docs/reference-maps/tibble.md +++ b/docs/reference-maps/tibble.md @@ -38,14 +38,13 @@ Reference map of `r-tidyverse-tibble` can be found [here][1]. |`tbl_df-class`||| |`print()` `format()`||| |[`tribble()`][3]|Row-wise tibble creation|[:material-notebook:][2]| -|[**`zibble()`**][19]|Zip version of tibble, where names specify together and so do values.|| ### Coercion |API|Description|Notebook example| |---|---|---:| |`is_tibble()`||| -|`as_tibble`||| +|[`as_tibble()`][19]|Convert data frames into datar's tibbles|| |`new_tibble()` `validate_tibble()`||| |[`enframe()`][4] [`deframe()`][14]|Converting iterables to data frames, and vice versa| [:material-notebook:][5]| @@ -85,4 +84,4 @@ Reference map of `r-tidyverse-tibble` can be found [here][1]. [16]: ../../api/datar.tibble.verbs/#datar.tibble.verbs.rownames_to_column [17]: ../../api/datar.tibble.verbs/#datar.tibble.verbs.rowid_to_column [18]: ../../api/datar.tibble.tibble/#datar.tibble.tibble.tibble_row -[19]: ../../api/datar.tibble.tibble/#datar.tibble.tibble.zibble +[19]: ../../api/datar.tibble.tibble/#datar.tibble.tibble.as_tibble diff --git a/docs/reference-maps/tidyr.md b/docs/reference-maps/tidyr.md index 8cab8911..459105f8 100644 --- a/docs/reference-maps/tidyr.md +++ b/docs/reference-maps/tidyr.md @@ -47,10 +47,8 @@ Reference map of `r-tidyverse-tidyr` can be found [here][1]. |---|---|---:| |[`extract()`][22]|Extract a character column into multiple columns using regular expression groups|[:material-notebook:][23]| |[`separate()`][30]|Separate a character column into multiple columns with a regular expression or numeric locations|[:material-notebook:][31]| -|[`separate_rows()`][34]| -Separate a collapsed column into multiple rows|[:material-notebook:][35]| -|[`unite()`][36]| -Unite multiple columns into one by pasting strings together|[:material-notebook:][37]| +|[`separate_rows()`][34]|Separate a collapsed column into multiple rows|[:material-notebook:][35]| +|[`unite()`][36]|Unite multiple columns into one by pasting strings together|[:material-notebook:][37]| ### Missing values diff --git a/docs/style.css b/docs/style.css index 099b7766..52f5ad23 100644 --- a/docs/style.css +++ b/docs/style.css @@ -1,6 +1,7 @@ .md-main__inner.md-grid { max-width: 80%; + margin-left: 32px; } .md-typeset .admonition, .md-typeset details { @@ -23,11 +24,11 @@ line-height: 1; } .mkapi-node { - background-color: #f0f6fa; - border-top: 3px solid #559bc9; + background-color: #f4faff; + border-top: 3px solid #151922; } .mkapi-node .mkapi-object-container { - background-color: #b4d4e9; + background-color: #d1d4d6; padding: .12em .4em; } .mkapi-node .mkapi-object-container .mkapi-object.code { @@ -79,7 +80,7 @@ padding-right: 2px; } .mkapi-node .mkapi-code * { - font-size: .65rem; + font-size: .6rem; } .mkapi-node a.mkapi-docs-link { font-size: .6rem; @@ -120,3 +121,8 @@ .mkapi-object-body.module.top * { font-size: .75rem !important; } + +.mkapi-section-body.examples pre code { + font-size: .65rem !important; + overflow: auto; +} diff --git a/environment.yml b/environment.yml new file mode 100644 index 00000000..4892c88c --- /dev/null +++ b/environment.yml @@ -0,0 +1,9 @@ +name: datar +channels: +- conda-forge +dependencies: +- python=3.9 +- pip: + - pdtypes + - datar + - -r docs/requirements.txt diff --git a/mkdocs.yml b/mkdocs.yml index ecf9b04b..b034bf85 100644 --- a/mkdocs.yml +++ b/mkdocs.yml @@ -9,9 +9,22 @@ theme: palette: primary: black name: 'material' - # font: - # text: 'Ubuntu' - # code: 'Ubuntu Mono' + font: + text: + - FreightSans + - "Helvetica Neue" + - Helvetica + - Arial + - sans-serif + code: + - IBMPlexMono + - SFMono-Regular + - Menlo + - Monaco + - Consolas + - "Liberation Mono" + - "Courier New" + - monospace features: - navigation.top markdown_extensions: diff --git a/poetry.lock b/poetry.lock new file mode 100644 index 00000000..135f0792 --- /dev/null +++ b/poetry.lock @@ -0,0 +1,670 @@ +[[package]] +name = "asttokens" +version = "2.0.5" +description = "Annotate AST trees with source code positions" +category = "main" +optional = false +python-versions = "*" + +[package.dependencies] +six = "*" + +[package.extras] +test = ["astroid", "pytest"] + +[[package]] +name = "atomicwrites" +version = "1.4.0" +description = "Atomic file writes." +category = "dev" +optional = false +python-versions = ">=2.7, !=3.0.*, !=3.1.*, !=3.2.*, !=3.3.*" + +[[package]] +name = "attrs" +version = "21.4.0" +description = "Classes Without Boilerplate" +category = "dev" +optional = false +python-versions = ">=2.7, !=3.0.*, !=3.1.*, !=3.2.*, !=3.3.*, !=3.4.*" + +[package.extras] +dev = ["coverage[toml] (>=5.0.2)", "hypothesis", "pympler", "pytest (>=4.3.0)", "six", "mypy", "pytest-mypy-plugins", "zope.interface", "furo", "sphinx", "sphinx-notfound-page", "pre-commit", "cloudpickle"] +docs = ["furo", "sphinx", "zope.interface", "sphinx-notfound-page"] +tests = ["coverage[toml] (>=5.0.2)", "hypothesis", "pympler", "pytest (>=4.3.0)", "six", "mypy", "pytest-mypy-plugins", "zope.interface", "cloudpickle"] +tests_no_zope = ["coverage[toml] (>=5.0.2)", "hypothesis", "pympler", "pytest (>=4.3.0)", "six", "mypy", "pytest-mypy-plugins", "cloudpickle"] + +[[package]] +name = "colorama" +version = "0.4.4" +description = "Cross-platform colored terminal text." +category = "dev" +optional = false +python-versions = ">=2.7, !=3.0.*, !=3.1.*, !=3.2.*, !=3.3.*, !=3.4.*" + +[[package]] +name = "coverage" +version = "6.3.2" +description = "Code coverage measurement for Python" +category = "dev" +optional = false +python-versions = ">=3.7" + +[package.dependencies] +tomli = {version = "*", optional = true, markers = "extra == \"toml\""} + +[package.extras] +toml = ["tomli"] + +[[package]] +name = "diot" +version = "0.1.5" +description = "Python dictionary with dot notation." +category = "main" +optional = false +python-versions = ">=3.6,<4.0" + +[package.dependencies] +inflection = "<1.0.0" + +[[package]] +name = "execnet" +version = "1.9.0" +description = "execnet: rapid multi-Python deployment" +category = "dev" +optional = false +python-versions = ">=2.7, !=3.0.*, !=3.1.*, !=3.2.*, !=3.3.*, !=3.4.*" + +[package.extras] +testing = ["pre-commit"] + +[[package]] +name = "executing" +version = "0.8.3" +description = "Get the currently executing AST node of a frame, and other information" +category = "main" +optional = false +python-versions = "*" + +[[package]] +name = "importlib-metadata" +version = "4.11.2" +description = "Read metadata from Python packages" +category = "main" +optional = false +python-versions = ">=3.7" + +[package.dependencies] +typing-extensions = {version = ">=3.6.4", markers = "python_version < \"3.8\""} +zipp = ">=0.5" + +[package.extras] +docs = ["sphinx", "jaraco.packaging (>=9)", "rst.linker (>=1.9)"] +perf = ["ipython"] +testing = ["pytest (>=6)", "pytest-checkdocs (>=2.4)", "pytest-flake8", "pytest-cov", "pytest-enabler (>=1.0.1)", "packaging", "pyfakefs", "flufl.flake8", "pytest-perf (>=0.9.2)", "pytest-black (>=0.3.7)", "pytest-mypy (>=0.9.1)", "importlib-resources (>=1.3)"] + +[[package]] +name = "inflection" +version = "0.5.1" +description = "A port of Ruby on Rails inflector to Python" +category = "main" +optional = false +python-versions = ">=3.5" + +[[package]] +name = "iniconfig" +version = "1.1.1" +description = "iniconfig: brain-dead simple config-ini parsing" +category = "dev" +optional = false +python-versions = "*" + +[[package]] +name = "numpy" +version = "1.21.1" +description = "NumPy is the fundamental package for array computing with Python." +category = "main" +optional = false +python-versions = ">=3.7" + +[[package]] +name = "packaging" +version = "21.3" +description = "Core utilities for Python packages" +category = "dev" +optional = false +python-versions = ">=3.6" + +[package.dependencies] +pyparsing = ">=2.0.2,<3.0.5 || >3.0.5" + +[[package]] +name = "pandas" +version = "1.3.5" +description = "Powerful data structures for data analysis, time series, and statistics" +category = "main" +optional = false +python-versions = ">=3.7.1" + +[package.dependencies] +numpy = [ + {version = ">=1.17.3", markers = "platform_machine != \"aarch64\" and platform_machine != \"arm64\" and python_version < \"3.10\""}, + {version = ">=1.19.2", markers = "platform_machine == \"aarch64\" and python_version < \"3.10\""}, + {version = ">=1.20.0", markers = "platform_machine == \"arm64\" and python_version < \"3.10\""}, + {version = ">=1.21.0", markers = "python_version >= \"3.10\""}, +] +python-dateutil = ">=2.7.3" +pytz = ">=2017.3" + +[package.extras] +test = ["hypothesis (>=3.58)", "pytest (>=6.0)", "pytest-xdist"] + +[[package]] +name = "pdtypes" +version = "0.0.4" +description = "Show data types for pandas data frames in terminal and notebooks" +category = "main" +optional = true +python-versions = ">=3.7.1,<4.0.0" + +[package.dependencies] +pandas = ">=1.2,<2.0" + +[[package]] +name = "pipda" +version = "0.5.7" +description = "A framework for data piping in python" +category = "main" +optional = false +python-versions = ">=3.7,<4.0" + +[package.dependencies] +diot = "*" +executing = "*" +pure_eval = "<1.0.0" +varname = "*" + +[[package]] +name = "pluggy" +version = "1.0.0" +description = "plugin and hook calling mechanisms for python" +category = "dev" +optional = false +python-versions = ">=3.6" + +[package.dependencies] +importlib-metadata = {version = ">=0.12", markers = "python_version < \"3.8\""} + +[package.extras] +dev = ["pre-commit", "tox"] +testing = ["pytest", "pytest-benchmark"] + +[[package]] +name = "pure-eval" +version = "0.2.2" +description = "Safely evaluate AST nodes without side effects" +category = "main" +optional = false +python-versions = "*" + +[package.extras] +tests = ["pytest"] + +[[package]] +name = "py" +version = "1.11.0" +description = "library with cross-python path, ini-parsing, io, code, log facilities" +category = "dev" +optional = false +python-versions = ">=2.7, !=3.0.*, !=3.1.*, !=3.2.*, !=3.3.*, !=3.4.*" + +[[package]] +name = "pyparsing" +version = "3.0.7" +description = "Python parsing module" +category = "dev" +optional = false +python-versions = ">=3.6" + +[package.extras] +diagrams = ["jinja2", "railroad-diagrams"] + +[[package]] +name = "pytest" +version = "7.0.1" +description = "pytest: simple powerful testing with Python" +category = "dev" +optional = false +python-versions = ">=3.6" + +[package.dependencies] +atomicwrites = {version = ">=1.0", markers = "sys_platform == \"win32\""} +attrs = ">=19.2.0" +colorama = {version = "*", markers = "sys_platform == \"win32\""} +importlib-metadata = {version = ">=0.12", markers = "python_version < \"3.8\""} +iniconfig = "*" +packaging = "*" +pluggy = ">=0.12,<2.0" +py = ">=1.8.2" +tomli = ">=1.0.0" + +[package.extras] +testing = ["argcomplete", "hypothesis (>=3.56)", "mock", "nose", "pygments (>=2.7.2)", "requests", "xmlschema"] + +[[package]] +name = "pytest-cov" +version = "3.0.0" +description = "Pytest plugin for measuring coverage." +category = "dev" +optional = false +python-versions = ">=3.6" + +[package.dependencies] +coverage = {version = ">=5.2.1", extras = ["toml"]} +pytest = ">=4.6" + +[package.extras] +testing = ["fields", "hunter", "process-tests", "six", "pytest-xdist", "virtualenv"] + +[[package]] +name = "pytest-forked" +version = "1.4.0" +description = "run tests in isolated forked subprocesses" +category = "dev" +optional = false +python-versions = ">=3.6" + +[package.dependencies] +py = "*" +pytest = ">=3.10" + +[[package]] +name = "pytest-xdist" +version = "2.5.0" +description = "pytest xdist plugin for distributed testing and loop-on-failing modes" +category = "dev" +optional = false +python-versions = ">=3.6" + +[package.dependencies] +execnet = ">=1.1" +pytest = ">=6.2.0" +pytest-forked = "*" + +[package.extras] +psutil = ["psutil (>=3.0)"] +setproctitle = ["setproctitle"] +testing = ["filelock"] + +[[package]] +name = "python-dateutil" +version = "2.8.2" +description = "Extensions to the standard Python datetime module" +category = "main" +optional = false +python-versions = "!=3.0.*,!=3.1.*,!=3.2.*,>=2.7" + +[package.dependencies] +six = ">=1.5" + +[[package]] +name = "python-slugify" +version = "6.1.1" +description = "A Python slugify application that also handles Unicode" +category = "main" +optional = true +python-versions = ">=2.7, !=3.0.*, !=3.1.*, !=3.2.*, !=3.3.*, !=3.4.*, !=3.5.*" + +[package.dependencies] +text-unidecode = ">=1.3" + +[package.extras] +unidecode = ["Unidecode (>=1.1.1)"] + +[[package]] +name = "pytz" +version = "2021.3" +description = "World timezone definitions, modern and historical" +category = "main" +optional = false +python-versions = "*" + +[[package]] +name = "scipy" +version = "1.6.1" +description = "SciPy: Scientific Library for Python" +category = "main" +optional = true +python-versions = ">=3.7" + +[package.dependencies] +numpy = ">=1.16.5" + +[[package]] +name = "six" +version = "1.16.0" +description = "Python 2 and 3 compatibility utilities" +category = "main" +optional = false +python-versions = ">=2.7, !=3.0.*, !=3.1.*, !=3.2.*" + +[[package]] +name = "text-unidecode" +version = "1.3" +description = "The most basic Text::Unidecode port" +category = "main" +optional = true +python-versions = "*" + +[[package]] +name = "toml" +version = "0.10.2" +description = "Python Library for Tom's Obvious, Minimal Language" +category = "main" +optional = false +python-versions = ">=2.6, !=3.0.*, !=3.1.*, !=3.2.*" + +[[package]] +name = "tomli" +version = "2.0.1" +description = "A lil' TOML parser" +category = "dev" +optional = false +python-versions = ">=3.7" + +[[package]] +name = "typing-extensions" +version = "4.1.1" +description = "Backported and Experimental Type Hints for Python 3.6+" +category = "main" +optional = false +python-versions = ">=3.6" + +[[package]] +name = "varname" +version = "0.8.2" +description = "Dark magics about variable names in python." +category = "main" +optional = false +python-versions = ">=3.6,<4.0" + +[package.dependencies] +asttokens = ">=2.0.0,<3.0.0" +executing = "*" +pure_eval = "<1.0.0" + +[[package]] +name = "wcwidth" +version = "0.2.5" +description = "Measures the displayed width of unicode strings in a terminal" +category = "main" +optional = true +python-versions = "*" + +[[package]] +name = "zipp" +version = "3.7.0" +description = "Backport of pathlib-compatible object wrapper for zip files" +category = "main" +optional = false +python-versions = ">=3.7" + +[package.extras] +docs = ["sphinx", "jaraco.packaging (>=8.2)", "rst.linker (>=1.9)"] +testing = ["pytest (>=6)", "pytest-checkdocs (>=2.4)", "pytest-flake8", "pytest-cov", "pytest-enabler (>=1.0.1)", "jaraco.itertools", "func-timeout", "pytest-black (>=0.3.7)", "pytest-mypy"] + +[metadata] +lock-version = "1.1" +python-versions = "^3.7.1" # align with pandas +content-hash = "5ba5c8a1a5f0b37b41aae63d8c8e6e03830927b22d1e7d318f9b210432e5b449" + +[metadata.files] +asttokens = [ + {file = "asttokens-2.0.5-py2.py3-none-any.whl", hash = "sha256:0844691e88552595a6f4a4281a9f7f79b8dd45ca4ccea82e5e05b4bbdb76705c"}, + {file = "asttokens-2.0.5.tar.gz", hash = "sha256:9a54c114f02c7a9480d56550932546a3f1fe71d8a02f1bc7ccd0ee3ee35cf4d5"}, +] +atomicwrites = [ + {file = "atomicwrites-1.4.0-py2.py3-none-any.whl", hash = "sha256:6d1784dea7c0c8d4a5172b6c620f40b6e4cbfdf96d783691f2e1302a7b88e197"}, + {file = "atomicwrites-1.4.0.tar.gz", hash = "sha256:ae70396ad1a434f9c7046fd2dd196fc04b12f9e91ffb859164193be8b6168a7a"}, +] +attrs = [ + {file = "attrs-21.4.0-py2.py3-none-any.whl", hash = "sha256:2d27e3784d7a565d36ab851fe94887c5eccd6a463168875832a1be79c82828b4"}, + {file = "attrs-21.4.0.tar.gz", hash = "sha256:626ba8234211db98e869df76230a137c4c40a12d72445c45d5f5b716f076e2fd"}, +] +colorama = [ + {file = "colorama-0.4.4-py2.py3-none-any.whl", hash = "sha256:9f47eda37229f68eee03b24b9748937c7dc3868f906e8ba69fbcbdd3bc5dc3e2"}, + {file = "colorama-0.4.4.tar.gz", hash = "sha256:5941b2b48a20143d2267e95b1c2a7603ce057ee39fd88e7329b0c292aa16869b"}, +] +coverage = [ + {file = "coverage-6.3.2-cp310-cp310-macosx_10_9_x86_64.whl", hash = "sha256:9b27d894748475fa858f9597c0ee1d4829f44683f3813633aaf94b19cb5453cf"}, + {file = "coverage-6.3.2-cp310-cp310-macosx_11_0_arm64.whl", hash = "sha256:37d1141ad6b2466a7b53a22e08fe76994c2d35a5b6b469590424a9953155afac"}, + {file = "coverage-6.3.2-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:f9987b0354b06d4df0f4d3e0ec1ae76d7ce7cbca9a2f98c25041eb79eec766f1"}, + {file = "coverage-6.3.2-cp310-cp310-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:26e2deacd414fc2f97dd9f7676ee3eaecd299ca751412d89f40bc01557a6b1b4"}, + {file = "coverage-6.3.2-cp310-cp310-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:4dd8bafa458b5c7d061540f1ee9f18025a68e2d8471b3e858a9dad47c8d41903"}, + {file = "coverage-6.3.2-cp310-cp310-musllinux_1_1_aarch64.whl", hash = "sha256:46191097ebc381fbf89bdce207a6c107ac4ec0890d8d20f3360345ff5976155c"}, + {file = "coverage-6.3.2-cp310-cp310-musllinux_1_1_i686.whl", hash = "sha256:6f89d05e028d274ce4fa1a86887b071ae1755082ef94a6740238cd7a8178804f"}, + {file = "coverage-6.3.2-cp310-cp310-musllinux_1_1_x86_64.whl", hash = "sha256:58303469e9a272b4abdb9e302a780072c0633cdcc0165db7eec0f9e32f901e05"}, + {file = "coverage-6.3.2-cp310-cp310-win32.whl", hash = "sha256:2fea046bfb455510e05be95e879f0e768d45c10c11509e20e06d8fcaa31d9e39"}, + {file = "coverage-6.3.2-cp310-cp310-win_amd64.whl", hash = "sha256:a2a8b8bcc399edb4347a5ca8b9b87e7524c0967b335fbb08a83c8421489ddee1"}, + {file = "coverage-6.3.2-cp37-cp37m-macosx_10_9_x86_64.whl", hash = "sha256:f1555ea6d6da108e1999b2463ea1003fe03f29213e459145e70edbaf3e004aaa"}, + {file = "coverage-6.3.2-cp37-cp37m-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:e5f4e1edcf57ce94e5475fe09e5afa3e3145081318e5fd1a43a6b4539a97e518"}, + {file = "coverage-6.3.2-cp37-cp37m-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:7a15dc0a14008f1da3d1ebd44bdda3e357dbabdf5a0b5034d38fcde0b5c234b7"}, + {file = "coverage-6.3.2-cp37-cp37m-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:21b7745788866028adeb1e0eca3bf1101109e2dc58456cb49d2d9b99a8c516e6"}, + {file = "coverage-6.3.2-cp37-cp37m-musllinux_1_1_aarch64.whl", hash = "sha256:8ce257cac556cb03be4a248d92ed36904a59a4a5ff55a994e92214cde15c5bad"}, + {file = "coverage-6.3.2-cp37-cp37m-musllinux_1_1_i686.whl", hash = "sha256:b0be84e5a6209858a1d3e8d1806c46214e867ce1b0fd32e4ea03f4bd8b2e3359"}, + {file = "coverage-6.3.2-cp37-cp37m-musllinux_1_1_x86_64.whl", hash = "sha256:acf53bc2cf7282ab9b8ba346746afe703474004d9e566ad164c91a7a59f188a4"}, + {file = "coverage-6.3.2-cp37-cp37m-win32.whl", hash = "sha256:8bdde1177f2311ee552f47ae6e5aa7750c0e3291ca6b75f71f7ffe1f1dab3dca"}, + {file = "coverage-6.3.2-cp37-cp37m-win_amd64.whl", hash = "sha256:b31651d018b23ec463e95cf10070d0b2c548aa950a03d0b559eaa11c7e5a6fa3"}, + {file = "coverage-6.3.2-cp38-cp38-macosx_10_9_x86_64.whl", hash = "sha256:07e6db90cd9686c767dcc593dff16c8c09f9814f5e9c51034066cad3373b914d"}, + {file = "coverage-6.3.2-cp38-cp38-macosx_11_0_arm64.whl", hash = "sha256:2c6dbb42f3ad25760010c45191e9757e7dce981cbfb90e42feef301d71540059"}, + {file = "coverage-6.3.2-cp38-cp38-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:c76aeef1b95aff3905fb2ae2d96e319caca5b76fa41d3470b19d4e4a3a313512"}, + {file = "coverage-6.3.2-cp38-cp38-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:8cf5cfcb1521dc3255d845d9dca3ff204b3229401994ef8d1984b32746bb45ca"}, + {file = "coverage-6.3.2-cp38-cp38-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:8fbbdc8d55990eac1b0919ca69eb5a988a802b854488c34b8f37f3e2025fa90d"}, + {file = "coverage-6.3.2-cp38-cp38-musllinux_1_1_aarch64.whl", hash = "sha256:ec6bc7fe73a938933d4178c9b23c4e0568e43e220aef9472c4f6044bfc6dd0f0"}, + {file = "coverage-6.3.2-cp38-cp38-musllinux_1_1_i686.whl", hash = "sha256:9baff2a45ae1f17c8078452e9e5962e518eab705e50a0aa8083733ea7d45f3a6"}, + {file = "coverage-6.3.2-cp38-cp38-musllinux_1_1_x86_64.whl", hash = "sha256:fd9e830e9d8d89b20ab1e5af09b32d33e1a08ef4c4e14411e559556fd788e6b2"}, + {file = "coverage-6.3.2-cp38-cp38-win32.whl", hash = "sha256:f7331dbf301b7289013175087636bbaf5b2405e57259dd2c42fdcc9fcc47325e"}, + {file = "coverage-6.3.2-cp38-cp38-win_amd64.whl", hash = "sha256:68353fe7cdf91f109fc7d474461b46e7f1f14e533e911a2a2cbb8b0fc8613cf1"}, + {file = "coverage-6.3.2-cp39-cp39-macosx_10_9_x86_64.whl", hash = "sha256:b78e5afb39941572209f71866aa0b206c12f0109835aa0d601e41552f9b3e620"}, + {file = "coverage-6.3.2-cp39-cp39-macosx_11_0_arm64.whl", hash = "sha256:4e21876082ed887baed0146fe222f861b5815455ada3b33b890f4105d806128d"}, + {file = "coverage-6.3.2-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:34626a7eee2a3da12af0507780bb51eb52dca0e1751fd1471d0810539cefb536"}, + {file = "coverage-6.3.2-cp39-cp39-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:1ebf730d2381158ecf3dfd4453fbca0613e16eaa547b4170e2450c9707665ce7"}, + {file = "coverage-6.3.2-cp39-cp39-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:dd6fe30bd519694b356cbfcaca9bd5c1737cddd20778c6a581ae20dc8c04def2"}, + {file = "coverage-6.3.2-cp39-cp39-musllinux_1_1_aarch64.whl", hash = "sha256:96f8a1cb43ca1422f36492bebe63312d396491a9165ed3b9231e778d43a7fca4"}, + {file = "coverage-6.3.2-cp39-cp39-musllinux_1_1_i686.whl", hash = "sha256:dd035edafefee4d573140a76fdc785dc38829fe5a455c4bb12bac8c20cfc3d69"}, + {file = "coverage-6.3.2-cp39-cp39-musllinux_1_1_x86_64.whl", hash = "sha256:5ca5aeb4344b30d0bec47481536b8ba1181d50dbe783b0e4ad03c95dc1296684"}, + {file = "coverage-6.3.2-cp39-cp39-win32.whl", hash = "sha256:f5fa5803f47e095d7ad8443d28b01d48c0359484fec1b9d8606d0e3282084bc4"}, + {file = "coverage-6.3.2-cp39-cp39-win_amd64.whl", hash = "sha256:9548f10d8be799551eb3a9c74bbf2b4934ddb330e08a73320123c07f95cc2d92"}, + {file = "coverage-6.3.2-pp36.pp37.pp38-none-any.whl", hash = "sha256:18d520c6860515a771708937d2f78f63cc47ab3b80cb78e86573b0a760161faf"}, + {file = "coverage-6.3.2.tar.gz", hash = "sha256:03e2a7826086b91ef345ff18742ee9fc47a6839ccd517061ef8fa1976e652ce9"}, +] +diot = [ + {file = "diot-0.1.5-py3-none-any.whl", hash = "sha256:f5e90a405064c09873130240b0c3a2ba9a480e754611a74f93599f84ec0a28b9"}, + {file = "diot-0.1.5.tar.gz", hash = "sha256:a8adc50e2d8e2a1d03ed017ecae98eb09a7ebb3bd0a5fbd44cbfb222e5a71bb4"}, +] +execnet = [ + {file = "execnet-1.9.0-py2.py3-none-any.whl", hash = "sha256:a295f7cc774947aac58dde7fdc85f4aa00c42adf5d8f5468fc630c1acf30a142"}, + {file = "execnet-1.9.0.tar.gz", hash = "sha256:8f694f3ba9cc92cab508b152dcfe322153975c29bda272e2fd7f3f00f36e47c5"}, +] +executing = [ + {file = "executing-0.8.3-py2.py3-none-any.whl", hash = "sha256:d1eef132db1b83649a3905ca6dd8897f71ac6f8cac79a7e58a1a09cf137546c9"}, + {file = "executing-0.8.3.tar.gz", hash = "sha256:c6554e21c6b060590a6d3be4b82fb78f8f0194d809de5ea7df1c093763311501"}, +] +importlib-metadata = [ + {file = "importlib_metadata-4.11.2-py3-none-any.whl", hash = "sha256:d16e8c1deb60de41b8e8ed21c1a7b947b0bc62fab7e1d470bcdf331cea2e6735"}, + {file = "importlib_metadata-4.11.2.tar.gz", hash = "sha256:b36ffa925fe3139b2f6ff11d6925ffd4fa7bc47870165e3ac260ac7b4f91e6ac"}, +] +inflection = [ + {file = "inflection-0.5.1-py2.py3-none-any.whl", hash = "sha256:f38b2b640938a4f35ade69ac3d053042959b62a0f1076a5bbaa1b9526605a8a2"}, + {file = "inflection-0.5.1.tar.gz", hash = "sha256:1a29730d366e996aaacffb2f1f1cb9593dc38e2ddd30c91250c6dde09ea9b417"}, +] +iniconfig = [ + {file = "iniconfig-1.1.1-py2.py3-none-any.whl", hash = "sha256:011e24c64b7f47f6ebd835bb12a743f2fbe9a26d4cecaa7f53bc4f35ee9da8b3"}, + {file = "iniconfig-1.1.1.tar.gz", hash = "sha256:bc3af051d7d14b2ee5ef9969666def0cd1a000e121eaea580d4a313df4b37f32"}, +] +numpy = [ + {file = "numpy-1.21.1-cp37-cp37m-macosx_10_9_x86_64.whl", hash = "sha256:38e8648f9449a549a7dfe8d8755a5979b45b3538520d1e735637ef28e8c2dc50"}, + {file = "numpy-1.21.1-cp37-cp37m-manylinux_2_12_i686.manylinux2010_i686.whl", hash = "sha256:fd7d7409fa643a91d0a05c7554dd68aa9c9bb16e186f6ccfe40d6e003156e33a"}, + {file = "numpy-1.21.1-cp37-cp37m-manylinux_2_12_x86_64.manylinux2010_x86_64.whl", hash = "sha256:a75b4498b1e93d8b700282dc8e655b8bd559c0904b3910b144646dbbbc03e062"}, + {file = "numpy-1.21.1-cp37-cp37m-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:1412aa0aec3e00bc23fbb8664d76552b4efde98fb71f60737c83efbac24112f1"}, + {file = "numpy-1.21.1-cp37-cp37m-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:e46ceaff65609b5399163de5893d8f2a82d3c77d5e56d976c8b5fb01faa6b671"}, + {file = "numpy-1.21.1-cp37-cp37m-manylinux_2_5_x86_64.manylinux1_x86_64.whl", hash = "sha256:c6a2324085dd52f96498419ba95b5777e40b6bcbc20088fddb9e8cbb58885e8e"}, + {file = "numpy-1.21.1-cp37-cp37m-win32.whl", hash = "sha256:73101b2a1fef16602696d133db402a7e7586654682244344b8329cdcbbb82172"}, + {file = "numpy-1.21.1-cp37-cp37m-win_amd64.whl", hash = "sha256:7a708a79c9a9d26904d1cca8d383bf869edf6f8e7650d85dbc77b041e8c5a0f8"}, + {file = "numpy-1.21.1-cp38-cp38-macosx_10_9_universal2.whl", hash = "sha256:95b995d0c413f5d0428b3f880e8fe1660ff9396dcd1f9eedbc311f37b5652e16"}, + {file = "numpy-1.21.1-cp38-cp38-macosx_10_9_x86_64.whl", hash = "sha256:635e6bd31c9fb3d475c8f44a089569070d10a9ef18ed13738b03049280281267"}, + {file = "numpy-1.21.1-cp38-cp38-macosx_11_0_arm64.whl", hash = "sha256:4a3d5fb89bfe21be2ef47c0614b9c9c707b7362386c9a3ff1feae63e0267ccb6"}, + {file = "numpy-1.21.1-cp38-cp38-manylinux_2_12_i686.manylinux2010_i686.whl", hash = "sha256:8a326af80e86d0e9ce92bcc1e65c8ff88297de4fa14ee936cb2293d414c9ec63"}, + {file = "numpy-1.21.1-cp38-cp38-manylinux_2_12_x86_64.manylinux2010_x86_64.whl", hash = "sha256:791492091744b0fe390a6ce85cc1bf5149968ac7d5f0477288f78c89b385d9af"}, + {file = "numpy-1.21.1-cp38-cp38-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:0318c465786c1f63ac05d7c4dbcecd4d2d7e13f0959b01b534ea1e92202235c5"}, + {file = "numpy-1.21.1-cp38-cp38-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:9a513bd9c1551894ee3d31369f9b07460ef223694098cf27d399513415855b68"}, + {file = "numpy-1.21.1-cp38-cp38-manylinux_2_5_x86_64.manylinux1_x86_64.whl", hash = "sha256:91c6f5fc58df1e0a3cc0c3a717bb3308ff850abdaa6d2d802573ee2b11f674a8"}, + {file = "numpy-1.21.1-cp38-cp38-win32.whl", hash = "sha256:978010b68e17150db8765355d1ccdd450f9fc916824e8c4e35ee620590e234cd"}, + {file = "numpy-1.21.1-cp38-cp38-win_amd64.whl", hash = "sha256:9749a40a5b22333467f02fe11edc98f022133ee1bfa8ab99bda5e5437b831214"}, + {file = "numpy-1.21.1-cp39-cp39-macosx_10_9_universal2.whl", hash = "sha256:d7a4aeac3b94af92a9373d6e77b37691b86411f9745190d2c351f410ab3a791f"}, + {file = "numpy-1.21.1-cp39-cp39-macosx_10_9_x86_64.whl", hash = "sha256:d9e7912a56108aba9b31df688a4c4f5cb0d9d3787386b87d504762b6754fbb1b"}, + {file = "numpy-1.21.1-cp39-cp39-macosx_11_0_arm64.whl", hash = "sha256:25b40b98ebdd272bc3020935427a4530b7d60dfbe1ab9381a39147834e985eac"}, + {file = "numpy-1.21.1-cp39-cp39-manylinux_2_12_i686.manylinux2010_i686.whl", hash = "sha256:8a92c5aea763d14ba9d6475803fc7904bda7decc2a0a68153f587ad82941fec1"}, + {file = "numpy-1.21.1-cp39-cp39-manylinux_2_12_x86_64.manylinux2010_x86_64.whl", hash = "sha256:05a0f648eb28bae4bcb204e6fd14603de2908de982e761a2fc78efe0f19e96e1"}, + {file = "numpy-1.21.1-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:f01f28075a92eede918b965e86e8f0ba7b7797a95aa8d35e1cc8821f5fc3ad6a"}, + {file = "numpy-1.21.1-cp39-cp39-win32.whl", hash = "sha256:88c0b89ad1cc24a5efbb99ff9ab5db0f9a86e9cc50240177a571fbe9c2860ac2"}, + {file = "numpy-1.21.1-cp39-cp39-win_amd64.whl", hash = "sha256:01721eefe70544d548425a07c80be8377096a54118070b8a62476866d5208e33"}, + {file = "numpy-1.21.1-pp37-pypy37_pp73-manylinux_2_12_x86_64.manylinux2010_x86_64.whl", hash = "sha256:2d4d1de6e6fb3d28781c73fbde702ac97f03d79e4ffd6598b880b2d95d62ead4"}, + {file = "numpy-1.21.1.zip", hash = "sha256:dff4af63638afcc57a3dfb9e4b26d434a7a602d225b42d746ea7fe2edf1342fd"}, +] +packaging = [ + {file = "packaging-21.3-py3-none-any.whl", hash = "sha256:ef103e05f519cdc783ae24ea4e2e0f508a9c99b2d4969652eed6a2e1ea5bd522"}, + {file = "packaging-21.3.tar.gz", hash = "sha256:dd47c42927d89ab911e606518907cc2d3a1f38bbd026385970643f9c5b8ecfeb"}, +] +pandas = [ + {file = "pandas-1.3.5-cp310-cp310-macosx_10_9_universal2.whl", hash = "sha256:62d5b5ce965bae78f12c1c0df0d387899dd4211ec0bdc52822373f13a3a022b9"}, + {file = "pandas-1.3.5-cp310-cp310-macosx_10_9_x86_64.whl", hash = "sha256:adfeb11be2d54f275142c8ba9bf67acee771b7186a5745249c7d5a06c670136b"}, + {file = "pandas-1.3.5-cp310-cp310-macosx_11_0_arm64.whl", hash = "sha256:60a8c055d58873ad81cae290d974d13dd479b82cbb975c3e1fa2cf1920715296"}, + {file = "pandas-1.3.5-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:fd541ab09e1f80a2a1760032d665f6e032d8e44055d602d65eeea6e6e85498cb"}, + {file = "pandas-1.3.5-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:2651d75b9a167cc8cc572cf787ab512d16e316ae00ba81874b560586fa1325e0"}, + {file = "pandas-1.3.5-cp310-cp310-win_amd64.whl", hash = "sha256:aaf183a615ad790801fa3cf2fa450e5b6d23a54684fe386f7e3208f8b9bfbef6"}, + {file = "pandas-1.3.5-cp37-cp37m-macosx_10_9_x86_64.whl", hash = "sha256:344295811e67f8200de2390093aeb3c8309f5648951b684d8db7eee7d1c81fb7"}, + {file = "pandas-1.3.5-cp37-cp37m-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:552020bf83b7f9033b57cbae65589c01e7ef1544416122da0c79140c93288f56"}, + {file = "pandas-1.3.5-cp37-cp37m-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:5cce0c6bbeb266b0e39e35176ee615ce3585233092f685b6a82362523e59e5b4"}, + {file = "pandas-1.3.5-cp37-cp37m-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:7d28a3c65463fd0d0ba8bbb7696b23073efee0510783340a44b08f5e96ffce0c"}, + {file = "pandas-1.3.5-cp37-cp37m-win32.whl", hash = "sha256:a62949c626dd0ef7de11de34b44c6475db76995c2064e2d99c6498c3dba7fe58"}, + {file = "pandas-1.3.5-cp37-cp37m-win_amd64.whl", hash = "sha256:8025750767e138320b15ca16d70d5cdc1886e8f9cc56652d89735c016cd8aea6"}, + {file = "pandas-1.3.5-cp38-cp38-macosx_10_9_x86_64.whl", hash = "sha256:fe95bae4e2d579812865db2212bb733144e34d0c6785c0685329e5b60fcb85dd"}, + {file = "pandas-1.3.5-cp38-cp38-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:5f261553a1e9c65b7a310302b9dbac31cf0049a51695c14ebe04e4bfd4a96f02"}, + {file = "pandas-1.3.5-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:8b6dbec5f3e6d5dc80dcfee250e0a2a652b3f28663492f7dab9a24416a48ac39"}, + {file = "pandas-1.3.5-cp38-cp38-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:d3bc49af96cd6285030a64779de5b3688633a07eb75c124b0747134a63f4c05f"}, + {file = "pandas-1.3.5-cp38-cp38-win32.whl", hash = "sha256:b6b87b2fb39e6383ca28e2829cddef1d9fc9e27e55ad91ca9c435572cdba51bf"}, + {file = "pandas-1.3.5-cp38-cp38-win_amd64.whl", hash = "sha256:a395692046fd8ce1edb4c6295c35184ae0c2bbe787ecbe384251da609e27edcb"}, + {file = "pandas-1.3.5-cp39-cp39-macosx_10_9_x86_64.whl", hash = "sha256:bd971a3f08b745a75a86c00b97f3007c2ea175951286cdda6abe543e687e5f2f"}, + {file = "pandas-1.3.5-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:37f06b59e5bc05711a518aa10beaec10942188dccb48918bb5ae602ccbc9f1a0"}, + {file = "pandas-1.3.5-cp39-cp39-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:2c21778a688d3712d35710501f8001cdbf96eb70a7c587a3d5613573299fdca6"}, + {file = "pandas-1.3.5-cp39-cp39-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:3345343206546545bc26a05b4602b6a24385b5ec7c75cb6059599e3d56831da2"}, + {file = "pandas-1.3.5-cp39-cp39-win32.whl", hash = "sha256:c69406a2808ba6cf580c2255bcf260b3f214d2664a3a4197d0e640f573b46fd3"}, + {file = "pandas-1.3.5-cp39-cp39-win_amd64.whl", hash = "sha256:32e1a26d5ade11b547721a72f9bfc4bd113396947606e00d5b4a5b79b3dcb006"}, + {file = "pandas-1.3.5.tar.gz", hash = "sha256:1e4285f5de1012de20ca46b188ccf33521bff61ba5c5ebd78b4fb28e5416a9f1"}, +] +pdtypes = [ + {file = "pdtypes-0.0.4-py3-none-any.whl", hash = "sha256:a51ecf8485dff142b1864e132928547350d789b735bfb7e8d87aa90cf464ec88"}, + {file = "pdtypes-0.0.4.tar.gz", hash = "sha256:4f76fac05a785d558b809aa59d2ec13ee22e105267f2bde025007242fe8f4983"}, +] +pipda = [ + {file = "pipda-0.5.7-py3-none-any.whl", hash = "sha256:36b629bd95c92395b0592239c835e92f4dda215a87d7c3300fd5530d52002244"}, + {file = "pipda-0.5.7.tar.gz", hash = "sha256:81d2c6e4939d334105f69a810f75b9e6bf725ddda545ba0756dd1dc2a0085bfd"}, +] +pluggy = [ + {file = "pluggy-1.0.0-py2.py3-none-any.whl", hash = "sha256:74134bbf457f031a36d68416e1509f34bd5ccc019f0bcc952c7b909d06b37bd3"}, + {file = "pluggy-1.0.0.tar.gz", hash = "sha256:4224373bacce55f955a878bf9cfa763c1e360858e330072059e10bad68531159"}, +] +pure-eval = [ + {file = "pure_eval-0.2.2-py3-none-any.whl", hash = "sha256:01eaab343580944bc56080ebe0a674b39ec44a945e6d09ba7db3cb8cec289350"}, + {file = "pure_eval-0.2.2.tar.gz", hash = "sha256:2b45320af6dfaa1750f543d714b6d1c520a1688dec6fd24d339063ce0aaa9ac3"}, +] +py = [ + {file = "py-1.11.0-py2.py3-none-any.whl", hash = "sha256:607c53218732647dff4acdfcd50cb62615cedf612e72d1724fb1a0cc6405b378"}, + {file = "py-1.11.0.tar.gz", hash = "sha256:51c75c4126074b472f746a24399ad32f6053d1b34b68d2fa41e558e6f4a98719"}, +] +pyparsing = [ + {file = "pyparsing-3.0.7-py3-none-any.whl", hash = "sha256:a6c06a88f252e6c322f65faf8f418b16213b51bdfaece0524c1c1bc30c63c484"}, + {file = "pyparsing-3.0.7.tar.gz", hash = "sha256:18ee9022775d270c55187733956460083db60b37d0d0fb357445f3094eed3eea"}, +] +pytest = [ + {file = "pytest-7.0.1-py3-none-any.whl", hash = "sha256:9ce3ff477af913ecf6321fe337b93a2c0dcf2a0a1439c43f5452112c1e4280db"}, + {file = "pytest-7.0.1.tar.gz", hash = "sha256:e30905a0c131d3d94b89624a1cc5afec3e0ba2fbdb151867d8e0ebd49850f171"}, +] +pytest-cov = [ + {file = "pytest-cov-3.0.0.tar.gz", hash = "sha256:e7f0f5b1617d2210a2cabc266dfe2f4c75a8d32fb89eafb7ad9d06f6d076d470"}, + {file = "pytest_cov-3.0.0-py3-none-any.whl", hash = "sha256:578d5d15ac4a25e5f961c938b85a05b09fdaae9deef3bb6de9a6e766622ca7a6"}, +] +pytest-forked = [ + {file = "pytest-forked-1.4.0.tar.gz", hash = "sha256:8b67587c8f98cbbadfdd804539ed5455b6ed03802203485dd2f53c1422d7440e"}, + {file = "pytest_forked-1.4.0-py3-none-any.whl", hash = "sha256:bbbb6717efc886b9d64537b41fb1497cfaf3c9601276be8da2cccfea5a3c8ad8"}, +] +pytest-xdist = [ + {file = "pytest-xdist-2.5.0.tar.gz", hash = "sha256:4580deca3ff04ddb2ac53eba39d76cb5dd5edeac050cb6fbc768b0dd712b4edf"}, + {file = "pytest_xdist-2.5.0-py3-none-any.whl", hash = "sha256:6fe5c74fec98906deb8f2d2b616b5c782022744978e7bd4695d39c8f42d0ce65"}, +] +python-dateutil = [ + {file = "python-dateutil-2.8.2.tar.gz", hash = "sha256:0123cacc1627ae19ddf3c27a5de5bd67ee4586fbdd6440d9748f8abb483d3e86"}, + {file = "python_dateutil-2.8.2-py2.py3-none-any.whl", hash = "sha256:961d03dc3453ebbc59dbdea9e4e11c5651520a876d0f4db161e8674aae935da9"}, +] +python-slugify = [ + {file = "python-slugify-6.1.1.tar.gz", hash = "sha256:00003397f4e31414e922ce567b3a4da28cf1436a53d332c9aeeb51c7d8c469fd"}, + {file = "python_slugify-6.1.1-py2.py3-none-any.whl", hash = "sha256:8c0016b2d74503eb64761821612d58fcfc729493634b1eb0575d8f5b4aa1fbcf"}, +] +pytz = [ + {file = "pytz-2021.3-py2.py3-none-any.whl", hash = "sha256:3672058bc3453457b622aab7a1c3bfd5ab0bdae451512f6cf25f64ed37f5b87c"}, + {file = "pytz-2021.3.tar.gz", hash = "sha256:acad2d8b20a1af07d4e4c9d2e9285c5ed9104354062f275f3fcd88dcef4f1326"}, +] +scipy = [ + {file = "scipy-1.6.1-cp37-cp37m-macosx_10_9_x86_64.whl", hash = "sha256:a15a1f3fc0abff33e792d6049161b7795909b40b97c6cc2934ed54384017ab76"}, + {file = "scipy-1.6.1-cp37-cp37m-manylinux1_i686.whl", hash = "sha256:e79570979ccdc3d165456dd62041d9556fb9733b86b4b6d818af7a0afc15f092"}, + {file = "scipy-1.6.1-cp37-cp37m-manylinux1_x86_64.whl", hash = "sha256:a423533c55fec61456dedee7b6ee7dce0bb6bfa395424ea374d25afa262be261"}, + {file = "scipy-1.6.1-cp37-cp37m-manylinux2014_aarch64.whl", hash = "sha256:33d6b7df40d197bdd3049d64e8e680227151673465e5d85723b3b8f6b15a6ced"}, + {file = "scipy-1.6.1-cp37-cp37m-win32.whl", hash = "sha256:6725e3fbb47da428794f243864f2297462e9ee448297c93ed1dcbc44335feb78"}, + {file = "scipy-1.6.1-cp37-cp37m-win_amd64.whl", hash = "sha256:5fa9c6530b1661f1370bcd332a1e62ca7881785cc0f80c0d559b636567fab63c"}, + {file = "scipy-1.6.1-cp38-cp38-macosx_10_9_x86_64.whl", hash = "sha256:bd50daf727f7c195e26f27467c85ce653d41df4358a25b32434a50d8870fc519"}, + {file = "scipy-1.6.1-cp38-cp38-manylinux1_i686.whl", hash = "sha256:f46dd15335e8a320b0fb4685f58b7471702234cba8bb3442b69a3e1dc329c345"}, + {file = "scipy-1.6.1-cp38-cp38-manylinux1_x86_64.whl", hash = "sha256:0e5b0ccf63155d90da576edd2768b66fb276446c371b73841e3503be1d63fb5d"}, + {file = "scipy-1.6.1-cp38-cp38-manylinux2014_aarch64.whl", hash = "sha256:2481efbb3740977e3c831edfd0bd9867be26387cacf24eb5e366a6a374d3d00d"}, + {file = "scipy-1.6.1-cp38-cp38-win32.whl", hash = "sha256:68cb4c424112cd4be886b4d979c5497fba190714085f46b8ae67a5e4416c32b4"}, + {file = "scipy-1.6.1-cp38-cp38-win_amd64.whl", hash = "sha256:5f331eeed0297232d2e6eea51b54e8278ed8bb10b099f69c44e2558c090d06bf"}, + {file = "scipy-1.6.1-cp39-cp39-macosx_10_9_x86_64.whl", hash = "sha256:0c8a51d33556bf70367452d4d601d1742c0e806cd0194785914daf19775f0e67"}, + {file = "scipy-1.6.1-cp39-cp39-manylinux1_i686.whl", hash = "sha256:83bf7c16245c15bc58ee76c5418e46ea1811edcc2e2b03041b804e46084ab627"}, + {file = "scipy-1.6.1-cp39-cp39-manylinux1_x86_64.whl", hash = "sha256:794e768cc5f779736593046c9714e0f3a5940bc6dcc1dba885ad64cbfb28e9f0"}, + {file = "scipy-1.6.1-cp39-cp39-manylinux2014_aarch64.whl", hash = "sha256:5da5471aed911fe7e52b86bf9ea32fb55ae93e2f0fac66c32e58897cfb02fa07"}, + {file = "scipy-1.6.1-cp39-cp39-win32.whl", hash = "sha256:8e403a337749ed40af60e537cc4d4c03febddcc56cd26e774c9b1b600a70d3e4"}, + {file = "scipy-1.6.1-cp39-cp39-win_amd64.whl", hash = "sha256:a5193a098ae9f29af283dcf0041f762601faf2e595c0db1da929875b7570353f"}, + {file = "scipy-1.6.1.tar.gz", hash = "sha256:c4fceb864890b6168e79b0e714c585dbe2fd4222768ee90bc1aa0f8218691b11"}, +] +six = [ + {file = "six-1.16.0-py2.py3-none-any.whl", hash = "sha256:8abb2f1d86890a2dfb989f9a77cfcfd3e47c2a354b01111771326f8aa26e0254"}, + {file = "six-1.16.0.tar.gz", hash = "sha256:1e61c37477a1626458e36f7b1d82aa5c9b094fa4802892072e49de9c60c4c926"}, +] +text-unidecode = [ + {file = "text-unidecode-1.3.tar.gz", hash = "sha256:bad6603bb14d279193107714b288be206cac565dfa49aa5b105294dd5c4aab93"}, + {file = "text_unidecode-1.3-py2.py3-none-any.whl", hash = "sha256:1311f10e8b895935241623731c2ba64f4c455287888b18189350b67134a822e8"}, +] +toml = [ + {file = "toml-0.10.2-py2.py3-none-any.whl", hash = "sha256:806143ae5bfb6a3c6e736a764057db0e6a0e05e338b5630894a5f779cabb4f9b"}, + {file = "toml-0.10.2.tar.gz", hash = "sha256:b3bda1d108d5dd99f4a20d24d9c348e91c4db7ab1b749200bded2f839ccbe68f"}, +] +tomli = [ + {file = "tomli-2.0.1-py3-none-any.whl", hash = "sha256:939de3e7a6161af0c887ef91b7d41a53e7c5a1ca976325f429cb46ea9bc30ecc"}, + {file = "tomli-2.0.1.tar.gz", hash = "sha256:de526c12914f0c550d15924c62d72abc48d6fe7364aa87328337a31007fe8a4f"}, +] +typing-extensions = [ + {file = "typing_extensions-4.1.1-py3-none-any.whl", hash = "sha256:21c85e0fe4b9a155d0799430b0ad741cdce7e359660ccbd8b530613e8df88ce2"}, + {file = "typing_extensions-4.1.1.tar.gz", hash = "sha256:1a9462dcc3347a79b1f1c0271fbe79e844580bb598bafa1ed208b94da3cdcd42"}, +] +varname = [ + {file = "varname-0.8.2-py3-none-any.whl", hash = "sha256:db4d82106a512e67104cdf6fecc0081bf318f810215610e3c9def6551c9e74ef"}, + {file = "varname-0.8.2.tar.gz", hash = "sha256:2df1fdd8945e57e67193c09998f5c9eeeb2d8c1f30f561ce71b94480a846e5d9"}, +] +wcwidth = [ + {file = "wcwidth-0.2.5-py2.py3-none-any.whl", hash = "sha256:beb4802a9cebb9144e99086eff703a642a13d6a0052920003a230f3294bbe784"}, + {file = "wcwidth-0.2.5.tar.gz", hash = "sha256:c4d647b99872929fdb7bdcaa4fbe7f01413ed3d98077df798530e5b04f116c83"}, +] +zipp = [ + {file = "zipp-3.7.0-py3-none-any.whl", hash = "sha256:b47250dd24f92b7dd6a0a8fc5244da14608f3ca90a5efcd37a3b1642fac9a375"}, + {file = "zipp-3.7.0.tar.gz", hash = "sha256:9f50f446828eb9d45b267433fd3e9da8d801f614129124863f9c51ebceafb87d"}, +] diff --git a/pyproject.toml b/pyproject.toml index f23b9a54..e36b6f14 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -1,6 +1,6 @@ [tool.poetry] name = "datar" -version = "0.6.3" +version = "0.6.4" description = "Port of dplyr and other related R packages in python, using pipda." authors = ["pwwang "] readme = "README.md" diff --git a/tests/__init__.py b/tests/__init__.py index 810a6be1..1d7d33ac 100644 --- a/tests/__init__.py +++ b/tests/__init__.py @@ -1,6 +1,6 @@ import sys -from pipda import options +from datar import options from datar.base import set_seed -options.warn_astnode_failure = False +options(warn_astnode_failure=False, warn_builtin_names=False) set_seed(8888) diff --git a/tests/dplyr/test_funs.py b/tests/dplyr/test_funs.py index 899295c9..e032cf0a 100644 --- a/tests/dplyr/test_funs.py +++ b/tests/dplyr/test_funs.py @@ -91,8 +91,11 @@ def test_lead_lag_return_x_if_n_eqs_0(): def test_lead_lag_return_all_nas_if_n_eqs_lenx(): - assert lead([1, 2], 2).fillna(0).tolist() == [0.0, 0.0] - assert lag([1, 2], 2).fillna(0).tolist() == [0.0, 0.0] + out = lead([1, 2], 2) + assert_iterable_equal(out, [NA, NA]) + + out = lag([1, 2], 2) + assert_iterable_equal(out, [NA, NA]) def test_cumany_cumall_handle_nas_consistently():