From 62e248e4e9c420a126c4084a328bfb8bf046dc85 Mon Sep 17 00:00:00 2001 From: "Igoshev, Iaroslav" Date: Fri, 2 Feb 2024 19:22:30 +0000 Subject: [PATCH] FEAT-#6908: Remove the warning regarding engine initialization Signed-off-by: Igoshev, Iaroslav --- docs/getting_started/quickstart.rst | 1 + docs/getting_started/troubleshooting.rst | 5 +- .../using_modin/using_modin_locally.rst | 49 - docs/usage_guide/advanced_usage/index.rst | 15 + .../advanced_usage/modin_engines.rst | 76 + .../advanced_usage/modin_xgboost.rst | 2 + docs/usage_guide/benchmarking.rst | 2 + examples/jupyter/integrations/NLTK.ipynb | 1186 +-------------- examples/jupyter/integrations/altair.ipynb | 147 +- .../jupyter/integrations/huggingface.ipynb | 363 +---- .../jupyter/integrations/matplotlib.ipynb | 191 +-- examples/jupyter/integrations/plotly.ipynb | 703 +-------- examples/jupyter/integrations/sklearn.ipynb | 1331 +---------------- .../jupyter/integrations/statsmodels.ipynb | 469 +----- .../jupyter/integrations/tensorflow.ipynb | 579 +------ examples/jupyter/integrations/xgboost.ipynb | 66 +- examples/quickstart.ipynb | 1 + modin/core/execution/dask/common/utils.py | 9 - modin/core/execution/ray/common/utils.py | 9 - modin/core/execution/unidist/common/utils.py | 9 - 20 files changed, 372 insertions(+), 4841 deletions(-) create mode 100644 docs/usage_guide/advanced_usage/modin_engines.rst diff --git a/docs/getting_started/quickstart.rst b/docs/getting_started/quickstart.rst index dc6661bc7ab..c91693bade6 100644 --- a/docs/getting_started/quickstart.rst +++ b/docs/getting_started/quickstart.rst @@ -61,6 +61,7 @@ For the purpose of demonstration, we will load in modin as ``pd`` and pandas as ############################################# import time import ray + # Look at the Ray documentation with respect to the Ray configuration suited to you most. ray.init() ############################################# diff --git a/docs/getting_started/troubleshooting.rst b/docs/getting_started/troubleshooting.rst index 85d3b7f4ad0..75f4fc17b6f 100644 --- a/docs/getting_started/troubleshooting.rst +++ b/docs/getting_started/troubleshooting.rst @@ -215,6 +215,7 @@ once Python interpreter is started in them so that to avoid a race condition in import modin.pandas as pd import modin.config as cfg + # Look at the Ray documentation with respect to the Ray configuration suited to you most. ray.init(runtime_env={'env_vars': {'__MODIN_AUTOIMPORT_PANDAS__': '1'}}) pandas_df = pandas.DataFrame( @@ -357,7 +358,9 @@ or cfg.Engine.put("dask") if __name__ == "__main__": - client = Client() # Explicit Dask Client creation. + # Explicit Dask Client creation. + # Look at the Dask Distributed documentation with respect to the Client configuration suited to you most. + client = Client() df = pd.DataFrame([0, 1, 2, 3]) print(df) diff --git a/docs/getting_started/using_modin/using_modin_locally.rst b/docs/getting_started/using_modin/using_modin_locally.rst index d69cf7a6b1e..4d68ef6d8b2 100644 --- a/docs/getting_started/using_modin/using_modin_locally.rst +++ b/docs/getting_started/using_modin/using_modin_locally.rst @@ -23,55 +23,6 @@ just like you would pandas, since the API is identical to pandas. **That's it. You're ready to use Modin on your previous pandas workflows!** -Optional Configurations ------------------------ - -When using Modin locally on a single machine or laptop (without a cluster), Modin will -automatically create and manage a local Dask or Ray cluster for the executing your -code. So when you run an operation for the first time with Modin, you will see a -message like this, indicating that a Modin has automatically initialized a local -cluster for you: - -.. code-block:: python - - df = pd.DataFrame({'col1': [1, 2], 'col2': [3, 4]}) - -.. code-block:: text - - UserWarning: Ray execution environment not yet initialized. Initializing... - To remove this warning, run the following python code before doing dataframe operations: - - import ray - ray.init() - - If you prefer to use Dask over Ray as your execution backend, you can use the - following code to modify the default configuration: - -.. code-block:: python - - import modin - modin.config.Engine.put("Dask") - -.. code-block:: python - - df = pd.DataFrame({'col1': [1, 2], 'col2': [3, 4]}) - - -.. code-block:: text - - UserWarning: Dask execution environment not yet initialized. Initializing... - To remove this warning, run the following python code before doing dataframe operations: - - from distributed import Client - - client = Client() - -Finally, if you already have an Ray or Dask engine initialized, Modin will -automatically attach to whichever engine is available. If you are interested in using -Modin with HDK engine, please refer to :doc:`these instructions `. -For additional information on other settings you can configure, see -:doc:`Modin's config ` page for more details. - Advanced: Configuring the resources Modin uses ---------------------------------------------- diff --git a/docs/usage_guide/advanced_usage/index.rst b/docs/usage_guide/advanced_usage/index.rst index 7263036d5d0..35c910acb01 100644 --- a/docs/usage_guide/advanced_usage/index.rst +++ b/docs/usage_guide/advanced_usage/index.rst @@ -12,6 +12,7 @@ Advanced Usage modin_xgboost modin_logging batch + modin_engines .. meta:: :description lang=en: @@ -22,6 +23,16 @@ integrated toolkit for data scientists. We are actively developing data science such as DataFrame spreadsheet integration, DataFrame algebra, progress bars, SQL queries on DataFrames, and more. Join us on `Slack`_ and `Discourse`_ for the latest updates! +Modin engines +------------- + +Modin supports a series of execution engines such as Ray_, Dask_, `MPI through unidist`_, `HDK`_, +each of which might be a more beneficial choice for a specific scenario. When doing the first operation +with Modin it automatically initializes one of the engines to further perform distributed/parallel computation. +If you are familiar with a concrete execution engine, it is possible to initialize the engine on your own and +Modin will automatically attach to it. Refer to :doc:`Modin engines ` page +for more details. + Experimental APIs ----------------- @@ -118,3 +129,7 @@ downloaded as an artifact from the GitHub Actions tab for further inspection. Se .. _`tqdm`: https://github.com/tqdm/tqdm .. _`distributed XGBoost`: https://medium.com/intel-analytics-software/distributed-xgboost-with-modin-on-ray-fc17edef7720 .. _`fuzzydata`: https://github.com/suhailrehman/fuzzydata +.. _Ray: https://github.com/ray-project/ray +.. _Dask: https://github.com/dask/distributed +.. _`MPI through unidist`: https://github.com/modin-project/unidist +.. _HDK: https://github.com/intel-ai/hdk diff --git a/docs/usage_guide/advanced_usage/modin_engines.rst b/docs/usage_guide/advanced_usage/modin_engines.rst new file mode 100644 index 00000000000..d925d4e7e89 --- /dev/null +++ b/docs/usage_guide/advanced_usage/modin_engines.rst @@ -0,0 +1,76 @@ +Modin engines +============= + +As a rule, you don't have to worry about initialization of an execution engine as +Modin itself automatically initializes one when performing the first operation. +Also, Modin has a broad range of :doc:`configuration settings `, which +you can use to configure an execution engine. If there is a reason to initialize an execution engine +on your own and you are sure what to do, Modin will automatically attach to whichever engine is available. +Below, you can find some examples on how to initialize a specific execution engine on your own. + +Ray +--- + +You can initialize Ray engine with a specific number of CPUs (worker processes) to perform computation. + +.. code-block:: python + + import ray + import modin.config as modin_cfg + + ray.init(num_cpus=) + modin_cfg.Engine.put("ray") # Modin will use Ray engine + modin_cfg.CpuCount.put() + +To get more details on all possible parameters for initialization refer to `Ray documentation`_. + +Dask +---- + +You can initialize Dask engine with a specific number of worker processes and threads per worker to perform computation. + +.. code-block:: python + + from distributed import Client + import modin.config as modin_cfg + + client = Client(n_workers=, threads_per_worker=) + modin_cfg.Engine.put("dask") # # Modin will use Dask engine + modin_cfg.CpuCount.put() + +To get more details on all possible parameters for initialization refer to `Dask Distributed documentation`_. + +MPI through unidist +------------------- + +You can initialize MPI thought unidist engine with a specific number of CPUs (worker processes) to perform computation. + +.. code-block:: python + + import unidist + import unidist.config as unidist_cfg + import modin.config as modin_cfg + + unidist_cfg.Backend.put("mpi") + unidist_cfg.CpuCount.put() + unidist.init() + + modin_cfg.Engine.put("unidist") # # Modin will use MPI through unidist engine + modin_cfg.CpuCount.put() + +To get more details on all possible parameters for initialization refer to `unidist documentation`_. + +HDK +--- + +For now it is not possible to initialize HDK beforehand. Modin itself initializes it with the required configuration. + +.. code-block:: python + + import modin.config as modin_cfg + + modin_cfg.StorageFormat.put("hdk") # # Modin will use HDK engine + +.. _`Ray documentation`: https://docs.ray.io/en/latest +.. _Dask Distributed documentation: https://distributed.dask.org/en/latest +.. _`unidist documentation`: https://unidist.readthedocs.io/en/latest diff --git a/docs/usage_guide/advanced_usage/modin_xgboost.rst b/docs/usage_guide/advanced_usage/modin_xgboost.rst index e77a464a528..af62158e437 100644 --- a/docs/usage_guide/advanced_usage/modin_xgboost.rst +++ b/docs/usage_guide/advanced_usage/modin_xgboost.rst @@ -55,6 +55,7 @@ To start the Ray runtime on a single node: .. code-block:: python import ray + # Look at the Ray documentation with respect to the Ray configuration suited to you most. ray.init() If you already had the Ray cluster you can connect to it by next way: @@ -78,6 +79,7 @@ All processing will be in a `single node` mode. from sklearn import datasets import ray + # Look at the Ray documentation with respect to the Ray configuration suited to you most. ray.init() # Start the Ray runtime for single-node import modin.pandas as pd diff --git a/docs/usage_guide/benchmarking.rst b/docs/usage_guide/benchmarking.rst index 551c9950ae7..f26a9dac3ec 100644 --- a/docs/usage_guide/benchmarking.rst +++ b/docs/usage_guide/benchmarking.rst @@ -35,6 +35,7 @@ Consider the following ipython script: import time import ray + # Look at the Ray documentation with respect to the Ray configuration suited to you most. ray.init() df = pd.DataFrame(list(range(MinPartitionSize.get() * 2))) %time result = df.map(lambda x: time.sleep(0.1) or x) @@ -146,6 +147,7 @@ That will typically block on any asynchronous computation: time.sleep(10) return x + 1 + # Look at the Ray documentation with respect to the Ray configuration suited to you most. ray.init() df1 = pd.DataFrame(list(range(10_000)), columns=['A']) result = df1.map(slow_add_one) diff --git a/examples/jupyter/integrations/NLTK.ipynb b/examples/jupyter/integrations/NLTK.ipynb index 0b9a945de38..504d56bcae9 100644 --- a/examples/jupyter/integrations/NLTK.ipynb +++ b/examples/jupyter/integrations/NLTK.ipynb @@ -16,7 +16,7 @@ }, { "cell_type": "code", - "execution_count": 1, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -29,96 +29,9 @@ }, { "cell_type": "code", - "execution_count": 2, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "UserWarning: Ray execution environment not yet initialized. Initializing...\n", - "To remove this warning, run the following python code before doing dataframe operations:\n", - "\n", - " import ray\n", - " ray.init(runtime_env={'env_vars': {'__MODIN_AUTOIMPORT_PANDAS__': '1'}})\n", - "\n", - "2023-04-05 18:22:43,278\tINFO worker.py:1553 -- Started a local Ray instance.\n" - ] - }, - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
Unnamed: 0created_atidauthor_idtext
002022-05-16T21:24:35.000Z1526312680226799618813286It’s despicable, it’s dangerous — and it needs...
112022-05-16T21:24:34.000Z1526312678951641088813286We need to repudiate in the strongest terms th...
222022-05-16T21:24:34.000Z1526312677521428480813286This weekend’s shootings in Buffalo offer a tr...
\n", - "
" - ], - "text/plain": [ - " Unnamed: 0 created_at id author_id \\\n", - "0 0 2022-05-16T21:24:35.000Z 1526312680226799618 813286 \n", - "1 1 2022-05-16T21:24:34.000Z 1526312678951641088 813286 \n", - "2 2 2022-05-16T21:24:34.000Z 1526312677521428480 813286 \n", - "\n", - " text \n", - "0 It’s despicable, it’s dangerous — and it needs... \n", - "1 We need to repudiate in the strongest terms th... \n", - "2 This weekend’s shootings in Buffalo offer a tr... " - ] - }, - "execution_count": 2, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "# Import some Tweets from Barack Obama \n", "modin_df = pd.read_csv(\"https://raw.githubusercontent.com/kirenz/twitter-tweepy/main/tweets-obama.csv\")\n", @@ -127,83 +40,9 @@ }, { "cell_type": "code", - "execution_count": 3, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
Unnamed: 0created_atidauthor_idtext
002022-05-16T21:24:35.000Z1526312680226799618813286it’s despicable, it’s dangerous — and it needs...
112022-05-16T21:24:34.000Z1526312678951641088813286we need to repudiate in the strongest terms th...
222022-05-16T21:24:34.000Z1526312677521428480813286this weekend’s shootings in buffalo offer a tr...
\n", - "
" - ], - "text/plain": [ - " Unnamed: 0 created_at id author_id \\\n", - "0 0 2022-05-16T21:24:35.000Z 1526312680226799618 813286 \n", - "1 1 2022-05-16T21:24:34.000Z 1526312678951641088 813286 \n", - "2 2 2022-05-16T21:24:34.000Z 1526312677521428480 813286 \n", - "\n", - " text \n", - "0 it’s despicable, it’s dangerous — and it needs... \n", - "1 we need to repudiate in the strongest terms th... \n", - "2 this weekend’s shootings in buffalo offer a tr... " - ] - }, - "execution_count": 3, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "modin_df['text'] = modin_df['text'].astype(str).str.lower()\n", "modin_df.head(3)" @@ -211,92 +50,9 @@ }, { "cell_type": "code", - "execution_count": 4, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
Unnamed: 0created_atidauthor_idtexttext_token
002022-05-16T21:24:35.000Z1526312680226799618813286it’s despicable, it’s dangerous — and it needs...[it, s, despicable, it, s, dangerous, and, it,...
112022-05-16T21:24:34.000Z1526312678951641088813286we need to repudiate in the strongest terms th...[we, need, to, repudiate, in, the, strongest, ...
222022-05-16T21:24:34.000Z1526312677521428480813286this weekend’s shootings in buffalo offer a tr...[this, weekend, s, shootings, in, buffalo, off...
\n", - "
" - ], - "text/plain": [ - " Unnamed: 0 created_at id author_id \\\n", - "0 0 2022-05-16T21:24:35.000Z 1526312680226799618 813286 \n", - "1 1 2022-05-16T21:24:34.000Z 1526312678951641088 813286 \n", - "2 2 2022-05-16T21:24:34.000Z 1526312677521428480 813286 \n", - "\n", - " text \\\n", - "0 it’s despicable, it’s dangerous — and it needs... \n", - "1 we need to repudiate in the strongest terms th... \n", - "2 this weekend’s shootings in buffalo offer a tr... \n", - "\n", - " text_token \n", - "0 [it, s, despicable, it, s, dangerous, and, it,... \n", - "1 [we, need, to, repudiate, in, the, strongest, ... \n", - "2 [this, weekend, s, shootings, in, buffalo, off... " - ] - }, - "execution_count": 4, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "regexp = RegexpTokenizer('\\w+')\n", "\n", @@ -306,36 +62,16 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[nltk_data] Downloading package stopwords to\n", - "[nltk_data] /Users/labanyamukhopadhyay/nltk_data...\n", - "[nltk_data] Package stopwords is already up-to-date!\n" - ] - }, - { - "data": { - "text/plain": [ - "True" - ] - }, - "execution_count": 5, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "nltk.download('stopwords')" ] }, { "cell_type": "code", - "execution_count": 6, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -349,92 +85,9 @@ }, { "cell_type": "code", - "execution_count": 7, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
Unnamed: 0created_atidauthor_idtexttext_token
002022-05-16T21:24:35.000Z1526312680226799618813286it’s despicable, it’s dangerous — and it needs...[despicable, dangerous, needs, stop, co, 0ch2z...
112022-05-16T21:24:34.000Z1526312678951641088813286we need to repudiate in the strongest terms th...[need, repudiate, strongest, terms, politician...
222022-05-16T21:24:34.000Z1526312677521428480813286this weekend’s shootings in buffalo offer a tr...[weekend, shootings, buffalo, offer, tragic, r...
\n", - "
" - ], - "text/plain": [ - " Unnamed: 0 created_at id author_id \\\n", - "0 0 2022-05-16T21:24:35.000Z 1526312680226799618 813286 \n", - "1 1 2022-05-16T21:24:34.000Z 1526312678951641088 813286 \n", - "2 2 2022-05-16T21:24:34.000Z 1526312677521428480 813286 \n", - "\n", - " text \\\n", - "0 it’s despicable, it’s dangerous — and it needs... \n", - "1 we need to repudiate in the strongest terms th... \n", - "2 this weekend’s shootings in buffalo offer a tr... \n", - "\n", - " text_token \n", - "0 [despicable, dangerous, needs, stop, co, 0ch2z... \n", - "1 [need, repudiate, strongest, terms, politician... \n", - "2 [weekend, shootings, buffalo, offer, tragic, r... " - ] - }, - "execution_count": 7, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "# Remove stopwords\n", "modin_df['text_token'] = modin_df['text_token'].apply(lambda x: [item for item in x if item not in stopwords])\n", @@ -443,98 +96,9 @@ }, { "cell_type": "code", - "execution_count": 8, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
texttext_tokentext_string
0it’s despicable, it’s dangerous — and it needs...[despicable, dangerous, needs, stop, co, 0ch2z...despicable dangerous needs stop 0ch2zosmhb
1we need to repudiate in the strongest terms th...[need, repudiate, strongest, terms, politician...need repudiate strongest terms politicians med...
2this weekend’s shootings in buffalo offer a tr...[weekend, shootings, buffalo, offer, tragic, r...weekend shootings buffalo offer tragic reminde...
3i’m proud to announce the voyager scholarship ...[proud, announce, voyager, scholarship, friend...proud announce voyager scholarship friend bche...
4across the country, americans are standing up ...[across, country, americans, standing, abortio...across country americans standing abortion rig...
\n", - "
" - ], - "text/plain": [ - " text \\\n", - "0 it’s despicable, it’s dangerous — and it needs... \n", - "1 we need to repudiate in the strongest terms th... \n", - "2 this weekend’s shootings in buffalo offer a tr... \n", - "3 i’m proud to announce the voyager scholarship ... \n", - "4 across the country, americans are standing up ... \n", - "\n", - " text_token \\\n", - "0 [despicable, dangerous, needs, stop, co, 0ch2z... \n", - "1 [need, repudiate, strongest, terms, politician... \n", - "2 [weekend, shootings, buffalo, offer, tragic, r... \n", - "3 [proud, announce, voyager, scholarship, friend... \n", - "4 [across, country, americans, standing, abortio... \n", - "\n", - " text_string \n", - "0 despicable dangerous needs stop 0ch2zosmhb \n", - "1 need repudiate strongest terms politicians med... \n", - "2 weekend shootings buffalo offer tragic reminde... \n", - "3 proud announce voyager scholarship friend bche... \n", - "4 across country americans standing abortion rig... " - ] - }, - "execution_count": 8, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "modin_df['text_string'] = modin_df['text_token'].apply(lambda x: ' '.join([item for item in x if len(item)>2]))\n", "modin_df[['text', 'text_token', 'text_string']].head()" @@ -542,36 +106,16 @@ }, { "cell_type": "code", - "execution_count": 9, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[nltk_data] Downloading package punkt to\n", - "[nltk_data] /Users/labanyamukhopadhyay/nltk_data...\n", - "[nltk_data] Package punkt is already up-to-date!\n" - ] - }, - { - "data": { - "text/plain": [ - "True" - ] - }, - "execution_count": 9, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "nltk.download('punkt')" ] }, { "cell_type": "code", - "execution_count": 10, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -581,20 +125,9 @@ }, { "cell_type": "code", - "execution_count": 11, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "FreqDist({'need': 2, 'americans': 2, 'proud': 2, 'despicable': 1, 'dangerous': 1, 'needs': 1, 'stop': 1, '0ch2zosmhb': 1, 'repudiate': 1, 'strongest': 1, ...})" - ] - }, - "execution_count": 11, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "from nltk.probability import FreqDist\n", "\n", @@ -604,111 +137,9 @@ }, { "cell_type": "code", - "execution_count": 12, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
texttext_tokentext_stringtext_string_fdist
0it’s despicable, it’s dangerous — and it needs...[despicable, dangerous, needs, stop, co, 0ch2z...despicable dangerous needs stop 0ch2zosmhbdespicable dangerous needs stop 0ch2zosmhb
1we need to repudiate in the strongest terms th...[need, repudiate, strongest, terms, politician...need repudiate strongest terms politicians med...need repudiate strongest terms politicians med...
2this weekend’s shootings in buffalo offer a tr...[weekend, shootings, buffalo, offer, tragic, r...weekend shootings buffalo offer tragic reminde...weekend shootings buffalo offer tragic reminde...
3i’m proud to announce the voyager scholarship ...[proud, announce, voyager, scholarship, friend...proud announce voyager scholarship friend bche...proud announce voyager scholarship friend bche...
4across the country, americans are standing up ...[across, country, americans, standing, abortio...across country americans standing abortion rig...across country americans standing abortion rig...
\n", - "
" - ], - "text/plain": [ - " text \\\n", - "0 it’s despicable, it’s dangerous — and it needs... \n", - "1 we need to repudiate in the strongest terms th... \n", - "2 this weekend’s shootings in buffalo offer a tr... \n", - "3 i’m proud to announce the voyager scholarship ... \n", - "4 across the country, americans are standing up ... \n", - "\n", - " text_token \\\n", - "0 [despicable, dangerous, needs, stop, co, 0ch2z... \n", - "1 [need, repudiate, strongest, terms, politician... \n", - "2 [weekend, shootings, buffalo, offer, tragic, r... \n", - "3 [proud, announce, voyager, scholarship, friend... \n", - "4 [across, country, americans, standing, abortio... \n", - "\n", - " text_string \\\n", - "0 despicable dangerous needs stop 0ch2zosmhb \n", - "1 need repudiate strongest terms politicians med... \n", - "2 weekend shootings buffalo offer tragic reminde... \n", - "3 proud announce voyager scholarship friend bche... \n", - "4 across country americans standing abortion rig... \n", - "\n", - " text_string_fdist \n", - "0 despicable dangerous needs stop 0ch2zosmhb \n", - "1 need repudiate strongest terms politicians med... \n", - "2 weekend shootings buffalo offer tragic reminde... \n", - "3 proud announce voyager scholarship friend bche... \n", - "4 across country americans standing abortion rig... " - ] - }, - "execution_count": 12, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "modin_df['text_string_fdist'] = modin_df['text_token'].apply(lambda x: ' '.join([item for item in x if fdist[item] >= 1 ]))\n", "modin_df[['text', 'text_token', 'text_string', 'text_string_fdist']].head()" @@ -716,32 +147,9 @@ }, { "cell_type": "code", - "execution_count": 13, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "[nltk_data] Downloading package wordnet to\n", - "[nltk_data] /Users/labanyamukhopadhyay/nltk_data...\n", - "[nltk_data] Package wordnet is already up-to-date!\n", - "[nltk_data] Downloading package omw-1.4 to\n", - "[nltk_data] /Users/labanyamukhopadhyay/nltk_data...\n", - "[nltk_data] Package omw-1.4 is already up-to-date!\n" - ] - }, - { - "data": { - "text/plain": [ - "True" - ] - }, - "execution_count": 13, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "#lemmatization\n", "nltk.download('wordnet')\n", @@ -750,7 +158,7 @@ }, { "cell_type": "code", - "execution_count": 14, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -763,7 +171,7 @@ }, { "cell_type": "code", - "execution_count": 15, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -773,21 +181,9 @@ }, { "cell_type": "code", - "execution_count": 16, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "True 5\n", - "Name: is_equal, dtype: int64" - ] - }, - "execution_count": 16, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "# show level count\n", "modin_df.is_equal.value_counts()" @@ -795,7 +191,7 @@ }, { "cell_type": "code", - "execution_count": 17, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -804,22 +200,9 @@ }, { "cell_type": "code", - "execution_count": 18, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": { - "needs_background": "light" - }, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "%matplotlib inline\n", "import matplotlib.pyplot as plt\n", @@ -844,7 +227,7 @@ }, { "cell_type": "code", - "execution_count": 19, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -854,83 +237,9 @@ }, { "cell_type": "code", - "execution_count": 20, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
Unnamed: 0created_atidauthor_idtext
002022-05-16T21:24:35.000Z1526312680226799618813286it’s despicable, it’s dangerous — and it needs...
112022-05-16T21:24:34.000Z1526312678951641088813286we need to repudiate in the strongest terms th...
222022-05-16T21:24:34.000Z1526312677521428480813286this weekend’s shootings in buffalo offer a tr...
\n", - "
" - ], - "text/plain": [ - " Unnamed: 0 created_at id author_id \\\n", - "0 0 2022-05-16T21:24:35.000Z 1526312680226799618 813286 \n", - "1 1 2022-05-16T21:24:34.000Z 1526312678951641088 813286 \n", - "2 2 2022-05-16T21:24:34.000Z 1526312677521428480 813286 \n", - "\n", - " text \n", - "0 it’s despicable, it’s dangerous — and it needs... \n", - "1 we need to repudiate in the strongest terms th... \n", - "2 this weekend’s shootings in buffalo offer a tr... " - ] - }, - "execution_count": 20, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "pandas_df['text'] = pandas_df['text'].astype(str).str.lower()\n", "pandas_df.head(3)" @@ -938,92 +247,9 @@ }, { "cell_type": "code", - "execution_count": 21, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
Unnamed: 0created_atidauthor_idtexttext_token
002022-05-16T21:24:35.000Z1526312680226799618813286it’s despicable, it’s dangerous — and it needs...[it, s, despicable, it, s, dangerous, and, it,...
112022-05-16T21:24:34.000Z1526312678951641088813286we need to repudiate in the strongest terms th...[we, need, to, repudiate, in, the, strongest, ...
222022-05-16T21:24:34.000Z1526312677521428480813286this weekend’s shootings in buffalo offer a tr...[this, weekend, s, shootings, in, buffalo, off...
\n", - "
" - ], - "text/plain": [ - " Unnamed: 0 created_at id author_id \\\n", - "0 0 2022-05-16T21:24:35.000Z 1526312680226799618 813286 \n", - "1 1 2022-05-16T21:24:34.000Z 1526312678951641088 813286 \n", - "2 2 2022-05-16T21:24:34.000Z 1526312677521428480 813286 \n", - "\n", - " text \\\n", - "0 it’s despicable, it’s dangerous — and it needs... \n", - "1 we need to repudiate in the strongest terms th... \n", - "2 this weekend’s shootings in buffalo offer a tr... \n", - "\n", - " text_token \n", - "0 [it, s, despicable, it, s, dangerous, and, it,... \n", - "1 [we, need, to, repudiate, in, the, strongest, ... \n", - "2 [this, weekend, s, shootings, in, buffalo, off... " - ] - }, - "execution_count": 21, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "regexp = RegexpTokenizer('\\w+')\n", "\n", @@ -1033,92 +259,9 @@ }, { "cell_type": "code", - "execution_count": 22, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
Unnamed: 0created_atidauthor_idtexttext_token
002022-05-16T21:24:35.000Z1526312680226799618813286it’s despicable, it’s dangerous — and it needs...[despicable, dangerous, needs, stop, co, 0ch2z...
112022-05-16T21:24:34.000Z1526312678951641088813286we need to repudiate in the strongest terms th...[need, repudiate, strongest, terms, politician...
222022-05-16T21:24:34.000Z1526312677521428480813286this weekend’s shootings in buffalo offer a tr...[weekend, shootings, buffalo, offer, tragic, r...
\n", - "
" - ], - "text/plain": [ - " Unnamed: 0 created_at id author_id \\\n", - "0 0 2022-05-16T21:24:35.000Z 1526312680226799618 813286 \n", - "1 1 2022-05-16T21:24:34.000Z 1526312678951641088 813286 \n", - "2 2 2022-05-16T21:24:34.000Z 1526312677521428480 813286 \n", - "\n", - " text \\\n", - "0 it’s despicable, it’s dangerous — and it needs... \n", - "1 we need to repudiate in the strongest terms th... \n", - "2 this weekend’s shootings in buffalo offer a tr... \n", - "\n", - " text_token \n", - "0 [despicable, dangerous, needs, stop, co, 0ch2z... \n", - "1 [need, repudiate, strongest, terms, politician... \n", - "2 [weekend, shootings, buffalo, offer, tragic, r... " - ] - }, - "execution_count": 22, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "# Remove stopwords\n", "pandas_df['text_token'] = pandas_df['text_token'].apply(lambda x: [item for item in x if item not in stopwords])\n", @@ -1127,98 +270,9 @@ }, { "cell_type": "code", - "execution_count": 23, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
texttext_tokentext_string
0it’s despicable, it’s dangerous — and it needs...[despicable, dangerous, needs, stop, co, 0ch2z...despicable dangerous needs stop 0ch2zosmhb
1we need to repudiate in the strongest terms th...[need, repudiate, strongest, terms, politician...need repudiate strongest terms politicians med...
2this weekend’s shootings in buffalo offer a tr...[weekend, shootings, buffalo, offer, tragic, r...weekend shootings buffalo offer tragic reminde...
3i’m proud to announce the voyager scholarship ...[proud, announce, voyager, scholarship, friend...proud announce voyager scholarship friend bche...
4across the country, americans are standing up ...[across, country, americans, standing, abortio...across country americans standing abortion rig...
\n", - "
" - ], - "text/plain": [ - " text \\\n", - "0 it’s despicable, it’s dangerous — and it needs... \n", - "1 we need to repudiate in the strongest terms th... \n", - "2 this weekend’s shootings in buffalo offer a tr... \n", - "3 i’m proud to announce the voyager scholarship ... \n", - "4 across the country, americans are standing up ... \n", - "\n", - " text_token \\\n", - "0 [despicable, dangerous, needs, stop, co, 0ch2z... \n", - "1 [need, repudiate, strongest, terms, politician... \n", - "2 [weekend, shootings, buffalo, offer, tragic, r... \n", - "3 [proud, announce, voyager, scholarship, friend... \n", - "4 [across, country, americans, standing, abortio... \n", - "\n", - " text_string \n", - "0 despicable dangerous needs stop 0ch2zosmhb \n", - "1 need repudiate strongest terms politicians med... \n", - "2 weekend shootings buffalo offer tragic reminde... \n", - "3 proud announce voyager scholarship friend bche... \n", - "4 across country americans standing abortion rig... " - ] - }, - "execution_count": 23, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "pandas_df['text_string'] = pandas_df['text_token'].apply(lambda x: ' '.join([item for item in x if len(item)>2]))\n", "pandas_df[['text', 'text_token', 'text_string']].head()" @@ -1226,7 +280,7 @@ }, { "cell_type": "code", - "execution_count": 24, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -1236,20 +290,9 @@ }, { "cell_type": "code", - "execution_count": 25, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "FreqDist({'need': 2, 'americans': 2, 'proud': 2, 'despicable': 1, 'dangerous': 1, 'needs': 1, 'stop': 1, '0ch2zosmhb': 1, 'repudiate': 1, 'strongest': 1, ...})" - ] - }, - "execution_count": 25, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "from nltk.probability import FreqDist\n", "\n", @@ -1259,111 +302,9 @@ }, { "cell_type": "code", - "execution_count": 26, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
texttext_tokentext_stringtext_string_fdist
0it’s despicable, it’s dangerous — and it needs...[despicable, dangerous, needs, stop, co, 0ch2z...despicable dangerous needs stop 0ch2zosmhbdespicable dangerous needs stop 0ch2zosmhb
1we need to repudiate in the strongest terms th...[need, repudiate, strongest, terms, politician...need repudiate strongest terms politicians med...need repudiate strongest terms politicians med...
2this weekend’s shootings in buffalo offer a tr...[weekend, shootings, buffalo, offer, tragic, r...weekend shootings buffalo offer tragic reminde...weekend shootings buffalo offer tragic reminde...
3i’m proud to announce the voyager scholarship ...[proud, announce, voyager, scholarship, friend...proud announce voyager scholarship friend bche...proud announce voyager scholarship friend bche...
4across the country, americans are standing up ...[across, country, americans, standing, abortio...across country americans standing abortion rig...across country americans standing abortion rig...
\n", - "
" - ], - "text/plain": [ - " text \\\n", - "0 it’s despicable, it’s dangerous — and it needs... \n", - "1 we need to repudiate in the strongest terms th... \n", - "2 this weekend’s shootings in buffalo offer a tr... \n", - "3 i’m proud to announce the voyager scholarship ... \n", - "4 across the country, americans are standing up ... \n", - "\n", - " text_token \\\n", - "0 [despicable, dangerous, needs, stop, co, 0ch2z... \n", - "1 [need, repudiate, strongest, terms, politician... \n", - "2 [weekend, shootings, buffalo, offer, tragic, r... \n", - "3 [proud, announce, voyager, scholarship, friend... \n", - "4 [across, country, americans, standing, abortio... \n", - "\n", - " text_string \\\n", - "0 despicable dangerous needs stop 0ch2zosmhb \n", - "1 need repudiate strongest terms politicians med... \n", - "2 weekend shootings buffalo offer tragic reminde... \n", - "3 proud announce voyager scholarship friend bche... \n", - "4 across country americans standing abortion rig... \n", - "\n", - " text_string_fdist \n", - "0 despicable dangerous needs stop 0ch2zosmhb \n", - "1 need repudiate strongest terms politicians med... \n", - "2 weekend shootings buffalo offer tragic reminde... \n", - "3 proud announce voyager scholarship friend bche... \n", - "4 across country americans standing abortion rig... " - ] - }, - "execution_count": 26, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "pandas_df['text_string_fdist'] = pandas_df['text_token'].apply(lambda x: ' '.join([item for item in x if fdist[item] >= 1 ]))\n", "pandas_df[['text', 'text_token', 'text_string', 'text_string_fdist']].head()" @@ -1371,7 +312,7 @@ }, { "cell_type": "code", - "execution_count": 27, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -1384,7 +325,7 @@ }, { "cell_type": "code", - "execution_count": 28, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -1394,21 +335,9 @@ }, { "cell_type": "code", - "execution_count": 29, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "True 5\n", - "Name: is_equal, dtype: int64" - ] - }, - "execution_count": 29, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "# show level count\n", "pandas_df.is_equal.value_counts()" @@ -1416,7 +345,7 @@ }, { "cell_type": "code", - "execution_count": 30, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -1425,22 +354,9 @@ }, { "cell_type": "code", - "execution_count": 31, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": { - "needs_background": "light" - }, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "%matplotlib inline\n", "import matplotlib.pyplot as plt\n", diff --git a/examples/jupyter/integrations/altair.ipynb b/examples/jupyter/integrations/altair.ipynb index 406aaed007b..8502334bb75 100644 --- a/examples/jupyter/integrations/altair.ipynb +++ b/examples/jupyter/integrations/altair.ipynb @@ -10,7 +10,7 @@ }, { "cell_type": "code", - "execution_count": 1, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -20,24 +20,9 @@ }, { "cell_type": "code", - "execution_count": 2, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "UserWarning: Ray execution environment not yet initialized. Initializing...\n", - "To remove this warning, run the following python code before doing dataframe operations:\n", - "\n", - " import ray\n", - " ray.init(runtime_env={'env_vars': {'__MODIN_AUTOIMPORT_PANDAS__': '1'}})\n", - "\n", - "2023-04-06 12:15:19,701\tINFO worker.py:1553 -- Started a local Ray instance.\n", - "UserWarning: Distributing object. This may take some time.\n" - ] - } - ], + "outputs": [], "source": [ "from vega_datasets import data\n", "pandas_cars = data.cars()\n", @@ -46,50 +31,9 @@ }, { "cell_type": "code", - "execution_count": 3, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "UserWarning: data of type not recognized\n", - "UserWarning: `DataFrame.to_dict` is not currently supported by PandasOnRay, defaulting to pandas implementation.\n", - "Please refer to https://modin.readthedocs.io/en/stable/supported_apis/defaulting_to_pandas.html for explanation.\n" - ] - }, - { - "ename": "ValueError", - "evalue": "Origin encoding field is specified without a type; the type cannot be automatically inferred because the data is not specified as a pandas.DataFrame.", - "output_type": "error", - "traceback": [ - "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", - "\u001b[0;31mValueError\u001b[0m Traceback (most recent call last)", - "\u001b[0;32m~/.local/lib/python3.9/site-packages/altair/vegalite/v4/api.py\u001b[0m in \u001b[0;36mto_dict\u001b[0;34m(self, *args, **kwargs)\u001b[0m\n\u001b[1;32m 2018\u001b[0m \u001b[0mcopy\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mdata\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mcore\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mInlineData\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mvalues\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m{\u001b[0m\u001b[0;34m}\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 2019\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0msuper\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mChart\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mcopy\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mto_dict\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 2020\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0msuper\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mto_dict\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 2021\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 2022\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0madd_selection\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m*\u001b[0m\u001b[0mselections\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/.local/lib/python3.9/site-packages/altair/vegalite/v4/api.py\u001b[0m in \u001b[0;36mto_dict\u001b[0;34m(self, *args, **kwargs)\u001b[0m\n\u001b[1;32m 382\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 383\u001b[0m \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 384\u001b[0;31m \u001b[0mdct\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0msuper\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mTopLevelMixin\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mcopy\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mto_dict\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 385\u001b[0m \u001b[0;32mexcept\u001b[0m \u001b[0mjsonschema\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mValidationError\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 386\u001b[0m \u001b[0mdct\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/.local/lib/python3.9/site-packages/altair/utils/schemapi.py\u001b[0m in \u001b[0;36mto_dict\u001b[0;34m(self, validate, ignore, context)\u001b[0m\n\u001b[1;32m 324\u001b[0m \u001b[0mresult\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0m_todict\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_args\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mvalidate\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0msub_validate\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mcontext\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mcontext\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 325\u001b[0m \u001b[0;32melif\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_args\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 326\u001b[0;31m result = _todict(\n\u001b[0m\u001b[1;32m 327\u001b[0m \u001b[0;34m{\u001b[0m\u001b[0mk\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mv\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mk\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mv\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_kwds\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mitems\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mk\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mignore\u001b[0m\u001b[0;34m}\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 328\u001b[0m \u001b[0mvalidate\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0msub_validate\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/.local/lib/python3.9/site-packages/altair/utils/schemapi.py\u001b[0m in \u001b[0;36m_todict\u001b[0;34m(obj, validate, context)\u001b[0m\n\u001b[1;32m 58\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0;34m[\u001b[0m\u001b[0m_todict\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mv\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mvalidate\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mcontext\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mv\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mobj\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 59\u001b[0m \u001b[0;32melif\u001b[0m \u001b[0misinstance\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mobj\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mdict\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 60\u001b[0;31m return {\n\u001b[0m\u001b[1;32m 61\u001b[0m \u001b[0mk\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0m_todict\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mv\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mvalidate\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mcontext\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 62\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mk\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mv\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mobj\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mitems\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/.local/lib/python3.9/site-packages/altair/utils/schemapi.py\u001b[0m in \u001b[0;36m\u001b[0;34m(.0)\u001b[0m\n\u001b[1;32m 59\u001b[0m \u001b[0;32melif\u001b[0m \u001b[0misinstance\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mobj\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mdict\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 60\u001b[0m return {\n\u001b[0;32m---> 61\u001b[0;31m \u001b[0mk\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0m_todict\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mv\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mvalidate\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mcontext\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 62\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mk\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mv\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mobj\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mitems\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 63\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mv\u001b[0m \u001b[0;32mis\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0mUndefined\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/.local/lib/python3.9/site-packages/altair/utils/schemapi.py\u001b[0m in \u001b[0;36m_todict\u001b[0;34m(obj, validate, context)\u001b[0m\n\u001b[1;32m 54\u001b[0m \u001b[0;34m\"\"\"Convert an object to a dict representation.\"\"\"\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 55\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0misinstance\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mobj\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mSchemaBase\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 56\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mobj\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mto_dict\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mvalidate\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mvalidate\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mcontext\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mcontext\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 57\u001b[0m \u001b[0;32melif\u001b[0m \u001b[0misinstance\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mobj\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m(\u001b[0m\u001b[0mlist\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtuple\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mnp\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mndarray\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 58\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0;34m[\u001b[0m\u001b[0m_todict\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mv\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mvalidate\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mcontext\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mv\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mobj\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/.local/lib/python3.9/site-packages/altair/utils/schemapi.py\u001b[0m in \u001b[0;36mto_dict\u001b[0;34m(self, validate, ignore, context)\u001b[0m\n\u001b[1;32m 324\u001b[0m \u001b[0mresult\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0m_todict\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_args\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mvalidate\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0msub_validate\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mcontext\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mcontext\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 325\u001b[0m \u001b[0;32melif\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_args\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 326\u001b[0;31m result = _todict(\n\u001b[0m\u001b[1;32m 327\u001b[0m \u001b[0;34m{\u001b[0m\u001b[0mk\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mv\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mk\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mv\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_kwds\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mitems\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mk\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mignore\u001b[0m\u001b[0;34m}\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 328\u001b[0m \u001b[0mvalidate\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0msub_validate\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/.local/lib/python3.9/site-packages/altair/utils/schemapi.py\u001b[0m in \u001b[0;36m_todict\u001b[0;34m(obj, validate, context)\u001b[0m\n\u001b[1;32m 58\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0;34m[\u001b[0m\u001b[0m_todict\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mv\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mvalidate\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mcontext\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mv\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mobj\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 59\u001b[0m \u001b[0;32melif\u001b[0m \u001b[0misinstance\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mobj\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mdict\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 60\u001b[0;31m return {\n\u001b[0m\u001b[1;32m 61\u001b[0m \u001b[0mk\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0m_todict\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mv\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mvalidate\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mcontext\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 62\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mk\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mv\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mobj\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mitems\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/.local/lib/python3.9/site-packages/altair/utils/schemapi.py\u001b[0m in \u001b[0;36m\u001b[0;34m(.0)\u001b[0m\n\u001b[1;32m 59\u001b[0m \u001b[0;32melif\u001b[0m \u001b[0misinstance\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mobj\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mdict\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 60\u001b[0m return {\n\u001b[0;32m---> 61\u001b[0;31m \u001b[0mk\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0m_todict\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mv\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mvalidate\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mcontext\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 62\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mk\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mv\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mobj\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mitems\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 63\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mv\u001b[0m \u001b[0;32mis\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0mUndefined\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/.local/lib/python3.9/site-packages/altair/utils/schemapi.py\u001b[0m in \u001b[0;36m_todict\u001b[0;34m(obj, validate, context)\u001b[0m\n\u001b[1;32m 54\u001b[0m \u001b[0;34m\"\"\"Convert an object to a dict representation.\"\"\"\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 55\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0misinstance\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mobj\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mSchemaBase\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 56\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mobj\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mto_dict\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mvalidate\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mvalidate\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mcontext\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mcontext\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 57\u001b[0m \u001b[0;32melif\u001b[0m \u001b[0misinstance\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mobj\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m(\u001b[0m\u001b[0mlist\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtuple\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mnp\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mndarray\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 58\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0;34m[\u001b[0m\u001b[0m_todict\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mv\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mvalidate\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mcontext\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mv\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mobj\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/.local/lib/python3.9/site-packages/altair/vegalite/v4/schema/channels.py\u001b[0m in \u001b[0;36mto_dict\u001b[0;34m(self, validate, ignore, context)\u001b[0m\n\u001b[1;32m 42\u001b[0m \"match any column in the data.\".format(shorthand))\n\u001b[1;32m 43\u001b[0m \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 44\u001b[0;31m raise ValueError(\"{} encoding field is specified without a type; \"\n\u001b[0m\u001b[1;32m 45\u001b[0m \u001b[0;34m\"the type cannot be automatically inferred because \"\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 46\u001b[0m \u001b[0;34m\"the data is not specified as a pandas.DataFrame.\"\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;31mValueError\u001b[0m: Origin encoding field is specified without a type; the type cannot be automatically inferred because the data is not specified as a pandas.DataFrame." - ] - }, - { - "data": { - "text/plain": [ - "alt.Chart(...)" - ] - }, - "execution_count": 3, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "# Create a visualization with Modin df\n", "alt.Chart(modin_cars).mark_point().encode(\n", @@ -101,84 +45,9 @@ }, { "cell_type": "code", - "execution_count": 4, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "FutureWarning: iteritems is deprecated and will be removed in a future version. Use .items instead.\n" - ] - }, - { - "data": { - "text/html": [ - "\n", - "
\n", - "" - ], - "text/plain": [ - "alt.Chart(...)" - ] - }, - "execution_count": 4, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "# Create a visualization with pandas df\n", "alt.Chart(pandas_cars).mark_point().encode(\n", @@ -208,7 +77,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.9.7" + "version": "3.9.18" }, "orig_nbformat": 4 }, diff --git a/examples/jupyter/integrations/huggingface.ipynb b/examples/jupyter/integrations/huggingface.ipynb index 69370054deb..ebb011c699b 100644 --- a/examples/jupyter/integrations/huggingface.ipynb +++ b/examples/jupyter/integrations/huggingface.ipynb @@ -10,7 +10,7 @@ }, { "cell_type": "code", - "execution_count": 1, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -20,7 +20,7 @@ }, { "cell_type": "code", - "execution_count": 2, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -31,20 +31,9 @@ }, { "cell_type": "code", - "execution_count": 3, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "('imdb.csv', )" - ] - }, - "execution_count": 3, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "import urllib.request\n", "url_path = \"https://modin-datasets.intel.com/testing/IMDB_Dataset.csv\"\n", @@ -53,31 +42,9 @@ }, { "cell_type": "code", - "execution_count": 4, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "UserWarning: Ray execution environment not yet initialized. Initializing...\n", - "To remove this warning, run the following python code before doing dataframe operations:\n", - "\n", - " import ray\n", - " ray.init(runtime_env={'env_vars': {'__MODIN_AUTOIMPORT_PANDAS__': '1'}})\n", - "\n", - "2023-04-11 10:27:18,363\tINFO worker.py:1553 -- Started a local Ray instance.\n" - ] - }, - { - "name": "stdout", - "output_type": "stream", - "text": [ - "CPU times: user 575 ms, sys: 261 ms, total: 836 ms\n", - "Wall time: 8.58 s\n" - ] - } - ], + "outputs": [], "source": [ "%%time\n", "modin_df = pd.read_csv(\"imdb.csv\")" @@ -85,159 +52,34 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
reviewsentiment
0One of the other reviewers has mentioned that ...positive
1A wonderful little production. <br /><br />The...positive
2I thought this was a wonderful way to spend ti...positive
3Basically there's a family where a little boy ...negative
4Petter Mattei's \"Love in the Time of Money\" is...positive
\n", - "
" - ], - "text/plain": [ - " review sentiment\n", - "0 One of the other reviewers has mentioned that ... positive\n", - "1 A wonderful little production.

The... positive\n", - "2 I thought this was a wonderful way to spend ti... positive\n", - "3 Basically there's a family where a little boy ... negative\n", - "4 Petter Mattei's \"Love in the Time of Money\" is... positive" - ] - }, - "execution_count": 5, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "modin_df.head()" ] }, { "cell_type": "code", - "execution_count": 6, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "modin.pandas.dataframe.DataFrame" - ] - }, - "execution_count": 6, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "type(modin_df)" ] }, { "cell_type": "code", - "execution_count": 7, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
reviewsentiment
30204Jack Lemmon was one of our great actors. His p...negative
\n", - "
" - ], - "text/plain": [ - " review sentiment\n", - "30204 Jack Lemmon was one of our great actors. His p... negative" - ] - }, - "execution_count": 7, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "modin_df.sample()" ] }, { "cell_type": "code", - "execution_count": 8, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -246,22 +88,9 @@ }, { "cell_type": "code", - "execution_count": 9, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "2023-04-11 10:27:24.824712: I tensorflow/core/platform/cpu_feature_guard.cc:151] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA\n", - "To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags.\n", - "All model checkpoint layers were used when initializing TFBertForSequenceClassification.\n", - "\n", - "Some layers of TFBertForSequenceClassification were not initialized from the model checkpoint at bert-base-uncased and are newly initialized: ['classifier']\n", - "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n" - ] - } - ], + "outputs": [], "source": [ "# Loading the BERT Classifier and Tokenizer along with Input module\n", "from transformers import InputExample, InputFeatures\n", @@ -272,38 +101,16 @@ }, { "cell_type": "code", - "execution_count": 10, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Model: \"tf_bert_for_sequence_classification\"\n", - "_________________________________________________________________\n", - " Layer (type) Output Shape Param # \n", - "=================================================================\n", - " bert (TFBertMainLayer) multiple 109482240 \n", - " \n", - " dropout_37 (Dropout) multiple 0 \n", - " \n", - " classifier (Dense) multiple 1538 \n", - " \n", - "=================================================================\n", - "Total params: 109,483,778\n", - "Trainable params: 109,483,778\n", - "Non-trainable params: 0\n", - "_________________________________________________________________\n" - ] - } - ], + "outputs": [], "source": [ "model.summary()" ] }, { "cell_type": "code", - "execution_count": 11, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -322,18 +129,9 @@ }, { "cell_type": "code", - "execution_count": 12, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "['in', 'this', 'ka', '##ggle', 'notebook', ',', 'i', 'will', 'do', 'sentiment', 'analysis', 'using', 'bert', 'with', 'hugging', '##face']\n", - "[1999, 2023, 10556, 24679, 14960, 1010, 1045, 2097, 2079, 15792, 4106, 2478, 14324, 2007, 17662, 12172]\n" - ] - } - ], + "outputs": [], "source": [ "# But first see BERT tokenizer exmaples and other required stuff!\n", "\n", @@ -346,27 +144,16 @@ }, { "cell_type": "code", - "execution_count": 13, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "modin.pandas.dataframe.DataFrame" - ] - }, - "execution_count": 13, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "type(train)" ] }, { "cell_type": "code", - "execution_count": 14, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -386,7 +173,7 @@ }, { "cell_type": "code", - "execution_count": 15, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -438,49 +225,18 @@ }, { "cell_type": "code", - "execution_count": 16, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "0 InputExample(guid=None, text_a=\"One of the oth...\n", - "1 InputExample(guid=None, text_a='A wonderful li...\n", - "2 InputExample(guid=None, text_a='I thought this...\n", - "3 InputExample(guid=None, text_a=\"Basically ther...\n", - "4 InputExample(guid=None, text_a='Petter Mattei\\...\n", - " ... \n", - "44995 InputExample(guid=None, text_a=\"I watched this...\n", - "44996 InputExample(guid=None, text_a=\"I am a sucker ...\n", - "44997 InputExample(guid=None, text_a=\"I am a college...\n", - "44998 InputExample(guid=None, text_a=\"huge Ramones f...\n", - "44999 InputExample(guid=None, text_a='I rented this ...\n", - "Length: 45000, dtype: object" - ] - }, - "execution_count": 16, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "train_InputExamples" ] }, { "cell_type": "code", - "execution_count": 17, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - " 0%| | 0/45000 [00:00\u001b[0;34m\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0mmodel\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mfit\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mtrain_data\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mepochs\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;36m2\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mvalidation_data\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mvalidation_data\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m", - "\u001b[0;32m~/opt/anaconda3/lib/python3.9/site-packages/keras/utils/traceback_utils.py\u001b[0m in \u001b[0;36merror_handler\u001b[0;34m(*args, **kwargs)\u001b[0m\n\u001b[1;32m 62\u001b[0m \u001b[0mfiltered_tb\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 63\u001b[0m \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 64\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mfn\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 65\u001b[0m \u001b[0;32mexcept\u001b[0m \u001b[0mException\u001b[0m \u001b[0;32mas\u001b[0m \u001b[0me\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0;31m# pylint: disable=broad-except\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 66\u001b[0m \u001b[0mfiltered_tb\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0m_process_traceback_frames\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0me\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m__traceback__\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/opt/anaconda3/lib/python3.9/site-packages/keras/engine/training.py\u001b[0m in \u001b[0;36mfit\u001b[0;34m(self, x, y, batch_size, epochs, verbose, callbacks, validation_split, validation_data, shuffle, class_weight, sample_weight, initial_epoch, steps_per_epoch, validation_steps, validation_batch_size, validation_freq, max_queue_size, workers, use_multiprocessing)\u001b[0m\n\u001b[1;32m 1382\u001b[0m _r=1):\n\u001b[1;32m 1383\u001b[0m \u001b[0mcallbacks\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mon_train_batch_begin\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mstep\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 1384\u001b[0;31m \u001b[0mtmp_logs\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mtrain_function\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0miterator\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 1385\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mdata_handler\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mshould_sync\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1386\u001b[0m \u001b[0mcontext\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0masync_wait\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/opt/anaconda3/lib/python3.9/site-packages/tensorflow/python/util/traceback_utils.py\u001b[0m in \u001b[0;36merror_handler\u001b[0;34m(*args, **kwargs)\u001b[0m\n\u001b[1;32m 148\u001b[0m \u001b[0mfiltered_tb\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 149\u001b[0m \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 150\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mfn\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 151\u001b[0m \u001b[0;32mexcept\u001b[0m \u001b[0mException\u001b[0m \u001b[0;32mas\u001b[0m \u001b[0me\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 152\u001b[0m \u001b[0mfiltered_tb\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0m_process_traceback_frames\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0me\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m__traceback__\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/opt/anaconda3/lib/python3.9/site-packages/tensorflow/python/eager/def_function.py\u001b[0m in \u001b[0;36m__call__\u001b[0;34m(self, *args, **kwds)\u001b[0m\n\u001b[1;32m 913\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 914\u001b[0m \u001b[0;32mwith\u001b[0m \u001b[0mOptionalXlaContext\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_jit_compile\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 915\u001b[0;31m \u001b[0mresult\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_call\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwds\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 916\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 917\u001b[0m \u001b[0mnew_tracing_count\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mexperimental_get_tracing_count\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/opt/anaconda3/lib/python3.9/site-packages/tensorflow/python/eager/def_function.py\u001b[0m in \u001b[0;36m_call\u001b[0;34m(self, *args, **kwds)\u001b[0m\n\u001b[1;32m 945\u001b[0m \u001b[0;31m# In this case we have created variables on the first call, so we run the\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 946\u001b[0m \u001b[0;31m# defunned version which is guaranteed to never create variables.\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 947\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_stateless_fn\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwds\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;31m# pylint: disable=not-callable\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 948\u001b[0m \u001b[0;32melif\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_stateful_fn\u001b[0m \u001b[0;32mis\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 949\u001b[0m \u001b[0;31m# Release the lock early so that multiple threads can perform the call\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/opt/anaconda3/lib/python3.9/site-packages/tensorflow/python/eager/function.py\u001b[0m in \u001b[0;36m__call__\u001b[0;34m(self, *args, **kwargs)\u001b[0m\n\u001b[1;32m 2954\u001b[0m (graph_function,\n\u001b[1;32m 2955\u001b[0m filtered_flat_args) = self._maybe_define_function(args, kwargs)\n\u001b[0;32m-> 2956\u001b[0;31m return graph_function._call_flat(\n\u001b[0m\u001b[1;32m 2957\u001b[0m filtered_flat_args, captured_inputs=graph_function.captured_inputs) # pylint: disable=protected-access\n\u001b[1;32m 2958\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/opt/anaconda3/lib/python3.9/site-packages/tensorflow/python/eager/function.py\u001b[0m in \u001b[0;36m_call_flat\u001b[0;34m(self, args, captured_inputs, cancellation_manager)\u001b[0m\n\u001b[1;32m 1851\u001b[0m and executing_eagerly):\n\u001b[1;32m 1852\u001b[0m \u001b[0;31m# No tape is watching; skip to running the function.\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 1853\u001b[0;31m return self._build_call_outputs(self._inference_function.call(\n\u001b[0m\u001b[1;32m 1854\u001b[0m ctx, args, cancellation_manager=cancellation_manager))\n\u001b[1;32m 1855\u001b[0m forward_backward = self._select_forward_and_backward_functions(\n", - "\u001b[0;32m~/opt/anaconda3/lib/python3.9/site-packages/tensorflow/python/eager/function.py\u001b[0m in \u001b[0;36mcall\u001b[0;34m(self, ctx, args, cancellation_manager)\u001b[0m\n\u001b[1;32m 497\u001b[0m \u001b[0;32mwith\u001b[0m \u001b[0m_InterpolateFunctionError\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 498\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mcancellation_manager\u001b[0m \u001b[0;32mis\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 499\u001b[0;31m outputs = execute.execute(\n\u001b[0m\u001b[1;32m 500\u001b[0m \u001b[0mstr\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0msignature\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mname\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 501\u001b[0m \u001b[0mnum_outputs\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_num_outputs\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/opt/anaconda3/lib/python3.9/site-packages/tensorflow/python/eager/execute.py\u001b[0m in \u001b[0;36mquick_execute\u001b[0;34m(op_name, num_outputs, inputs, attrs, ctx, name)\u001b[0m\n\u001b[1;32m 52\u001b[0m \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 53\u001b[0m \u001b[0mctx\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mensure_initialized\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 54\u001b[0;31m tensors = pywrap_tfe.TFE_Py_Execute(ctx._handle, device_name, op_name,\n\u001b[0m\u001b[1;32m 55\u001b[0m inputs, attrs, num_outputs)\n\u001b[1;32m 56\u001b[0m \u001b[0;32mexcept\u001b[0m \u001b[0mcore\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_NotOkStatusException\u001b[0m \u001b[0;32mas\u001b[0m \u001b[0me\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;31mKeyboardInterrupt\u001b[0m: " - ] - } - ], + "outputs": [], "source": [ "model.fit(train_data, epochs=2, validation_data=validation_data)" ] }, { "cell_type": "code", - "execution_count": 21, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -566,18 +284,9 @@ }, { "cell_type": "code", - "execution_count": 22, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "worst movie of my life, will never watch movies from this series : Negative\n", - "Wow, blew my mind, what a movie by Marvel, animation and story is amazing : Positive\n" - ] - } - ], + "outputs": [], "source": [ "tf_batch = tokenizer(pred_sentences, max_length=128, padding=True, truncation=True, return_tensors='tf') # we are tokenizing before sending into our trained model\n", "tf_outputs = model(tf_batch) \n", diff --git a/examples/jupyter/integrations/matplotlib.ipynb b/examples/jupyter/integrations/matplotlib.ipynb index 4c1e53a4dbf..8c2a5dec3c7 100644 --- a/examples/jupyter/integrations/matplotlib.ipynb +++ b/examples/jupyter/integrations/matplotlib.ipynb @@ -9,7 +9,7 @@ }, { "cell_type": "code", - "execution_count": 1, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -21,37 +21,9 @@ }, { "cell_type": "code", - "execution_count": 2, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "UserWarning: Ray execution environment not yet initialized. Initializing...\n", - "To remove this warning, run the following python code before doing dataframe operations:\n", - "\n", - " import ray\n", - " ray.init(runtime_env={'env_vars': {'__MODIN_AUTOIMPORT_PANDAS__': '1'}})\n", - "\n", - "2023-01-06 09:40:24,085\tINFO worker.py:1529 -- Started a local Ray instance. View the dashboard at \u001b[1m\u001b[32m127.0.0.1:8267 \u001b[39m\u001b[22m\n", - "UserWarning: Distributing object. This may take some time.\n", - "UserWarning: Distributing object. This may take some time.\n" - ] - }, - { - "data": { - "image/png": "iVBORw0KGgoAAAANSUhEUgAAAXwAAAD6CAYAAACiefy7AAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjQuMywgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/MnkTPAAAACXBIWXMAAAsTAAALEwEAmpwYAAAR40lEQVR4nO3dUYxcV33H8e+/DqSSUZVSg3Fjl/XDqiJQKtDKoaUP29K0dhJhHmjl0KaGElmpYgkkqmJAon10VIkCImBZECVRUV0kaGMlhhTSjlqEQr1OIchJA6s0aRa7paEoYKcqcvn3YcYwDLObmZ07c+fe8/1IK8+99+w95z9z5zdnzo53IzORJLXfT9U9AEnSbBj4klQIA1+SCmHgS1IhDHxJKoSBL0mFqCTwI2JvRDweEasRcWTI8d+LiEd6X1+KiF+uol9J0uhi0s/hR8QW4OvAdcAacBq4KTMf7Wvzq8BjmfmdiNgH/FlmXvt85962bVsuLCxMNL5Zu3jxIlu3bq17GDNlzWWw5mY4c+bMM5n5kmHHrqjg/HuA1cx8AiAiTgD7gR8GfmZ+qa/9Q8DOUU68sLDAyspKBUOcnU6nw/Lyct3DmClrLoM1N0NEPLXesSqWdK4Gnu7bXuvtW8/bgc9W0K8kaQxVzPBjyL6h60QR8et0A//X1j1ZxCHgEMD27dvpdDoVDHF2Lly40LgxT8qay2DNzVdF4K8Bu/q2dwLnBhtFxKuBjwP7MvPb650sM48DxwGWlpayaW+nmvgWcFLWXAZrbr4qlnROA4sRsTsiXggcAE72N4iIXwA+A9ycmV+voE+1zMKR+1k4cn/dw5BabeIZfmZeiojDwAPAFuDOzDwbEbf2jh8D3g/8HPDRiAC4lJlLk/YtSRpdFUs6ZOYp4NTAvmN9t28BbqmiL0nS5vg/bSWpEAa+JBXCwJekQhj4klQIA18agR8bVRsY+JJUCANf0lzx3dT0GPiSVAgDX43hzE+ajIEvTZkvVJoXBr6k1vLF9scZ+JJUgSa8uBj4klQIA19T0YTZjlQaA19S4zih2BwDX5IKYeBLDTEvs9p5GYfGZ+BLUiEMfGkKnAVrHhn4KoYhrNIZ+JIazRfy0Rn4DePFLWmzDHxJKoSBL0mFMPAlFafUpVEDXyNd/KU8QUqpU2Uy8Dfgk19Smxj4c8IXlx/ZzH3h/acqtP06MvBVmXlcGmr7E1gaxxV1D0DNdjlMn1yudxxqvx9ea0dvqHkkzeUMvyDOdtV207rG2/LcMfAlbVpbgrAULumoNr5FH24e7xeX7qZrVo+5M3ypJv2z43mcKc/jmDQZA1+SCmHgS1IhDHxJqti8LocVG/jz+oCMow01TIP3izRcsYGv5jPYpfFUEvgRsTciHo+I1Yg4MuR4RMSHe8cfiYjXVtGvJGl0E38OPyK2AHcA1wFrwOmIOJmZj/Y12wcs9r6uBT7W+1dSDebhs/7zMIaNtPH/HlQxw98DrGbmE5n5feAEsH+gzX7gnux6CLgqInZU0LdazmUbNd08XcORmZOdIOLNwN7MvKW3fTNwbWYe7mtzH3A0M7/Y234QeHdmrmx07it3LOaOgx+caHySVJKnbr/xTGYuDTtWxQw/huwbfBUZpU23YcShiFiJiA1fDCRJ46nid+msAbv6tncC5zbRBoDMPA4cB1haWsqVCdf3+tcJ11szHKXNKO3HvT3K+Ydtj/I9Vewf9Xs7nQ7Ly8tjj61Om6nz+b53ksepyvGPO75Ra9js41zVfT2pzfQxrOZxH/OqvndUcfv6x6oI/NPAYkTsBr4JHADeMtDmJHA4Ik7Q/WHts5l5voK+59Y8hVvV2lybNE11P3cmDvzMvBQRh4EHgC3AnZl5NiJu7R0/BpwCrgdWgeeAt03ar6T2qDsIS1HJr0fOzFN0Q71/37G+2wncVkVf88YLVVJT+PvwC+ULVT2qut99/JqvjsfQX60gSYVwhr8J670yP3n0BjqdzmwH09e3JG3EGb4kFaL1M3xnvpLU1frAl4YpZSJQSp0aTVGBX9fFX+eTzif85jXlvmvKOFW/ogJf9TCQpPngD20lqRDO8HEGKqkMBv6M+eIiqS4GvlQRX8w17wx8qRClvyCVXj8Y+JIq0tRAbeq4N8NP6UhSIQx8SSqESzpaV0lvdaXNaNpzxBm+JBXCGf4catqsQdpI267nJtfjDF+SCuEMXz+mybMXSRtzhi9JhTDwJakQBr4kFcLAl8b05NEbuGvv1rqHIY3NwJekQvgpHUk/NG+f0pq38TSdM3xJKoQzfGkCzkDVJAb+AJ/AKs0sr3mfX/Uy8BvAJ4mkKhj4Uss4QdB6/KGtJBXCwJekQhj4klQIA1+SCmHgS1IhDHxJKoSBL0mFmOhz+BHxYuCvgQXgSeB3M/M7A212AfcALwN+ABzPzA9N0q9UJT+3rlJMOsM/AjyYmYvAg73tQZeAd2XmK4DXAbdFxDUT9itJGtOkgb8fuLt3+27gTYMNMvN8Zj7cu/094DHg6gn7lSSNadLA356Z56Eb7MBLN2ocEQvAa4AvT9ivJGlMz7uGHxFfoLv+Puh943QUES8CPg28MzO/u0G7Q8Ch3uaFiHh8nH7mwDbgmboHMWPWXAZrboaXr3cgMnPTZ+2F8XJmno+IHUAnM39xSLsXAPcBD2TmBzbdYQNExEpmLtU9jlmy5jJYc/NNuqRzEjjYu30QuHewQUQE8AngsbaHvSTNs0kD/yhwXUR8A7iut01E/HxEnOq1eT1wM/AbEfGV3tf1E/YrSRrTRJ/Dz8xvA28Ysv8ccH3v9heBmKSfhjle9wBqYM1lsOaGm2gNX5LUHP5qBUkqhIEvSYUw8CWpEAa+JBXCwJekQhj4klQIA1+SCmHgS1IhDHxJKoSBL0mFMPAlqRAGviQVwsCXpEIY+JJUiIl+H/60bdu2LRcWFuoexlguXrzI1q1b6x7GTFlzGay5Gc6cOfNMZr5k2LFKAj8i7gRuBL6Vma8acjyAD9H9oyjPAW/NzIef77wLCwusrKxUMcSZ6XQ6LC8v1z2MmbLmMlhzM0TEU+sdq2pJ5y5g7wbH9wGLva9DwMcq6leSNKJKAj8z/xH47w2a7Afuya6HgKsiYkcVfUuSRjOrNfyrgaf7ttd6+84PNoyIQ3TfBbB9+3Y6nc4sxleZCxcuNG7Mkyqt5rd+7iIAd9GpdyAzVtrjDO2reVaBP+yPmA/9Y7qZeZzeHw5eWlrKpq2fNXHNb1LF1fy5+wHKqpkCH2faV/OsPpa5Buzq294JnJtR35IkZhf4J4E/iK7XAc9m5k8s50iSpqeqj2X+FbAMbIuINeBPgRcAZOYx4BTdj2Su0v1Y5tuq6FeSNLpKAj8zb3qe4wncVkVfkqTN8VcrSFIhDHxJKoSBL0mFMPAlqRAGviQVwsCXpEIY+JJUCANfkgph4EtSIQx8SSqEgS9JhTDwJakQBr4kFcLAl6RCGPiSVAgDX5IKYeBLUiEMfEkqhIEvSYUw8CWpEAa+JBXCwJekQhj4klQIA1+SCmHgS1IhDHxJKoSBL0mFMPAlqRCVBH5E7I2IxyNiNSKODDm+HBHPRsRXel/vr6JfSdLorpj0BBGxBbgDuA5YA05HxMnMfHSg6T9l5o2T9idJ2pwqZvh7gNXMfCIzvw+cAPZXcF5JUoWqCPyrgaf7ttd6+wb9SkR8NSI+GxGvrKBfSdIYJl7SAWLIvhzYfhh4eWZeiIjrgb8FFoeeLOIQcAhg+/btdDqdCoY4OxcuXGjcmCdVYs1AcTWX+Di3reYqAn8N2NW3vRM4198gM7/bd/tURHw0IrZl5jODJ8vM48BxgKWlpVxeXq5giLPT6XRo2pgnVVzNn7sfoKyaKfBxpn01V7GkcxpYjIjdEfFC4ABwsr9BRLwsIqJ3e0+v329X0LckaUQTz/Az81JEHAYeALYAd2bm2Yi4tXf8GPBm4I8i4hLwP8CBzBxc9pEkTVEVSzpk5ing1MC+Y323PwJ8pIq+JEmb4/+0laRCGPiSVAgDX5IKYeBLUiEMfEkqhIEvSYUw8CWpEAa+JBXCwJekQhj4klQIA1+SCmHgS1IhDHxJKoSBL0mFMPAlqRAGviQVwsCXpEIY+JqKhSP3s3Dk/rqHoTH5uLWbgS9JhTDwJakQBr4kFcLAl6RCtD7wR/khVOk/qCq9fk1X6dfXPGVQ6wO/KqVftJJ+UtNywcDX2Jp2kY+jqtq8jzSPDHwVb9oBZkBqXhj4NZpFEDhj1TQ16fryGi448J3VSRrU9lyoJPAjYm9EPB4RqxFxZMjxiIgP944/EhGvraJfVa/uC3JQleMZ91zz1n7a56nSPI5JFQR+RGwB7gD2AdcAN0XENQPN9gGLva9DwMcm7bdOk1zM8/QRrao1ddwaromP56hjnvZzeF5dUcE59gCrmfkEQEScAPYDj/a12Q/ck5kJPBQRV0XEjsw8X0H/lbr8QD559IbNf+/ybPstxeB9VNp91l9vabVvls/nHxfdDJ7gBBFvBvZm5i297ZuBazPzcF+b+4CjmfnF3vaDwLszc2Wjc1+5YzF3HPzgROOTpJI8dfuNZzJzadixKtbwY8i+wVeRUdp0G0YcioiViNjwxUCSNJ4qlnTWgF192zuBc5toA0BmHgeOAywtLeXKJG/FBr533LdZo7QfbNPpdFheXp6o3436GKW2SdqMO+5J2qw3ns3cX+Oea9Jr4fLjXNU1Ne/3xTTazPJa3shG3z/O4zyNa2Ez4vb1j1UR+KeBxYjYDXwTOAC8ZaDNSeBwb33/WuDZeVy/34x5W6ObR+vdR953s+XjsHltuY8mDvzMvBQRh4EHgC3AnZl5NiJu7R0/BpwCrgdWgeeAt03a70bm7cGZxXj6+5i3+kcx6ZinHWZNPX/Tr4VZP3fmwTTHU8UMn8w8RTfU+/cd67udwG1V9FWiebsgpXni82N0xf5PW0kqTSUzfKlKJS5j9Cu9fk2Pgb8BnziSRtWEvHBJRxN58ugN3LV3a93D0JT5OLeDM/yCNGEGonJ4Pc5eUYHvBabL6roWvAZ1WR3XQlGB3wYGhuTzYLNcw5ekQhj4klQIl3S0Lt82axxeL/PPwC+UT07VweuuXi7pSFIhDHxJKoSBL0mFMPAlqRAT/xHzaYqI/wKeqnscY9oGPFP3IGbMmstgzc3w8sx8ybADcx34TRQRK+v9xfi2suYyWHPzuaQjSYUw8CWpEAZ+9Y7XPYAaWHMZrLnhXMOXpEI4w5ekQhj4FYuIP46IjIhtffveExGrEfF4RPx2neOrUkT8eUT8a0Q8EhF/ExFX9R1ra817ezWtRsSRusczDRGxKyL+ISIei4izEfGO3v4XR8TnI+IbvX9/tu6xVi0itkTEv0TEfb3tVtVs4FcoInYB1wH/3rfvGuAA8EpgL/DRiNhSzwgr93ngVZn5auDrwHugvTX3argD2AdcA9zUq7VtLgHvysxXAK8DbuvVeQR4MDMXgQd7223zDuCxvu1W1WzgV+svgD8B+n8wsh84kZn/m5n/BqwCe+oYXNUy8+8y81Jv8yFgZ+92W2veA6xm5hOZ+X3gBN1aWyUzz2fmw73b36MbgFfTrfXuXrO7gTfVMsApiYidwA3Ax/t2t6pmA78iEfFG4JuZ+dWBQ1cDT/dtr/X2tc0fAp/t3W5rzW2ta10RsQC8BvgysD0zz0P3RQF4aY1Dm4YP0p2w/aBvX6tq9vfhjyEivgC8bMih9wHvBX5r2LcN2deYj0ZtVHNm3ttr8z66ywCfvPxtQ9o3puYNtLWuoSLiRcCngXdm5ncjhpXfDhFxI/CtzDwTEcs1D2dqDPwxZOZvDtsfEb8E7Aa+2ntS7AQejog9dGeBu/qa7wTOTXmolVmv5ssi4iBwI/CG/NFnfBtd8wbaWtdPiIgX0A37T2bmZ3q7/zMidmTm+YjYAXyrvhFW7vXAGyPieuCngZ+JiL+kZTW7pFOBzPxaZr40Mxcyc4FuMLw2M/8DOAkciIgrI2I3sAj8c43DrUxE7AXeDbwxM5/rO9TWmk8DixGxOyJeSPcH0ydrHlPlojtr+QTwWGZ+oO/QSeBg7/ZB4N5Zj21aMvM9mbmz9/w9APx9Zv4+LavZGf6UZebZiPgU8CjdZY/bMvP/ah5WVT4CXAl8vvfO5qHMvLWtNWfmpYg4DDwAbAHuzMyzNQ9rGl4P3Ax8LSK+0tv3XuAo8KmIeDvdT6L9Tj3Dm6lW1ez/tJWkQrikI0mFMPAlqRAGviQVwsCXpEIY+JJUCANfkgph4EtSIQx8SSrE/wMpeUs5Gu1M/QAAAABJRU5ErkJggg==", - "text/plain": [ - "
" - ] - }, - "metadata": { - "needs_background": "light" - }, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "# Create a visualization with Modin df\n", "# Example modified from https://matplotlib.org/3.1.1/gallery/lines_bars_and_markers/xcorr_acorr_demo.html#sphx-glr-gallery-lines-bars-and-markers-xcorr-acorr-demo-py\n", @@ -74,22 +46,9 @@ }, { "cell_type": "code", - "execution_count": 3, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "image/png": "iVBORw0KGgoAAAANSUhEUgAAAXwAAAD6CAYAAACiefy7AAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjQuMywgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/MnkTPAAAACXBIWXMAAAsTAAALEwEAmpwYAAAR40lEQVR4nO3dUYxcV33H8e+/DqSSUZVSg3Fjl/XDqiJQKtDKoaUP29K0dhJhHmjl0KaGElmpYgkkqmJAon10VIkCImBZECVRUV0kaGMlhhTSjlqEQr1OIchJA6s0aRa7paEoYKcqcvn3YcYwDLObmZ07c+fe8/1IK8+99+w95z9z5zdnzo53IzORJLXfT9U9AEnSbBj4klQIA1+SCmHgS1IhDHxJKoSBL0mFqCTwI2JvRDweEasRcWTI8d+LiEd6X1+KiF+uol9J0uhi0s/hR8QW4OvAdcAacBq4KTMf7Wvzq8BjmfmdiNgH/FlmXvt85962bVsuLCxMNL5Zu3jxIlu3bq17GDNlzWWw5mY4c+bMM5n5kmHHrqjg/HuA1cx8AiAiTgD7gR8GfmZ+qa/9Q8DOUU68sLDAyspKBUOcnU6nw/Lyct3DmClrLoM1N0NEPLXesSqWdK4Gnu7bXuvtW8/bgc9W0K8kaQxVzPBjyL6h60QR8et0A//X1j1ZxCHgEMD27dvpdDoVDHF2Lly40LgxT8qay2DNzVdF4K8Bu/q2dwLnBhtFxKuBjwP7MvPb650sM48DxwGWlpayaW+nmvgWcFLWXAZrbr4qlnROA4sRsTsiXggcAE72N4iIXwA+A9ycmV+voE+1zMKR+1k4cn/dw5BabeIZfmZeiojDwAPAFuDOzDwbEbf2jh8D3g/8HPDRiAC4lJlLk/YtSRpdFUs6ZOYp4NTAvmN9t28BbqmiL0nS5vg/bSWpEAa+JBXCwJekQhj4klQIA18agR8bVRsY+JJUCANf0lzx3dT0GPiSVAgDX43hzE+ajIEvTZkvVJoXBr6k1vLF9scZ+JJUgSa8uBj4klQIA19T0YTZjlQaA19S4zih2BwDX5IKYeBLDTEvs9p5GYfGZ+BLUiEMfGkKnAVrHhn4KoYhrNIZ+JIazRfy0Rn4DePFLWmzDHxJKoSBL0mFMPAlFafUpVEDXyNd/KU8QUqpU2Uy8Dfgk19Smxj4c8IXlx/ZzH3h/acqtP06MvBVmXlcGmr7E1gaxxV1D0DNdjlMn1yudxxqvx9ea0dvqHkkzeUMvyDOdtV207rG2/LcMfAlbVpbgrAULumoNr5FH24e7xeX7qZrVo+5M3ypJv2z43mcKc/jmDQZA1+SCmHgS1IhDHxJqti8LocVG/jz+oCMow01TIP3izRcsYGv5jPYpfFUEvgRsTciHo+I1Yg4MuR4RMSHe8cfiYjXVtGvJGl0E38OPyK2AHcA1wFrwOmIOJmZj/Y12wcs9r6uBT7W+1dSDebhs/7zMIaNtPH/HlQxw98DrGbmE5n5feAEsH+gzX7gnux6CLgqInZU0LdazmUbNd08XcORmZOdIOLNwN7MvKW3fTNwbWYe7mtzH3A0M7/Y234QeHdmrmx07it3LOaOgx+caHySVJKnbr/xTGYuDTtWxQw/huwbfBUZpU23YcShiFiJiA1fDCRJ46nid+msAbv6tncC5zbRBoDMPA4cB1haWsqVCdf3+tcJ11szHKXNKO3HvT3K+Ydtj/I9Vewf9Xs7nQ7Ly8tjj61Om6nz+b53ksepyvGPO75Ra9js41zVfT2pzfQxrOZxH/OqvndUcfv6x6oI/NPAYkTsBr4JHADeMtDmJHA4Ik7Q/WHts5l5voK+59Y8hVvV2lybNE11P3cmDvzMvBQRh4EHgC3AnZl5NiJu7R0/BpwCrgdWgeeAt03ar6T2qDsIS1HJr0fOzFN0Q71/37G+2wncVkVf88YLVVJT+PvwC+ULVT2qut99/JqvjsfQX60gSYVwhr8J670yP3n0BjqdzmwH09e3JG3EGb4kFaL1M3xnvpLU1frAl4YpZSJQSp0aTVGBX9fFX+eTzif85jXlvmvKOFW/ogJf9TCQpPngD20lqRDO8HEGKqkMBv6M+eIiqS4GvlQRX8w17wx8qRClvyCVXj8Y+JIq0tRAbeq4N8NP6UhSIQx8SSqESzpaV0lvdaXNaNpzxBm+JBXCGf4catqsQdpI267nJtfjDF+SCuEMXz+mybMXSRtzhi9JhTDwJakQBr4kFcLAl8b05NEbuGvv1rqHIY3NwJekQvgpHUk/NG+f0pq38TSdM3xJKoQzfGkCzkDVJAb+AJ/AKs0sr3mfX/Uy8BvAJ4mkKhj4Uss4QdB6/KGtJBXCwJekQhj4klQIA1+SCmHgS1IhDHxJKoSBL0mFmOhz+BHxYuCvgQXgSeB3M/M7A212AfcALwN+ABzPzA9N0q9UJT+3rlJMOsM/AjyYmYvAg73tQZeAd2XmK4DXAbdFxDUT9itJGtOkgb8fuLt3+27gTYMNMvN8Zj7cu/094DHg6gn7lSSNadLA356Z56Eb7MBLN2ocEQvAa4AvT9ivJGlMz7uGHxFfoLv+Puh943QUES8CPg28MzO/u0G7Q8Ch3uaFiHh8nH7mwDbgmboHMWPWXAZrboaXr3cgMnPTZ+2F8XJmno+IHUAnM39xSLsXAPcBD2TmBzbdYQNExEpmLtU9jlmy5jJYc/NNuqRzEjjYu30QuHewQUQE8AngsbaHvSTNs0kD/yhwXUR8A7iut01E/HxEnOq1eT1wM/AbEfGV3tf1E/YrSRrTRJ/Dz8xvA28Ysv8ccH3v9heBmKSfhjle9wBqYM1lsOaGm2gNX5LUHP5qBUkqhIEvSYUw8CWpEAa+JBXCwJekQhj4klQIA1+SCmHgS1IhDHxJKoSBL0mFMPAlqRAGviQVwsCXpEIY+JJUiIl+H/60bdu2LRcWFuoexlguXrzI1q1b6x7GTFlzGay5Gc6cOfNMZr5k2LFKAj8i7gRuBL6Vma8acjyAD9H9oyjPAW/NzIef77wLCwusrKxUMcSZ6XQ6LC8v1z2MmbLmMlhzM0TEU+sdq2pJ5y5g7wbH9wGLva9DwMcq6leSNKJKAj8z/xH47w2a7Afuya6HgKsiYkcVfUuSRjOrNfyrgaf7ttd6+84PNoyIQ3TfBbB9+3Y6nc4sxleZCxcuNG7Mkyqt5rd+7iIAd9GpdyAzVtrjDO2reVaBP+yPmA/9Y7qZeZzeHw5eWlrKpq2fNXHNb1LF1fy5+wHKqpkCH2faV/OsPpa5Buzq294JnJtR35IkZhf4J4E/iK7XAc9m5k8s50iSpqeqj2X+FbAMbIuINeBPgRcAZOYx4BTdj2Su0v1Y5tuq6FeSNLpKAj8zb3qe4wncVkVfkqTN8VcrSFIhDHxJKoSBL0mFMPAlqRAGviQVwsCXpEIY+JJUCANfkgph4EtSIQx8SSqEgS9JhTDwJakQBr4kFcLAl6RCGPiSVAgDX5IKYeBLUiEMfEkqhIEvSYUw8CWpEAa+JBXCwJekQhj4klQIA1+SCmHgS1IhDHxJKoSBL0mFMPAlqRCVBH5E7I2IxyNiNSKODDm+HBHPRsRXel/vr6JfSdLorpj0BBGxBbgDuA5YA05HxMnMfHSg6T9l5o2T9idJ2pwqZvh7gNXMfCIzvw+cAPZXcF5JUoWqCPyrgaf7ttd6+wb9SkR8NSI+GxGvrKBfSdIYJl7SAWLIvhzYfhh4eWZeiIjrgb8FFoeeLOIQcAhg+/btdDqdCoY4OxcuXGjcmCdVYs1AcTWX+Di3reYqAn8N2NW3vRM4198gM7/bd/tURHw0IrZl5jODJ8vM48BxgKWlpVxeXq5giLPT6XRo2pgnVVzNn7sfoKyaKfBxpn01V7GkcxpYjIjdEfFC4ABwsr9BRLwsIqJ3e0+v329X0LckaUQTz/Az81JEHAYeALYAd2bm2Yi4tXf8GPBm4I8i4hLwP8CBzBxc9pEkTVEVSzpk5ing1MC+Y323PwJ8pIq+JEmb4/+0laRCGPiSVAgDX5IKYeBLUiEMfEkqhIEvSYUw8CWpEAa+JBXCwJekQhj4klQIA1+SCmHgS1IhDHxJKoSBL0mFMPAlqRAGviQVwsCXpEIY+JqKhSP3s3Dk/rqHoTH5uLWbgS9JhTDwJakQBr4kFcLAl6RCtD7wR/khVOk/qCq9fk1X6dfXPGVQ6wO/KqVftJJ+UtNywcDX2Jp2kY+jqtq8jzSPDHwVb9oBZkBqXhj4NZpFEDhj1TQ16fryGi448J3VSRrU9lyoJPAjYm9EPB4RqxFxZMjxiIgP944/EhGvraJfVa/uC3JQleMZ91zz1n7a56nSPI5JFQR+RGwB7gD2AdcAN0XENQPN9gGLva9DwMcm7bdOk1zM8/QRrao1ddwaromP56hjnvZzeF5dUcE59gCrmfkEQEScAPYDj/a12Q/ck5kJPBQRV0XEjsw8X0H/lbr8QD559IbNf+/ybPstxeB9VNp91l9vabVvls/nHxfdDJ7gBBFvBvZm5i297ZuBazPzcF+b+4CjmfnF3vaDwLszc2Wjc1+5YzF3HPzgROOTpJI8dfuNZzJzadixKtbwY8i+wVeRUdp0G0YcioiViNjwxUCSNJ4qlnTWgF192zuBc5toA0BmHgeOAywtLeXKJG/FBr533LdZo7QfbNPpdFheXp6o3436GKW2SdqMO+5J2qw3ns3cX+Oea9Jr4fLjXNU1Ne/3xTTazPJa3shG3z/O4zyNa2Ez4vb1j1UR+KeBxYjYDXwTOAC8ZaDNSeBwb33/WuDZeVy/34x5W6ObR+vdR953s+XjsHltuY8mDvzMvBQRh4EHgC3AnZl5NiJu7R0/BpwCrgdWgeeAt03a70bm7cGZxXj6+5i3+kcx6ZinHWZNPX/Tr4VZP3fmwTTHU8UMn8w8RTfU+/cd67udwG1V9FWiebsgpXni82N0xf5PW0kqTSUzfKlKJS5j9Cu9fk2Pgb8BnziSRtWEvHBJRxN58ugN3LV3a93D0JT5OLeDM/yCNGEGonJ4Pc5eUYHvBabL6roWvAZ1WR3XQlGB3wYGhuTzYLNcw5ekQhj4klQIl3S0Lt82axxeL/PPwC+UT07VweuuXi7pSFIhDHxJKoSBL0mFMPAlqRAT/xHzaYqI/wKeqnscY9oGPFP3IGbMmstgzc3w8sx8ybADcx34TRQRK+v9xfi2suYyWHPzuaQjSYUw8CWpEAZ+9Y7XPYAaWHMZrLnhXMOXpEI4w5ekQhj4FYuIP46IjIhtffveExGrEfF4RPx2neOrUkT8eUT8a0Q8EhF/ExFX9R1ra817ezWtRsSRusczDRGxKyL+ISIei4izEfGO3v4XR8TnI+IbvX9/tu6xVi0itkTEv0TEfb3tVtVs4FcoInYB1wH/3rfvGuAA8EpgL/DRiNhSzwgr93ngVZn5auDrwHugvTX3argD2AdcA9zUq7VtLgHvysxXAK8DbuvVeQR4MDMXgQd7223zDuCxvu1W1WzgV+svgD8B+n8wsh84kZn/m5n/BqwCe+oYXNUy8+8y81Jv8yFgZ+92W2veA6xm5hOZ+X3gBN1aWyUzz2fmw73b36MbgFfTrfXuXrO7gTfVMsApiYidwA3Ax/t2t6pmA78iEfFG4JuZ+dWBQ1cDT/dtr/X2tc0fAp/t3W5rzW2ta10RsQC8BvgysD0zz0P3RQF4aY1Dm4YP0p2w/aBvX6tq9vfhjyEivgC8bMih9wHvBX5r2LcN2deYj0ZtVHNm3ttr8z66ywCfvPxtQ9o3puYNtLWuoSLiRcCngXdm5ncjhpXfDhFxI/CtzDwTEcs1D2dqDPwxZOZvDtsfEb8E7Aa+2ntS7AQejog9dGeBu/qa7wTOTXmolVmv5ssi4iBwI/CG/NFnfBtd8wbaWtdPiIgX0A37T2bmZ3q7/zMidmTm+YjYAXyrvhFW7vXAGyPieuCngZ+JiL+kZTW7pFOBzPxaZr40Mxcyc4FuMLw2M/8DOAkciIgrI2I3sAj8c43DrUxE7AXeDbwxM5/rO9TWmk8DixGxOyJeSPcH0ydrHlPlojtr+QTwWGZ+oO/QSeBg7/ZB4N5Zj21aMvM9mbmz9/w9APx9Zv4+LavZGf6UZebZiPgU8CjdZY/bMvP/ah5WVT4CXAl8vvfO5qHMvLWtNWfmpYg4DDwAbAHuzMyzNQ9rGl4P3Ax8LSK+0tv3XuAo8KmIeDvdT6L9Tj3Dm6lW1ez/tJWkQrikI0mFMPAlqRAGviQVwsCXpEIY+JJUCANfkgph4EtSIQx8SSrE/wMpeUs5Gu1M/QAAAABJRU5ErkJggg==", - "text/plain": [ - "
" - ] - }, - "metadata": { - "needs_background": "light" - }, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "# Create a visualization with pandas df\n", "# Example modified from https://matplotlib.org/3.1.1/gallery/lines_bars_and_markers/xcorr_acorr_demo.html#sphx-glr-gallery-lines-bars-and-markers-xcorr-acorr-demo-py\n", @@ -112,29 +71,9 @@ }, { "cell_type": "code", - "execution_count": 4, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "UserWarning: Distributing object. This may take some time.\n" - ] - }, - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": { - "needs_background": "light" - }, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "# Create a visualization with Modin df\n", "# Example modified from https://matplotlib.org/stable/tutorials/introductory/pyplot.html#sphx-glr-tutorials-introductory-pyplot-py\n", @@ -158,22 +97,9 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": { - "needs_background": "light" - }, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "# Create a visualization with pandas df\n", "# Example modified from https://matplotlib.org/stable/tutorials/introductory/pyplot.html#sphx-glr-tutorials-introductory-pyplot-py\n", @@ -196,29 +122,9 @@ }, { "cell_type": "code", - "execution_count": 6, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "UserWarning: Distributing object. This may take some time.\n" - ] - }, - { - "data": { - "image/png": "iVBORw0KGgoAAAANSUhEUgAAAY8AAADYCAYAAAATZm8cAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjQuMywgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/MnkTPAAAACXBIWXMAAAsTAAALEwEAmpwYAAAi2UlEQVR4nO3deZzV9X3v8ddbEJBtUFmEQQUFNSiuUzWJccM0McZgYhajsdQYaW1iTFtvatramubGcnuTXDGptaQxId5coyYaNSZGHcWlcWFxYREZVFAWYQAZFFdmPveP3/focZxhzsBZ5px5Px8PHue3ne/v8/v5cz7n8/v+FkUEZmZm3bFLpQMwM7Pq4+RhZmbd5uRhZmbd5uRhZmbd5uRhZmbd5uRhZmbd5uRhZhUh6VVJ++1kGz+T9D934HsnSlq1M+tu194+aXv6FKvNns7Jw6yKSTpb0rz0h2utpN9LOq7A74akCaWOsTMRMTginitV+5L+XFJr2jdbJD0h6ZM70M77EpSkFZJOyY1HxAtpe1qLEXs1cPIwq1KS/ga4ErgCGAXsA1wNTK1gWF2S1LeMq3s4IgYDw4CfADdK2qOM669ZTh5mVUhSHfAvwFcj4uaI2BoRb0fE7RHxP9IyR0t6WNLmVJX8SFK/NO+B1NST6Zf5F9L0T6Zf6Jsl/VHSoXnrPFLS45JekXSTpBvyf5FLukDSckmbJN0maUzevJD0VUlNQFPetAlpeDdJ35e0UlKLpIck7Zbm3STppTT9AUkHd3d/RUQbcC2wG/C+U2WSPiBpTtruxZI+laZPB84Bvpn20+2SriNL1Lenad+UNC5tT9/0vTmSviPpv9P+ukvS8Lz1/Vna1o2SLmtfyVQDJw+z6vRBYABwy3aWaQX+Ghielp8C/BVARByfljksnW65QdKRZH9g/wLYE/hP4DZJ/VPSuQX4GbAHcD3w6dyKJJ0M/CvweWA0sBL4Zbt4zgCOASZ1EOv3gKOAD6X2vwm0pXm/ByYCI4EFwC+2s80dSn/UvwK8SkpeefN2BW4H7krruAj4haQDI2JWWt+/pf10ekScC7wAnJ6m/Vsnqz0bOC+12Q+4JK1vElmFeA7ZvqoD6ru7TZXm5GFWnfYENkTEts4WiIj5EfFIRGyLiBVkyeCE7bR5AfCfEfFoRLRGxGzgTeDY9K8vcFWqcG4GHsv77jnAtRGxICLeBL4FfFDSuLxl/jUiNkXE6/krlbQL8GXg4ohYndb9x9QOEXFtRLySxi8HDkuVVyGOlbQZeAn4IvDpiGhpvwwwGJgREW9FxL3Ab9PyO+OnEbEsbe+NwOFp+meB2yPioYh4C/gnoOoeMljOc49mVjwbgeGS+naWQCQdAPwAaAAGkv3/Pn87be4LTJN0Ud60fsAYsj9uq+O9T1J9MW94DFlVAEBEvCppI9kv6hUdLJ9vOFkV9WwH29AH+C7wOWAE71Yjw4H2SaAjj0REVxcQjAFeTKe2clay89XAS3nDr5ElqHfWl5sREa+lfVVVXHmYVaeHgTfITgV15j+ApcDEiBgK/D2g7Sz/IvDdiBiW929gRFwPrAXqJeV/f++84TVkyQcASYPIqqPVect09ut6Q9qW/TuYdzbZBQCnkJ3eGZdbxXa2o7vWAHunCihnH96NvaO4d6ZSWAuMzY2kvp09d6K9inDyMKtC6dTLPwH/LukMSQMl7SrpVEm5c/BDgC3Aq5IOAi5s18w63tt5/GPgLyUdo8wgSadJGkKWrFqBr0nqK2kqcHTed/8fcJ6kwyX1J7sC7NF0uqyrbcl1Zv9A0hhJfSR9MLUzhOzU2Uay6umKwvdSwR4FtpJ1iu8q6UTgdN7ts2m/nzqbVqhfAadL+lDqS/o2xU2GZeHkYValIuIHwN8A/wg0k1UOXwN+kxa5hOyX+ytkieGGdk1cDsxOVxh9PiLmkfV7/Ah4GVgO/Hla11vAZ4Dzgc3Al8j6BXL9Eo3AZcCvyX5Z7w+c1Y3NuQRYCMwFNgH/i+zv08/JTiGtBpYAj3SjzYKkbfsUcCpZFXQ18GcRsTQt8hNgUtpPv0nT/hX4xzTtkm6ubzFZp/wvyfbVK8B60r6sFvLLoMxsR0h6FLgmIn5a6ViqmaTBZAl5YkQ8X+FwCubKw8wKIukESXul01bTgEOBOysdVzWSdHo61TiI7DLlhbx7YUFVcPIws0IdCDxJdpXT3wKfjYi1lQ2pak0l66hfQ3YPy1lRZaeBfNrKzMy6zZWHmZl1m5OHmZl1m5OHmZl1m5OHmZl1m5OHmZl1m5OHmZl1m5OHmZl1W80+kn348OExbty4SodhNWL+/PkbImJEudfr49iKpdjHcM0mj3HjxjFv3rxKh2E1QtLKSqzXx7EVS7GPYZ+2MjOzbnPyMDOzbnPyMNtBkq6VtF7Sorxpe0i6W1JT+tw9b963JC2X9Iykj1UmarPicPIw23E/Az7ebtqlQGNETAQa0ziSJpG9HOng9J2r0/u5zaqSk4fZDoqIB8jeepdvKjA7Dc/m3XeMTwV+GRFvphf+LOe9r3E12ylvbmvlst8s4vkNW8uyvpq92mrh6hbGXXpHpcOwKrJixmnFaGZU7h0XEbFW0sg0vZ73vkJ1VZr2PpKmA9MB9tlnn2LEZL3AjXNf5LpHVvKxg/di/PBBJV+fKw+z8lAH0zp8mU5EzIqIhohoGDGi7LeWWBV6c1srV895loZ9d+fDE/YsyzqdPMyKa52k0QDpc32avgrYO2+5sWRvkTPbaTfOW8Xalje4+JSJSB39Tik+Jw+z4roNmJaGpwG35k0/S1J/SePJXj36WAXisxrz5rZW/uO+5Ry17+4cN2F42dZbs30eZqUm6XrgRGC4pFXAPwMzgBslnQ+8AHwOICIWS7oRWAJsA74aEa0VCdxqyk3zVrGm5Q1mnHlo2aoOcPIw22ER8cVOZk3pZPnvAt8tXUTW27y1rY2r71vOkfsM4yMTy1d1gE9bmZlVrZvmv8ialje4+JQDylp1gJOHmVlVyqqOZzlin2EcX+aqA5w8zMyq0q/mr2L15te5eEr5rrDK5+RhZlZl3trWxr/ft5zD9x7GCQdU5l4gJw8zsyrz6wWp6ijjfR3tOXmYmVWRXNVx2N7DOLFCVQc4eZiZVZWbF6xi1cuv840K9XXkOHmYmVWJt1vb+NF9yzlsbB0nHljZ5545eZiZVYlc1VHJvo4cJw8zsyrwdmsbP7x3OYeOreOkA0d2/YUSc/IwM6sCtyxYnVUdFe7ryHHyMDPr4d5ubeOH9zUxub6Okw+qfNUBTh5mZj3eLY+v5sVNPafqgCIlD0l+Oq+ZWQm83drGj+5dziH1Q5nygZ5RdUCByUPSZZKWSrpb0vWSLpE0R9IVku4HLpY0RdLjkhZKulZS//TdFZKGp+EGSXPS8OWSrpN0r6QmSRd0EcM3U9tPSpqxc5ttZlYdfvP4al7Y9BrfmFL+J+duT5cVg6QG4EzgiLT8AmB+mj0sIk6QNABoAqZExDJJPwcuBK7sovlDgWOBQcDjku6IiPe9mlPSqcAZwDER8ZqkPTqJdTowHaDPUL/72cyq27Z0X0dPqzqgsMrjOODWiHg9Il4Bbs+bd0P6PBB4PiKWpfHZwPEFtJ1rdwNwH3B0J8udAvw0Il4DiIhNHS0UEbMioiEiGvoMrCtg9WZmPddvnljDyo2vcXEPqzqgsOSxvYi3FrDMtrz1DGg3L7oYz4+hs3lmZjVnW2sbP7y3iYPHDOWUHlZ1QGHJ4yHgdEkDJA0GTutgmaXAOEkT0vi5wP1peAVwVBo+s933pqZ29yR7F/TcTmK4C/iypIEAnZ22MjOrFbe+U3X0nCus8nWZPCJiLnAb8CRwMzAPaGm3zBvAecBNkhYCbcA1afa3gZmSHgRa2zX/GHAH8AjwnY76O1L7d6YY5kl6ArikkI0zM6tGuapj0uihfHTSqEqH06FCL7H9XkRcnn75PwB8PyJ+nL9ARDSSdarTbvqDwAGdtLssIqYXEkBEzAB8lZWZ1bzbnlzDio2v8Z/nHtUjqw4o/D6PWekX/wLg1xGxoHQhmVU3SX8tabGkRenS9gGS9kiXujelz90rHaf1TNvSM6w+MHoof9pDqw4osPKIiLOLveKIuLz9NEmTgevaTX4zIo4p9vrNSkFSPfB1YFJEvC7pRuAsYBLQGBEzJF0KXAr8XQVDtR7q9qfW8PyGrVzzpZ5bdUDhp63KIiIWAodXOg6zndQX2E3S28BAYA3wLbKLQiC7lH0OTh7WTmtb8MPG5Ry015AeXXWAn21lVlQRsRr4HvACsBZoiYi7gFERsTYtsxbo9NpLSdMlzZM0r7m5uRxhWw9x+5NreG7DVr5xykR22aXnVh3g5GFWVKkvYyowHhgDDJL0pe60kX+z64gRflJCb9HaFlx1b1OqOvaqdDhdcvIwK65TyJ620BwRb5Nd3v4hYJ2k0QDpc30FY7Qe6LdPreG55q1cPKXnVx3g5GFWbC8Ax0oaqKy3cwrwNNl9StPSMtOAWysUn/VArW3BzMYmDhw1hI8d3POrDuhhHeZm1S4iHpX0K7LL2rcBjwOzgMHAjZLOJ0swn6tclNbT5KqOq885siqqDnDyMCu6iPhn4J/bTX6TrAoxe4/WtuCqVHV8vEqqDvBpKzOzivrtU2t4tnkrX6+Svo4cJw8zswppbQt+eO9yDhg1mFMPqZ6qA5w8zMwq5o6Fa1m+/tWqqzrAycPMrCKyu8mbmDhyMJ84ZHSlw+k2Jw8zswr43cK1NFVp1QFOHmZmZdeWrrCaOHIwn5hcfVUHOHmYmZXd7xZlVcdFUybSpwqrDqjh+zwm19cxb0ZHb8w1M6ucXNUxYeRgTqvSqgNceZiZldXvF73EsnWvctHJE6q26gAnDzOzsslVHfuPGMQnDx1T6XB2ipOHmVmZ3Ln4JZ5Z9wpfr+K+jhwnDzOzMshVHfvVQNUBTh5mZmXxh8UvsfSlV/j6ydVfdYCTh5lZybWl93XsN3wQpx9W/VUHOHmYmZXcXUuyquOiKdV9hVU+Jw8zsxLKqo7lWdVRA30dOU4eZmYldNeSdTy9dgtfO3kCffvUzp/cmr3DfOHqFsZdeke3v7fCd6WbWZHk+jrGDx/Ep2qkryOndtKgmVkPc/fTqeo4qbaqDnDyMDMriYhg5j1NjNtzIFMPr62qA5w8zMxK4u4l61iydgsXnTyx5qoOcPIwKwlJwyT9StJSSU9L+qCkPSTdLakpfe5e6TitNCKyvo5arTrAycOsVGYCd0bEQcBhwNPApUBjREwEGtO41aB7nl7P4jVb+FqNVh3g5GFWdJKGAscDPwGIiLciYjMwFZidFpsNnFGJ+Ky0IoIr71nGvnsO5IwarTrAycOsFPYDmoGfSnpc0n9JGgSMioi1AOlzZEdfljRd0jxJ85qbm8sXtRVFY67qqMErrPLV7paZVU5f4EjgPyLiCGAr3ThFFRGzIqIhIhpGjBhRqhitBCKCKxuXsc8eA/n0EfWVDqeknDzMim8VsCoiHk3jvyJLJuskjQZIn+srFJ+VyL1L17Node3dTd6R2t46swqIiJeAFyUdmCZNAZYAtwHT0rRpwK0VCM9KJOvraGLvPXar+aoDavjxJGYVdhHwC0n9gOeA88h+rN0o6XzgBeBzFYzPiuy+Z9azcHUL/3bmoexa41UHOHmYlUREPAE0dDBrSplDsTJ4T9VxZO1XHeDTVmZmO23OM808taqFr500oVdUHeDkYWa2U3L3dYzdfTc+c+TYSodTNk4eZmY7Yc6yZp7sZVUHOHmYme2wXF9H/bDeVXWAk4eZ2Q67f1kzT764ma+dPIF+fXvXn9PetbVmZkWSX3Wc2cuqDqiS5CHpREm/rXQcZmY59y9r5okXN/PVk3pf1QFFSh6SfL+ImfUaufd11A/bjc8e1fuqDigweUi6LL3U5m5J10u6RNIcSVdIuh+4WNKU9ATRhZKuldQ/fXeFpOFpuEHSnDR8uaTrJN2bXo5zQRdhDJV0i6Qlkq6R9L7Y859G2vpaS7d2hJlZoR5o2sDjL2zmr07av1dWHVDAHeaSGoAzgSPS8guA+Wn2sIg4QdIAoAmYEhHLJP0cuBC4sovmDwWOBQYBj0u6IyLWdLLs0cAkYCVwJ/AZsgfOvSMiZgGzAPqPnhhdbZuZWXdl7yZfxpi6AXzuqL0rHU7FFJIyjwNujYjXI+IV4Pa8eTekzwOB5yNiWRqfTfYynK7k2t0A3EeWIDrzWEQ8FxGtwPUpLjOzsnqwaQMLXtjMX/XSvo6cQrZc25m3tYBltuWtZ0C7ee2rg+1VC91Z1sys6HJ9HWPqBvC5ht7Z15FTSPJ4CDhd0gBJg4HTOlhmKTBO0oQ0fi5wfxpeARyVhs9s972pqd09gROBuduJ42hJ41NfxxdSXGZmZfPQ8g3MX/kyF540gf59+1Q6nIrqMnlExFyy9xA8CdwMzANa2i3zBtkjp2+StBBoA65Js78NzJT0INDarvnHgDuAR4DvbKe/A+BhYAawCHgeuKWr2M3MiiXr62hidN0APt/Lqw4o/JHs34uIyyUNBB4Avh8RP85fICIayTrVaTf9QeCATtpdFhHTu1p5RMwB5hQYq5lZ0f338o3MW/ky35l6cK+vOqDw5DFL0iSyPovZEbGghDGZmfUoWV/HMvYaOoDP/0nvvcIqX0HJIyLOLvaKI+Ly9tMkTQauazf5zYg4ptjrNzMr1B+f3cjcFS/zL6463tGj7gyPiIXA4ZWOw8wsJ9fXsdfQAXy+wVVHTu+9SNnMrAAPP7uRx1Zs4sIT92fArq46cpw8zMw6ERFc2djEqKH9+YL7Ot7DycPMrBMPP7eRx57fxIUnuOpoz8nDrAQk9UkPCv1tGt8jPVi0KX3uXukYrWsz72li5JD+nHX0PpUOpcdx8jArjYuBp/PGLwUaI2Ii0JjGrQd7+NmNPPq8+zo64+RhVmSSxpI9xue/8iZPJXtgKOnzjDKHZd00s3EZI4f054uuOjrk5GFWfFcC3yR7TE/OqIhYC5A+R3b25fz30jQ3N5c0UOvYw89u5JHnNvGX7uvolJOHWRFJ+iSwPiLmd7lwJyJiVkQ0RETDiBEjihidFWpm4zJGDOnP2ce46uhMj7pJ0KwGfBj4lKRPkD3OZ6ik/wuskzQ6ItZKGg2sr2iU1qlHnsuqjn/65CRXHdvhysOsiCLiWxExNiLGAWcB90bEl8ieTD0tLTYNuLVCIVoXZt7T5KqjAE4eZuUxA/iopCbgo2ncephHn9vIw89tdF9HAXzayqxE8l8lEBEbgSmVjMe6NrOxieGD+3OOq44u1WzymFxfx7wZHb300Mzs/R57fhN/fHYj/3jaB1x1FMCnrczMyK6wyqqOfSsdSlVw8jCzXm/uik389/KN/OUJ+7FbP1cdhXDyMLNeb+Y9TQwf3M9VRzc4eZhZrzZvxSYeWr6Bvzh+f1cd3eDkYWa92szGJvYc1I9zjvUVVt3h5GFmvdb8lZt4sGkDf3HCfgzsV7MXn5aEk4eZ9VpX3pNVHV861n0d3eXkYWa90vyVL/Ng0wamH++qY0c4eZhZrzSzsYk9BvXj3A+66tgRNZs8Fq5uYdyld1Q6DDPrgRa88DIPLGt21bETajZ5mJl1ZuY9qepwX8cOc/Iws17l8Rde5v5lzVzwkf0Y1N9Vx45y8jCzXmVmYxO7D9yVP3Nfx05x8jCzXuOJFzcz55lmLjjeVcfOcvIws15j5j3LUtUxrtKhVD0nDzPrFZ54cTP3PdPMVz6yH4Nddew0Jw8z6xWuamxi2MBdmfahcZUOpSY4eZhZzXvyxc3cu3Q9F7jqKBonDzOrebmqw1dYFY+Th5nVtKdWbaZx6Xq+ctx4hgzYtdLh1AwnD7Mik7S3pPskPS1psaSL0/Q9JN0tqSl97l7pWHuDqxqbqNvNfR3F5uRhVnzbgL+NiA8AxwJflTQJuBRojIiJQGMatxJauKqFe5521VEKTh5mRRYRayNiQRp+BXgaqAemArPTYrOBMyoSYC8yM1d1fHhcpUOpOU4eZiUkaRxwBPAoMCoi1kKWYICRnXxnuqR5kuY1NzeXLdZas2h1C/c8vY7zjxvPUFcdRefkYVYikgYDvwa+ERFbCv1eRMyKiIaIaBgxYkTpAqxxMxubGDqgL3/uqqMknDzMSkDSrmSJ4xcRcXOavE7S6DR/NLC+UvHVukWrW7h7yTrOP24/Vx0l4uRhVmSSBPwEeDoifpA36zZgWhqeBtxa7th6i6tcdZSck4dZ8X0YOBc4WdIT6d8ngBnARyU1AR9N41Zki9e0cNeSdXz5uPHU7eaqo1SKcp++pL4Rsa0YbZlVu4h4CFAns6eUM5be6KrGJoYM6Mt5Hx5f6VBqWkGVh6TLJC1NNzZdL+kSSXMkXSHpfuBiSVMkPS5poaRrJfVP310haXgabpA0Jw1fLuk6Sfemm6Yu2M76B0tqlLQgtT915zfdzGrNkjVb+MPidXz5w646Sq3LykNSA3Am2eWGfYEFwPw0e1hEnCBpANAETImIZZJ+DlwIXNlF84eS3UQ1CHhc0h0RsaaD5d4APh0RW1IiekTSbRER7WKdDkwH6DPUV6mY9Ta5quPLx7nqKLVCKo/jgFsj4vV0w9PtefNuSJ8HAs9HxLI0Phs4voC2c+1uAO4Dju5kOQFXSHoKuIfshqtR7RfKv8Sxz8C6AlZvZrViyZot3Ln4Jc5z1VEWhfR5dHbuFmBrActs490kNaDdvOhiPOccYARwVES8LWlFB22ZWS92VWMTQ/r35Xz3dZRFIZXHQ8Dpkgakm55O62CZpcA4SRPS+LnA/Wl4BXBUGj6z3fempnb3BE4E5nYSQx2wPiWOkwA/V9nM3vH02lR1HDeeuoGuOsqhy+QREXPJrk9/ErgZmAe0tFvmDeA84CZJC4E24Jo0+9vATEkPAq3tmn8MuAN4BPhOJ/0dAL8AGiTNI6tClna9aWbWW7jqKL9CL9X9XkRcLmkg8ADw/Yj4cf4CEdFI1qlOu+kPAgd00u6yiJje1cpTn8gHC4zVzHqRpS9t4feLXuLrJ09w1VFGhSaPWemR0gOA2bknhpqZVdpVjU0M7u8rrMqtoOQREWcXe8URcXn7aZImA9e1m/xmRBxT7PWbWXXa1tpG0/pXWbi6hadWbeZ3C1/iopMnMGxgv0qH1qv0qDfBR8RC4PBKx2FmPcO21jaWN7/KwlUtLFrdwlOrW3h67RbeeLsNgEH9+nDyQSP5ynH7VTjS3qdHJQ8z6722tbbxbPNWFq5OiWLVZpa0SxQH19dxzjH7Mrm+jslj6xi/5yB22WV7dwpYqTh5mFnZtbYFz6aKYuHq7N+SNVt4/e3sgsyB/fpwyJg6zj56XyaPHcrk+mHsN9yJoidx8jCzkmptC55rzvVRZFXF4rxEsduufTikfihnHb03k+vrOHRsHeOHD6aPE0WP5uRhZkXT2hY8v+H9ieK1t95NFAePGcoX/uTdRLHfCCeKauTkYWY7pK0teG7D1tQ/kUsULWxNiWLArrtw8Jg6Pt+wN4ekRLG/E0XNcPIwsy61tQXPb3w3UeT6KF59M3uNT/++u3DwmKF89qixTB47jMn1dew/YhB9+/h9c7XKycPM3qOtLVixMbvqKdehvbhdopg0ZiifObL+naueJowY7ETRyzh5mPVibW3Byk2vpUSxOUsUq7fwSl6i+MDooXz6iHomj61jcn0dE0c6UZiTh1mvERGs3PjaO5fGLlzVwqI1LbzyRpYo+qVEMfWIMRxaP4xD6uuYOGowuzpRWAecPMxqUETwwjsVxbv3UryTKPrswgdGD+FTh43h0LF1HFJfxwGjhjhRWMGcPMyqXETw4qbXs8tjV29mUUoYW/ISxUEpUUyufzdR9OvrRGE7zsnDrIwkfRyYCfQB/isiZnS3jXVb3mD+ypffuTx24eoWWl5/G4Bd+4iD9hrKJ1OimOxEYSVSs8ljcn0d82Z09NJDs8qQ1Af4d+CjwCpgrqTbImJJd9r51fxV/O8/PMOufcSBew3hE5NHv5so9hpM/759ShG+2XvUbPIw64GOBpZHxHMAkn4JTAW6lTzOOKKej0wczoF7DXGisIpx8jArn3rgxbzxVcD73lUjaTowHWCfffZ5fyPDdqN+2G4lCtGsMD4RalY+HT2XI943IWJWRDRERMOIESPKEJZZ9zl5mJXPKmDvvPGxwJoKxWK2U5w8zMpnLjBR0nhJ/YCzgNsqHJPZDnGfh1mZRMQ2SV8D/kB2qe61EbG4wmGZ7RAnD7MyiojfAb+rdBxmO0sR7+uvqwmSXgGeqXQcPdRwYEOlg+iBtrdf9o2IsvdeS2oGVnYwy/8N3+V98V6d7Y+iHsO1nDzmRURDpePoibxvOlZN+6WaYi0174v3Ktf+cIe5mZl1m5OHmZl1Wy0nj1mVDqAH877pWDXtl2qKtdS8L96rLPujZvs8zMysdGq58jAzsxJx8jAzs26ryeQh6eOSnpG0XNKllY6nkiStkLRQ0hOS5qVpe0i6W1JT+ty90nGWg6RrJa2XtChvWqf7QtK30jH0jKSPlSlG37hr79MTj4uaSx55L9w5FZgEfFHSpMpGVXEnRcThedd+Xwo0RsREoDGN9wY/Az7eblqH+yIdM2cBB6fvXJ2OrZ0i6TJJS1Oiul7SJZLmSLpC0v3AxZKmSHo8Jf1rJfVP310haXgabpA0Jw1fLuk6SfemJHjBdtY/WFKjpAWp/ak7u03VStKJkn5b6Tig8sdFWv6bqe0nJXX5hssel82KoCgv3KlxU4ET0/BsYA7wd5UKplwi4gFJ49pN7mxfTAV+GRFvAs9LWk52bD28o+uX1ACcCRxB9v/eAmB+mj0sIk6QNABoAqZExDJJPwcuBK7sovlDgWOBQcDjku6IiI6e2PsG8OmI2JL+4DyS3mbY466ckdQ3IrZVOo5S6wnHhaRTgTOAYyLiNUl7dBV3zVUedPzCnfoKxdITBHCXpPnpJUMAoyJiLUD6HFmx6Cqvs31RiuPoOODWiHg9Il4Bbs+bd0P6PBB4PiKWpfHZwPEFtJ1rdwNwH1mi64iAKyQ9BdxDtk2jurkdRdETfm0DQyXdImmJpGskVeJvYk84Lk4BfhoRrwFExKauGq7FyqOgF+70Ih+OiDWSRgJ3S1pa6YCqRCmOo47azNlawDLbePcH34B289rH1lms5wAjgKMi4m1JKzpoq+R6wq/t5Giy09srgTuBzwC/2uEN2zE94bjQduZ1qBYrD79wJ0/uf5qIWA/cQvY/yzpJowHS5/rKRVhxne2LUhxHDwGnSxogaTBwWgfLLAXGSZqQxs8F7k/DK4Cj0vCZ7b43NbW7J9lpuLmdxFAHrE+J4yRg3x3akp3XE35tAzwWEc9FRCtwfYqr3HrCcXEX8GVJAyG7kKSroGsxefiFO4mkQZKG5IaBPwUWke2PaWmxacCtlYmwR+hsX9wGnCWpv6TxwETgsZ1ZUUTMTe0+CdwMzANa2i3zBnAecJOkhUAbcE2a/W1gpqQHgdZ2zT8G3AE8AnxnO7+0fwE0KLvy7hyyP0qV0BN+bXd32ZLoCcdFRNyZYpgn6QngkkICr7l/wCeAZcCzwD9UOp4K7of90gH5JLA4ty+APcmuLGpKn3tUOtYy7Y/rgbXA22SVxfnb2xfAP6Rj6Bng1CLFMDh9DiT7I3FkEdq8HLik0vu3mzH/CdmpqgHA4LSPLyG7YKEhLTMAeAGYkMZ/Blychu/J/TcB/g8wJ29fPJG+u2f6/phOYjgReB0YT5aI/gCcWaH9UXXHRS32eRB+4Q4AkV1xdlgH0zcCU8ofUWVFxBc7mdXhvoiI7wLfLXIYs5RdBjwAmB0RC4rcflWIiLmScr+2V9LJr21JuV/bfcnOKuT/2v6JpL8HHm3XfO7X9j5svwqD7Oq5GcBk4AGyU7uVUHXHhZ9tZVaDJE0Grms3+c2IOKYS8XRE0uCIeDWdZ38AmL6zfzQlXQ68GhHfK0aMtaaYx0VNVh5mvV1ELAQOr3QcXai6X9vVrpjHhSsPM6tp1VCFVSMnDzMz67ZavFTXzMxKzMnDzMy6zcnDzMy6zcnDzMy67f8Dbh16cCaVNAcAAAAASUVORK5CYII=", - "text/plain": [ - "
" - ] - }, - "metadata": { - "needs_background": "light" - }, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "# Create a visualization with Modin df\n", "# Example modified from https://matplotlib.org/stable/tutorials/introductory/pyplot.html#sphx-glr-tutorials-introductory-pyplot-py\n", @@ -242,22 +148,9 @@ }, { "cell_type": "code", - "execution_count": 7, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": { - "needs_background": "light" - }, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "# Create a visualization with pandas df\n", "# Example modified from https://matplotlib.org/stable/tutorials/introductory/pyplot.html#sphx-glr-tutorials-introductory-pyplot-py\n", @@ -279,22 +172,9 @@ }, { "cell_type": "code", - "execution_count": 8, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "image/png": "iVBORw0KGgoAAAANSUhEUgAAAVYAAADYCAYAAACwYsufAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjQuMywgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/MnkTPAAAACXBIWXMAAAsTAAALEwEAmpwYAAAQWUlEQVR4nO3debCddX3H8ffHBJBNAbnQsGhcIoqOW+8gqKMM4FTrEtqRimu0jNgOWqxaBx3XVpR2LGNbl5IKGlvLIjASHGtlohmGCuhlsYrBhipLIJALFAFtQfDbP84TOcSb7Z7fzTmHvF8zZ86z/77Pk7mf/M7znPM8qSokSe08atgFSNIjjcEqSY0ZrJLUmMEqSY0ZrJLUmMEqSY0ZrJI2K8m9SZ404Da+lOTjs1jv8CRrBml7g+09vtufea22uSGDVdpGkrw+yVT3R702yb8ledEWrltJnjLXNW5MVe1WVT+dq+0neUuSB7tjc3eSq5O8chbb+a3wTnJ9kqPWj1fVjd3+PNii9pkYrNI2kOTdwKeBTwD7Ao8HPgcsHmJZm5Vk/jZs7tKq2g3YAzgdOCfJXtuw/WYMVmmOJXks8JfACVV1flX9oqp+VVUXVtVfdMsckuTSJHd1vdnPJNmxm3dxt6kfdD2613bTX9n17O5K8t0kz+pr83lJrkpyT5KvJjm7vyeX5G1JrktyZ5LlSfbrm1dJTkiyGljdN+0p3fDOSf42yQ1Jfp7kkiQ7d/O+muTWbvrFSZ6xtcerqn4NnAHsDPzW6YckT0+ystvva5K8upt+PPAG4H3dcbowyT/T+0/swm7a+5Is7PZnfrfeyiR/leQ/uuP1rSR797X35m5f70jyoQ17wBvbCV++fM3hC3gZ8AAwfxPL/C5wKDAfWAisAt7VN7+Ap/SNPw9YBzwfmAcsAa4HdgJ2BG4ATgR2AP4QuB/4eLfuEcDt3TZ2Av4BuHiDti4C9gJ23rB94LPASmD/ru0XADt18/4Y2L3b7qeBq/u2+6X1Ncyw/28BLumG53e13wM8FjgcWNPN2wG4DvhAt59HdMsdtLE2uuNyVN/4wm5/5nfjK4H/Bp5KL8xXAqd08w4G7gVe1LX3KeBX/dub6WWPVZp7jwNur6oHNrZAVV1RVZdV1QNVdT1wGvCSTWzzbcBpVXV5VT1YVcuA++iF8/qA/vvq9YzPB77Xt+4bgDOq6sqqug94P3BYkoV9y3yyqu6sqv/tbzTJo+iF54lVdXPX9ne77VBVZ1TVPd34R4Fndz32LXFokruAW4HXAX9QVT/fcBlgN3rBd39VfRv4erf8IL5YVf/V7e85wHO66a8BLqyqS6rqfuDD9EJ5k7bl+RNpe3UHsHeS+RsL1yRPBU4FJoFd6P1tXrGJbT4BWJLknX3TdgT2o/eHf3N1Xa7OTX3D+wFXrh+pqnuT3EGvB3r9DMv32xt4NL0e3ob7MA84GTgGmAB+3bfOhgE5k8uqanMX8/YDbqre6YL1buhqH8StfcO/pBfev2lv/Yyq+mV3rDbJHqs09y4F/g84ehPLfB64FlhUVY+h91E3m1j+JuDkqtqj77VLVZ0JrAX2T9K//oF9w7fQC2YAkuxKr1d9c98yG+uV3d7ty5NnmPd6ehfjjqL3EX7h+iY2sR9b6xbgwK7nvN7jeaj2meoe5BZ+a4ED1o9055Ift7mVDFZpjnUfZz8MfDbJ0Ul2SbJDkpcn+Ztusd2Bu4F7kzwN+NMNNnMbD7+Q80/AnyR5fnp2TfKKJLvTC/IHgXckmZ9kMXBI37r/Crw1yXOS7ETvmwqXd6cgNrcv6y8snZpkvyTzkhzWbWd3eqcj7qDX6/7Elh+lLXY58At6F6h2SHI48CrgrG7+hsdpY9O21LnAq5K8oLuY+DG24D8Kg1XaBqrqVODdwAeBaXo9zncAX+sWeS+9Ht899ELz7A028VFgWXcl/I+qaoreedbPAP9D74LOW7q27qd3weo44C7gjfTOQ64/D7oC+BBwHr0e2ZOBY7did94L/BD4PnAn8Nf0suTL9D6W3wz8GLhsK7a5Rbp9ezXwcnq9588Bb66qa7tFTgcO7o7T17ppnwQ+2E1771a2dw3wTnrBvZbev886umO5MXn4aRhJj0RJLgf+saq+OOxaxlmS3ej9Z7Woqn62seXssUqPQElekuR3ulMBS4BnAd8cdl3jKMmrutM3u9L7utUPeegi34wMVumR6SDgB/Suxr8HeE1VrR1uSWNrMb2LZrcAi4BjazMf9T0VIEmN2WOVpMYMVklqzGCVpMYMVklqzGCVpMYMVklqzGCVpMYMVklqbCTux7r33nvXwoULh12GHiGuuOKK26tqYth1aPs1EsG6cOFCpqamhl2GHiGS3DDsGrR981SAJDW22WBNckaSdUl+1DdtryQXJVndve/ZN+/93dMff5Lk9+aqcEkaVVvSY/0SvadM9jsJWFFVi4AV3ThJDqZ3w9xndOt8rnsOjiRtNzYbrFV1Mb27hPdbDCzrhpfx0LN8FgNnVdV93U1gr+Phj4SQpEe82V682nf9vR2ram2Sfbrp+/PwxzGsYcCnJ772tEsHWV2PUGe//bBhlyBtVOuLVzM9ZGvGG74mOT7JVJKp6enpxmVI0vDMtsd6W5IFXW91Ab2Ha0Gvh9r/mN0D6N11+7dU1VJgKcDk5ORG77Ztz0TSuJltj3U5sKQbXgJc0Df92CQ7JXkivccYfG+wEiVpvGy2x5rkTOBwYO8ka4CPAKcA5yQ5DrgROAZ6j4pNcg69R98+AJxQVQ/OUe2SNJI2G6xV9bqNzDpyI8ufDJw8SFGSNM785ZUkNWawSlJjBqskNWawSlJjBqskNWawSlJjBqskNWawSlJjBqskNWawSlJjBqskNWawSlJjBqskNWawSlJjBqskNWawSlJjBqskNWawSlJjBqskNWawSlJjBqskNTZQsCb58yTXJPlRkjOTPDrJXkkuSrK6e9+zVbGSNA5mHaxJ9gf+DJisqmcC84BjgZOAFVW1CFjRjUvSdmPQUwHzgZ2TzAd2AW4BFgPLuvnLgKMHbEOSxsqsg7WqbgY+BdwIrAV+XlXfAvatqrXdMmuBfVoUKknjYpBTAXvS650+EdgP2DXJG7di/eOTTCWZmp6enm0ZkjRyBjkVcBTws6qarqpfAecDLwBuS7IAoHtfN9PKVbW0qiaranJiYmKAMiRptAwSrDcChybZJUmAI4FVwHJgSbfMEuCCwUqUpPEyf7YrVtXlSc4FrgQeAK4ClgK7AeckOY5e+B7TolBJGhezDlaAqvoI8JENJt9Hr/cqSdslf3klSY0ZrJLUmMEqSY0ZrJLUmMEqSY0ZrJLUmMEqSY0ZrJLUmMEqSY0ZrJLUmMEqSY0ZrJLUmMEqSY0ZrJLUmMEqSY0ZrJLUmMEqSY0ZrJLUmMEqSY0ZrJLUmMEqSY0NFKxJ9khybpJrk6xKcliSvZJclGR1975nq2IlaRwM2mP9O+CbVfU04NnAKuAkYEVVLQJWdOOStN2YdbAmeQzwYuB0gKq6v6ruAhYDy7rFlgFHD1aiJI2XQXqsTwKmgS8muSrJF5LsCuxbVWsBuvd9GtQpSWNjkGCdDzwP+HxVPRf4BVvxsT/J8UmmkkxNT08PUIYkjZZBgnUNsKaqLu/Gz6UXtLclWQDQva+baeWqWlpVk1U1OTExMUAZkjRaZh2sVXUrcFOSg7pJRwI/BpYDS7ppS4ALBqpQksbM/AHXfyfwlSQ7Aj8F3kovrM9JchxwI3DMgG1I0lgZKFir6mpgcoZZRw6yXUkaZ/7ySpIaM1glqTGDVZIaM1glqTGDVZIaM1glqTGDVZIaM1glqTGDVZIaM1glqTGDVZIaM1glqTGDVZIaM1glqTGDVZIaM1glqTGDVZIaM1glqTGDVZIaM1glqTGDVZIaGzhYk8xLclWSr3fjeyW5KMnq7n3PwcuUpPHRosd6IrCqb/wkYEVVLQJWdOOStN0YKFiTHAC8AvhC3+TFwLJueBlw9CBtSNK4GbTH+mngfcCv+6btW1VrAbr3fQZsQ5LGyqyDNckrgXVVdcUs1z8+yVSSqenp6dmWIUkjZ5Ae6wuBVye5HjgLOCLJvwC3JVkA0L2vm2nlqlpaVZNVNTkxMTFAGZI0WmYdrFX1/qo6oKoWAscC366qNwLLgSXdYkuACwauUpLGyFx8j/UU4KVJVgMv7cYlabsxv8VGqmolsLIbvgM4ssV2JWkc+csrSWrMYJWkxgxWSWrMYJWkxgxWSWrMYJWkxgxWSWrMYJWkxgxWSWrMYJWkxgxWSWrMYJWkxgxWSWrMYJWkxgxWSWrMYJWkxgxWSWrMYJWkxgxWSWrMYJWkxgxWSWps1sGa5MAk30myKsk1SU7spu+V5KIkq7v3PduVK0mjb5Ae6wPAe6rq6cChwAlJDgZOAlZU1SJgRTcuSduNWQdrVa2tqiu74XuAVcD+wGJgWbfYMuDoAWuUpLHS5BxrkoXAc4HLgX2rai30whfYp0UbkjQuBg7WJLsB5wHvqqq7t2K945NMJZmanp4etAxJGhkDBWuSHeiF6leq6vxu8m1JFnTzFwDrZlq3qpZW1WRVTU5MTAxShiSNlEG+FRDgdGBVVZ3aN2s5sKQbXgJcMPvyJGn8zB9g3RcCbwJ+mOTqbtoHgFOAc5IcB9wIHDNQhZI0ZmYdrFV1CZCNzD5yttuVpHHnL68kqTGDVZIaM1glqTGDVZIaM1glqTGDVZIaM1glqTGDVZIaM1glqbFBftK6Tbz2tEuHXYJG0NlvP2zYJUgbZY9Vkhob+R6rPRNJ48YeqyQ1ZrBKUmMGqyQ1ZrBKUmMGqyQ1ZrBKUmMGqyQ1ZrBKUmMGqyQ1NmfBmuRlSX6S5LokJ81VO5I0aubkJ61J5gGfBV4KrAG+n2R5Vf14a7flTVg0E3/qrFE2Vz3WQ4DrquqnVXU/cBaweI7akqSRMlc3YdkfuKlvfA3w/NlsyJ6JpHEzVz3WzDCtHrZAcnySqSRT09PTc1SGJG17cxWsa4AD+8YPAG7pX6CqllbVZFVNTkxMzFEZkrTtzVWwfh9YlOSJSXYEjgWWz1FbkjRS5uQca1U9kOQdwL8D84AzquqauWhLkkbNnD1BoKq+AXxjrrYvSaPKX15JUmOpqs0vNddFJNPADRuZvTdw+zYsZ5R5LB6yqWPxhKryiqiGZiSCdVOSTFXV5LDrGAUei4d4LDTKPBUgSY0ZrJLU2DgE69JhFzBCPBYP8VhoZI38OVZJGjfj0GOVpLEyssGa5Iwk65L8aNi1DFuSA5N8J8mqJNckOXHYNQ1Lkkcn+V6SH3TH4mPDrkna0MieCkjyYuBe4MtV9cxh1zNMSRYAC6rqyiS7A1cAR8/mxuHjLkmAXavq3iQ7AJcAJ1bVZUMuTfqNke2xVtXFwJ3DrmMUVNXaqrqyG74HWEXvnrfbneq5txvdoXuNZu9A262RDVbNLMlC4LnA5UMuZWiSzEtyNbAOuKiqtttjodFksI6RJLsB5wHvqqq7h13PsFTVg1X1HHr3+T0kyXZ9qkijx2AdE935xPOAr1TV+cOuZxRU1V3ASuBlw61EejiDdQx0F2xOB1ZV1anDrmeYkkwk2aMb3hk4Crh2qEVJGxjZYE1yJnApcFCSNUmOG3ZNQ/RC4E3AEUmu7l6/P+yihmQB8J0k/0nvSRUXVdXXh1yT9DAj+3UrSRpXI9tjlaRxZbBKUmMGqyQ1ZrBKUmMGqyQ1ZrBKUmMGqyQ1ZrBKUmP/D+sOcHI/NdK7AAAAAElFTkSuQmCC", - "text/plain": [ - "
" - ] - }, - "metadata": { - "needs_background": "light" - }, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "plt.figure(figsize=(9, 3))\n", "\n", @@ -306,29 +186,9 @@ }, { "cell_type": "code", - "execution_count": 9, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "UserWarning: Distributing object. This may take some time.\n" - ] - }, - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": { - "needs_background": "light" - }, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "# Create a visualization with Modin df\n", "# Example modified from https://matplotlib.org/stable/tutorials/introductory/pyplot.html#sphx-glr-tutorials-introductory-pyplot-py\n", @@ -352,22 +212,9 @@ }, { "cell_type": "code", - "execution_count": 10, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "image/png": "", - "text/plain": [ - "
" - ] - }, - "metadata": { - "needs_background": "light" - }, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "# Create a visualization with pandas df\n", "# Example modified from https://matplotlib.org/stable/tutorials/introductory/pyplot.html#sphx-glr-tutorials-introductory-pyplot-py\n", diff --git a/examples/jupyter/integrations/plotly.ipynb b/examples/jupyter/integrations/plotly.ipynb index 6fd3b5ae185..ea37e589c29 100644 --- a/examples/jupyter/integrations/plotly.ipynb +++ b/examples/jupyter/integrations/plotly.ipynb @@ -16,7 +16,7 @@ }, { "cell_type": "code", - "execution_count": 1, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -30,30 +30,9 @@ }, { "cell_type": "code", - "execution_count": 2, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "/Users/labanyamukhopadhyay/opt/anaconda3/lib/python3.9/site-packages/modin/error_message.py:108: UserWarning:\n", - "\n", - "Ray execution environment not yet initialized. Initializing...\n", - "To remove this warning, run the following python code before doing dataframe operations:\n", - "\n", - " import ray\n", - " ray.init(runtime_env={'env_vars': {'__MODIN_AUTOIMPORT_PANDAS__': '1'}})\n", - "\n", - "\n", - "2023-04-06 11:28:25,243\tINFO worker.py:1553 -- Started a local Ray instance.\n", - "/Users/labanyamukhopadhyay/opt/anaconda3/lib/python3.9/site-packages/modin/pandas/dataframe.py:170: UserWarning:\n", - "\n", - "Distributing object. This may take some time.\n", - "\n" - ] - } - ], + "outputs": [], "source": [ "modin_df = pd.DataFrame(dict(a=[1,3,2,4], b=[3,2,1,0]))\n", "pandas_df = pandas.DataFrame(dict(a=[1,3,2,4], b=[3,2,1,0]))" @@ -61,129 +40,9 @@ }, { "cell_type": "code", - "execution_count": 3, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - " \n", - " " - ] - }, - "metadata": {}, - "output_type": "display_data" - }, - { - "data": { - "text/html": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "# Create a visualization with Modin df\n", "fig2 = px.bar(modin_df)\n", @@ -193,43 +52,9 @@ }, { "cell_type": "code", - "execution_count": 4, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "# Create a visualization with pandas df\n", "fig2 = px.bar(pandas_df)\n", @@ -238,43 +63,9 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "# Create a visualization with Modin df\n", "fig = px.line(modin_df)\n", @@ -283,43 +74,9 @@ }, { "cell_type": "code", - "execution_count": 6, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "# Create a visualization with pandas df\n", "fig = px.line(pandas_df)\n", @@ -328,43 +85,9 @@ }, { "cell_type": "code", - "execution_count": 7, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "# Create a visualization with Modin df\n", "fig = px.area(modin_df)\n", @@ -373,43 +96,9 @@ }, { "cell_type": "code", - "execution_count": 8, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "# Create a visualization with pandas df\n", "fig = px.area(pandas_df)\n", @@ -418,43 +107,9 @@ }, { "cell_type": "code", - "execution_count": 9, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "# Create a visualization with Modin df\n", "fig = px.area(modin_df)\n", @@ -463,43 +118,9 @@ }, { "cell_type": "code", - "execution_count": 10, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "# Create a visualization with pandas df\n", "fig = px.area(pandas_df)\n", @@ -508,43 +129,9 @@ }, { "cell_type": "code", - "execution_count": 11, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "# Create a visualization with Modin df\n", "fig = px.violin(modin_df)\n", @@ -553,43 +140,9 @@ }, { "cell_type": "code", - "execution_count": 12, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "# Create a visualization with pandas df\n", "fig = px.violin(pandas_df)\n", @@ -598,43 +151,9 @@ }, { "cell_type": "code", - "execution_count": 13, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "# Create a visualization with Modin df\n", "fig = px.box(modin_df)\n", @@ -643,43 +162,9 @@ }, { "cell_type": "code", - "execution_count": 14, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "# Create a visualization with pandas df\n", "fig = px.box(pandas_df)\n", @@ -688,43 +173,9 @@ }, { "cell_type": "code", - "execution_count": 15, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "# Create a visualization with Modin df\n", "fig = px.histogram(modin_df, opacity=0.5, orientation='h', nbins=5)\n", @@ -733,43 +184,9 @@ }, { "cell_type": "code", - "execution_count": 16, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "# Create a visualization with pandas df\n", "fig = px.histogram(pandas_df, opacity=0.5, orientation='h', nbins=5)\n", @@ -778,25 +195,9 @@ }, { "cell_type": "code", - "execution_count": 19, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "ename": "ValueError", - "evalue": "Value of 'locations' is not the name of a column in 'data_frame'. Expected one of [0, 1] but received: fips", - "output_type": "error", - "traceback": [ - "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", - "\u001b[0;31mValueError\u001b[0m Traceback (most recent call last)", - "\u001b[0;32m/var/folders/qj/jybppsbd2jl75s8y2q8s2xx80000gn/T/ipykernel_5361/4179859770.py\u001b[0m in \u001b[0;36m\u001b[0;34m\u001b[0m\n\u001b[1;32m 8\u001b[0m modin_df = pd.read_csv(\"https://raw.githubusercontent.com/plotly/datasets/master/fips-unemp-16.csv\",\n\u001b[1;32m 9\u001b[0m dtype={\"fips\": str})\n\u001b[0;32m---> 10\u001b[0;31m fig = px.choropleth(modin_df, geojson=counties, locations='fips', color='unemp',\n\u001b[0m\u001b[1;32m 11\u001b[0m \u001b[0mcolor_continuous_scale\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;34m\"Viridis\"\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 12\u001b[0m \u001b[0mrange_color\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;36m12\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/opt/anaconda3/lib/python3.9/site-packages/plotly/express/_chart_types.py\u001b[0m in \u001b[0;36mchoropleth\u001b[0;34m(data_frame, lat, lon, locations, locationmode, geojson, featureidkey, color, facet_row, facet_col, facet_col_wrap, facet_row_spacing, facet_col_spacing, hover_name, hover_data, custom_data, animation_frame, animation_group, category_orders, labels, color_discrete_sequence, color_discrete_map, color_continuous_scale, range_color, color_continuous_midpoint, projection, scope, center, fitbounds, basemap_visible, title, template, width, height)\u001b[0m\n\u001b[1;32m 1075\u001b[0m \u001b[0mcolored\u001b[0m \u001b[0mregion\u001b[0m \u001b[0mmark\u001b[0m \u001b[0mon\u001b[0m \u001b[0ma\u001b[0m \u001b[0mmap\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1076\u001b[0m \"\"\"\n\u001b[0;32m-> 1077\u001b[0;31m return make_figure(\n\u001b[0m\u001b[1;32m 1078\u001b[0m \u001b[0margs\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mlocals\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1079\u001b[0m \u001b[0mconstructor\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mgo\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mChoropleth\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/opt/anaconda3/lib/python3.9/site-packages/plotly/express/_core.py\u001b[0m in \u001b[0;36mmake_figure\u001b[0;34m(args, constructor, trace_patch, layout_patch)\u001b[0m\n\u001b[1;32m 1943\u001b[0m \u001b[0mapply_default_cascade\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1944\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 1945\u001b[0;31m \u001b[0margs\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mbuild_dataframe\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mconstructor\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 1946\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mconstructor\u001b[0m \u001b[0;32min\u001b[0m \u001b[0;34m[\u001b[0m\u001b[0mgo\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mTreemap\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mgo\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mSunburst\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mgo\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mIcicle\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;32mand\u001b[0m \u001b[0margs\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m\"path\"\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;32mis\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1947\u001b[0m \u001b[0margs\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mprocess_dataframe_hierarchy\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/opt/anaconda3/lib/python3.9/site-packages/plotly/express/_core.py\u001b[0m in \u001b[0;36mbuild_dataframe\u001b[0;34m(args, constructor)\u001b[0m\n\u001b[1;32m 1403\u001b[0m \u001b[0;31m# now that things have been prepped, we do the systematic rewriting of `args`\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1404\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 1405\u001b[0;31m df_output, wide_id_vars = process_args_into_dataframe(\n\u001b[0m\u001b[1;32m 1406\u001b[0m \u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mwide_mode\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mvar_name\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mvalue_name\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1407\u001b[0m )\n", - "\u001b[0;32m~/opt/anaconda3/lib/python3.9/site-packages/plotly/express/_core.py\u001b[0m in \u001b[0;36mprocess_args_into_dataframe\u001b[0;34m(args, wide_mode, var_name, value_name)\u001b[0m\n\u001b[1;32m 1205\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0margument\u001b[0m \u001b[0;34m==\u001b[0m \u001b[0;34m\"index\"\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1206\u001b[0m \u001b[0merr_msg\u001b[0m \u001b[0;34m+=\u001b[0m \u001b[0;34m\"\\n To use the index, pass it in directly as `df.index`.\"\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 1207\u001b[0;31m \u001b[0;32mraise\u001b[0m \u001b[0mValueError\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0merr_msg\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 1208\u001b[0m \u001b[0;32melif\u001b[0m \u001b[0mlength\u001b[0m \u001b[0;32mand\u001b[0m \u001b[0mlen\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mdf_input\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0margument\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;34m!=\u001b[0m \u001b[0mlength\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1209\u001b[0m raise ValueError(\n", - "\u001b[0;31mValueError\u001b[0m: Value of 'locations' is not the name of a column in 'data_frame'. Expected one of [0, 1] but received: fips" - ] - } - ], + "outputs": [], "source": [ "# Create a visualization with Modin df\n", "# Example from https://plotly.com/python/mapbox-county-choropleth/#choropleth-map-using-plotlyexpress-and-carto-base-map-no-token-needed\n", @@ -819,43 +220,9 @@ }, { "cell_type": "code", - "execution_count": 20, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], + "outputs": [], "source": [ "# Create a visualization with pandas df\n", "# Example from https://plotly.com/python/mapbox-county-choropleth/#choropleth-map-using-plotlyexpress-and-carto-base-map-no-token-needed\n", diff --git a/examples/jupyter/integrations/sklearn.ipynb b/examples/jupyter/integrations/sklearn.ipynb index 41b305e5c85..7088c92ebb1 100644 --- a/examples/jupyter/integrations/sklearn.ipynb +++ b/examples/jupyter/integrations/sklearn.ipynb @@ -16,7 +16,7 @@ }, { "cell_type": "code", - "execution_count": 1, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -26,23 +26,9 @@ }, { "cell_type": "code", - "execution_count": 2, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "UserWarning: Ray execution environment not yet initialized. Initializing...\n", - "To remove this warning, run the following python code before doing dataframe operations:\n", - "\n", - " import ray\n", - " ray.init(runtime_env={'env_vars': {'__MODIN_AUTOIMPORT_PANDAS__': '1'}})\n", - "\n", - "2023-01-03 11:03:39,350\tINFO worker.py:1529 -- Started a local Ray instance. View the dashboard at \u001b[1m\u001b[32m127.0.0.1:8266 \u001b[39m\u001b[22m\n" - ] - } - ], + "outputs": [], "source": [ "# From https://www.ritchieng.com/pandas-scikit-learn/\n", "\n", @@ -52,159 +38,16 @@ }, { "cell_type": "code", - "execution_count": 3, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
PassengerIdSurvivedPclassNameSexAgeSibSpParchTicketFareCabinEmbarked
0103Braund, Mr. Owen Harrismale22.010A/5 211717.2500NaNS
1211Cumings, Mrs. John Bradley (Florence Briggs Th...female38.010PC 1759971.2833C85C
2313Heikkinen, Miss. Lainafemale26.000STON/O2. 31012827.9250NaNS
3411Futrelle, Mrs. Jacques Heath (Lily May Peel)female35.01011380353.1000C123S
4503Allen, Mr. William Henrymale35.0003734508.0500NaNS
\n", - "
" - ], - "text/plain": [ - " PassengerId Survived Pclass \\\n", - "0 1 0 3 \n", - "1 2 1 1 \n", - "2 3 1 3 \n", - "3 4 1 1 \n", - "4 5 0 3 \n", - "\n", - " Name Sex Age SibSp \\\n", - "0 Braund, Mr. Owen Harris male 22.0 1 \n", - "1 Cumings, Mrs. John Bradley (Florence Briggs Th... female 38.0 1 \n", - "2 Heikkinen, Miss. Laina female 26.0 0 \n", - "3 Futrelle, Mrs. Jacques Heath (Lily May Peel) female 35.0 1 \n", - "4 Allen, Mr. William Henry male 35.0 0 \n", - "\n", - " Parch Ticket Fare Cabin Embarked \n", - "0 0 A/5 21171 7.2500 NaN S \n", - "1 0 PC 17599 71.2833 C85 C \n", - "2 0 STON/O2. 3101282 7.9250 NaN S \n", - "3 0 113803 53.1000 C123 S \n", - "4 0 373450 8.0500 NaN S " - ] - }, - "execution_count": 3, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "train.head()" ] }, { "cell_type": "code", - "execution_count": 4, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -215,7 +58,7 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -225,7 +68,7 @@ }, { "cell_type": "code", - "execution_count": 6, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -235,20 +78,9 @@ }, { "cell_type": "code", - "execution_count": 7, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "LogisticRegression()" - ] - }, - "execution_count": 7, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "# 1. import\n", "from sklearn.linear_model import LogisticRegression\n", @@ -262,7 +94,7 @@ }, { "cell_type": "code", - "execution_count": 8, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -272,139 +104,9 @@ }, { "cell_type": "code", - "execution_count": 9, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
PassengerIdPclassNameSexAgeSibSpParchTicketFareCabinEmbarked
08923Kelly, Mr. Jamesmale34.5003309117.8292NaNQ
18933Wilkes, Mrs. James (Ellen Needs)female47.0103632727.0000NaNS
28942Myles, Mr. Thomas Francismale62.0002402769.6875NaNQ
38953Wirz, Mr. Albertmale27.0003151548.6625NaNS
48963Hirvonen, Mrs. Alexander (Helga E Lindqvist)female22.011310129812.2875NaNS
\n", - "
" - ], - "text/plain": [ - " PassengerId Pclass Name Sex \\\n", - "0 892 3 Kelly, Mr. James male \n", - "1 893 3 Wilkes, Mrs. James (Ellen Needs) female \n", - "2 894 2 Myles, Mr. Thomas Francis male \n", - "3 895 3 Wirz, Mr. Albert male \n", - "4 896 3 Hirvonen, Mrs. Alexander (Helga E Lindqvist) female \n", - "\n", - " Age SibSp Parch Ticket Fare Cabin Embarked \n", - "0 34.5 0 0 330911 7.8292 NaN Q \n", - "1 47.0 1 0 363272 7.0000 NaN S \n", - "2 62.0 0 0 240276 9.6875 NaN Q \n", - "3 27.0 0 0 315154 8.6625 NaN S \n", - "4 22.0 1 1 3101298 12.2875 NaN S " - ] - }, - "execution_count": 9, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "# missing Survived column because we are predicting\n", "test.head()" @@ -412,7 +114,7 @@ }, { "cell_type": "code", - "execution_count": 10, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -421,7 +123,7 @@ }, { "cell_type": "code", - "execution_count": 11, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -431,17 +133,9 @@ }, { "cell_type": "code", - "execution_count": 12, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "UserWarning: Distributing object. This may take some time.\n" - ] - } - ], + "outputs": [], "source": [ "# kaggle wants 2 columns\n", "# new_pred_class\n", @@ -455,18 +149,9 @@ }, { "cell_type": "code", - "execution_count": 13, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "UserWarning: `to_pickle` is not currently supported by PandasOnRay, defaulting to pandas implementation.\n", - "Please refer to https://modin.readthedocs.io/en/stable/supported_apis/defaulting_to_pandas.html for explanation.\n" - ] - } - ], + "outputs": [], "source": [ "# save train data to disk using pickle\n", "train.to_pickle('train.pkl')" @@ -474,270 +159,9 @@ }, { "cell_type": "code", - "execution_count": 14, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "UserWarning: `read_pickle` is not currently supported by PandasOnRay, defaulting to pandas implementation.\n" - ] - }, - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
PassengerIdSurvivedPclassNameSexAgeSibSpParchTicketFareCabinEmbarked
0103Braund, Mr. Owen Harrismale22.010A/5 211717.2500NaNS
1211Cumings, Mrs. John Bradley (Florence Briggs Th...female38.010PC 1759971.2833C85C
2313Heikkinen, Miss. Lainafemale26.000STON/O2. 31012827.9250NaNS
3411Futrelle, Mrs. Jacques Heath (Lily May Peel)female35.01011380353.1000C123S
4503Allen, Mr. William Henrymale35.0003734508.0500NaNS
.......................................
88688702Montvila, Rev. Juozasmale27.00021153613.0000NaNS
88788811Graham, Miss. Margaret Edithfemale19.00011205330.0000B42S
88888903Johnston, Miss. Catherine Helen \"Carrie\"femaleNaN12W./C. 660723.4500NaNS
88989011Behr, Mr. Karl Howellmale26.00011136930.0000C148C
89089103Dooley, Mr. Patrickmale32.0003703767.7500NaNQ
\n", - "

891 rows x 12 columns

\n", - "
" - ], - "text/plain": [ - " PassengerId Survived Pclass \\\n", - "0 1 0 3 \n", - "1 2 1 1 \n", - "2 3 1 3 \n", - "3 4 1 1 \n", - "4 5 0 3 \n", - ".. ... ... ... \n", - "886 887 0 2 \n", - "887 888 1 1 \n", - "888 889 0 3 \n", - "889 890 1 1 \n", - "890 891 0 3 \n", - "\n", - " Name Sex Age SibSp \\\n", - "0 Braund, Mr. Owen Harris male 22.0 1 \n", - "1 Cumings, Mrs. John Bradley (Florence Briggs Th... female 38.0 1 \n", - "2 Heikkinen, Miss. Laina female 26.0 0 \n", - "3 Futrelle, Mrs. Jacques Heath (Lily May Peel) female 35.0 1 \n", - "4 Allen, Mr. William Henry male 35.0 0 \n", - ".. ... ... ... ... \n", - "886 Montvila, Rev. Juozas male 27.0 0 \n", - "887 Graham, Miss. Margaret Edith female 19.0 0 \n", - "888 Johnston, Miss. Catherine Helen \"Carrie\" female NaN 1 \n", - "889 Behr, Mr. Karl Howell male 26.0 0 \n", - "890 Dooley, Mr. Patrick male 32.0 0 \n", - "\n", - " Parch Ticket Fare Cabin Embarked \n", - "0 0 A/5 21171 7.2500 NaN S \n", - "1 0 PC 17599 71.2833 C85 C \n", - "2 0 STON/O2. 3101282 7.9250 NaN S \n", - "3 0 113803 53.1000 C123 S \n", - "4 0 373450 8.0500 NaN S \n", - ".. ... ... ... ... ... \n", - "886 0 211536 13.0000 NaN S \n", - "887 0 112053 30.0000 B42 S \n", - "888 2 W./C. 6607 23.4500 NaN S \n", - "889 0 111369 30.0000 C148 C \n", - "890 0 370376 7.7500 NaN Q \n", - "\n", - "[891 rows x 12 columns]" - ] - }, - "execution_count": 14, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "# read data\n", "pd.read_pickle('train.pkl')" @@ -745,28 +169,9 @@ }, { "cell_type": "code", - "execution_count": 15, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "UserWarning: Distributing object. This may take some time.\n" - ] - }, - { - "data": { - "text/plain": [ - "array([[0. , 1. , 0.5, 0.5],\n", - " [0.5, 0.5, 0. , 1. ]])" - ] - }, - "execution_count": 15, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "# From https://scikit-learn.org/stable/modules/generated/sklearn.compose.ColumnTransformer.html\n", "\n", @@ -786,17 +191,9 @@ }, { "cell_type": "code", - "execution_count": 16, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "UserWarning: Distributing object. This may take some time.\n" - ] - } - ], + "outputs": [], "source": [ "from sklearn.feature_extraction import FeatureHasher\n", "from sklearn.preprocessing import MinMaxScaler\n", @@ -812,27 +209,9 @@ }, { "cell_type": "code", - "execution_count": 17, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[[ 7. 2. 3. ]\n", - " [ 4. 3.5 6. ]\n", - " [10. 3.5 9. ]]\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "UserWarning: Distributing object. This may take some time.\n", - "UserWarning: Distributing object. This may take some time.\n" - ] - } - ], + "outputs": [], "source": [ "# From https://scikit-learn.org/stable/modules/generated/sklearn.impute.SimpleImputer.html\n", "\n", @@ -847,28 +226,9 @@ }, { "cell_type": "code", - "execution_count": 18, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "UserWarning: Distributing object. This may take some time.\n", - "UserWarning: Distributing object. This may take some time.\n" - ] - }, - { - "data": { - "text/plain": [ - "[0, 1, 2, 3, 4]" - ] - }, - "execution_count": 18, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "# From https://scikit-learn.org/stable/modules/generated/sklearn.model_selection.train_test_split.html\n", "\n", @@ -881,7 +241,7 @@ }, { "cell_type": "code", - "execution_count": 19, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -891,46 +251,18 @@ }, { "cell_type": "code", - "execution_count": 20, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "modin.pandas.dataframe.DataFrame" - ] - }, - "execution_count": 20, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "type(X_train)" ] }, { "cell_type": "code", - "execution_count": 22, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "[0 0\n", - " 1 1\n", - " 2 2\n", - " dtype: int64,\n", - " 3 3\n", - " 4 4\n", - " dtype: int64]" - ] - }, - "execution_count": 22, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "train_test_split(y, shuffle=False)" ] @@ -944,7 +276,7 @@ }, { "cell_type": "code", - "execution_count": 23, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -953,17 +285,9 @@ }, { "cell_type": "code", - "execution_count": 24, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "UserWarning: Distributing object. This may take some time.\n" - ] - } - ], + "outputs": [], "source": [ "tips = sns.load_dataset(\"tips\")\n", "tips = pd.DataFrame(tips)" @@ -971,221 +295,16 @@ }, { "cell_type": "code", - "execution_count": 25, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
total_billtipsizesex_Femalesmoker_Noday_Friday_Satday_Suntime_Dinner
016.991.012110011
110.341.663010011
221.013.503010011
323.683.312010011
424.593.614110011
..............................
23929.035.923010101
24027.182.002100101
24122.672.002000101
24217.821.752010101
24318.783.002110001
\n", - "

244 rows x 9 columns

\n", - "
" - ], - "text/plain": [ - " total_bill tip size sex_Female smoker_No day_Fri day_Sat day_Sun \\\n", - "0 16.99 1.01 2 1 1 0 0 1 \n", - "1 10.34 1.66 3 0 1 0 0 1 \n", - "2 21.01 3.50 3 0 1 0 0 1 \n", - "3 23.68 3.31 2 0 1 0 0 1 \n", - "4 24.59 3.61 4 1 1 0 0 1 \n", - ".. ... ... ... ... ... ... ... ... \n", - "239 29.03 5.92 3 0 1 0 1 0 \n", - "240 27.18 2.00 2 1 0 0 1 0 \n", - "241 22.67 2.00 2 0 0 0 1 0 \n", - "242 17.82 1.75 2 0 1 0 1 0 \n", - "243 18.78 3.00 2 1 1 0 0 0 \n", - "\n", - " time_Dinner \n", - "0 1 \n", - "1 1 \n", - "2 1 \n", - "3 1 \n", - "4 1 \n", - ".. ... \n", - "239 1 \n", - "240 1 \n", - "241 1 \n", - "242 1 \n", - "243 1 \n", - "\n", - "[244 rows x 9 columns]" - ] - }, - "execution_count": 25, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "pd.get_dummies(tips, drop_first=True)" ] }, { "cell_type": "code", - "execution_count": 26, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -1194,7 +313,7 @@ }, { "cell_type": "code", - "execution_count": 27, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -1204,20 +323,9 @@ }, { "cell_type": "code", - "execution_count": 28, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "LinearRegression()" - ] - }, - "execution_count": 28, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "# 2. fit the model object\n", "lr.fit(X=tips[[\"total_bill\", \"size\"]], y=tips[\"tip\"])" @@ -1225,20 +333,9 @@ }, { "cell_type": "code", - "execution_count": 29, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "array([0.09271334, 0.19259779])" - ] - }, - "execution_count": 29, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "# look at the coefficients\n", "lr.coef_" @@ -1246,20 +343,9 @@ }, { "cell_type": "code", - "execution_count": 30, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "0.6689447408125027" - ] - }, - "execution_count": 30, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "# look at the intercept\n", "lr.intercept_" @@ -1267,129 +353,9 @@ }, { "cell_type": "code", - "execution_count": 31, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
tiptotal_billsmoker_No
01.0116.991
11.6610.341
23.5021.011
33.3123.681
43.6124.591
............
2395.9229.031
2402.0027.180
2412.0022.670
2421.7517.821
2433.0018.781
\n", - "

244 rows x 3 columns

\n", - "
" - ], - "text/plain": [ - " tip total_bill smoker_No\n", - "0 1.01 16.99 1\n", - "1 1.66 10.34 1\n", - "2 3.50 21.01 1\n", - "3 3.31 23.68 1\n", - "4 3.61 24.59 1\n", - ".. ... ... ...\n", - "239 5.92 29.03 1\n", - "240 2.00 27.18 0\n", - "241 2.00 22.67 0\n", - "242 1.75 17.82 1\n", - "243 3.00 18.78 1\n", - "\n", - "[244 rows x 3 columns]" - ] - }, - "execution_count": 31, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "tips_dummy = pd.get_dummies(tips, drop_first=True)[[\"tip\", \"total_bill\", \"smoker_No\"]]\n", "tips_dummy" @@ -1397,20 +363,9 @@ }, { "cell_type": "code", - "execution_count": 32, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "LinearRegression()" - ] - }, - "execution_count": 32, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "lr2 = linear_model.LinearRegression()\n", "lr2.fit(X=tips_dummy.iloc[:, 1:], y=tips_dummy[\"tip\"])" @@ -1418,98 +373,18 @@ }, { "cell_type": "code", - "execution_count": 33, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "(array([0.10572239, 0.14892431]), 0.8142993000217928)" - ] - }, - "execution_count": 33, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "lr2.coef_, lr2.intercept_" ] }, { "cell_type": "code", - "execution_count": 34, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
total_billsmoker_No
23929.031
24027.180
24122.670
24217.821
24318.781
\n", - "
" - ], - "text/plain": [ - " total_bill smoker_No\n", - "239 29.03 1\n", - "240 27.18 0\n", - "241 22.67 0\n", - "242 17.82 1\n", - "243 18.78 1" - ] - }, - "execution_count": 34, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "new_data = tips_dummy[[\"total_bill\", \"smoker_No\"]].tail() # not really new data\n", "new_data" @@ -1517,7 +392,7 @@ }, { "cell_type": "code", - "execution_count": 35, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -1527,104 +402,18 @@ }, { "cell_type": "code", - "execution_count": 36, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
total_billsmoker_Nopredicted_tips
23929.0314.032345
24027.1803.687834
24122.6703.211026
24217.8212.847197
24318.7812.948690
\n", - "
" - ], - "text/plain": [ - " total_bill smoker_No predicted_tips\n", - "239 29.03 1 4.032345\n", - "240 27.18 0 3.687834\n", - "241 22.67 0 3.211026\n", - "242 17.82 1 2.847197\n", - "243 18.78 1 2.948690" - ] - }, - "execution_count": 36, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "new_data" ] }, { "cell_type": "code", - "execution_count": 38, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "modin.pandas.dataframe.DataFrame" - ] - }, - "execution_count": 38, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "type(new_data)" ] diff --git a/examples/jupyter/integrations/statsmodels.ipynb b/examples/jupyter/integrations/statsmodels.ipynb index 27d4038e59d..51bf90136a5 100644 --- a/examples/jupyter/integrations/statsmodels.ipynb +++ b/examples/jupyter/integrations/statsmodels.ipynb @@ -10,20 +10,9 @@ }, { "cell_type": "code", - "execution_count": 1, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "/Users/labanyamukhopadhyay/opt/anaconda3/lib/python3.9/site-packages/statsmodels/tsa/base/tsa_model.py:7: FutureWarning: pandas.Int64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n", - " from pandas import (to_datetime, Int64Index, DatetimeIndex, Period,\n", - "/Users/labanyamukhopadhyay/opt/anaconda3/lib/python3.9/site-packages/statsmodels/tsa/base/tsa_model.py:7: FutureWarning: pandas.Float64Index is deprecated and will be removed from pandas in a future version. Use pandas.Index with the appropriate dtype instead.\n", - " from pandas import (to_datetime, Int64Index, DatetimeIndex, Period,\n" - ] - } - ], + "outputs": [], "source": [ "import statsmodels.api as sm\n", "import pandas\n", @@ -40,24 +29,9 @@ }, { "cell_type": "code", - "execution_count": 2, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "UserWarning: Ray execution environment not yet initialized. Initializing...\n", - "To remove this warning, run the following python code before doing dataframe operations:\n", - "\n", - " import ray\n", - " ray.init(runtime_env={'env_vars': {'__MODIN_AUTOIMPORT_PANDAS__': '1'}})\n", - "\n", - "2023-04-06 11:48:00,894\tINFO worker.py:1553 -- Started a local Ray instance.\n", - "UserWarning: Distributing object. This may take some time.\n" - ] - } - ], + "outputs": [], "source": [ "df = sm.datasets.get_rdataset(\"Guerry\", \"HistData\").data\n", "modin_df = pd.DataFrame(df)" @@ -65,96 +39,9 @@ }, { "cell_type": "code", - "execution_count": 3, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
DepartmentLotteryLiteracyWealthRegion
81Vienne402568W
82Haute-Vienne551367C
83Vosges146282E
84Yonne514730C
85Corse834937NaN
\n", - "
" - ], - "text/plain": [ - " Department Lottery Literacy Wealth Region\n", - "81 Vienne 40 25 68 W\n", - "82 Haute-Vienne 55 13 67 C\n", - "83 Vosges 14 62 82 E\n", - "84 Yonne 51 47 30 C\n", - "85 Corse 83 49 37 NaN" - ] - }, - "execution_count": 3, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "vars = ['Department', 'Lottery', 'Literacy', 'Wealth', 'Region']\n", "\n", @@ -165,96 +52,9 @@ }, { "cell_type": "code", - "execution_count": 4, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
DepartmentLotteryLiteracyWealthRegion
80Vendee682856W
81Vienne402568W
82Haute-Vienne551367C
83Vosges146282E
84Yonne514730C
\n", - "
" - ], - "text/plain": [ - " Department Lottery Literacy Wealth Region\n", - "80 Vendee 68 28 56 W\n", - "81 Vienne 40 25 68 W\n", - "82 Haute-Vienne 55 13 67 C\n", - "83 Vosges 14 62 82 E\n", - "84 Yonne 51 47 30 C" - ] - }, - "execution_count": 4, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "modin_df = modin_df.dropna()\n", "\n", @@ -263,7 +63,7 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -272,17 +72,9 @@ }, { "cell_type": "code", - "execution_count": 6, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "UserWarning: Distributing object. This may take some time.\n" - ] - } - ], + "outputs": [], "source": [ "y = pd.DataFrame(y)\n", "X = pd.DataFrame(X)" @@ -290,50 +82,18 @@ }, { "cell_type": "code", - "execution_count": 7, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "ename": "ValueError", - "evalue": "unrecognized data structures: / ", - "output_type": "error", - "traceback": [ - "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", - "\u001b[0;31mValueError\u001b[0m Traceback (most recent call last)", - "\u001b[0;32m/var/folders/qj/jybppsbd2jl75s8y2q8s2xx80000gn/T/ipykernel_5691/1699330070.py\u001b[0m in \u001b[0;36m\u001b[0;34m\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0mmod\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0msm\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mOLS\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0my\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mX\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;31m# Describe model\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m", - "\u001b[0;32m~/opt/anaconda3/lib/python3.9/site-packages/statsmodels/regression/linear_model.py\u001b[0m in \u001b[0;36m__init__\u001b[0;34m(self, endog, exog, missing, hasconst, **kwargs)\u001b[0m\n\u001b[1;32m 870\u001b[0m def __init__(self, endog, exog=None, missing='none', hasconst=None,\n\u001b[1;32m 871\u001b[0m **kwargs):\n\u001b[0;32m--> 872\u001b[0;31m super(OLS, self).__init__(endog, exog, missing=missing,\n\u001b[0m\u001b[1;32m 873\u001b[0m hasconst=hasconst, **kwargs)\n\u001b[1;32m 874\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0;34m\"weights\"\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_init_keys\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/opt/anaconda3/lib/python3.9/site-packages/statsmodels/regression/linear_model.py\u001b[0m in \u001b[0;36m__init__\u001b[0;34m(self, endog, exog, weights, missing, hasconst, **kwargs)\u001b[0m\n\u001b[1;32m 701\u001b[0m \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 702\u001b[0m \u001b[0mweights\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mweights\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0msqueeze\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 703\u001b[0;31m super(WLS, self).__init__(endog, exog, missing=missing,\n\u001b[0m\u001b[1;32m 704\u001b[0m weights=weights, hasconst=hasconst, **kwargs)\n\u001b[1;32m 705\u001b[0m \u001b[0mnobs\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mexog\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mshape\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/opt/anaconda3/lib/python3.9/site-packages/statsmodels/regression/linear_model.py\u001b[0m in \u001b[0;36m__init__\u001b[0;34m(self, endog, exog, **kwargs)\u001b[0m\n\u001b[1;32m 188\u001b[0m \"\"\"\n\u001b[1;32m 189\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0m__init__\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mendog\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mexog\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 190\u001b[0;31m \u001b[0msuper\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mRegressionModel\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m__init__\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mendog\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mexog\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 191\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_data_attr\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mextend\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m'pinv_wexog'\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m'weights'\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 192\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/opt/anaconda3/lib/python3.9/site-packages/statsmodels/base/model.py\u001b[0m in \u001b[0;36m__init__\u001b[0;34m(self, endog, exog, **kwargs)\u001b[0m\n\u001b[1;32m 235\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 236\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0m__init__\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mendog\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mexog\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mNone\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 237\u001b[0;31m \u001b[0msuper\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mLikelihoodModel\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m__init__\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mendog\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mexog\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 238\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0minitialize\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 239\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/opt/anaconda3/lib/python3.9/site-packages/statsmodels/base/model.py\u001b[0m in \u001b[0;36m__init__\u001b[0;34m(self, endog, exog, **kwargs)\u001b[0m\n\u001b[1;32m 75\u001b[0m \u001b[0mmissing\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mkwargs\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mpop\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m'missing'\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m'none'\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 76\u001b[0m \u001b[0mhasconst\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mkwargs\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mpop\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m'hasconst'\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 77\u001b[0;31m self.data = self._handle_data(endog, exog, missing, hasconst,\n\u001b[0m\u001b[1;32m 78\u001b[0m **kwargs)\n\u001b[1;32m 79\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mk_constant\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mdata\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mk_constant\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/opt/anaconda3/lib/python3.9/site-packages/statsmodels/base/model.py\u001b[0m in \u001b[0;36m_handle_data\u001b[0;34m(self, endog, exog, missing, hasconst, **kwargs)\u001b[0m\n\u001b[1;32m 99\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 100\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0m_handle_data\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mendog\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mexog\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mmissing\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mhasconst\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 101\u001b[0;31m \u001b[0mdata\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mhandle_data\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mendog\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mexog\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mmissing\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mhasconst\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 102\u001b[0m \u001b[0;31m# kwargs arrays could have changed, easier to just attach here\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 103\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mkey\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mkwargs\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/opt/anaconda3/lib/python3.9/site-packages/statsmodels/base/data.py\u001b[0m in \u001b[0;36mhandle_data\u001b[0;34m(endog, exog, missing, hasconst, **kwargs)\u001b[0m\n\u001b[1;32m 669\u001b[0m \u001b[0mexog\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mnp\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0masarray\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mexog\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 670\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 671\u001b[0;31m \u001b[0mklass\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mhandle_data_class_factory\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mendog\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mexog\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 672\u001b[0m return klass(endog, exog=exog, missing=missing, hasconst=hasconst,\n\u001b[1;32m 673\u001b[0m **kwargs)\n", - "\u001b[0;32m~/opt/anaconda3/lib/python3.9/site-packages/statsmodels/base/data.py\u001b[0m in \u001b[0;36mhandle_data_class_factory\u001b[0;34m(endog, exog)\u001b[0m\n\u001b[1;32m 657\u001b[0m \u001b[0mklass\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mModelData\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 658\u001b[0m \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 659\u001b[0;31m raise ValueError('unrecognized data structures: %s / %s' %\n\u001b[0m\u001b[1;32m 660\u001b[0m (type(endog), type(exog)))\n\u001b[1;32m 661\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0mklass\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;31mValueError\u001b[0m: unrecognized data structures: / " - ] - } - ], + "outputs": [], "source": [ "mod = sm.OLS(y, X) # Describe model" ] }, { "cell_type": "code", - "execution_count": 8, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "ename": "NameError", - "evalue": "name 'mod' is not defined", - "output_type": "error", - "traceback": [ - "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", - "\u001b[0;31mNameError\u001b[0m Traceback (most recent call last)", - "\u001b[0;32m/var/folders/qj/jybppsbd2jl75s8y2q8s2xx80000gn/T/ipykernel_5691/3877149832.py\u001b[0m in \u001b[0;36m\u001b[0;34m\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0mres\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mmod\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mfit\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;31m# Fit model\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 2\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 3\u001b[0m \u001b[0mprint\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mres\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0msummary\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;31mNameError\u001b[0m: name 'mod' is not defined" - ] - } - ], + "outputs": [], "source": [ "res = mod.fit() # Fit model\n", "\n", @@ -356,37 +116,18 @@ }, { "cell_type": "code", - "execution_count": 9, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "UserWarning: Distributing object. This may take some time.\n" - ] - } - ], + "outputs": [], "source": [ "modin_df = pd.DataFrame({\"A\": [10,20,30,40,50], \"B\": [20, 30, 10, 40, 50], \"C\": [32, 234, 23, 23, 42523]})" ] }, { "cell_type": "code", - "execution_count": 10, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Intercept 14.952480\n", - "B 0.401182\n", - "C 0.000352\n", - "dtype: float64\n" - ] - } - ], + "outputs": [], "source": [ "import statsmodels.formula.api as sm\n", "result = sm.ols(formula=\"A ~ B + C\", data=modin_df).fit()\n", @@ -395,51 +136,9 @@ }, { "cell_type": "code", - "execution_count": 11, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - " OLS Regression Results \n", - "==============================================================================\n", - "Dep. Variable: A R-squared: 0.579\n", - "Model: OLS Adj. R-squared: 0.158\n", - "Method: Least Squares F-statistic: 1.375\n", - "Date: Thu, 06 Apr 2023 Prob (F-statistic): 0.421\n", - "Time: 11:48:10 Log-Likelihood: -18.178\n", - "No. Observations: 5 AIC: 42.36\n", - "Df Residuals: 2 BIC: 41.19\n", - "Df Model: 2 \n", - "Covariance Type: nonrobust \n", - "==============================================================================\n", - " coef std err t P>|t| [0.025 0.975]\n", - "------------------------------------------------------------------------------\n", - "Intercept 14.9525 17.764 0.842 0.489 -61.481 91.386\n", - "B 0.4012 0.650 0.617 0.600 -2.394 3.197\n", - "C 0.0004 0.001 0.650 0.583 -0.002 0.003\n", - "==============================================================================\n", - "Omnibus: nan Durbin-Watson: 1.061\n", - "Prob(Omnibus): nan Jarque-Bera (JB): 0.498\n", - "Skew: -0.123 Prob(JB): 0.780\n", - "Kurtosis: 1.474 Cond. No. 5.21e+04\n", - "==============================================================================\n", - "\n", - "Notes:\n", - "[1] Standard Errors assume that the covariance matrix of the errors is correctly specified.\n", - "[2] The condition number is large, 5.21e+04. This might indicate that there are\n", - "strong multicollinearity or other numerical problems.\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "ValueWarning: omni_normtest is not valid with less than 8 observations; 5 samples were given.\n" - ] - } - ], + "outputs": [], "source": [ "print(result.summary())" ] @@ -453,7 +152,7 @@ }, { "cell_type": "code", - "execution_count": 13, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -465,7 +164,7 @@ }, { "cell_type": "code", - "execution_count": 14, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -476,7 +175,7 @@ }, { "cell_type": "code", - "execution_count": 15, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -485,7 +184,7 @@ }, { "cell_type": "code", - "execution_count": 16, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -494,7 +193,7 @@ }, { "cell_type": "code", - "execution_count": 17, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -504,7 +203,7 @@ }, { "cell_type": "code", - "execution_count": 18, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -513,46 +212,9 @@ }, { "cell_type": "code", - "execution_count": 19, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - " OLS Regression Results \n", - "==============================================================================\n", - "Dep. Variable: Lottery R-squared: 0.338\n", - "Model: OLS Adj. R-squared: 0.287\n", - "Method: Least Squares F-statistic: 6.636\n", - "Date: Thu, 06 Apr 2023 Prob (F-statistic): 1.07e-05\n", - "Time: 11:48:36 Log-Likelihood: -375.30\n", - "No. Observations: 85 AIC: 764.6\n", - "Df Residuals: 78 BIC: 781.7\n", - "Df Model: 6 \n", - "Covariance Type: nonrobust \n", - "===============================================================================\n", - " coef std err t P>|t| [0.025 0.975]\n", - "-------------------------------------------------------------------------------\n", - "Intercept 38.6517 9.456 4.087 0.000 19.826 57.478\n", - "Region[T.E] -15.4278 9.727 -1.586 0.117 -34.793 3.938\n", - "Region[T.N] -10.0170 9.260 -1.082 0.283 -28.453 8.419\n", - "Region[T.S] -4.5483 7.279 -0.625 0.534 -19.039 9.943\n", - "Region[T.W] -10.0913 7.196 -1.402 0.165 -24.418 4.235\n", - "Literacy -0.1858 0.210 -0.886 0.378 -0.603 0.232\n", - "Wealth 0.4515 0.103 4.390 0.000 0.247 0.656\n", - "==============================================================================\n", - "Omnibus: 3.049 Durbin-Watson: 1.785\n", - "Prob(Omnibus): 0.218 Jarque-Bera (JB): 2.694\n", - "Skew: -0.340 Prob(JB): 0.260\n", - "Kurtosis: 2.454 Cond. No. 371.\n", - "==============================================================================\n", - "\n", - "Notes:\n", - "[1] Standard Errors assume that the covariance matrix of the errors is correctly specified.\n" - ] - } - ], + "outputs": [], "source": [ "res = mod.fit() # Fit model\n", "\n", @@ -568,37 +230,18 @@ }, { "cell_type": "code", - "execution_count": 20, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "UserWarning: Distributing object. This may take some time.\n" - ] - } - ], + "outputs": [], "source": [ "pandas_df = pd.DataFrame({\"A\": [10,20,30,40,50], \"B\": [20, 30, 10, 40, 50], \"C\": [32, 234, 23, 23, 42523]})" ] }, { "cell_type": "code", - "execution_count": 21, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Intercept 14.952480\n", - "B 0.401182\n", - "C 0.000352\n", - "dtype: float64\n" - ] - } - ], + "outputs": [], "source": [ "import statsmodels.formula.api as sm\n", "result = sm.ols(formula=\"A ~ B + C\", data=pandas_df).fit()\n", @@ -607,51 +250,9 @@ }, { "cell_type": "code", - "execution_count": 22, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - " OLS Regression Results \n", - "==============================================================================\n", - "Dep. Variable: A R-squared: 0.579\n", - "Model: OLS Adj. R-squared: 0.158\n", - "Method: Least Squares F-statistic: 1.375\n", - "Date: Thu, 06 Apr 2023 Prob (F-statistic): 0.421\n", - "Time: 11:48:58 Log-Likelihood: -18.178\n", - "No. Observations: 5 AIC: 42.36\n", - "Df Residuals: 2 BIC: 41.19\n", - "Df Model: 2 \n", - "Covariance Type: nonrobust \n", - "==============================================================================\n", - " coef std err t P>|t| [0.025 0.975]\n", - "------------------------------------------------------------------------------\n", - "Intercept 14.9525 17.764 0.842 0.489 -61.481 91.386\n", - "B 0.4012 0.650 0.617 0.600 -2.394 3.197\n", - "C 0.0004 0.001 0.650 0.583 -0.002 0.003\n", - "==============================================================================\n", - "Omnibus: nan Durbin-Watson: 1.061\n", - "Prob(Omnibus): nan Jarque-Bera (JB): 0.498\n", - "Skew: -0.123 Prob(JB): 0.780\n", - "Kurtosis: 1.474 Cond. No. 5.21e+04\n", - "==============================================================================\n", - "\n", - "Notes:\n", - "[1] Standard Errors assume that the covariance matrix of the errors is correctly specified.\n", - "[2] The condition number is large, 5.21e+04. This might indicate that there are\n", - "strong multicollinearity or other numerical problems.\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "ValueWarning: omni_normtest is not valid with less than 8 observations; 5 samples were given.\n" - ] - } - ], + "outputs": [], "source": [ "print(result.summary())" ] diff --git a/examples/jupyter/integrations/tensorflow.ipynb b/examples/jupyter/integrations/tensorflow.ipynb index dee3f9c0dc6..2702149e604 100644 --- a/examples/jupyter/integrations/tensorflow.ipynb +++ b/examples/jupyter/integrations/tensorflow.ipynb @@ -10,7 +10,7 @@ }, { "cell_type": "code", - "execution_count": 1, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -21,170 +21,9 @@ }, { "cell_type": "code", - "execution_count": 2, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "UserWarning: Ray execution environment not yet initialized. Initializing...\n", - "To remove this warning, run the following python code before doing dataframe operations:\n", - "\n", - " import ray\n", - " ray.init(runtime_env={'env_vars': {'__MODIN_AUTOIMPORT_PANDAS__': '1'}})\n", - "\n", - "2023-04-06 11:54:12,027\tINFO worker.py:1553 -- Started a local Ray instance.\n" - ] - }, - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
agesexcptrestbpscholfbsrestecgthalachexangoldpeakslopecathaltarget
063111452331215002.330fixed0
167141602860210811.523normal1
267141202290212912.622reversible0
337131302500018703.530normal0
441021302040217201.410normal0
\n", - "
" - ], - "text/plain": [ - " age sex cp trestbps chol fbs restecg thalach exang oldpeak slope \\\n", - "0 63 1 1 145 233 1 2 150 0 2.3 3 \n", - "1 67 1 4 160 286 0 2 108 1 1.5 2 \n", - "2 67 1 4 120 229 0 2 129 1 2.6 2 \n", - "3 37 1 3 130 250 0 0 187 0 3.5 3 \n", - "4 41 0 2 130 204 0 2 172 0 1.4 1 \n", - "\n", - " ca thal target \n", - "0 0 fixed 0 \n", - "1 3 normal 1 \n", - "2 2 reversible 0 \n", - "3 0 normal 0 \n", - "4 0 normal 0 " - ] - }, - "execution_count": 2, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "SHUFFLE_BUFFER = 500\n", "BATCH_SIZE = 2\n", @@ -197,7 +36,7 @@ }, { "cell_type": "code", - "execution_count": 3, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -206,96 +45,9 @@ }, { "cell_type": "code", - "execution_count": 4, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
agethalachtrestbpschololdpeak
0631501452332.3
1671081602861.5
2671291202292.6
3371871302503.5
4411721302041.4
\n", - "
" - ], - "text/plain": [ - " age thalach trestbps chol oldpeak\n", - "0 63 150 145 233 2.3\n", - "1 67 108 160 286 1.5\n", - "2 67 129 120 229 2.6\n", - "3 37 187 130 250 3.5\n", - "4 41 172 130 204 1.4" - ] - }, - "execution_count": 4, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "numeric_feature_names = ['age', 'thalach', 'trestbps', 'chol', 'oldpeak']\n", "numeric_features = modin_df[numeric_feature_names]\n", @@ -304,60 +56,18 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "2023-04-06 11:54:16.000875: I tensorflow/core/platform/cpu_feature_guard.cc:151] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA\n", - "To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags.\n" - ] - }, - { - "data": { - "text/plain": [ - "" - ] - }, - "execution_count": 5, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "tf.convert_to_tensor(numeric_features)" ] }, { "cell_type": "code", - "execution_count": 6, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "ename": "ValueError", - "evalue": "Failed to find data adapter that can handle input: , ", - "output_type": "error", - "traceback": [ - "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", - "\u001b[0;31mValueError\u001b[0m Traceback (most recent call last)", - "\u001b[0;32m/var/folders/qj/jybppsbd2jl75s8y2q8s2xx80000gn/T/ipykernel_5722/2210982900.py\u001b[0m in \u001b[0;36m\u001b[0;34m\u001b[0m\n\u001b[1;32m 1\u001b[0m \u001b[0mnormalizer\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mtf\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mkeras\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mlayers\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mNormalization\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0maxis\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;34m-\u001b[0m\u001b[0;36m1\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m----> 2\u001b[0;31m \u001b[0mnormalizer\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0madapt\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mnumeric_features\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m", - "\u001b[0;32m~/opt/anaconda3/lib/python3.9/site-packages/keras/layers/preprocessing/normalization.py\u001b[0m in \u001b[0;36madapt\u001b[0;34m(self, data, batch_size, steps)\u001b[0m\n\u001b[1;32m 240\u001b[0m \u001b[0margument\u001b[0m \u001b[0;32mis\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0msupported\u001b[0m \u001b[0;32mwith\u001b[0m \u001b[0marray\u001b[0m \u001b[0minputs\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 241\u001b[0m \"\"\"\n\u001b[0;32m--> 242\u001b[0;31m \u001b[0msuper\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0madapt\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mdata\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mbatch_size\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mbatch_size\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0msteps\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0msteps\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 243\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 244\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0mupdate_state\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mdata\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/opt/anaconda3/lib/python3.9/site-packages/keras/engine/base_preprocessing_layer.py\u001b[0m in \u001b[0;36madapt\u001b[0;34m(self, data, batch_size, steps)\u001b[0m\n\u001b[1;32m 236\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mbuilt\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 237\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mreset_state\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 238\u001b[0;31m data_handler = data_adapter.DataHandler(\n\u001b[0m\u001b[1;32m 239\u001b[0m \u001b[0mdata\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 240\u001b[0m \u001b[0mbatch_size\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mbatch_size\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/opt/anaconda3/lib/python3.9/site-packages/keras/engine/data_adapter.py\u001b[0m in \u001b[0;36m__init__\u001b[0;34m(self, x, y, sample_weight, batch_size, steps_per_epoch, initial_epoch, epochs, shuffle, class_weight, max_queue_size, workers, use_multiprocessing, model, steps_per_execution, distribute)\u001b[0m\n\u001b[1;32m 1146\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_steps_per_execution\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0msteps_per_execution\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1147\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 1148\u001b[0;31m \u001b[0madapter_cls\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mselect_data_adapter\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mx\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0my\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 1149\u001b[0m self._adapter = adapter_cls(\n\u001b[1;32m 1150\u001b[0m \u001b[0mx\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/opt/anaconda3/lib/python3.9/site-packages/keras/engine/data_adapter.py\u001b[0m in \u001b[0;36mselect_data_adapter\u001b[0;34m(x, y)\u001b[0m\n\u001b[1;32m 982\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0madapter_cls\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 983\u001b[0m \u001b[0;31m# TODO(scottzhu): This should be a less implementation-specific error.\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 984\u001b[0;31m raise ValueError(\n\u001b[0m\u001b[1;32m 985\u001b[0m \u001b[0;34m\"Failed to find data adapter that can handle \"\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 986\u001b[0m \"input: {}, {}\".format(\n", - "\u001b[0;31mValueError\u001b[0m: Failed to find data adapter that can handle input: , " - ] - } - ], + "outputs": [], "source": [ "normalizer = tf.keras.layers.Normalization(axis=-1)\n", "normalizer.adapt(numeric_features)" @@ -372,157 +82,9 @@ }, { "cell_type": "code", - "execution_count": 7, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
agesexcptrestbpscholfbsrestecgthalachexangoldpeakslopecathaltarget
063111452331215002.330fixed0
167141602860210811.523normal1
267141202290212912.622reversible0
337131302500018703.530normal0
441021302040217201.410normal0
\n", - "
" - ], - "text/plain": [ - " age sex cp trestbps chol fbs restecg thalach exang oldpeak slope \\\n", - "0 63 1 1 145 233 1 2 150 0 2.3 3 \n", - "1 67 1 4 160 286 0 2 108 1 1.5 2 \n", - "2 67 1 4 120 229 0 2 129 1 2.6 2 \n", - "3 37 1 3 130 250 0 0 187 0 3.5 3 \n", - "4 41 0 2 130 204 0 2 172 0 1.4 1 \n", - "\n", - " ca thal target \n", - "0 0 fixed 0 \n", - "1 3 normal 1 \n", - "2 2 reversible 0 \n", - "3 0 normal 0 \n", - "4 0 normal 0 " - ] - }, - "execution_count": 7, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "SHUFFLE_BUFFER = 500\n", "BATCH_SIZE = 2\n", @@ -535,7 +97,7 @@ }, { "cell_type": "code", - "execution_count": 8, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -544,96 +106,9 @@ }, { "cell_type": "code", - "execution_count": 9, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/html": [ - "
\n", - "\n", - "\n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - " \n", - "
agethalachtrestbpschololdpeak
0631501452332.3
1671081602861.5
2671291202292.6
3371871302503.5
4411721302041.4
\n", - "
" - ], - "text/plain": [ - " age thalach trestbps chol oldpeak\n", - "0 63 150 145 233 2.3\n", - "1 67 108 160 286 1.5\n", - "2 67 129 120 229 2.6\n", - "3 37 187 130 250 3.5\n", - "4 41 172 130 204 1.4" - ] - }, - "execution_count": 9, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "numeric_feature_names = ['age', 'thalach', 'trestbps', 'chol', 'oldpeak']\n", "numeric_features = pandas_df[numeric_feature_names]\n", @@ -642,34 +117,16 @@ }, { "cell_type": "code", - "execution_count": 10, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "" - ] - }, - "execution_count": 10, - "metadata": {}, - "output_type": "execute_result" - } - ], + "outputs": [], "source": [ "tf.convert_to_tensor(numeric_features)" ] }, { "cell_type": "code", - "execution_count": 11, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ diff --git a/examples/jupyter/integrations/xgboost.ipynb b/examples/jupyter/integrations/xgboost.ipynb index dda5e774240..10f452e7d23 100644 --- a/examples/jupyter/integrations/xgboost.ipynb +++ b/examples/jupyter/integrations/xgboost.ipynb @@ -16,7 +16,7 @@ }, { "cell_type": "code", - "execution_count": 1, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -27,25 +27,9 @@ }, { "cell_type": "code", - "execution_count": 2, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "UserWarning: Ray execution environment not yet initialized. Initializing...\n", - "To remove this warning, run the following python code before doing dataframe operations:\n", - "\n", - " import ray\n", - " ray.init(runtime_env={'env_vars': {'__MODIN_AUTOIMPORT_PANDAS__': '1'}})\n", - "\n", - "2023-01-03 12:19:34,877\tINFO worker.py:1529 -- Started a local Ray instance. View the dashboard at \u001b[1m\u001b[32m127.0.0.1:8269 \u001b[39m\u001b[22m\n", - "UserWarning: Distributing object. This may take some time.\n", - "UserWarning: Distributing object. This may take some time.\n" - ] - } - ], + "outputs": [], "source": [ "data_train = pd.DataFrame(np.arange(36).reshape((12,3)), columns=['a', 'b', 'c'])\n", "label_train = pd.DataFrame(np.random.randint(2, size=12))\n", @@ -54,17 +38,9 @@ }, { "cell_type": "code", - "execution_count": 3, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "UserWarning: Distributing object. This may take some time.\n" - ] - } - ], + "outputs": [], "source": [ "data_test = pd.DataFrame(np.arange(12).reshape((4,3)), columns=['a', 'b', 'c'])\n", "label_test = pd.DataFrame(np.random.randint(2, size=4))\n", @@ -73,7 +49,7 @@ }, { "cell_type": "code", - "execution_count": 4, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -84,33 +60,9 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": null, "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "[0]\ttrain-auc:0.85714\teval-auc:0.50000\n", - "[1]\ttrain-auc:0.82857\teval-auc:0.50000\n", - "[2]\ttrain-auc:0.82857\teval-auc:0.50000\n", - "[3]\ttrain-auc:0.85714\teval-auc:0.50000\n", - "[4]\ttrain-auc:0.85714\teval-auc:0.50000\n", - "[5]\ttrain-auc:0.85714\teval-auc:0.50000\n", - "[6]\ttrain-auc:0.85714\teval-auc:0.50000\n", - "[7]\ttrain-auc:0.85714\teval-auc:0.50000\n", - "[8]\ttrain-auc:0.85714\teval-auc:0.50000\n", - "[9]\ttrain-auc:0.85714\teval-auc:0.50000\n" - ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "FutureWarning: Pass `evals` as keyword args.\n" - ] - } - ], + "outputs": [], "source": [ "evallist = [(dtrain, 'train'), (dtest, 'eval')]\n", "num_round = 10\n", @@ -119,7 +71,7 @@ }, { "cell_type": "code", - "execution_count": 6, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ diff --git a/examples/quickstart.ipynb b/examples/quickstart.ipynb index 395e7cd9f7f..0fe229f2cea 100644 --- a/examples/quickstart.ipynb +++ b/examples/quickstart.ipynb @@ -70,6 +70,7 @@ "#############################################\n", "import time\n", "import ray\n", + "# Look at the Ray documentation with respect to the Ray configuration suited to you most.\n", "ray.init()\n", "from IPython.display import Markdown, display\n", "def printmd(string):\n", diff --git a/modin/core/execution/dask/common/utils.py b/modin/core/execution/dask/common/utils.py index 3eda2a50375..160a58bbc8f 100644 --- a/modin/core/execution/dask/common/utils.py +++ b/modin/core/execution/dask/common/utils.py @@ -44,15 +44,6 @@ def _disable_warnings(): except ValueError: from distributed import Client - # The indentation here is intentional, we want the code to be indented. - ErrorMessage.not_initialized( - "Dask", - """ - from distributed import Client - - client = Client() -""", - ) num_cpus = CpuCount.get() memory_limit = Memory.get() worker_memory_limit = memory_limit // num_cpus if memory_limit else "auto" diff --git a/modin/core/execution/ray/common/utils.py b/modin/core/execution/ray/common/utils.py index f24be8fe2cf..3d954b578de 100644 --- a/modin/core/execution/ray/common/utils.py +++ b/modin/core/execution/ray/common/utils.py @@ -118,15 +118,6 @@ def initialize_ray( **extra_init_kw, ) else: - # This string is intentionally formatted this way. We want it indented in - # the warning message. - ErrorMessage.not_initialized( - "Ray", - f""" - import ray - ray.init({', '.join([f'{k}={v}' for k,v in extra_init_kw.items()])}) -""", - ) object_store_memory = _get_object_store_memory() ray_init_kwargs = { "num_cpus": CpuCount.get(), diff --git a/modin/core/execution/unidist/common/utils.py b/modin/core/execution/unidist/common/utils.py index 30d735945e5..c6d2b95ba22 100644 --- a/modin/core/execution/unidist/common/utils.py +++ b/modin/core/execution/unidist/common/utils.py @@ -36,15 +36,6 @@ def initialize_unidist(): modin_cfg.CpuCount.subscribe( lambda cpu_count: unidist_cfg.CpuCount.put(cpu_count.get()) ) - # This string is intentionally formatted this way. We want it indented in - # the warning message. - ErrorMessage.not_initialized( - "unidist", - """ - import unidist - unidist.init() - """, - ) unidist_cfg.MpiRuntimeEnv.put( {"env_vars": {"PYTHONWARNINGS": "ignore::FutureWarning"}} )