diff --git a/docs/samples/databricks/databricks_quickstart_nyc_taxi_demo.ipynb b/docs/samples/databricks/databricks_quickstart_nyc_taxi_demo.ipynb index 07905d591..7b47e96ad 100644 --- a/docs/samples/databricks/databricks_quickstart_nyc_taxi_demo.ipynb +++ b/docs/samples/databricks/databricks_quickstart_nyc_taxi_demo.ipynb @@ -350,7 +350,7 @@ "\n", "# Download the data file\n", "df_raw = nyc_taxi.get_spark_df(spark=spark, local_cache_path=DATA_FILE_PATH)\n", - "df_raw.limit(5).toPandas()" + "df_raw.limit(5).show()" ] }, { @@ -1203,7 +1203,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.10.4" + "version": "3.10.9 (main, Jan 11 2023, 15:21:40) [GCC 11.2.0]" }, "vscode": { "interpreter": { diff --git a/docs/samples/nyc_taxi_demo.ipynb b/docs/samples/nyc_taxi_demo.ipynb index dc47b8ea8..473604937 100644 --- a/docs/samples/nyc_taxi_demo.ipynb +++ b/docs/samples/nyc_taxi_demo.ipynb @@ -81,7 +81,7 @@ }, { "cell_type": "code", - "execution_count": 1, + "execution_count": null, "metadata": {}, "outputs": [], "source": [ @@ -417,7 +417,7 @@ "# Download the data file\n", "data_file_path = f\"{WORKING_DIR}/nyc_taxi_data.csv\"\n", "df_raw = nyc_taxi.get_spark_df(spark=spark, local_cache_path=data_file_path)\n", - "df_raw.limit(5).toPandas()" + "df_raw.limit(5).show()" ] }, { @@ -791,7 +791,7 @@ " client=client,\n", " data_format=DATA_FORMAT,\n", ")\n", - "df.select(feature_names).limit(5).toPandas()" + "df.select(feature_names).limit(5).show()" ] }, { @@ -1155,7 +1155,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.8.0 (default, Nov 6 2019, 21:49:08) \n[GCC 7.3.0]" + "version": "3.10.9" }, "vscode": { "interpreter": { diff --git a/feathr_project/setup.py b/feathr_project/setup.py index d5f13b31c..699f6d688 100644 --- a/feathr_project/setup.py +++ b/feathr_project/setup.py @@ -74,7 +74,7 @@ "pyyaml<=6.0", "Jinja2<=3.1.2", "pyarrow<=9.0.0", - "pyspark>=3.1.2", + "pyspark>=3.1.2", # TODO upgrade the version once pyspark publishes new release to resolve `AttributeError: module 'numpy' has no attribute 'bool'` "python-snappy<=0.6.1", "deltalake>=0.6.2", "graphlib_backport<=1.0.3",