{"id":9922,"date":"2025-01-26T04:42:08","date_gmt":"2025-01-26T03:42:08","guid":{"rendered":"https:\/\/myoceane.fr\/?p=9922"},"modified":"2025-01-26T04:46:22","modified_gmt":"2025-01-26T03:46:22","slug":"bigdata-pyspark-on-jupyter-lab","status":"publish","type":"post","link":"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/","title":{"rendered":"[BigData] PySpark on Jupyter Lab"},"content":{"rendered":"<div id=\"fb-root\"><\/div>\n\n<p style=\"text-align: justify;\">Jupyter Notebook\/Lab \u662f\u4e00\u500b\u5e38\u7528\u7684\u4e92\u52d5\u5f0f\u4ecb\u9762\u5354\u52a9\u5404\u7a2e\u7a0b\u5f0f\u78bc\u7684\u958b\u767c\u6211\u5011\u5728\u4e0a\u4e00\u7bc7<a href=\"https:\/\/myoceane.fr\/index.php\/jupyter-notebook-server\/\">\u300e\u5efa\u7acb\u81ea\u5df1\u7684 Jupyter Notebook \u4f3a\u670d\u5668\u300f<\/a>\u6709\u7a0d\u5fae\u4ecb\u7d39\u904e\uff0c\u4e00\u822c\u5e38\u898b\u7684\u4f7f\u7528\u5834\u666f\u662f\u5728\u958b\u767c python \u7684\u7a0b\u5f0f\uff0c\u4f46\u662f Jupyter Server \u7684 Kernel \u529f\u80fd\u53ef\u4ee5\u64f4\u5145\u66f4\u591a\u7684\u4e92\u52d5\u5f0f\u958b\u767c\u74b0\u5883\uff0c\u4f8b\u5982 R, PySpark, SparkR, SparklyR \u7b49\u7b49\uff0c\u6ab8\u6aac\u7238\u6700\u65e9\u63a5\u89f8\u7684\u662f\u5c07 PySpark \u8a3b\u518a\u5230 Jupyter Lab \u88e1\u9762\uff0c\u5be6\u4f5c\u7684\u7a0b\u5f0f\u78bc\u662f\u900f\u904e AZTK \u7684 Repository \u5b78\u7fd2\u5230\u7684\uff0c\u5f8c\u4f86\u9032\u4e00\u6b65\u5c07\u5176\u64f4\u5145\u5230 R \u7b49\u7b49\u7684\u4f7f\u7528\u5834\u666f\uff0c\u672c\u7bc7\u5c07\u6703\u5448\u73fe\u5982\u4f55\u90e8\u7f72\u4e00\u500b\u6709 PySpark \u6838\u5fc3\u7684 Jupyter Lab\u3002<\/p>\n\n\n\n<blockquote class=\"wp-block-quote is-layout-flow wp-block-quote-is-layout-flow\">\n<p>AZTK \u9a45\u52d5\u5305\u542b\u6709 PySpark \u7684 Jupyter Lab \u670d\u52d9\u7bc4\u4f8b<\/p>\n<cite><a href=\"https:\/\/github.com\/Azure\/aztk\/blob\/master\/aztk\/spark\/models\/plugins\/jupyter_lab\/jupyter_lab.sh\">https:\/\/github.com\/Azure\/aztk\/blob\/master\/aztk\/spark\/models\/plugins\/jupyter_lab\/jupyter_lab.sh<\/a><\/cite><\/blockquote>\n\n\n<p>\u4e0b\u9762\u7684\u7a0b\u5f0f\u78bc\u64f7\u53d6\u91cd\u8981\u7684\u90e8\u5206\uff0c\u5176\u4e2d\u6700\u4e3b\u8981\u7684\u5730\u65b9\u5728\u65bc\uff1a<\/p>\n<ol>\n<li>\u5b9a\u7fa9 PYSPARK_DRIVER_PYTHON \u4f7f pyspark \u7a0b\u5f0f\u521d\u59cb\u5316\u6642\u9a45\u52d5 jupyter<\/li>\n<li>\u5b9a\u7fa9 PYSPARK_DRIVER_PYTHON_OPTS\u00a0\u00a0<\/li>\n<li>\u5275\u5efa\u4e00\u500b kernel.json \u6a94\u6848<\/li>\n<li>\u5229\u7528 pyspark \u7a0b\u5f0f\u78bc\u555f\u52d5<\/li>\n<\/ol>\n<pre class=\"lang:bash\">PYSPARK_DRIVER_PYTHON=\"\/opt\/conda\/bin\/jupyter\"\nJUPYTER_KERNELS=\"\/opt\/conda\/share\/jupyter\/kernels\"\n\nmkdir $JUPYTER_KERNELS\/pyspark\ntouch $JUPYTER_KERNELS\/pyspark\/kernel.json\ncat &lt;&lt; EOF &gt; $JUPYTER_KERNELS\/pyspark\/kernel.json\n{\n    \"display_name\": \"PySpark\",\n    \"language\": \"python\",\n    \"argv\": [\n        \"python\",\n        \"-m\",\n        \"ipykernel\",\n        \"-f\",\n        \"{connection_file}\"\n    ],\n    \"env\": {\n        \"SPARK_HOME\": \"$SPARK_HOME\",\n        \"PYSPARK_PYTHON\": \"python\",\n        \"PYSPARK_SUBMIT_ARGS\": \"--master spark:\/\/$MASTER_IP:7077 pyspark-shell\"\n    }\n}\nEOF\n(PYSPARK_DRIVER_PYTHON=$PYSPARK_DRIVER_PYTHON PYSPARK_DRIVER_PYTHON_OPTS=\"lab --no-browser --port=8889 --allow-root\" pyspark &amp;)<\/pre>\n<p style=\"text-align: justify;\"><strong>\u7f3a\u9ede\uff1a<\/strong>\u4f7f\u7528\u4ee5\u4e0a\u7684\u65b9\u6cd5\u90e8\u7f72 jupyter notebook \u7684\u670d\u52d9\u662f\u53ef\u4ee5\u6210\u529f\u7684\uff0c\u4f46\u662f\u7f3a\u9ede\u537b\u4e5f\u96a8\u4e4b\u800c\u4f86\uff0c\u5305\u542b pyspark \u7d81\u5b9a\u4e86 jupyter\uff0c\u7121\u6cd5\u5728 terminal \u7684\u72c0\u614b\u518d\u5229\u7528 pyspark \u505a\u5075\u932f\uff0c\u4e26\u4e14\u9032\u4e00\u6b65\u9650\u5236\u4e86 jupyter lab \u5167\u90e8\u7684\u5176\u4ed6 kernel \u5fc5\u9808\u8981\u540c\u6b65\u4f7f\u7528 pyspark\uff0c\u5728\u4f7f\u7528\u55ae\u7d14 python \u7684\u60c5\u6cc1\u4e0b\u9020\u6210\u8cc7\u6e90\u7684\u6d6a\u8cbb\u3002<\/p>\n\n\n<h4>\u6539\u826f\u9a45\u52d5 Jupyter Lab \u7684\u65b9\u5f0f<\/h4>\n<p>\u70ba\u4e86\u4e0d\u8981\u5c07\u9a45\u52d5 pyspark \u7684\u65b9\u5f0f\u7d81\u5b9a\u5728 jupyter\uff0c\u6211\u5011\u5c07 PYSPARK_DRIVER_PYTHON \u7684\u5b9a\u7fa9\u79fb\u9032 kernel.json \u4e26\u4e14\u5229\u7528\u5b9a\u7fa9\u521d\u59cb\u5316\u8173\u672c PYTHONSTARTUP \u7684\u65b9\u5f0f\u505a\u5230 SparkSession \u7684\u521d\u59cb\u5316\uff0c\u4ee5\u4e0b\u662f\u53c3\u8003\u7684\u7a0b\u5f0f\u78bc\uff1a<\/p>\n<pre class=\"lang:bash\">export JUPYTER_KERNELS=\/usr\/local\/share\/jupyter\/kernels\nmkdir $JUPYTER_KERNELS\/pyspark\ntouch $JUPYTER_KERNELS\/pyspark\/kernel.json\n\ncat &lt;&lt; EOF &gt; $JUPYTER_KERNELS\/pyspark\/kernel.json\n{\n    \"display_name\": \"PySpark\",\n    \"language\": \"python\",\n    \"argv\": [\n        \"python\",\n        \"-m\",\n        \"ipykernel\",\n        \"-f\",\n        \"{connection_file}\"\n    ],\n    \"env\": {\n        \"SPARK_HOME\": \"$SPARK_HOME\",\n        \"PYSPARK_PYTHON\": \"python\",\n        \"PYSPARK_DRIVER_PYTHON\": \"jupyter\",\n        \"PYSPARK_SUBMIT_ARGS\": \"--master spark:\/\/$MASTER_IP:7077 pyspark-shell\",\n        \"PYTHONSTARTUP\": \"$JUPYTER_KERNELS\/pyspark\/init.py\"\n    }\n}\nEOF\ncat &lt;&lt; EOF &gt; $JUPYTER_KERNELS\/pyspark\/init.py\nfrom pyspark.sql import SparkSession\nspark = SparkSession.builder.appName(\"PySpark Kernel\").config(\"spark.master\", \"spark:\/\/$MASTER_IP:7077\").getOrCreate()\nEOF\n\njupyter lab --no-browser --port=8999 --allow-root --ip=0.0.0.0 &amp;<\/pre>\n<p>\u00a0<\/p>\n","protected":false},"excerpt":{"rendered":"<p>Jupyter Notebook\/Lab \u662f\u4e00\u500b\u5e38\u7528\u7684\u4e92\u52d5\u5f0f\u4ecb\u9762\u5354\u52a9\u5404\u7a2e\u7a0b\u5f0f\u78bc\u7684\u958b\u767c\u6211\u5011\u5728\u4e0a\u4e00\u7bc7\u300e\u5efa\u7acb\u81ea\u5df1\u7684 Jupyter Notebook \u4f3a\u670d\u5668\u300f\u6709\u7a0d\u5fae\u4ecb\u7d39\u904e\uff0c\u4e00\u822c\u5e38\u898b\u7684\u4f7f\u7528\u5834\u666f\u662f\u5728\u958b\u767c python \u7684\u7a0b\u5f0f\uff0c\u4f46\u662f Jupyter Server \u7684 Kernel \u529f\u80fd\u53ef\u4ee5\u64f4\u5145\u66f4\u591a\u7684\u4e92\u52d5\u5f0f\u958b\u767c\u74b0\u5883\uff0c\u4f8b\u5982 R, PySpark, SparkR, SparklyR \u7b49\u7b49\uff0c\u6ab8\u6aac\u7238\u6700\u65e9\u63a5\u89f8\u7684\u662f\u5c07 PySpark \u8a3b\u518a\u5230 Jupyter Lab \u88e1\u9762\uff0c\u5be6\u4f5c\u7684\u7a0b\u5f0f\u78bc\u662f\u900f\u904e AZTK \u7684 Repository \u5b78\u7fd2\u5230\u7684\uff0c\u5f8c\u4f86\u9032\u4e00\u6b65\u5c07\u5176\u64f4\u5145\u5230 R \u7b49\u7b49\u7684\u4f7f\u7528\u5834\u666f\uff0c\u672c\u7bc7\u5c07\u6703\u5448\u73fe\u5982\u4f55\u90e8\u7f72\u4e00\u500b\u6709 PySpark \u6838\u5fc3\u7684 Jupyter Lab\u3002<\/p>\n","protected":false},"author":1,"featured_media":2637,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[9],"tags":[1844,1843,1842],"class_list":["post-9922","post","type-post","status-publish","format-standard","has-post-thumbnail","hentry","category-bigdata-ml","tag-jupyter-lab","tag-kernel","tag-pyspark"],"yoast_head":"<!-- This site is optimized with the Yoast SEO plugin v24.6 - https:\/\/yoast.com\/wordpress\/plugins\/seo\/ -->\n<title>[BigData] PySpark on Jupyter Lab - \u60f3\u65b9\u6d89\u6cd5 - \u91cf\u74f6\u5916\u7684\u5929\u7a7a M-Y-Oceane<\/title>\n<meta name=\"robots\" content=\"index, follow, max-snippet:-1, max-image-preview:large, max-video-preview:-1\" \/>\n<link rel=\"canonical\" href=\"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/\" \/>\n<meta property=\"og:locale\" content=\"en_US\" \/>\n<meta property=\"og:type\" content=\"article\" \/>\n<meta property=\"og:title\" content=\"[BigData] PySpark on Jupyter Lab - \u60f3\u65b9\u6d89\u6cd5 - \u91cf\u74f6\u5916\u7684\u5929\u7a7a M-Y-Oceane\" \/>\n<meta property=\"og:description\" content=\"Jupyter Notebook\/Lab \u662f\u4e00\u500b\u5e38\u7528\u7684\u4e92\u52d5\u5f0f\u4ecb\u9762\u5354\u52a9\u5404\u7a2e\u7a0b\u5f0f\u78bc\u7684\u958b\u767c\u6211\u5011\u5728\u4e0a\u4e00\u7bc7\u300e\u5efa\u7acb\u81ea\u5df1\u7684 Jupyter Notebook \u4f3a\u670d\u5668\u300f\u6709\u7a0d\u5fae\u4ecb\u7d39\u904e\uff0c\u4e00\u822c\u5e38\u898b\u7684\u4f7f\u7528\u5834\u666f\u662f\u5728\u958b\u767c python \u7684\u7a0b\u5f0f\uff0c\u4f46\u662f Jupyter Server \u7684 Kernel \u529f\u80fd\u53ef\u4ee5\u64f4\u5145\u66f4\u591a\u7684\u4e92\u52d5\u5f0f\u958b\u767c\u74b0\u5883\uff0c\u4f8b\u5982 R, PySpark, SparkR, SparklyR \u7b49\u7b49\uff0c\u6ab8\u6aac\u7238\u6700\u65e9\u63a5\u89f8\u7684\u662f\u5c07 PySpark \u8a3b\u518a\u5230 Jupyter Lab \u88e1\u9762\uff0c\u5be6\u4f5c\u7684\u7a0b\u5f0f\u78bc\u662f\u900f\u904e AZTK \u7684 Repository \u5b78\u7fd2\u5230\u7684\uff0c\u5f8c\u4f86\u9032\u4e00\u6b65\u5c07\u5176\u64f4\u5145\u5230 R \u7b49\u7b49\u7684\u4f7f\u7528\u5834\u666f\uff0c\u672c\u7bc7\u5c07\u6703\u5448\u73fe\u5982\u4f55\u90e8\u7f72\u4e00\u500b\u6709 PySpark \u6838\u5fc3\u7684 Jupyter Lab\u3002\" \/>\n<meta property=\"og:url\" content=\"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/\" \/>\n<meta property=\"og:site_name\" content=\"\u60f3\u65b9\u6d89\u6cd5 - \u91cf\u74f6\u5916\u7684\u5929\u7a7a M-Y-Oceane\" \/>\n<meta property=\"article:published_time\" content=\"2025-01-26T03:42:08+00:00\" \/>\n<meta property=\"article:modified_time\" content=\"2025-01-26T03:46:22+00:00\" \/>\n<meta property=\"og:image\" content=\"https:\/\/myoceane.fr\/wp-content\/uploads\/2019\/06\/1_m87_Htb_9Pstq0UcvNJ49w.png\" \/>\n\t<meta property=\"og:image:width\" content=\"1600\" \/>\n\t<meta property=\"og:image:height\" content=\"795\" \/>\n\t<meta property=\"og:image:type\" content=\"image\/png\" \/>\n<meta name=\"author\" content=\"\u6ab8\u6aac\u7238\" \/>\n<meta name=\"twitter:card\" content=\"summary_large_image\" \/>\n<meta name=\"twitter:label1\" content=\"Written by\" \/>\n\t<meta name=\"twitter:data1\" content=\"\u6ab8\u6aac\u7238\" \/>\n\t<meta name=\"twitter:label2\" content=\"Est. reading time\" \/>\n\t<meta name=\"twitter:data2\" content=\"1 minute\" \/>\n<script type=\"application\/ld+json\" class=\"yoast-schema-graph\">{\"@context\":\"https:\/\/schema.org\",\"@graph\":[{\"@type\":\"Article\",\"@id\":\"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/#article\",\"isPartOf\":{\"@id\":\"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/\"},\"author\":{\"name\":\"\u6ab8\u6aac\u7238\",\"@id\":\"https:\/\/myoceane.fr\/#\/schema\/person\/4a4552fb8c27693083d465e12db7658b\"},\"headline\":\"[BigData] PySpark on Jupyter Lab\",\"datePublished\":\"2025-01-26T03:42:08+00:00\",\"dateModified\":\"2025-01-26T03:46:22+00:00\",\"mainEntityOfPage\":{\"@id\":\"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/\"},\"wordCount\":81,\"commentCount\":0,\"publisher\":{\"@id\":\"https:\/\/myoceane.fr\/#\/schema\/person\/4a4552fb8c27693083d465e12db7658b\"},\"image\":{\"@id\":\"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/#primaryimage\"},\"thumbnailUrl\":\"https:\/\/myoceane.fr\/wp-content\/uploads\/2019\/06\/1_m87_Htb_9Pstq0UcvNJ49w.png\",\"keywords\":[\"Jupyter Lab\",\"Kernel\",\"PySpark\"],\"articleSection\":[\"Big Data &amp; Machine Learning\"],\"inLanguage\":\"en-US\",\"potentialAction\":[{\"@type\":\"CommentAction\",\"name\":\"Comment\",\"target\":[\"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/#respond\"]}]},{\"@type\":\"WebPage\",\"@id\":\"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/\",\"url\":\"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/\",\"name\":\"[BigData] PySpark on Jupyter Lab - \u60f3\u65b9\u6d89\u6cd5 - \u91cf\u74f6\u5916\u7684\u5929\u7a7a M-Y-Oceane\",\"isPartOf\":{\"@id\":\"https:\/\/myoceane.fr\/#website\"},\"primaryImageOfPage\":{\"@id\":\"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/#primaryimage\"},\"image\":{\"@id\":\"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/#primaryimage\"},\"thumbnailUrl\":\"https:\/\/myoceane.fr\/wp-content\/uploads\/2019\/06\/1_m87_Htb_9Pstq0UcvNJ49w.png\",\"datePublished\":\"2025-01-26T03:42:08+00:00\",\"dateModified\":\"2025-01-26T03:46:22+00:00\",\"breadcrumb\":{\"@id\":\"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/#breadcrumb\"},\"inLanguage\":\"en-US\",\"potentialAction\":[{\"@type\":\"ReadAction\",\"target\":[\"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/\"]}]},{\"@type\":\"ImageObject\",\"inLanguage\":\"en-US\",\"@id\":\"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/#primaryimage\",\"url\":\"https:\/\/myoceane.fr\/wp-content\/uploads\/2019\/06\/1_m87_Htb_9Pstq0UcvNJ49w.png\",\"contentUrl\":\"https:\/\/myoceane.fr\/wp-content\/uploads\/2019\/06\/1_m87_Htb_9Pstq0UcvNJ49w.png\",\"width\":1600,\"height\":795},{\"@type\":\"BreadcrumbList\",\"@id\":\"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/#breadcrumb\",\"itemListElement\":[{\"@type\":\"ListItem\",\"position\":1,\"name\":\"Home\",\"item\":\"https:\/\/myoceane.fr\/\"},{\"@type\":\"ListItem\",\"position\":2,\"name\":\"[BigData] PySpark on Jupyter Lab\"}]},{\"@type\":\"WebSite\",\"@id\":\"https:\/\/myoceane.fr\/#website\",\"url\":\"https:\/\/myoceane.fr\/\",\"name\":\"M-Y-Oceane \u60f3\u65b9\u6d89\u6cd5\u3002\u91cf\u74f6\u5916\u7684\u5929\u7a7a\",\"description\":\"\u60f3\u65b9\u6d89\u6cd5, France, Taiwan, Health, Information Technology\",\"publisher\":{\"@id\":\"https:\/\/myoceane.fr\/#\/schema\/person\/4a4552fb8c27693083d465e12db7658b\"},\"potentialAction\":[{\"@type\":\"SearchAction\",\"target\":{\"@type\":\"EntryPoint\",\"urlTemplate\":\"https:\/\/myoceane.fr\/?s={search_term_string}\"},\"query-input\":{\"@type\":\"PropertyValueSpecification\",\"valueRequired\":true,\"valueName\":\"search_term_string\"}}],\"inLanguage\":\"en-US\"},{\"@type\":[\"Person\",\"Organization\"],\"@id\":\"https:\/\/myoceane.fr\/#\/schema\/person\/4a4552fb8c27693083d465e12db7658b\",\"name\":\"\u6ab8\u6aac\u7238\",\"image\":{\"@type\":\"ImageObject\",\"inLanguage\":\"en-US\",\"@id\":\"https:\/\/myoceane.fr\/#\/schema\/person\/image\/\",\"url\":\"https:\/\/secure.gravatar.com\/avatar\/6cc678684664f8ad45a8d56a6630b183?s=96&d=mm&r=g\",\"contentUrl\":\"https:\/\/secure.gravatar.com\/avatar\/6cc678684664f8ad45a8d56a6630b183?s=96&d=mm&r=g\",\"caption\":\"\u6ab8\u6aac\u7238\"},\"logo\":{\"@id\":\"https:\/\/myoceane.fr\/#\/schema\/person\/image\/\"},\"url\":\"https:\/\/myoceane.fr\/index.php\/author\/johnny5584767gmail-com\/\"}]}<\/script>\n<!-- \/ Yoast SEO plugin. -->","yoast_head_json":{"title":"[BigData] PySpark on Jupyter Lab - \u60f3\u65b9\u6d89\u6cd5 - \u91cf\u74f6\u5916\u7684\u5929\u7a7a M-Y-Oceane","robots":{"index":"index","follow":"follow","max-snippet":"max-snippet:-1","max-image-preview":"max-image-preview:large","max-video-preview":"max-video-preview:-1"},"canonical":"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/","og_locale":"en_US","og_type":"article","og_title":"[BigData] PySpark on Jupyter Lab - \u60f3\u65b9\u6d89\u6cd5 - \u91cf\u74f6\u5916\u7684\u5929\u7a7a M-Y-Oceane","og_description":"Jupyter Notebook\/Lab \u662f\u4e00\u500b\u5e38\u7528\u7684\u4e92\u52d5\u5f0f\u4ecb\u9762\u5354\u52a9\u5404\u7a2e\u7a0b\u5f0f\u78bc\u7684\u958b\u767c\u6211\u5011\u5728\u4e0a\u4e00\u7bc7\u300e\u5efa\u7acb\u81ea\u5df1\u7684 Jupyter Notebook \u4f3a\u670d\u5668\u300f\u6709\u7a0d\u5fae\u4ecb\u7d39\u904e\uff0c\u4e00\u822c\u5e38\u898b\u7684\u4f7f\u7528\u5834\u666f\u662f\u5728\u958b\u767c python \u7684\u7a0b\u5f0f\uff0c\u4f46\u662f Jupyter Server \u7684 Kernel \u529f\u80fd\u53ef\u4ee5\u64f4\u5145\u66f4\u591a\u7684\u4e92\u52d5\u5f0f\u958b\u767c\u74b0\u5883\uff0c\u4f8b\u5982 R, PySpark, SparkR, SparklyR \u7b49\u7b49\uff0c\u6ab8\u6aac\u7238\u6700\u65e9\u63a5\u89f8\u7684\u662f\u5c07 PySpark \u8a3b\u518a\u5230 Jupyter Lab \u88e1\u9762\uff0c\u5be6\u4f5c\u7684\u7a0b\u5f0f\u78bc\u662f\u900f\u904e AZTK \u7684 Repository \u5b78\u7fd2\u5230\u7684\uff0c\u5f8c\u4f86\u9032\u4e00\u6b65\u5c07\u5176\u64f4\u5145\u5230 R \u7b49\u7b49\u7684\u4f7f\u7528\u5834\u666f\uff0c\u672c\u7bc7\u5c07\u6703\u5448\u73fe\u5982\u4f55\u90e8\u7f72\u4e00\u500b\u6709 PySpark \u6838\u5fc3\u7684 Jupyter Lab\u3002","og_url":"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/","og_site_name":"\u60f3\u65b9\u6d89\u6cd5 - \u91cf\u74f6\u5916\u7684\u5929\u7a7a M-Y-Oceane","article_published_time":"2025-01-26T03:42:08+00:00","article_modified_time":"2025-01-26T03:46:22+00:00","og_image":[{"width":1600,"height":795,"url":"https:\/\/myoceane.fr\/wp-content\/uploads\/2019\/06\/1_m87_Htb_9Pstq0UcvNJ49w.png","type":"image\/png"}],"author":"\u6ab8\u6aac\u7238","twitter_card":"summary_large_image","twitter_misc":{"Written by":"\u6ab8\u6aac\u7238","Est. reading time":"1 minute"},"schema":{"@context":"https:\/\/schema.org","@graph":[{"@type":"Article","@id":"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/#article","isPartOf":{"@id":"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/"},"author":{"name":"\u6ab8\u6aac\u7238","@id":"https:\/\/myoceane.fr\/#\/schema\/person\/4a4552fb8c27693083d465e12db7658b"},"headline":"[BigData] PySpark on Jupyter Lab","datePublished":"2025-01-26T03:42:08+00:00","dateModified":"2025-01-26T03:46:22+00:00","mainEntityOfPage":{"@id":"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/"},"wordCount":81,"commentCount":0,"publisher":{"@id":"https:\/\/myoceane.fr\/#\/schema\/person\/4a4552fb8c27693083d465e12db7658b"},"image":{"@id":"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/#primaryimage"},"thumbnailUrl":"https:\/\/myoceane.fr\/wp-content\/uploads\/2019\/06\/1_m87_Htb_9Pstq0UcvNJ49w.png","keywords":["Jupyter Lab","Kernel","PySpark"],"articleSection":["Big Data &amp; Machine Learning"],"inLanguage":"en-US","potentialAction":[{"@type":"CommentAction","name":"Comment","target":["https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/#respond"]}]},{"@type":"WebPage","@id":"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/","url":"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/","name":"[BigData] PySpark on Jupyter Lab - \u60f3\u65b9\u6d89\u6cd5 - \u91cf\u74f6\u5916\u7684\u5929\u7a7a M-Y-Oceane","isPartOf":{"@id":"https:\/\/myoceane.fr\/#website"},"primaryImageOfPage":{"@id":"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/#primaryimage"},"image":{"@id":"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/#primaryimage"},"thumbnailUrl":"https:\/\/myoceane.fr\/wp-content\/uploads\/2019\/06\/1_m87_Htb_9Pstq0UcvNJ49w.png","datePublished":"2025-01-26T03:42:08+00:00","dateModified":"2025-01-26T03:46:22+00:00","breadcrumb":{"@id":"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/#breadcrumb"},"inLanguage":"en-US","potentialAction":[{"@type":"ReadAction","target":["https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/"]}]},{"@type":"ImageObject","inLanguage":"en-US","@id":"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/#primaryimage","url":"https:\/\/myoceane.fr\/wp-content\/uploads\/2019\/06\/1_m87_Htb_9Pstq0UcvNJ49w.png","contentUrl":"https:\/\/myoceane.fr\/wp-content\/uploads\/2019\/06\/1_m87_Htb_9Pstq0UcvNJ49w.png","width":1600,"height":795},{"@type":"BreadcrumbList","@id":"https:\/\/myoceane.fr\/index.php\/bigdata-pyspark-on-jupyter-lab\/#breadcrumb","itemListElement":[{"@type":"ListItem","position":1,"name":"Home","item":"https:\/\/myoceane.fr\/"},{"@type":"ListItem","position":2,"name":"[BigData] PySpark on Jupyter Lab"}]},{"@type":"WebSite","@id":"https:\/\/myoceane.fr\/#website","url":"https:\/\/myoceane.fr\/","name":"M-Y-Oceane \u60f3\u65b9\u6d89\u6cd5\u3002\u91cf\u74f6\u5916\u7684\u5929\u7a7a","description":"\u60f3\u65b9\u6d89\u6cd5, France, Taiwan, Health, Information Technology","publisher":{"@id":"https:\/\/myoceane.fr\/#\/schema\/person\/4a4552fb8c27693083d465e12db7658b"},"potentialAction":[{"@type":"SearchAction","target":{"@type":"EntryPoint","urlTemplate":"https:\/\/myoceane.fr\/?s={search_term_string}"},"query-input":{"@type":"PropertyValueSpecification","valueRequired":true,"valueName":"search_term_string"}}],"inLanguage":"en-US"},{"@type":["Person","Organization"],"@id":"https:\/\/myoceane.fr\/#\/schema\/person\/4a4552fb8c27693083d465e12db7658b","name":"\u6ab8\u6aac\u7238","image":{"@type":"ImageObject","inLanguage":"en-US","@id":"https:\/\/myoceane.fr\/#\/schema\/person\/image\/","url":"https:\/\/secure.gravatar.com\/avatar\/6cc678684664f8ad45a8d56a6630b183?s=96&d=mm&r=g","contentUrl":"https:\/\/secure.gravatar.com\/avatar\/6cc678684664f8ad45a8d56a6630b183?s=96&d=mm&r=g","caption":"\u6ab8\u6aac\u7238"},"logo":{"@id":"https:\/\/myoceane.fr\/#\/schema\/person\/image\/"},"url":"https:\/\/myoceane.fr\/index.php\/author\/johnny5584767gmail-com\/"}]}},"amp_enabled":true,"_links":{"self":[{"href":"https:\/\/myoceane.fr\/index.php\/wp-json\/wp\/v2\/posts\/9922","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/myoceane.fr\/index.php\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/myoceane.fr\/index.php\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/myoceane.fr\/index.php\/wp-json\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/myoceane.fr\/index.php\/wp-json\/wp\/v2\/comments?post=9922"}],"version-history":[{"count":15,"href":"https:\/\/myoceane.fr\/index.php\/wp-json\/wp\/v2\/posts\/9922\/revisions"}],"predecessor-version":[{"id":9937,"href":"https:\/\/myoceane.fr\/index.php\/wp-json\/wp\/v2\/posts\/9922\/revisions\/9937"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/myoceane.fr\/index.php\/wp-json\/wp\/v2\/media\/2637"}],"wp:attachment":[{"href":"https:\/\/myoceane.fr\/index.php\/wp-json\/wp\/v2\/media?parent=9922"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/myoceane.fr\/index.php\/wp-json\/wp\/v2\/categories?post=9922"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/myoceane.fr\/index.php\/wp-json\/wp\/v2\/tags?post=9922"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}