blob: 878b6d2ef7feb45ef82941c1e42d20deaa7e86a9 [file] [log] [blame]
{
"paragraphs": [
{
"text": "%md\n## Welcome to Zeppelin.\n##### This is a live tutorial, you can run the code yourself. (Shift-Enter to Run)",
"user": "anonymous",
"dateUpdated": "2021-07-26 04:36:10.172",
"progress": 0,
"config": {
"colWidth": 12.0,
"editorHide": true,
"results": [
{
"graph": {
"mode": "table",
"height": 300.0,
"optionOpen": false,
"keys": [],
"values": [],
"groups": [],
"scatter": {}
}
}
],
"enabled": true,
"editorSetting": {
"language": "markdown",
"editOnDblClick": true
},
"editorMode": "ace/mode/markdown",
"tableHide": false,
"fontSize": 9.0
},
"settings": {
"params": {},
"forms": {}
},
"results": {
"code": "SUCCESS",
"msg": [
{
"type": "HTML",
"data": "\u003cdiv class\u003d\"markdown-body\"\u003e\n\u003ch2\u003eWelcome to Zeppelin.\u003c/h2\u003e\n\u003ch5\u003eThis is a live tutorial, you can run the code yourself. (Shift-Enter to Run)\u003c/h5\u003e\n\n\u003c/div\u003e"
}
]
},
"apps": [],
"runtimeInfos": {},
"progressUpdateIntervalMs": 500,
"jobName": "paragraph_1423836981412_-1007008116",
"id": "20150213-231621_168813393",
"dateCreated": "2015-02-13 23:16:21.000",
"dateStarted": "2021-07-26 04:36:10.174",
"dateFinished": "2021-07-26 04:36:10.184",
"status": "FINISHED"
},
{
"title": "Load data into table",
"text": "import org.apache.commons.io.IOUtils\nimport java.net.URL\nimport java.nio.charset.Charset\n\n// Zeppelin creates and injects sc (SparkContext) and sqlContext (HiveContext or SqlContext)\n// So you don\u0027t need create them manually\n\n// load bank data\nval bankText \u003d sc.parallelize(\n IOUtils.toString(\n new URL(\"https://s3.amazonaws.com/apache-zeppelin/tutorial/bank/bank.csv\"),\n Charset.forName(\"utf8\")).split(\"\\n\"))\n\ncase class Bank(age: Integer, job: String, marital: String, education: String, balance: Integer)\n\nval bank \u003d bankText.map(s \u003d\u003e s.split(\";\")).filter(s \u003d\u003e s(0) !\u003d \"\\\"age\\\"\").map(\n s \u003d\u003e Bank(s(0).toInt, \n s(1).replaceAll(\"\\\"\", \"\"),\n s(2).replaceAll(\"\\\"\", \"\"),\n s(3).replaceAll(\"\\\"\", \"\"),\n s(5).replaceAll(\"\\\"\", \"\").toInt\n )\n).toDF()\nbank.registerTempTable(\"bank\")",
"user": "anonymous",
"dateUpdated": "2021-07-26 04:36:10.274",
"progress": 0,
"config": {
"colWidth": 12.0,
"title": true,
"enabled": true,
"editorMode": "ace/mode/scala",
"results": [
{
"graph": {
"mode": "table",
"height": 300.0,
"optionOpen": false
}
}
],
"editorSetting": {
"language": "scala",
"editOnDblClick": false,
"completionKey": "TAB",
"completionSupport": true
},
"fontSize": 9.0
},
"settings": {
"params": {},
"forms": {}
},
"results": {
"code": "SUCCESS",
"msg": [
{
"type": "TEXT",
"data": "\u001b[33mwarning: \u001b[0mthere was one deprecation warning (since 2.0.0); for details, enable `:setting -deprecation\u0027 or `:replay -deprecation\u0027\nimport sqlContext.implicits._\nimport org.apache.commons.io.IOUtils\nimport java.net.URL\nimport java.nio.charset.Charset\n\u001b[1m\u001b[34mbankText\u001b[0m: \u001b[1m\u001b[32morg.apache.spark.rdd.RDD[String]\u001b[0m \u003d ParallelCollectionRDD[505] at parallelize at \u003cconsole\u003e:32\ndefined class Bank\n\u001b[1m\u001b[34mbank\u001b[0m: \u001b[1m\u001b[32morg.apache.spark.sql.DataFrame\u001b[0m \u003d [age: int, job: string ... 3 more fields]\n"
}
]
},
"apps": [],
"runtimeInfos": {},
"progressUpdateIntervalMs": 500,
"jobName": "paragraph_1423500779206_-1502780787",
"id": "20150210-015259_1403135953",
"dateCreated": "2015-02-10 01:52:59.000",
"dateStarted": "2021-07-26 04:36:10.276",
"dateFinished": "2021-07-26 04:36:13.186",
"status": "FINISHED"
},
{
"text": "%sql \nselect age, count(1) value\nfrom bank \nwhere age \u003c 30 \ngroup by age \norder by age",
"user": "anonymous",
"dateUpdated": "2021-07-26 04:36:13.281",
"progress": 15,
"config": {
"colWidth": 4.0,
"results": [
{
"graph": {
"mode": "multiBarChart",
"height": 366.0,
"optionOpen": false,
"setting": {
"multiBarChart": {
"rotate": {
"degree": "-45"
},
"xLabelStatus": "default"
}
},
"commonSetting": {},
"keys": [
{
"name": "age",
"index": 0.0,
"aggr": "sum"
}
],
"groups": [],
"values": [
{
"name": "value",
"index": 1.0,
"aggr": "sum"
}
]
},
"helium": {}
}
],
"enabled": true,
"editorSetting": {
"language": "sql",
"editOnDblClick": false,
"completionKey": "TAB",
"completionSupport": true
},
"editorMode": "ace/mode/sql",
"fontSize": 9.0
},
"settings": {
"params": {},
"forms": {}
},
"results": {
"code": "SUCCESS",
"msg": [
{
"type": "TABLE",
"data": "age\tvalue\n19\t4\n20\t3\n21\t7\n22\t9\n23\t20\n24\t24\n25\t44\n26\t77\n27\t94\n28\t103\n29\t97\n"
}
]
},
"apps": [],
"runtimeInfos": {
"jobUrl": {
"propertyName": "jobUrl",
"label": "SPARK JOB",
"tooltip": "View in Spark web UI",
"group": "spark",
"values": [
{
"jobUrl": "http://3745c7ed824d:4040/jobs/job?id\u003d210"
}
],
"interpreterSettingId": "spark"
}
},
"progressUpdateIntervalMs": 500,
"jobName": "paragraph_1423500782552_-1439281894",
"id": "20150210-015302_1492795503",
"dateCreated": "2015-02-10 01:53:02.000",
"dateStarted": "2021-07-26 04:36:13.283",
"dateFinished": "2021-07-26 04:36:14.677",
"status": "FINISHED"
},
{
"text": "%sql \nselect age, count(1) value \nfrom bank \nwhere age \u003c ${maxAge\u003d30} \ngroup by age \norder by age",
"user": "anonymous",
"dateUpdated": "2021-07-26 04:36:14.692",
"progress": 58,
"config": {
"colWidth": 4.0,
"results": [
{
"graph": {
"mode": "multiBarChart",
"height": 294.0,
"optionOpen": false,
"setting": {
"multiBarChart": {
"rotate": {
"degree": "-45"
},
"xLabelStatus": "default"
}
},
"commonSetting": {},
"keys": [
{
"name": "age",
"index": 0.0,
"aggr": "sum"
}
],
"groups": [],
"values": [
{
"name": "value",
"index": 1.0,
"aggr": "sum"
}
]
},
"helium": {}
}
],
"enabled": true,
"editorSetting": {
"language": "sql",
"editOnDblClick": false,
"completionKey": "TAB",
"completionSupport": true
},
"editorMode": "ace/mode/sql",
"fontSize": 9.0
},
"settings": {
"params": {
"maxAge": "35"
},
"forms": {
"maxAge": {
"type": "TextBox",
"name": "maxAge",
"displayName": "maxAge",
"defaultValue": "30",
"hidden": false
}
}
},
"results": {
"code": "SUCCESS",
"msg": [
{
"type": "TABLE",
"data": "age\tvalue\n19\t4\n20\t3\n21\t7\n22\t9\n23\t20\n24\t24\n25\t44\n26\t77\n27\t94\n28\t103\n29\t97\n30\t150\n31\t199\n32\t224\n33\t186\n34\t231\n"
}
]
},
"apps": [],
"runtimeInfos": {
"jobUrl": {
"propertyName": "jobUrl",
"label": "SPARK JOB",
"tooltip": "View in Spark web UI",
"group": "spark",
"values": [
{
"jobUrl": "http://3745c7ed824d:4040/jobs/job?id\u003d211"
}
],
"interpreterSettingId": "spark"
}
},
"progressUpdateIntervalMs": 500,
"jobName": "paragraph_1423720444030_-1424110477",
"id": "20150212-145404_867439529",
"dateCreated": "2015-02-12 14:54:04.000",
"dateStarted": "2021-07-26 04:36:14.700",
"dateFinished": "2021-07-26 04:36:15.404",
"status": "FINISHED"
},
{
"text": "%sql \nselect age, count(1) value \nfrom bank \nwhere marital\u003d\"${marital\u003dsingle,single|divorced|married}\" \ngroup by age \norder by age",
"user": "anonymous",
"dateUpdated": "2021-07-26 04:36:15.497",
"progress": 51,
"config": {
"colWidth": 4.0,
"results": [
{
"graph": {
"mode": "stackedAreaChart",
"height": 280.0,
"optionOpen": false,
"setting": {
"stackedAreaChart": {
"rotate": {
"degree": "-45"
},
"xLabelStatus": "default"
}
},
"commonSetting": {},
"keys": [
{
"name": "age",
"index": 0.0,
"aggr": "sum"
}
],
"groups": [],
"values": [
{
"name": "value",
"index": 1.0,
"aggr": "sum"
}
]
},
"helium": {}
}
],
"enabled": true,
"editorSetting": {
"language": "sql",
"editOnDblClick": false,
"completionKey": "TAB",
"completionSupport": true
},
"editorMode": "ace/mode/sql",
"fontSize": 9.0,
"runOnSelectionChange": true
},
"settings": {
"params": {
"marital": "single"
},
"forms": {
"marital": {
"type": "Select",
"options": [
{
"value": "single"
},
{
"value": "divorced"
},
{
"value": "married"
}
],
"name": "marital",
"displayName": "marital",
"defaultValue": "single",
"hidden": false
}
}
},
"results": {
"code": "SUCCESS",
"msg": [
{
"type": "TABLE",
"data": "age\tvalue\n19\t4\n20\t3\n21\t7\n22\t9\n23\t17\n24\t13\n25\t33\n26\t56\n27\t64\n28\t78\n29\t56\n30\t92\n31\t86\n32\t105\n33\t61\n34\t75\n35\t46\n36\t50\n37\t43\n38\t44\n39\t30\n40\t25\n41\t19\n42\t23\n43\t21\n44\t20\n45\t15\n46\t14\n47\t12\n48\t12\n49\t11\n50\t8\n51\t6\n52\t9\n53\t4\n55\t3\n56\t3\n57\t2\n58\t7\n59\t2\n60\t5\n66\t2\n69\t1\n"
}
]
},
"apps": [],
"runtimeInfos": {
"jobUrl": {
"propertyName": "jobUrl",
"label": "SPARK JOB",
"tooltip": "View in Spark web UI",
"group": "spark",
"values": [
{
"jobUrl": "http://3745c7ed824d:4040/jobs/job?id\u003d212"
}
],
"interpreterSettingId": "spark"
}
},
"progressUpdateIntervalMs": 500,
"jobName": "paragraph_1423836262027_-210588283",
"id": "20150213-230422_1600658137",
"dateCreated": "2015-02-13 23:04:22.000",
"dateStarted": "2021-07-26 04:36:15.502",
"dateFinished": "2021-07-26 04:36:16.265",
"status": "FINISHED"
},
{
"text": "%md\n## Congratulations, it\u0027s done.\n##### You can create your own notebook in \u0027Notebook\u0027 menu. Good luck!",
"user": "anonymous",
"dateUpdated": "2021-07-26 04:36:16.300",
"progress": 0,
"config": {
"colWidth": 12.0,
"editorHide": true,
"results": [
{
"graph": {
"mode": "table",
"height": 300.0,
"optionOpen": false
}
}
],
"enabled": true,
"editorSetting": {
"language": "markdown",
"editOnDblClick": true
},
"editorMode": "ace/mode/markdown",
"tableHide": false,
"fontSize": 9.0
},
"settings": {
"params": {},
"forms": {}
},
"results": {
"code": "SUCCESS",
"msg": [
{
"type": "HTML",
"data": "\u003cdiv class\u003d\"markdown-body\"\u003e\n\u003ch2\u003eCongratulations, it\u0026rsquo;s done.\u003c/h2\u003e\n\u003ch5\u003eYou can create your own notebook in \u0026lsquo;Notebook\u0026rsquo; menu. Good luck!\u003c/h5\u003e\n\n\u003c/div\u003e"
}
]
},
"apps": [],
"runtimeInfos": {},
"progressUpdateIntervalMs": 500,
"jobName": "paragraph_1423836268492_216498320",
"id": "20150213-230428_1231780373",
"dateCreated": "2015-02-13 23:04:28.000",
"dateStarted": "2021-07-26 04:36:16.302",
"dateFinished": "2021-07-26 04:36:16.308",
"status": "FINISHED"
},
{
"text": "%md\n\nAbout bank data\n\n```\nCitation Request:\n This dataset is public available for research. The details are described in [Moro et al., 2011]. \n Please include this citation if you plan to use this database:\n\n [Moro et al., 2011] S. Moro, R. Laureano and P. Cortez. Using Data Mining for Bank Direct Marketing: An Application of the CRISP-DM Methodology. \n In P. Novais et al. (Eds.), Proceedings of the European Simulation and Modelling Conference - ESM\u00272011, pp. 117-121, GuimarĂ£es, Portugal, October, 2011. EUROSIS.\n\n Available at: [pdf] http://hdl.handle.net/1822/14838\n [bib] http://www3.dsi.uminho.pt/pcortez/bib/2011-esm-1.txt\n```",
"user": "anonymous",
"dateUpdated": "2021-07-26 04:36:16.402",
"progress": 0,
"config": {
"colWidth": 12.0,
"editorHide": true,
"results": [
{
"graph": {
"mode": "table",
"height": 300.0,
"optionOpen": false
}
}
],
"enabled": true,
"editorSetting": {
"language": "markdown",
"editOnDblClick": true
},
"editorMode": "ace/mode/markdown",
"tableHide": false,
"fontSize": 9.0
},
"settings": {
"params": {},
"forms": {}
},
"results": {
"code": "SUCCESS",
"msg": [
{
"type": "HTML",
"data": "\u003cdiv class\u003d\"markdown-body\"\u003e\n\u003cp\u003eAbout bank data\u003c/p\u003e\n\u003cpre\u003e\u003ccode\u003eCitation Request:\n This dataset is public available for research. The details are described in [Moro et al., 2011]. \n Please include this citation if you plan to use this database:\n\n [Moro et al., 2011] S. Moro, R. Laureano and P. Cortez. Using Data Mining for Bank Direct Marketing: An Application of the CRISP-DM Methodology. \n In P. Novais et al. (Eds.), Proceedings of the European Simulation and Modelling Conference - ESM\u00272011, pp. 117-121, GuimarĂ£es, Portugal, October, 2011. EUROSIS.\n\n Available at: [pdf] http://hdl.handle.net/1822/14838\n [bib] http://www3.dsi.uminho.pt/pcortez/bib/2011-esm-1.txt\n\u003c/code\u003e\u003c/pre\u003e\n\n\u003c/div\u003e"
}
]
},
"apps": [],
"runtimeInfos": {},
"progressUpdateIntervalMs": 500,
"jobName": "paragraph_1427420818407_872443482",
"id": "20150326-214658_12335843",
"dateCreated": "2015-03-26 21:46:58.000",
"dateStarted": "2021-07-26 04:36:16.404",
"dateFinished": "2021-07-26 04:36:16.413",
"status": "FINISHED"
},
{
"user": "anonymous",
"dateUpdated": "2021-07-26 04:36:16.504",
"progress": 0,
"config": {
"colWidth": 12.0,
"fontSize": 9.0,
"enabled": true,
"results": {},
"editorSetting": {
"language": "scala",
"editOnDblClick": false,
"completionKey": "TAB",
"completionSupport": true
},
"editorMode": "ace/mode/scala"
},
"settings": {
"params": {},
"forms": {}
},
"apps": [],
"runtimeInfos": {},
"progressUpdateIntervalMs": 500,
"jobName": "paragraph_1435955447812_-158639899",
"id": "20150703-133047_853701097",
"dateCreated": "2015-07-03 13:30:47.000",
"status": "FINISHED"
}
],
"name": "2. Spark Basic Features",
"id": "2A94M5J1Z",
"defaultInterpreterGroup": "spark",
"noteParams": {},
"noteForms": {},
"angularObjects": {},
"config": {
"looknfeel": "default",
"isZeppelinNotebookCronEnable": false
},
"info": {
"isRunning": true
}
}