{"paragraphs":[{"text":"%spark.pyspark\n","user":"walker","dateUpdated":"2019-10-12T05:15:04+0000","config":{"colWidth":12,"fontSize":9,"enabled":true,"results":{},"editorSetting":{"language":"python","editOnDblClick":false,"completionSupport":true},"editorMode":"ace/mode/python"},"settings":{"params":{},"forms":{}},"apps":[],"jobName":"paragraph_1570857304400_640746049","id":"20191012-051504_1791494737","dateCreated":"2019-10-12T05:15:04+0000","status":"READY","progressUpdateIntervalMs":500,"focus":true,"$$hashKey":"object:23686"},{"text":"%spark.pyspark\ndef isSick(x):\n if x in (3,7):\n return 0\n else:\n return 1","user":"walker","dateUpdated":"2019-10-12T05:13:57+0000","config":{"colWidth":12,"fontSize":9,"enabled":true,"results":{},"editorSetting":{"language":"python","editOnDblClick":false,"completionSupport":true,"completionKey":"TAB"},"editorMode":"ace/mode/python","editorHide":false},"settings":{"params":{},"forms":{}},"results":{"code":"SUCCESS","msg":[]},"apps":[],"jobName":"paragraph_1570785919759_-1457622604","id":"20191011-092519_94493470","dateCreated":"2019-10-11T09:25:19+0000","dateStarted":"2019-10-12T05:13:57+0000","dateFinished":"2019-10-12T05:13:57+0000","status":"FINISHED","progressUpdateIntervalMs":500,"$$hashKey":"object:23687"},{"text":"%spark.pyspark\n","user":"walker","dateUpdated":"2019-10-12T05:13:57+0000","config":{"colWidth":12,"fontSize":9,"enabled":true,"results":{},"editorSetting":{"language":"python","editOnDblClick":false,"completionSupport":true,"completionKey":"TAB"},"editorMode":"ace/mode/python"},"settings":{"params":{},"forms":{}},"apps":[],"jobName":"paragraph_1570857227530_1796867328","id":"20191012-051347_1396539575","dateCreated":"2019-10-12T05:13:47+0000","status":"FINISHED","progressUpdateIntervalMs":500,"$$hashKey":"object:23688"},{"text":"%spark.pyspark\n\nimport pandas as pd\nfrom pyspark.sql.types import StructType, StructField, NumericType\n\n \ncols = ('age', \n 'sex', \n 'chest pain', \n 'resting blood pressure', \n 'serum cholestoral', \n 'fasting blood sugar', \n 'resting electrocardiographic results', \n 'maximum heart rate achieved', \n 'exercise induced angina', \n 'ST depression induced by exercise relative to rest', \n 'the slope of the peak exercise ST segment', \n 'number of major vessels ', \n 'thal', \n 'last')\n \n\n \ndata = pd.read_csv('/home/ubuntu/Downloads/heart.csv', delimiter=' ', names=cols)\n\ndata = data.iloc[:,0:13]\n\ndata['isSick'] = data['thal'].apply(isSick)\n\ndf = spark.createDataFrame(data)\n\n \n \n \n\n ","user":"walker","dateUpdated":"2019-10-12T05:13:57+0000","config":{"colWidth":12,"fontSize":9,"enabled":true,"results":{},"editorSetting":{"language":"python","editOnDblClick":false,"completionSupport":true,"completionKey":"TAB"},"editorMode":"ace/mode/python","tableHide":false,"editorHide":false},"settings":{"params":{},"forms":{}},"results":{"code":"SUCCESS","msg":[]},"apps":[],"jobName":"paragraph_1570626673174_-397859394","id":"20191009-131113_1020772482","dateCreated":"2019-10-09T13:11:13+0000","dateStarted":"2019-10-12T05:13:57+0000","dateFinished":"2019-10-12T05:13:57+0000","status":"FINISHED","progressUpdateIntervalMs":500,"$$hashKey":"object:23689"},{"text":"%spark.pyspark\nfrom pyspark.ml.feature import StandardScaler\nfrom pyspark.ml.feature import VectorAssembler\n\nfeatures = ('age', \n 'sex', \n 'chest pain', \n 'resting blood pressure', \n 'serum cholestoral', \n 'fasting blood sugar', \n 'resting electrocardiographic results', \n 'maximum heart rate achieved', \n 'exercise induced angina', \n 'ST depression induced by exercise relative to rest', \n 'the slope of the peak exercise ST segment', \n 'number of major vessels ') \n\nassembler = VectorAssembler(inputCols=features,outputCol=\"features\")\n \nraw_data=assembler.transform(df)\nraw_data.select(\"features\").show(truncate=False)","user":"walker","dateUpdated":"2019-10-12T05:13:57+0000","config":{"colWidth":12,"fontSize":9,"enabled":true,"results":{},"editorSetting":{"language":"python","editOnDblClick":false,"completionSupport":true,"completionKey":"TAB"},"editorMode":"ace/mode/python"},"settings":{"params":{},"forms":{}},"results":{"code":"SUCCESS","msg":[{"type":"TEXT","data":"+--------------------------------------------------------+\n|features |\n+--------------------------------------------------------+\n|[70.0,1.0,4.0,130.0,322.0,0.0,2.0,109.0,0.0,2.4,2.0,3.0]|\n|[67.0,0.0,3.0,115.0,564.0,0.0,2.0,160.0,0.0,1.6,2.0,0.0]|\n|[57.0,1.0,2.0,124.0,261.0,0.0,0.0,141.0,0.0,0.3,1.0,0.0]|\n|[64.0,1.0,4.0,128.0,263.0,0.0,0.0,105.0,1.0,0.2,2.0,1.0]|\n|[74.0,0.0,2.0,120.0,269.0,0.0,2.0,121.0,1.0,0.2,1.0,1.0]|\n|[65.0,1.0,4.0,120.0,177.0,0.0,0.0,140.0,0.0,0.4,1.0,0.0]|\n|[56.0,1.0,3.0,130.0,256.0,1.0,2.0,142.0,1.0,0.6,2.0,1.0]|\n|[59.0,1.0,4.0,110.0,239.0,0.0,2.0,142.0,1.0,1.2,2.0,1.0]|\n|[60.0,1.0,4.0,140.0,293.0,0.0,2.0,170.0,0.0,1.2,2.0,2.0]|\n|[63.0,0.0,4.0,150.0,407.0,0.0,2.0,154.0,0.0,4.0,2.0,3.0]|\n|[59.0,1.0,4.0,135.0,234.0,0.0,0.0,161.0,0.0,0.5,2.0,0.0]|\n|[53.0,1.0,4.0,142.0,226.0,0.0,2.0,111.0,1.0,0.0,1.0,0.0]|\n|[44.0,1.0,3.0,140.0,235.0,0.0,2.0,180.0,0.0,0.0,1.0,0.0]|\n|[61.0,1.0,1.0,134.0,234.0,0.0,0.0,145.0,0.0,2.6,2.0,2.0]|\n|[57.0,0.0,4.0,128.0,303.0,0.0,2.0,159.0,0.0,0.0,1.0,1.0]|\n|[71.0,0.0,4.0,112.0,149.0,0.0,0.0,125.0,0.0,1.6,2.0,0.0]|\n|[46.0,1.0,4.0,140.0,311.0,0.0,0.0,120.0,1.0,1.8,2.0,2.0]|\n|[53.0,1.0,4.0,140.0,203.0,1.0,2.0,155.0,1.0,3.1,3.0,0.0]|\n|[64.0,1.0,1.0,110.0,211.0,0.0,2.0,144.0,1.0,1.8,2.0,0.0]|\n|[40.0,1.0,1.0,140.0,199.0,0.0,0.0,178.0,1.0,1.4,1.0,0.0]|\n+--------------------------------------------------------+\nonly showing top 20 rows\n\n"}]},"runtimeInfos":{"jobUrl":{"propertyName":"jobUrl","label":"SPARK JOB","tooltip":"View in Spark web UI","group":"spark","values":["http://parisx:4040/jobs/job?id=238"],"interpreterSettingId":"spark"}},"apps":[],"jobName":"paragraph_1570787472789_-2031757993","id":"20191011-095112_1692182483","dateCreated":"2019-10-11T09:51:12+0000","dateStarted":"2019-10-12T05:13:57+0000","dateFinished":"2019-10-12T05:13:57+0000","status":"FINISHED","progressUpdateIntervalMs":500,"$$hashKey":"object:23690"},{"text":"%spark.pyspark\nfrom pyspark.ml.feature import StandardScaler\nstandardscaler=StandardScaler().setInputCol(\"features\").setOutputCol(\"Scaled_features\")\nraw_data=standardscaler.fit(raw_data).transform(raw_data)\nraw_data.select(\"features\",\"Scaled_features\").show(5)","user":"walker","dateUpdated":"2019-10-12T05:13:57+0000","config":{"colWidth":12,"fontSize":9,"enabled":true,"results":{},"editorSetting":{"language":"python","editOnDblClick":false,"completionSupport":true,"completionKey":"TAB"},"editorMode":"ace/mode/python"},"settings":{"params":{},"forms":{}},"results":{"code":"SUCCESS","msg":[{"type":"TEXT","data":"+--------------------+--------------------+\n| features| Scaled_features|\n+--------------------+--------------------+\n|[70.0,1.0,4.0,130...|[7.68465131046640...|\n|[67.0,0.0,3.0,115...|[7.35530911144641...|\n|[57.0,1.0,2.0,124...|[6.25750178137978...|\n|[64.0,1.0,4.0,128...|[7.02596691242642...|\n|[74.0,0.0,2.0,120...|[8.12377424249305...|\n+--------------------+--------------------+\nonly showing top 5 rows\n\n"}]},"runtimeInfos":{"jobUrl":{"propertyName":"jobUrl","label":"SPARK JOB","tooltip":"View in Spark web UI","group":"spark","values":["http://parisx:4040/jobs/job?id=239","http://parisx:4040/jobs/job?id=240"],"interpreterSettingId":"spark"}},"apps":[],"jobName":"paragraph_1570787532506_804248666","id":"20191011-095212_884979848","dateCreated":"2019-10-11T09:52:12+0000","dateStarted":"2019-10-12T05:13:57+0000","dateFinished":"2019-10-12T05:13:58+0000","status":"FINISHED","progressUpdateIntervalMs":500,"$$hashKey":"object:23691"},{"text":"%spark.pyspark\nfrom pyspark.ml.tuning import ParamGridBuilder, TrainValidationSplit\ntraining, test = raw_data.randomSplit([0.5, 0.5], seed=12345) ","user":"walker","dateUpdated":"2019-10-12T05:13:58+0000","config":{"colWidth":12,"fontSize":9,"enabled":true,"results":{},"editorSetting":{"language":"python","editOnDblClick":false,"completionSupport":true,"completionKey":"TAB"},"editorMode":"ace/mode/python"},"settings":{"params":{},"forms":{}},"results":{"code":"SUCCESS","msg":[]},"apps":[],"jobName":"paragraph_1570786856257_1989926248","id":"20191011-094056_1017703181","dateCreated":"2019-10-11T09:40:56+0000","dateStarted":"2019-10-12T05:13:58+0000","dateFinished":"2019-10-12T05:13:58+0000","status":"FINISHED","progressUpdateIntervalMs":500,"$$hashKey":"object:23692"},{"text":"%spark.pyspark\nfrom pyspark.ml.classification import LogisticRegression\n\nlr = LogisticRegression(labelCol=\"isSick\", featuresCol=\"Scaled_features\",maxIter=10)\nmodel=lr.fit(training)\npredict_train=model.transform(training)\npredict_test=model.transform(test)\npredict_test.select(\"isSick\",\"prediction\").show(10)\n\n","user":"walker","dateUpdated":"2019-10-12T05:13:58+0000","config":{"colWidth":12,"fontSize":9,"enabled":true,"results":{"0":{"graph":{"mode":"table","height":300,"optionOpen":false,"setting":{"table":{"tableGridState":{},"tableColumnTypeState":{"names":{"age":"string","sex":"string","chest pain":"string","resting blood pressure":"string","serum cholestoral":"string","fasting blood sugar":"string","resting electrocardiographic results":"string","maximum heart rate achieved":"string","exercise induced angina":"string","ST depression induced by exercise relative to rest":"string","the slope of the peak exercise ST segment":"string","number of major vessels ":"string","thal":"string","last":"string"},"updated":false},"tableOptionSpecHash":"[{\"name\":\"useFilter\",\"valueType\":\"boolean\",\"defaultValue\":false,\"widget\":\"checkbox\",\"description\":\"Enable filter for columns\"},{\"name\":\"showPagination\",\"valueType\":\"boolean\",\"defaultValue\":false,\"widget\":\"checkbox\",\"description\":\"Enable pagination for better navigation\"},{\"name\":\"showAggregationFooter\",\"valueType\":\"boolean\",\"defaultValue\":false,\"widget\":\"checkbox\",\"description\":\"Enable a footer for displaying aggregated values\"}]","tableOptionValue":{"useFilter":false,"showPagination":false,"showAggregationFooter":false},"updated":false,"initialized":false}},"commonSetting":{}}}},"editorSetting":{"language":"python","editOnDblClick":false,"completionSupport":true,"completionKey":"TAB"},"editorMode":"ace/mode/python"},"settings":{"params":{},"forms":{}},"results":{"code":"SUCCESS","msg":[{"type":"TEXT","data":"+------+----------+\n|isSick|prediction|\n+------+----------+\n| 0| 0.0|\n| 0| 0.0|\n| 0| 0.0|\n| 0| 0.0|\n| 0| 0.0|\n| 0| 0.0|\n| 0| 0.0|\n| 0| 0.0|\n| 0| 0.0|\n| 0| 0.0|\n+------+----------+\nonly showing top 10 rows\n\n"}]},"runtimeInfos":{"jobUrl":{"propertyName":"jobUrl","label":"SPARK JOB","tooltip":"View in Spark web UI","group":"spark","values":["http://parisx:4040/jobs/job?id=241","http://parisx:4040/jobs/job?id=242","http://parisx:4040/jobs/job?id=243","http://parisx:4040/jobs/job?id=244","http://parisx:4040/jobs/job?id=245","http://parisx:4040/jobs/job?id=246","http://parisx:4040/jobs/job?id=247","http://parisx:4040/jobs/job?id=248","http://parisx:4040/jobs/job?id=249","http://parisx:4040/jobs/job?id=250","http://parisx:4040/jobs/job?id=251","http://parisx:4040/jobs/job?id=252","http://parisx:4040/jobs/job?id=253","http://parisx:4040/jobs/job?id=254"],"interpreterSettingId":"spark"}},"apps":[],"jobName":"paragraph_1570780194447_-881313364","id":"20191011-074954_221759573","dateCreated":"2019-10-11T07:49:54+0000","dateStarted":"2019-10-12T05:13:58+0000","dateFinished":"2019-10-12T05:13:59+0000","status":"FINISHED","progressUpdateIntervalMs":500,"$$hashKey":"object:23693"},{"text":"","user":"walker","dateUpdated":"2019-10-12T05:13:59+0000","config":{"colWidth":12,"fontSize":9,"enabled":true,"results":{},"editorSetting":{"language":"python","editOnDblClick":false,"completionSupport":true,"completionKey":"TAB"},"editorMode":"ace/mode/python"},"settings":{"params":{},"forms":{}},"apps":[],"jobName":"paragraph_1570791927022_-1684254656","id":"20191011-110527_322705203","dateCreated":"2019-10-11T11:05:27+0000","dateStarted":"2019-10-11T17:18:09+0000","dateFinished":"2019-10-11T17:18:10+0000","status":"FINISHED","errorMessage":"","progressUpdateIntervalMs":500,"$$hashKey":"object:23694"},{"text":"","user":"walker","dateUpdated":"2019-10-12T05:13:59+0000","config":{"colWidth":12,"fontSize":9,"enabled":true,"results":{},"editorSetting":{"language":"python","editOnDblClick":false,"completionSupport":true,"completionKey":"TAB"},"editorMode":"ace/mode/python"},"settings":{"params":{},"forms":{}},"runtimeInfos":{"jobUrl":{"propertyName":"jobUrl","label":"SPARK JOB","tooltip":"View in Spark web UI","group":"spark","values":["http://parisx:4040/jobs/job?id=90"],"interpreterSettingId":"spark"}},"apps":[],"jobName":"paragraph_1570792350392_-458139160","id":"20191011-111230_1736345948","dateCreated":"2019-10-11T11:12:30+0000","dateStarted":"2019-10-11T11:39:51+0000","dateFinished":"2019-10-11T11:39:51+0000","status":"FINISHED","errorMessage":"","progressUpdateIntervalMs":500,"$$hashKey":"object:23695"},{"text":"%spark.pyspark\n \n\n\nprint(\"Multinomial coefficients: \" + str(model.coefficientMatrix))\nprint(\"Multinomial intercepts: \" + str(model.interceptVector))","user":"walker","dateUpdated":"2019-10-12T05:13:59+0000","config":{"colWidth":12,"fontSize":9,"enabled":true,"results":{},"editorSetting":{"language":"python","editOnDblClick":false,"completionSupport":true,"completionKey":"TAB"},"editorMode":"ace/mode/python"},"settings":{"params":{},"forms":{}},"results":{"code":"SUCCESS","msg":[{"type":"TEXT","data":"Multinomial coefficients: DenseMatrix([[ 0.6668908 , 1.69441174, -0.12228916, -0.4890833 , -1.12192264,\n -0.09436271, -0.94372679, -0.02751622, -0.19240091, -0.83972691,\n 1.17107336, 0.26495489]])\nMultinomial intercepts: [-2.7970145465614697]\n"}]},"apps":[],"jobName":"paragraph_1570791083763_-478407110","id":"20191011-105123_295762744","dateCreated":"2019-10-11T10:51:23+0000","dateStarted":"2019-10-12T05:13:59+0000","dateFinished":"2019-10-12T05:13:59+0000","status":"FINISHED","progressUpdateIntervalMs":500,"$$hashKey":"object:23696"},{"text":"%spark.pyspark\n# Extract the summary from the returned LogisticRegressionModel instance trained\n# in the earlier example\ntrainingSummary = model.summary\n\n# Obtain the objective per iteration\nobjectiveHistory = trainingSummary.objectiveHistory\nprint(\"objectiveHistory:\")\nfor objective in objectiveHistory:\n print(objective)\n\n# Obtain the receiver-operating characteristic as a dataframe and areaUnderROC.\n#trainingSummary.roc.show()\nprint(\"areaUnderROC: \" + str(trainingSummary.areaUnderROC))\n\n# Set the model threshold to maximize F-Measure\nfMeasure = trainingSummary.fMeasureByThreshold\nmaxFMeasure = fMeasure.groupBy().max('F-Measure').select('max(F-Measure)').head()\nbestThreshold = fMeasure.where(fMeasure['F-Measure'] == maxFMeasure['max(F-Measure)']) \\\n .select('threshold').head()['threshold']\nlr.setThreshold(bestThreshold)","user":"walker","dateUpdated":"2019-10-12T05:13:59+0000","config":{"colWidth":12,"fontSize":9,"enabled":true,"results":{"0":{"graph":{"mode":"table","height":300,"optionOpen":false,"setting":{"table":{"tableGridState":{},"tableColumnTypeState":{"names":{"age":"string","sex":"string","chest pain":"string","resting blood pressure":"string","serum cholestoral":"string","fasting blood sugar":"string","resting electrocardiographic results":"string","maximum heart rate achieved":"string","exercise induced angina":"string","ST depression induced by exercise relative to rest":"string","the slope of the peak exercise ST segment":"string","number of major vessels ":"string","thal":"string"},"updated":false},"tableOptionSpecHash":"[{\"name\":\"useFilter\",\"valueType\":\"boolean\",\"defaultValue\":false,\"widget\":\"checkbox\",\"description\":\"Enable filter for columns\"},{\"name\":\"showPagination\",\"valueType\":\"boolean\",\"defaultValue\":false,\"widget\":\"checkbox\",\"description\":\"Enable pagination for better navigation\"},{\"name\":\"showAggregationFooter\",\"valueType\":\"boolean\",\"defaultValue\":false,\"widget\":\"checkbox\",\"description\":\"Enable a footer for displaying aggregated values\"}]","tableOptionValue":{"useFilter":false,"showPagination":false,"showAggregationFooter":false},"updated":false,"initialized":false}},"commonSetting":{}}}},"editorSetting":{"language":"python","editOnDblClick":false,"completionSupport":true,"completionKey":"TAB"},"editorMode":"ace/mode/python"},"settings":{"params":{},"forms":{}},"results":{"code":"SUCCESS","msg":[{"type":"TEXT","data":"objectiveHistory:\n0.2183808333258687\n0.20816927260803536\n0.1881067217274369\n0.18205075266753093\n0.17703243938548047\n0.17640412785509704\n0.16477178254282865\n0.1630298030353237\n0.1624715046926652\n0.16229471593907993\n0.16197892605655764\nareaUnderROC: 0.8460591133004924\nLogisticRegression_4f78985a234065d79b08"}]},"runtimeInfos":{"jobUrl":{"propertyName":"jobUrl","label":"SPARK JOB","tooltip":"View in Spark web UI","group":"spark","values":["http://parisx:4040/jobs/job?id=255","http://parisx:4040/jobs/job?id=256","http://parisx:4040/jobs/job?id=257","http://parisx:4040/jobs/job?id=258","http://parisx:4040/jobs/job?id=259","http://parisx:4040/jobs/job?id=260","http://parisx:4040/jobs/job?id=261"],"interpreterSettingId":"spark"}},"apps":[],"jobName":"paragraph_1570785416983_-405639045","id":"20191011-091656_1871714335","dateCreated":"2019-10-11T09:16:56+0000","dateStarted":"2019-10-12T05:13:59+0000","dateFinished":"2019-10-12T05:14:00+0000","status":"FINISHED","progressUpdateIntervalMs":500,"$$hashKey":"object:23697"},{"text":" ","user":"walker","dateUpdated":"2019-10-12T05:14:00+0000","config":{"colWidth":12,"fontSize":9,"enabled":true,"results":{},"editorSetting":{"language":"python","editOnDblClick":false,"completionSupport":true,"completionKey":"TAB"},"editorMode":"ace/mode/python"},"settings":{"params":{},"forms":{}},"apps":[],"jobName":"paragraph_1570810637687_831880407","id":"20191011-161717_1625998568","dateCreated":"2019-10-11T16:17:17+0000","dateStarted":"2019-10-11T17:00:00+0000","dateFinished":"2019-10-11T17:00:00+0000","status":"FINISHED","errorMessage":"","progressUpdateIntervalMs":500,"$$hashKey":"object:23698"},{"text":"%spark.pyspark\ntrainingSummary","user":"walker","dateUpdated":"2019-10-12T05:14:00+0000","config":{"colWidth":12,"fontSize":9,"enabled":true,"results":{"0":{"graph":{"mode":"table","height":300,"optionOpen":false,"setting":{"table":{"tableGridState":{},"tableColumnTypeState":{"names":{"age":"string","sex":"string","chest pain":"string","resting blood pressure":"string","serum cholestoral":"string","fasting blood sugar":"string","resting electrocardiographic results":"string","maximum heart rate achieved":"string","exercise induced angina":"string","ST depression induced by exercise relative to rest":"string","the slope of the peak exercise ST segment":"string","number of major vessels ":"string","thal":"string"},"updated":false},"tableOptionSpecHash":"[{\"name\":\"useFilter\",\"valueType\":\"boolean\",\"defaultValue\":false,\"widget\":\"checkbox\",\"description\":\"Enable filter for columns\"},{\"name\":\"showPagination\",\"valueType\":\"boolean\",\"defaultValue\":false,\"widget\":\"checkbox\",\"description\":\"Enable pagination for better navigation\"},{\"name\":\"showAggregationFooter\",\"valueType\":\"boolean\",\"defaultValue\":false,\"widget\":\"checkbox\",\"description\":\"Enable a footer for displaying aggregated values\"}]","tableOptionValue":{"useFilter":false,"showPagination":false,"showAggregationFooter":false},"updated":false,"initialized":false}},"commonSetting":{}}}},"editorSetting":{"language":"python","editOnDblClick":false,"completionSupport":true,"completionKey":"TAB"},"editorMode":"ace/mode/python"},"settings":{"params":{},"forms":{}},"results":{"code":"SUCCESS","msg":[{"type":"TEXT","data":""}]},"apps":[],"jobName":"paragraph_1570627395453_-1913081912","id":"20191009-132315_1652278208","dateCreated":"2019-10-09T13:23:15+0000","dateStarted":"2019-10-12T05:14:00+0000","dateFinished":"2019-10-12T05:14:00+0000","status":"FINISHED","progressUpdateIntervalMs":500,"$$hashKey":"object:23699"},{"text":"%spark.pyspark\nimport pyspark.sql.functions as F\ncheck = predict_test.withColumn('correct', F.when(F.col('isSick') == F.col('prediction'), 1).otherwise(0))\ncheck.groupby(\"correct\").count().show()\n ","user":"walker","dateUpdated":"2019-10-12T05:14:00+0000","config":{"colWidth":12,"fontSize":9,"enabled":true,"results":{"0":{"graph":{"mode":"table","height":300,"optionOpen":false,"setting":{"table":{"tableGridState":{},"tableColumnTypeState":{"names":{"Price":"string","Rooms":"string"},"updated":false},"tableOptionSpecHash":"[{\"name\":\"useFilter\",\"valueType\":\"boolean\",\"defaultValue\":false,\"widget\":\"checkbox\",\"description\":\"Enable filter for columns\"},{\"name\":\"showPagination\",\"valueType\":\"boolean\",\"defaultValue\":false,\"widget\":\"checkbox\",\"description\":\"Enable pagination for better navigation\"},{\"name\":\"showAggregationFooter\",\"valueType\":\"boolean\",\"defaultValue\":false,\"widget\":\"checkbox\",\"description\":\"Enable a footer for displaying aggregated values\"}]","tableOptionValue":{"useFilter":false,"showPagination":false,"showAggregationFooter":false},"updated":false,"initialized":false}},"commonSetting":{}}}},"editorSetting":{"language":"python","editOnDblClick":false,"completionSupport":true,"completionKey":"TAB"},"editorMode":"ace/mode/python"},"settings":{"params":{},"forms":{}},"results":{"code":"SUCCESS","msg":[{"type":"TEXT","data":"+-------+-----+\n|correct|count|\n+-------+-----+\n| 1| 137|\n| 0| 10|\n+-------+-----+\n\n"}]},"runtimeInfos":{"jobUrl":{"propertyName":"jobUrl","label":"SPARK JOB","tooltip":"View in Spark web UI","group":"spark","values":["http://parisx:4040/jobs/job?id=262","http://parisx:4040/jobs/job?id=263","http://parisx:4040/jobs/job?id=264","http://parisx:4040/jobs/job?id=265","http://parisx:4040/jobs/job?id=266"],"interpreterSettingId":"spark"}},"apps":[],"jobName":"paragraph_1570627594552_1531265333","id":"20191009-132634_932134512","dateCreated":"2019-10-09T13:26:34+0000","dateStarted":"2019-10-12T05:14:00+0000","dateFinished":"2019-10-12T05:14:02+0000","status":"FINISHED","progressUpdateIntervalMs":500,"$$hashKey":"object:23700"},{"text":"%spark.pyspark\n \nimport matplotlib.pyplot as plt\n \nimport numpy as np\n \n \n \narr = [int(row.correct ) for row in check.select(['correct']).collect()]\n \n \n\n#plt.pie(arr,labels=labels,autopct='%1.1f%%')\nplt.pie(arr)\n\nplt.show()\n \n \n\n \n\n\n","user":"walker","dateUpdated":"2019-10-12T05:14:02+0000","config":{"colWidth":11,"fontSize":9,"enabled":true,"results":{"0":{"graph":{"mode":"table","height":227,"optionOpen":false}}},"editorSetting":{"language":"python","editOnDblClick":false,"completionSupport":true,"completionKey":"TAB"},"editorMode":"ace/mode/python"},"settings":{"params":{},"forms":{}},"results":{"code":"SUCCESS","msg":[{"type":"TEXT","data":"
\n"},{"type":"IMG","data":"\n"}]},"runtimeInfos":{"jobUrl":{"propertyName":"jobUrl","label":"SPARK JOB","tooltip":"View in Spark web UI","group":"spark","values":["http://parisx:4040/jobs/job?id=267"],"interpreterSettingId":"spark"}},"apps":[],"jobName":"paragraph_1570627870630_-1173954090","id":"20191009-133110_294747364","dateCreated":"2019-10-09T13:31:10+0000","dateStarted":"2019-10-12T05:14:02+0000","dateFinished":"2019-10-12T05:14:03+0000","status":"FINISHED","progressUpdateIntervalMs":500,"$$hashKey":"object:23701"},{"text":"%spark.pyspark\ntype(check.groupby(\"correct\").count())","user":"walker","dateUpdated":"2019-10-12T05:14:03+0000","config":{"colWidth":12,"fontSize":9,"enabled":true,"results":{},"editorSetting":{"language":"python","editOnDblClick":false,"completionSupport":true,"completionKey":"TAB"},"editorMode":"ace/mode/python"},"settings":{"params":{},"forms":{}},"results":{"code":"SUCCESS","msg":[{"type":"TEXT","data":"pyspark.sql.dataframe.DataFrame"}]},"apps":[],"jobName":"paragraph_1570709979301_-136058291","id":"20191010-121939_338275750","dateCreated":"2019-10-10T12:19:39+0000","dateStarted":"2019-10-12T05:14:03+0000","dateFinished":"2019-10-12T05:14:03+0000","status":"FINISHED","progressUpdateIntervalMs":500,"$$hashKey":"object:23702"},{"text":"\n","user":"walker","dateUpdated":"2019-10-12T05:14:03+0000","config":{"colWidth":12,"fontSize":9,"enabled":true,"results":{},"editorSetting":{"language":"python","editOnDblClick":false,"completionSupport":true},"editorMode":"ace/mode/python"},"settings":{"params":{},"forms":{}},"apps":[],"jobName":"paragraph_1570627950251_-191653154","id":"20191009-133230_1683063558","dateCreated":"2019-10-09T13:32:30+0000","status":"FINISHED","errorMessage":"","progressUpdateIntervalMs":500,"$$hashKey":"object:23703"}],"name":"heartDisease","id":"2EQ47DXVR","noteParams":{},"noteForms":{},"angularObjects":{"python:shared_process":[],"spark:shared_process":[]},"config":{"isZeppelinNotebookCronEnable":false,"looknfeel":"default","personalizedMode":"false"},"info":{}}