Skip to content

Commit b15edb7

Browse files
committed
Added DataFrames section and cleared outputs
1 parent d445057 commit b15edb7

File tree

2 files changed

+7
-38
lines changed

2 files changed

+7
-38
lines changed

.DS_Store

6 KB
Binary file not shown.

spark/spark.ipynb

+7-38
Original file line numberDiff line numberDiff line change
@@ -64,19 +64,11 @@
6464
},
6565
{
6666
"cell_type": "code",
67-
"execution_count": 1,
67+
"execution_count": null,
6868
"metadata": {
6969
"collapsed": false
7070
},
71-
"outputs": [
72-
{
73-
"name": "stdout",
74-
"output_type": "stream",
75-
"text": [
76-
"/bin/sh: pyspark: command not found\r\n"
77-
]
78-
}
79-
],
71+
"outputs": [],
8072
"source": [
8173
"!pyspark"
8274
]
@@ -90,22 +82,11 @@
9082
},
9183
{
9284
"cell_type": "code",
93-
"execution_count": 2,
85+
"execution_count": null,
9486
"metadata": {
9587
"collapsed": false
9688
},
97-
"outputs": [
98-
{
99-
"data": {
100-
"text/plain": [
101-
"<pyspark.context.SparkContext at 0x103923610>"
102-
]
103-
},
104-
"execution_count": 2,
105-
"metadata": {},
106-
"output_type": "execute_result"
107-
}
108-
],
89+
"outputs": [],
10990
"source": [
11091
"sc"
11192
]
@@ -132,7 +113,7 @@
132113
},
133114
{
134115
"cell_type": "code",
135-
"execution_count": 3,
116+
"execution_count": null,
136117
"metadata": {
137118
"collapsed": false
138119
},
@@ -555,23 +536,11 @@
555536
},
556537
{
557538
"cell_type": "code",
558-
"execution_count": 5,
539+
"execution_count": null,
559540
"metadata": {
560541
"collapsed": false
561542
},
562-
"outputs": [
563-
{
564-
"ename": "NameError",
565-
"evalue": "name 'df' is not defined",
566-
"output_type": "error",
567-
"traceback": [
568-
"\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
569-
"\u001b[0;31mNameError\u001b[0m Traceback (most recent call last)",
570-
"\u001b[0;32m<ipython-input-5-af17cfa6d2c8>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m()\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0mdf\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mgroupBy\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m\"column_name\"\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mcount\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m",
571-
"\u001b[0;31mNameError\u001b[0m: name 'df' is not defined"
572-
]
573-
}
574-
],
543+
"outputs": [],
575544
"source": [
576545
"df.groupBy(\"column_name\").count()"
577546
]

0 commit comments

Comments
 (0)