- import numpy as np
- import pandas as pd
- from pyspark.sql import SparkSession
- APP_NAME = "DataFrames"
- SPARK_URL = "local[*]"
- spark = SparkSession.builder.appName(APP_NAME) \
- .config('spark.ui.showConsoleProgress', 'false') \
- .getOrCreate()
- taxi = spark.read.load('/datasets/pickups_terminal_5.csv',
- format='csv', header='true', inferSchema='true')
- taxi_select = taxi[['date','hour', 'minute']]# < напишите код здесь >
- taxi_select.show(5)
SQL
From Александр Юрьевич Храмов, 4 Months ago, written in Plain Text, viewed 83 times.
URL http://codebin.org/view/5f17eff4
Embed
Download Paste or View Raw
— Expand Paste to full width of browser