Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- from pyspark.sql import functions as F
- (logs_df.agg(F.min(logs_df['content_size']).alias('min_content_size'),
- F.max(logs_df['content_size']).alias('max_content_size'),
- F.mean(logs_df['content_size']).alias('mean_content_size'),
- F.stddev(logs_df['content_size']).alias('std_content_size'),
- F.count(logs_df['content_size']).alias('count_content_size'))
- .toPandas())
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement