start new:
tmux
start new with session name:
tmux new -s myname
#! /usr/bin/python | |
# -*- coding: utf-8 -*- | |
"""vlc media player; based off example in vlc repo: | |
`http://git.videolan.org/?p=vlc/bindings/python.git;a=commit;h=HEAD` | |
See also: | |
`http://infohost.nmt.edu/tcc/help/pubs/tkinter/web/menu.html` | |
`http://infohost.nmt.edu/tcc/help/pubs/tkinter/web/menu-coptions.html` |
# for records grouped by colA, colB, and colC return a df where colD is unique: | |
import pyspark.sql.functions as fn | |
df.groupBy('colA', 'colB', 'colC').agg(fn.collect_list('colD').alias('newColD'), fn.count('colD').alias('count').filter(fn.col('count') > 1)) | |
df.select(fn.explode('newColD').alias('colDUniques')).show() | |
# given a subset of columns, return a dataframe where duplciates exists for these columns: |