sorting a pandas column code example
Example 1: sorting by column in pandas
#Python, Pandas
#Sorting dataframe df on the values of a column col1
#Temporary
df.sort_values(by=["col1"])
#Permanent
df.sort_values(by=["col1"], inplace = True)
Example 2: Returns a new DataFrame sorted by the specified column(s)
# Returns a new DataFrame sorted by the specified column(s)
df.sort(df.age.desc()).collect()
# [Row(age=5, name=u'Bob'), Row(age=2, name=u'Alice')]
df.sort("age", ascending=False).collect()
# [Row(age=5, name=u'Bob'), Row(age=2, name=u'Alice')]
df.orderBy(df.age.desc()).collect()
# [Row(age=5, name=u'Bob'), Row(age=2, name=u'Alice')]
from pyspark.sql.functions import *
df.sort(asc("age")).collect()
# [Row(age=2, name=u'Alice'), Row(age=5, name=u'Bob')]
df.orderBy(desc("age"), "name").collect()
# [Row(age=5, name=u'Bob'), Row(age=2, name=u'Alice')]
df.orderBy(["age", "name"], ascending=[0, 1]).collect()
# [Row(age=5, name=u'Bob'), Row(age=2, name=u'Alice')]