1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27
| df.groupby(["post_source", "host"]).count().reset_index() df.groupby(["post_source", "host"]).max().reset_index() df.groupby(["post_source", "host"]).min().reset_index() df.groupby(["post_source", "host"]).mean().reset_index()
pd.merge(trdf, tgrdf, 'left', left_on='GROUP_ID', right_on='GROUP_ID')
df = pd.concat([df1, df2], ignore_index=True, sort=True)
def trim(row, col='name'): return row.get(col).strip()
df['name'] = df.apply(trim, axis=1, col='name')
df.sort_values('score', ascending=False).head(15)
df[df['name'].str.contains('Africa')] df[df['name'].str.contains(r'A.{5}$')]
df['SYS_DATE'] = pd.to_datetime(df['SYS_DATE'], format='%Y%m%d')
|