df.groupBy { city }.mean { age }
Input DataFrame: rowsCount = 7, columnsCount = 5
name | age | city | weight | isHappy |
---|
firstName | lastName | | | | |
---|
Alice | Cooper | 15 | London | 54 | true |
Bob | Dylan | 45 | Dubai | 87 | true |
Charlie | Daniels | 20 | Moscow | null | false |
Charlie | Chaplin | 40 | Milan | null | true |
Bob | Marley | 30 | Tokyo | 68 | true |
Alice | Wolf | 20 | null | 55 | false |
Charlie | Byrd | 30 | Moscow | 90 | true |
Step 1: GroupBy
Output DataFrame: rowsCount = 6, columnsCount = 2
city | age |
---|
London | 15.0 |
Dubai | 45.0 |
Moscow | 25.0 |
Milan | 40.0 |
Tokyo | 30.0 |
null | 20.0 |
df.groupBy { city }.meanOf { age / 2 }
Input DataFrame: rowsCount = 7, columnsCount = 5
name | age | city | weight | isHappy |
---|
firstName | lastName | | | | |
---|
Alice | Cooper | 15 | London | 54 | true |
Bob | Dylan | 45 | Dubai | 87 | true |
Charlie | Daniels | 20 | Moscow | null | false |
Charlie | Chaplin | 40 | Milan | null | true |
Bob | Marley | 30 | Tokyo | 68 | true |
Alice | Wolf | 20 | null | 55 | false |
Charlie | Byrd | 30 | Moscow | 90 | true |
Step 1: GroupBy
Output DataFrame: rowsCount = 6, columnsCount = 2
city | mean |
---|
London | 7.0 |
Dubai | 22.0 |
Moscow | 12.5 |
Milan | 20.0 |
Tokyo | 15.0 |
null | 10.0 |