df.select { age and name }
Input DataFrame: rowsCount = 7, columnsCount = 5
name | age | city | weight | isHappy |
---|
firstName | lastName | | | | |
---|
Alice | Cooper | 15 | London | 54 | true |
Bob | Dylan | 45 | Dubai | 87 | true |
Charlie | Daniels | 20 | Moscow | null | false |
Charlie | Chaplin | 40 | Milan | null | true |
Bob | Marley | 30 | Tokyo | 68 | true |
Alice | Wolf | 20 | null | 55 | false |
Charlie | Byrd | 30 | Moscow | 90 | true |
Output DataFrame: rowsCount = 7, columnsCount = 2
age | name |
---|
| firstName | lastName |
---|
15 | Alice | Cooper |
45 | Bob | Dylan |
20 | Charlie | Daniels |
40 | Charlie | Chaplin |
30 | Bob | Marley |
20 | Alice | Wolf |
30 | Charlie | Byrd |
df.fillNaNs { colsAtAnyDepth().colsOf<Double>() }.withZero()
Input DataFrame: rowsCount = 7, columnsCount = 5
name | age | city | weight | isHappy |
---|
firstName | lastName | | | | |
---|
Alice | Cooper | 15 | London | 54 | true |
Bob | Dylan | 45 | Dubai | 87 | true |
Charlie | Daniels | 20 | Moscow | null | false |
Charlie | Chaplin | 40 | Milan | null | true |
Bob | Marley | 30 | Tokyo | 68 | true |
Alice | Wolf | 20 | null | 55 | false |
Charlie | Byrd | 30 | Moscow | 90 | true |
Step 1: Update
name | age | city | weight | isHappy |
---|
firstName | lastName | | | | |
---|
Alice | Cooper | 15 | London | 54 | true |
Bob | Dylan | 45 | Dubai | 87 | true |
Charlie | Daniels | 20 | Moscow | null | false |
Charlie | Chaplin | 40 | Milan | null | true |
Bob | Marley | 30 | Tokyo | 68 | true |
Alice | Wolf | 20 | null | 55 | false |
Charlie | Byrd | 30 | Moscow | 90 | true |
DataFrame [7 x 5]
Output DataFrame: rowsCount = 7, columnsCount = 5
name | age | city | weight | isHappy |
---|
firstName | lastName | | | | |
---|
Alice | Cooper | 15 | London | 54 | true |
Bob | Dylan | 45 | Dubai | 87 | true |
Charlie | Daniels | 20 | Moscow | null | false |
Charlie | Chaplin | 40 | Milan | null | true |
Bob | Marley | 30 | Tokyo | 68 | true |
Alice | Wolf | 20 | null | 55 | false |
Charlie | Byrd | 30 | Moscow | 90 | true |
df.remove { cols { it.hasNulls() } }
Input DataFrame: rowsCount = 7, columnsCount = 5
name | age | city | weight | isHappy |
---|
firstName | lastName | | | | |
---|
Alice | Cooper | 15 | London | 54 | true |
Bob | Dylan | 45 | Dubai | 87 | true |
Charlie | Daniels | 20 | Moscow | null | false |
Charlie | Chaplin | 40 | Milan | null | true |
Bob | Marley | 30 | Tokyo | 68 | true |
Alice | Wolf | 20 | null | 55 | false |
Charlie | Byrd | 30 | Moscow | 90 | true |
Output DataFrame: rowsCount = 7, columnsCount = 3
name | age | isHappy |
---|
firstName | lastName | | |
---|
Alice | Cooper | 15 | true |
Bob | Dylan | 45 | true |
Charlie | Daniels | 20 | false |
Charlie | Chaplin | 40 | true |
Bob | Marley | 30 | true |
Alice | Wolf | 20 | false |
Charlie | Byrd | 30 | true |
df.into { "nameless" }
Input DataFrame: rowsCount = 7, columnsCount = 5
name | age | city | weight | isHappy |
---|
firstName | lastName | | | | |
---|
Alice | Cooper | 15 | London | 54 | true |
Bob | Dylan | 45 | Dubai | 87 | true |
Charlie | Daniels | 20 | Moscow | null | false |
Charlie | Chaplin | 40 | Milan | null | true |
Bob | Marley | 30 | Tokyo | 68 | true |
Alice | Wolf | 20 | null | 55 | false |
Charlie | Byrd | 30 | Moscow | 90 | true |
Output DataFrame: rowsCount = 7, columnsCount = 2
name | nameless |
---|
firstName | lastName | age | city | weight | isHappy |
---|
Alice | Cooper | 15 | London | 54 | true |
Bob | Dylan | 45 | Dubai | 87 | true |
Charlie | Daniels | 20 | Moscow | null | false |
Charlie | Chaplin | 40 | Milan | null | true |
Bob | Marley | 30 | Tokyo | 68 | true |
Alice | Wolf | 20 | null | 55 | false |
Charlie | Byrd | 30 | Moscow | 90 | true |
df.update { city }.notNull { it.lowercase() }
Input DataFrame: rowsCount = 7, columnsCount = 5
name | age | city | weight | isHappy |
---|
firstName | lastName | | | | |
---|
Alice | Cooper | 15 | London | 54 | true |
Bob | Dylan | 45 | Dubai | 87 | true |
Charlie | Daniels | 20 | Moscow | null | false |
Charlie | Chaplin | 40 | Milan | null | true |
Bob | Marley | 30 | Tokyo | 68 | true |
Alice | Wolf | 20 | null | 55 | false |
Charlie | Byrd | 30 | Moscow | 90 | true |
Step 1: Update
name | age | city | weight | isHappy |
---|
firstName | lastName | | | | |
---|
Alice | Cooper | 15 | London | 54 | true |
Bob | Dylan | 45 | Dubai | 87 | true |
Charlie | Daniels | 20 | Moscow | null | false |
Charlie | Chaplin | 40 | Milan | null | true |
Bob | Marley | 30 | Tokyo | 68 | true |
Alice | Wolf | 20 | null | 55 | false |
Charlie | Byrd | 30 | Moscow | 90 | true |
DataFrame [7 x 5]
Output DataFrame: rowsCount = 7, columnsCount = 5
name | age | city | weight | isHappy |
---|
firstName | lastName | | | | |
---|
Alice | Cooper | 15 | london | 54 | true |
Bob | Dylan | 45 | dubai | 87 | true |
Charlie | Daniels | 20 | moscow | null | false |
Charlie | Chaplin | 40 | milan | null | true |
Bob | Marley | 30 | tokyo | 68 | true |
Alice | Wolf | 20 | null | 55 | false |
Charlie | Byrd | 30 | moscow | 90 | true |
df.gather { colsOf<Number>() }.into("key", "value")
Input DataFrame: rowsCount = 7, columnsCount = 5
name | age | city | weight | isHappy |
---|
firstName | lastName | | | | |
---|
Alice | Cooper | 15 | London | 54 | true |
Bob | Dylan | 45 | Dubai | 87 | true |
Charlie | Daniels | 20 | Moscow | null | false |
Charlie | Chaplin | 40 | Milan | null | true |
Bob | Marley | 30 | Tokyo | 68 | true |
Alice | Wolf | 20 | null | 55 | false |
Charlie | Byrd | 30 | Moscow | 90 | true |
Step 1: Gather
name | city | weight | isHappy | key | value |
---|
firstName | lastName | | | | | |
---|
Alice | Cooper | London | 54 | true | age | 15 |
Bob | Dylan | Dubai | 87 | true | age | 45 |
Charlie | Daniels | Moscow | null | false | age | 20 |
Charlie | Chaplin | Milan | null | true | age | 40 |
Bob | Marley | Tokyo | 68 | true | age | 30 |
Alice | Wolf | null | 55 | false | age | 20 |
Charlie | Byrd | Moscow | 90 | true | age | 30 |
Output DataFrame: rowsCount = 7, columnsCount = 6
name | city | weight | isHappy | key | value |
---|
firstName | lastName | | | | | |
---|
Alice | Cooper | London | 54 | true | age | 15 |
Bob | Dylan | Dubai | 87 | true | age | 45 |
Charlie | Daniels | Moscow | null | false | age | 20 |
Charlie | Chaplin | Milan | null | true | age | 40 |
Bob | Marley | Tokyo | 68 | true | age | 30 |
Alice | Wolf | null | 55 | false | age | 20 |
Charlie | Byrd | Moscow | 90 | true | age | 30 |
df.after { city }
Input DataFrame: rowsCount = 7, columnsCount = 5
name | age | city | weight | isHappy |
---|
firstName | lastName | | | | |
---|
Alice | Cooper | 15 | London | 54 | true |
Bob | Dylan | 45 | Dubai | 87 | true |
Charlie | Daniels | 20 | Moscow | null | false |
Charlie | Chaplin | 40 | Milan | null | true |
Bob | Marley | 30 | Tokyo | 68 | true |
Alice | Wolf | 20 | null | 55 | false |
Charlie | Byrd | 30 | Moscow | 90 | true |
Output DataFrame: rowsCount = 7, columnsCount = 6
age | city | firstName | lastName | weight | isHappy |
---|
15 | London | Alice | Cooper | 54 | true |
45 | Dubai | Bob | Dylan | 87 | true |
20 | Moscow | Charlie | Daniels | null | false |
40 | Milan | Charlie | Chaplin | null | true |
30 | Tokyo | Bob | Marley | 68 | true |
20 | null | Alice | Wolf | 55 | false |
30 | Moscow | Charlie | Byrd | 90 | true |