In [8]:
# https://dplyr.tidyverse.org/reference/rowwise.html

from datar.datasets import iris
from datar.all import *

%run nb_helpers.py
nb_header(rowwise)

### # rowwise  

##### Compute on a data frame a row-at-a-time

See https://dplyr.tidyverse.org/reference/rowwise.html  

##### Args:
&emsp;&emsp;`_data`: The dataframe  
&emsp;&emsp;`*columns`: Variables to be preserved when calling summarise().  
&emsp;&emsp;&emsp;&emsp;This is typically a set of variables whose combination  
&emsp;&emsp;&emsp;&emsp;uniquely identify each row.  

&emsp;&emsp;`base0_`: Whether indexes are 0-based if columns are selected by indexes.  
&emsp;&emsp;&emsp;&emsp;If not given, will use `datar.base.get_option('index.base.0')`  

##### Returns:
&emsp;&emsp;A row-wise data frame  


In [9]:
df = tibble(x=runif(6), y=runif(6), z=runif(6))

df >> rowwise() >> mutate(m=mean(c_across(c(f.x, f.y, f.z)))) 

Unnamed: 0,x,y,z,m
,<float64>,<float64>,<float64>,<float64>
0.0,0.978019,0.409827,0.494186,0.627344
1.0,0.148053,0.267015,0.727037,0.380702
2.0,0.353099,0.932557,0.851494,0.712383
3.0,0.342744,0.497407,0.459758,0.433303
4.0,0.817116,0.301053,0.049890,0.389353
5.0,0.444922,0.769882,0.802420,0.672408


In [10]:
df >> rowwise() >> mutate(m=mean(c_across(f[f.x:f.z])))

Unnamed: 0,x,y,z,m
,<float64>,<float64>,<float64>,<float64>
0.0,0.978019,0.409827,0.494186,0.627344
1.0,0.148053,0.267015,0.727037,0.380702
2.0,0.353099,0.932557,0.851494,0.712383
3.0,0.342744,0.497407,0.459758,0.433303
4.0,0.817116,0.301053,0.049890,0.389353
5.0,0.444922,0.769882,0.802420,0.672408


In [11]:
df >> rowwise() >> mutate(m=min(c_across([f.x, f.y, f.z]))) 

Unnamed: 0,x,y,z,m
,<float64>,<float64>,<float64>,<float64>
0.0,0.978019,0.409827,0.494186,0.409827
1.0,0.148053,0.267015,0.727037,0.148053
2.0,0.353099,0.932557,0.851494,0.353099
3.0,0.342744,0.497407,0.459758,0.342744
4.0,0.817116,0.301053,0.049890,0.049890
5.0,0.444922,0.769882,0.802420,0.444922


In [12]:
df >> rowwise() >> mutate(m=min(c_across(f[f.x:f.z]))) 

Unnamed: 0,x,y,z,m
,<float64>,<float64>,<float64>,<float64>
0.0,0.978019,0.409827,0.494186,0.409827
1.0,0.148053,0.267015,0.727037,0.148053
2.0,0.353099,0.932557,0.851494,0.353099
3.0,0.342744,0.497407,0.459758,0.342744
4.0,0.817116,0.301053,0.049890,0.049890
5.0,0.444922,0.769882,0.802420,0.444922


In [13]:
df >> mutate(m = pmin(f.x, f.y, f.z))

Unnamed: 0,x,y,z,m
,<float64>,<float64>,<float64>,<float64>
0.0,0.978019,0.409827,0.494186,0.409827
1.0,0.148053,0.267015,0.727037,0.148053
2.0,0.353099,0.932557,0.851494,0.353099
3.0,0.342744,0.497407,0.459758,0.342744
4.0,0.817116,0.301053,0.049890,0.049890
5.0,0.444922,0.769882,0.802420,0.444922


In [14]:
params = tibble(
    sim=[1, 2, 3],
    n=[1, 2, 3],
    mean=[1, 2, 1],
    sd=[1, 4, 2]
)

params >> rowwise(f.sim) >> summarise(z=[rnorm(f.n, f.mean, f.sd)]) 

[2021-07-07 00:16:53][datar][   INFO] `summarise()` has grouped output by ['sim'] (override with `_groups` argument)


Unnamed: 0,sim,z
,<int64>,<object>
0.0,1,[0.4253793332736262]
1.0,2,"[5.685960561587633, 7.0549853098163195]"
2.0,3,"[3.2541795161080462, -0.22317530678020692, -2...."
