apache_beam.dataframe.frames module

apache_beam.dataframe.frames.populate_not_implemented(pd_type)[source]
class apache_beam.dataframe.frames.DeferredDataFrameOrSeries(expr)[source]

Bases: apache_beam.dataframe.frame_base.DeferredFrame

drop(labels, axis, index, columns, errors, **kwargs)[source]
droplevel(level, axis)[source]
fillna(value, method, axis, limit, **kwargs)[source]
ffill(**kwargs)[source]
bfill(**kwargs)[source]
pad(**kwargs)
backfill(**kwargs)
groupby(by, level, axis, as_index, group_keys, **kwargs)[source]
abs(**kwargs)
astype(**kwargs)
copy(**kwargs)
tz_localize(ambiguous, **kwargs)[source]
size
empty
bool()[source]
equals(other)[source]
sort_values(axis, **kwargs)[source]
sort_index(axis, **kwargs)[source]
dtype
ndim
dtypes
index
hist(**kwargs)
first(**kwargs)
last(**kwargs)
head(**kwargs)
tail(**kwargs)
classmethod wrap(expr, split_tuples=True)
class apache_beam.dataframe.frames.DeferredSeries(expr)[source]

Bases: apache_beam.dataframe.frames.DeferredDataFrameOrSeries

keys()[source]
append(to_append, ignore_index, verify_integrity, **kwargs)[source]
align(other, join, axis, level, method, **kwargs)[source]
array
rename(**kwargs)
between(**kwargs)
dot(other)[source]
std(*args, **kwargs)[source]
var(axis, skipna, level, ddof, **kwargs)[source]
corr(other, method, min_periods)[source]
cov(other, min_periods, ddof)[source]
dropna(**kwargs)[source]
items(**kwargs)
iteritems(**kwargs)
isin(**kwargs)
isnull(**kwargs)
isna(**kwargs)
notnull(**kwargs)
notna(**kwargs)
tolist(**kwargs)
to_numpy(**kwargs)
to_string(**kwargs)
aggregate(func, axis=0, *args, **kwargs)[source]
agg(func, axis=0, *args, **kwargs)
axes
clip(**kwargs)
all(*args, **kwargs)
any(*args, **kwargs)
count(*args, **kwargs)
min(*args, **kwargs)
max(*args, **kwargs)
prod(*args, **kwargs)
product(*args, **kwargs)
sum(*args, **kwargs)
mean(*args, **kwargs)
median(*args, **kwargs)
cummax(**kwargs)
cummin(**kwargs)
cumsum(**kwargs)
cumprod(**kwargs)
diff(**kwargs)
filter(**kwargs)
memory_usage(**kwargs)
nlargest(keep, **kwargs)[source]
nsmallest(keep, **kwargs)[source]
plot
pop(**kwargs)
rename_axis(**kwargs)
replace(to_replace, value, limit, method, **kwargs)[source]
round(**kwargs)
searchsorted(**kwargs)
shift(**kwargs)
take(**kwargs)
to_dict(**kwargs)
to_frame(**kwargs)
unique(as_series=False)[source]
update(other)[source]
unstack(**kwargs)
values
view(**kwargs)
str
apply(**kwargs)
map(**kwargs)
T
abs(**kwargs)
add(**kwargs)
add_prefix(**kwargs)
add_suffix(**kwargs)
and(**kwargs)
argmax(**kwargs)
argmin(**kwargs)
argsort(**kwargs)
asfreq(**kwargs)
asof(**kwargs)
astype(**kwargs)
at
at_time(**kwargs)
attrs
autocorr(**kwargs)
backfill(**kwargs)
between_time(**kwargs)
bfill(**kwargs)
bool()
cat
combine(**kwargs)
combine_first(**kwargs)
compare(**kwargs)
convert_dtypes(**kwargs)
copy(**kwargs)
describe(**kwargs)
div(**kwargs)
divide(**kwargs)
divmod(**kwargs)
drop(labels, axis, index, columns, errors, **kwargs)
drop_duplicates(**kwargs)
droplevel(level, axis)
dt
dtype
dtypes
duplicated(**kwargs)
empty
eq(**kwargs)
equals(other)
ewm(**kwargs)
expanding(**kwargs)
explode(**kwargs)
factorize(**kwargs)
ffill(**kwargs)
fillna(value, method, axis, limit, **kwargs)
first(**kwargs)
first_valid_index(**kwargs)
flags
floordiv(**kwargs)
ge(**kwargs)
get(**kwargs)
groupby(by, level, axis, as_index, group_keys, **kwargs)
gt(**kwargs)
hasnans
head(**kwargs)
hist(**kwargs)
iat
idxmax(**kwargs)
idxmin(**kwargs)
iloc
index
infer_objects(**kwargs)
interpolate(**kwargs)
is_monotonic
is_monotonic_decreasing
is_monotonic_increasing
is_unique
item(**kwargs)
kurt(**kwargs)
kurtosis(**kwargs)
last(**kwargs)
last_valid_index(**kwargs)
le(**kwargs)
loc
lt(**kwargs)
mad(**kwargs)
mask(**kwargs)
mod(**kwargs)
mode(**kwargs)
mul(**kwargs)
multiply(**kwargs)
name
nbytes
ndim
ne(**kwargs)
nunique(**kwargs)
or(**kwargs)
pad(**kwargs)
pct_change(**kwargs)
pipe(**kwargs)
pow(**kwargs)
quantile(**kwargs)
radd(**kwargs)
rand(**kwargs)
rank(**kwargs)
ravel(**kwargs)
rdiv(**kwargs)
rdivmod(**kwargs)
reindex(**kwargs)
reindex_like(**kwargs)
reorder_levels(**kwargs)
repeat(**kwargs)
resample(**kwargs)
reset_index(**kwargs)
rfloordiv(**kwargs)
rmod(**kwargs)
rmul(**kwargs)
rolling(**kwargs)
ror(**kwargs)
rpow(**kwargs)
rsub(**kwargs)
rtruediv(**kwargs)
sample(**kwargs)
sem(**kwargs)
set_axis(**kwargs)
set_flags(**kwargs)
shape
size
skew(**kwargs)
slice_shift(**kwargs)
sort_index(axis, **kwargs)
sort_values(axis, **kwargs)
sparse
squeeze(**kwargs)
sub(**kwargs)
subtract(**kwargs)
swapaxes(**kwargs)
swaplevel(**kwargs)
tail(**kwargs)
to_clipboard(**kwargs)
to_csv(**kwargs)
to_excel(**kwargs)
to_hdf(**kwargs)
to_json(**kwargs)
to_latex(**kwargs)
to_list(**kwargs)
to_markdown(**kwargs)
to_period(**kwargs)
to_pickle(**kwargs)
to_sql(**kwargs)
to_timestamp(**kwargs)
to_xarray(**kwargs)
transform(**kwargs)
transpose(**kwargs)
truediv(**kwargs)
truncate(**kwargs)
tshift(**kwargs)
tz_convert(**kwargs)
tz_localize(ambiguous, **kwargs)
value_counts(**kwargs)
where(**kwargs)
classmethod wrap(expr, split_tuples=True)
xs(**kwargs)
class apache_beam.dataframe.frames.DeferredDataFrame(expr)[source]

Bases: apache_beam.dataframe.frames.DeferredDataFrameOrSeries

T
columns
keys()[source]
align(other, join, axis, copy, level, method, **kwargs)[source]
append(other, ignore_index, verify_integrity, sort, **kwargs)[source]
set_index(keys, **kwargs)[source]
loc
iloc
axes
dtypes
assign(**kwargs)[source]
explode(column, ignore_index)[source]
aggregate(func, axis=0, *args, **kwargs)[source]
agg(func, axis=0, *args, **kwargs)
applymap(**kwargs)
memory_usage(**kwargs)
info(**kwargs)
clip(**kwargs)
corr(method, min_periods)[source]
cov(min_periods, ddof)[source]
corrwith(other, axis, drop, method)[source]
cummax(**kwargs)
cummin(**kwargs)
cumsum(**kwargs)
cumprod(**kwargs)
diff(**kwargs)
dot(other)[source]
mode(axis=0, *args, **kwargs)[source]
dropna(axis, **kwargs)[source]
eval(expr, inplace, **kwargs)[source]
query(expr, inplace, **kwargs)[source]
isnull(**kwargs)
isna(**kwargs)
notnull(**kwargs)
notna(**kwargs)
items(**kwargs)
itertuples(**kwargs)
iterrows(**kwargs)
iteritems(**kwargs)
join(other, on, **kwargs)[source]
merge(right, on, left_on, right_on, left_index, right_index, suffixes, **kwargs)[source]
nlargest(keep, **kwargs)[source]
nsmallest(keep, **kwargs)[source]
nunique(**kwargs)[source]
plot
pop(item)[source]
quantile(axis, **kwargs)[source]
rename(**kwargs)[source]
rename_axis(**kwargs)
replace(limit, **kwargs)[source]
reset_index(level=None, **kwargs)[source]
round(decimals, *args, **kwargs)[source]
select_dtypes(**kwargs)
shift(axis, **kwargs)[source]
shape
stack(**kwargs)
all(*args, **kwargs)
any(*args, **kwargs)
count(*args, **kwargs)
max(*args, **kwargs)
min(*args, **kwargs)
prod(*args, **kwargs)
product(*args, **kwargs)
sum(*args, **kwargs)
mean(*args, **kwargs)
median(*args, **kwargs)
take(**kwargs)
to_records(**kwargs)
to_dict(**kwargs)
to_numpy(**kwargs)
to_string(**kwargs)
to_sparse(**kwargs)
transpose(**kwargs)
unstack(*args, **kwargs)[source]
update(**kwargs)
values
abs(**kwargs)
add(**kwargs)
add_prefix(**kwargs)
add_suffix(**kwargs)
and(**kwargs)
apply(**kwargs)
asfreq(**kwargs)
asof(**kwargs)
astype(**kwargs)
at
at_time(**kwargs)
attrs
backfill(**kwargs)
between_time(**kwargs)
bfill(**kwargs)
bool()
boxplot(**kwargs)
combine(**kwargs)
combine_first(**kwargs)
compare(**kwargs)
convert_dtypes(**kwargs)
copy(**kwargs)
describe(**kwargs)
div(**kwargs)
divide(**kwargs)
divmod(**kwargs)
drop(labels, axis, index, columns, errors, **kwargs)
drop_duplicates(**kwargs)
droplevel(level, axis)
dtype
duplicated(**kwargs)
empty
eq(**kwargs)
equals(other)
ewm(**kwargs)
expanding(**kwargs)
ffill(**kwargs)
fillna(value, method, axis, limit, **kwargs)
filter(**kwargs)
first(**kwargs)
first_valid_index(**kwargs)
flags
floordiv(**kwargs)
from_dict(**kwargs)
from_records(**kwargs)
ge(**kwargs)
get(**kwargs)
groupby(by, level, axis, as_index, group_keys, **kwargs)
gt(**kwargs)
head(**kwargs)
hist(**kwargs)
iat
idxmax(**kwargs)
idxmin(**kwargs)
index
infer_objects(**kwargs)
insert(**kwargs)
interpolate(**kwargs)
isin(**kwargs)
kurt(**kwargs)
kurtosis(**kwargs)
last(**kwargs)
last_valid_index(**kwargs)
le(**kwargs)
lookup(**kwargs)
lt(**kwargs)
mad(**kwargs)
mask(**kwargs)
melt(**kwargs)
mod(**kwargs)
mul(**kwargs)
multiply(**kwargs)
ndim
ne(**kwargs)
or(**kwargs)
pad(**kwargs)
pct_change(**kwargs)
pipe(**kwargs)
pivot(**kwargs)
pivot_table(**kwargs)
pow(**kwargs)
radd(**kwargs)
rand(**kwargs)
rank(**kwargs)
rdiv(**kwargs)
rdivmod(**kwargs)
reindex(**kwargs)
reindex_like(**kwargs)
reorder_levels(**kwargs)
resample(**kwargs)
rfloordiv(**kwargs)
rmod(**kwargs)
rmul(**kwargs)
rolling(**kwargs)
ror(**kwargs)
rpow(**kwargs)
rsub(**kwargs)
rtruediv(**kwargs)
sample(**kwargs)
sem(**kwargs)
set_axis(**kwargs)
set_flags(**kwargs)
size
skew(**kwargs)
slice_shift(**kwargs)
sort_index(axis, **kwargs)
sort_values(axis, **kwargs)
sparse
squeeze(**kwargs)
std(**kwargs)
style
sub(**kwargs)
subtract(**kwargs)
swapaxes(**kwargs)
swaplevel(**kwargs)
tail(**kwargs)
to_clipboard(**kwargs)
to_csv(path, *args, **kwargs)
to_excel(path, *args, **kwargs)
to_feather(path, *args, **kwargs)
to_gbq(**kwargs)
to_hdf(**kwargs)
to_html(path, *args, **kwargs)
to_json(path, orient=None, *args, **kwargs)
to_latex(**kwargs)
to_markdown(**kwargs)
to_msgpack(**kwargs)
to_parquet(path, *args, **kwargs)
to_period(**kwargs)
to_pickle(**kwargs)
to_sql(**kwargs)
to_stata(path, *args, **kwargs)
to_timestamp(**kwargs)
to_xarray(**kwargs)
transform(**kwargs)
truediv(**kwargs)
truncate(**kwargs)
tshift(**kwargs)
tz_convert(**kwargs)
tz_localize(ambiguous, **kwargs)
value_counts(**kwargs)
var(**kwargs)
where(**kwargs)
classmethod wrap(expr, split_tuples=True)
xs(**kwargs)
class apache_beam.dataframe.frames.DeferredGroupBy(expr, kwargs, ungrouped: apache_beam.dataframe.expressions.Expression, ungrouped_with_index: apache_beam.dataframe.expressions.Expression, grouping_columns, grouping_indexes, projection=None)[source]

Bases: apache_beam.dataframe.frame_base.DeferredFrame

This object represents the result of:

ungrouped.groupby(level=[grouping_indexes + grouping_columns],
                  **kwargs)[projection]
Parameters:
  • expr – An expression to compute a pandas GroupBy object. Convenient for unliftable aggregations.
  • ungrouped – An expression to compute the DataFrame pre-grouping, the (Multi)Index contains only the grouping columns/indexes.
  • ungrouped_with_index – Same as ungrouped, except the index includes all of the original indexes as well as any grouping columns. This is important for operations that expose the original index, e.g. .apply(), but we only use it when necessary to avoid unnessary data transfer and GBKs.
  • grouping_columns – list of column labels that were in the original groupby(..) by parameter. Only relevant for grouped DataFrames.
  • grouping_indexes – list of index names (or index level numbers) to be grouped.
  • kwargs – Keywords args passed to the original groupby(..) call.
agg(fn)[source]
apply(fn, *args, **kwargs)[source]
aggregate(fn)
hist(**kwargs)
plot(**kwargs)
first(**kwargs)
last(**kwargs)
head(**kwargs)
tail(**kwargs)
nth(**kwargs)
cumcount(**kwargs)
cummax(**kwargs)
cummin(**kwargs)
cumsum(**kwargs)
cumprod(**kwargs)
groups
all(*args, **kwargs)
any(*args, **kwargs)
backfill(**kwargs)
bfill(**kwargs)
boxplot(**kwargs)
corr
corrwith
count(*args, **kwargs)
cov
describe(**kwargs)
diff
dtypes
ewm(**kwargs)
expanding(**kwargs)
ffill(**kwargs)
fillna
filter(**kwargs)
get_group(**kwargs)
idxmax(**kwargs)
idxmin(**kwargs)
indices
mad
max(*args, **kwargs)
mean(*args, **kwargs)
median(*args, **kwargs)
min(*args, **kwargs)
ngroup(**kwargs)
ngroups
nunique(**kwargs)
ohlc(**kwargs)
pad(**kwargs)
pct_change(**kwargs)
pipe(**kwargs)
prod(*args, **kwargs)
quantile(**kwargs)
rank(**kwargs)
resample(**kwargs)
rolling(**kwargs)
sample(**kwargs)
sem(**kwargs)
shift(**kwargs)
size(*args, **kwargs)
skew
std(*args, **kwargs)
sum(*args, **kwargs)
take
transform(**kwargs)
tshift
var(*args, **kwargs)
classmethod wrap(expr, split_tuples=True)
apache_beam.dataframe.frames.make_str_func(method)[source]