Changes to inplace operations for large dataframes.
This commit is contained in:
@@ -193,20 +193,20 @@ if __name__ == "__main__":
|
|||||||
# Get the frequency, PDF and CDF for each value in the series
|
# Get the frequency, PDF and CDF for each value in the series
|
||||||
|
|
||||||
# Frequency
|
# Frequency
|
||||||
stats_df = transmission_df \
|
transmission_df \
|
||||||
.groupby("goodput")["goodput"] \
|
.groupby("goodput")["goodput"] \
|
||||||
.agg("count") \
|
.agg("count") \
|
||||||
.pipe(pd.DataFrame) \
|
.pipe(pd.DataFrame) \
|
||||||
.rename(columns={"goodput": 'frequency'}, inplace=True)
|
.rename(columns={"goodput": 'frequency'}, inplace=True)
|
||||||
|
|
||||||
# PDF
|
# PDF
|
||||||
stats_df['pdf'] = stats_df['frequency'] / sum(stats_df['frequency'])
|
transmission_df['pdf'] = transmission_df['frequency'] / sum(transmission_df['frequency'])
|
||||||
|
|
||||||
# CDF
|
# CDF
|
||||||
stats_df['cdf'] = stats_df['pdf'].cumsum()
|
transmission_df['cdf'] = transmission_df['pdf'].cumsum()
|
||||||
stats_df = stats_df.reset_index()
|
transmission_df.reset_index(inplace=True)
|
||||||
|
|
||||||
stats_df.plot(x="goodput", y=["cdf"], grid=True)
|
transmission_df.plot(x="goodput", y=["cdf"], grid=True)
|
||||||
|
|
||||||
if args.save:
|
if args.save:
|
||||||
plt.savefig("{}cdf_plot.pdf".format(args.save))
|
plt.savefig("{}cdf_plot.pdf".format(args.save))
|
||||||
|
|||||||
Reference in New Issue
Block a user