Changes to inplace operations for large dataframes.

This commit is contained in:
2023-01-11 09:44:57 +01:00
parent a72552d373
commit 53d89bad05

View File

@@ -193,20 +193,20 @@ if __name__ == "__main__":
# Get the frequency, PDF and CDF for each value in the series
# Frequency
stats_df = transmission_df \
transmission_df \
.groupby("goodput")["goodput"] \
.agg("count") \
.pipe(pd.DataFrame) \
.rename(columns={"goodput": 'frequency'}, inplace=True)
# PDF
stats_df['pdf'] = stats_df['frequency'] / sum(stats_df['frequency'])
transmission_df['pdf'] = transmission_df['frequency'] / sum(transmission_df['frequency'])
# CDF
stats_df['cdf'] = stats_df['pdf'].cumsum()
stats_df = stats_df.reset_index()
transmission_df['cdf'] = transmission_df['pdf'].cumsum()
transmission_df.reset_index(inplace=True)
stats_df.plot(x="goodput", y=["cdf"], grid=True)
transmission_df.plot(x="goodput", y=["cdf"], grid=True)
if args.save:
plt.savefig("{}cdf_plot.pdf".format(args.save))