[READY] perf improvements for strftime by smarie · Pull Request #51298 · pandas-dev/pandas (original) (raw)
@@ -6,10 +6,10 @@
class DatetimeStrftime:
timeout = 1500
params = [1000, 10000]
param_names = ["nobs"]
params = ([1000, 10000], [False, True])
param_names = ["nobs", "tz_aware"]
def setup(self, nobs):
def setup(self, nobs, tz_aware):
d = "2018-11-29"
dt = "2018-11-26 11🔞27.0"
self.data = pd.DataFrame(
@@ -19,37 +19,68 @@ def setup(self, nobs):
"r": [np.random.uniform()] * nobs,
}
)
if tz_aware:
self.data["dt"] = self.data["dt"].dt.tz_localize("UTC")
self.data["d"] = self.data["d"].dt.tz_localize("UTC")
self.data["i"] = self.data["dt"]
self.data.set_index("i", inplace=True)
def time_frame_date_to_str(self, nobs):
def time_frame_date_to_str(self, nobs, tz_aware):
self.data["d"].astype(str)
def time_frame_date_formatting_default(self, nobs):
def time_frame_date_formatting_default(self, nobs, tz_aware):
self.data["d"].dt.strftime(date_format=None)
def time_frame_date_formatting_default_explicit(self, nobs):
self.data["d"].dt.strftime(date_format="%Y-%m-%d")
def time_frame_date_formatting_index_to_str(self, nobs, tz_aware):
self.data.index.astype(str)
def time_frame_date_formatting_index_default(self, nobs, tz_aware):
self.data.index.strftime(date_format=None)
def time_frame_date_formatting_custom(self, nobs):
def time_frame_date_formatting_custom(self, nobs, tz_aware):
self.data["d"].dt.strftime(date_format="%Y---%m---%d")
def time_frame_datetime_to_str(self, nobs):
def time_frame_date_formatting_index_custom(self, nobs, tz_aware):
self.data.index.strftime(date_format="%Y---%m---%d")
def time_frame_datetime_to_str(self, nobs, tz_aware):
self.data["dt"].astype(str)
def time_frame_datetime_formatting_default(self, nobs):
def time_frame_datetime_formatting_default(self, nobs, tz_aware):
self.data["dt"].dt.strftime(date_format=None)
def time_frame_datetime_formatting_default_explicit_date_only(self, nobs):
def time_frame_datetime_formatting_default_explicit_date_only(self, nobs, tz_aware):
self.data["dt"].dt.strftime(date_format="%Y-%m-%d")
def time_frame_datetime_formatting_default_explicit(self, nobs):
def time_frame_datetime_formatting_default_explicit(self, nobs, tz_aware):
self.data["dt"].dt.strftime(date_format="%Y-%m-%d %H:%M:%S")
def time_frame_datetime_formatting_default_with_float(self, nobs):
def time_frame_datetime_formatting_default_with_float(self, nobs, tz_aware):
self.data["dt"].dt.strftime(date_format="%Y-%m-%d %H:%M:%S.%f")
def time_frame_datetime_formatting_custom(self, nobs):
def time_frame_datetime_formatting_index_to_str(self, nobs, tz_aware):
self.data.set_index("dt").index.astype(str)
def time_frame_datetime_formatting_index_default(self, nobs, tz_aware):
self.data.set_index("dt").index.strftime(date_format=None)
def time_frame_datetime_formatting_custom(self, nobs, tz_aware):
self.data["dt"].dt.strftime(date_format="%Y-%m-%d --- %H:%M:%S")
def time_frame_datetime_formatting_index_custom(self, nobs, tz_aware):
self.data.set_index("dt").index.strftime(date_format="%Y-%m-%d --- %H:%M:%S")
def time_frame_datetime_formatting_iso8601_map(self, nobs, tz_aware):
self.data["dt"].map(lambda timestamp: timestamp.isoformat())
def time_frame_datetime_formatting_iso8601_strftime_Z(self, nobs, tz_aware):
self.data["dt"].dt.strftime(date_format="%Y-%m-%dT%H:%M:%SZ")
def time_frame_datetime_formatting_iso8601_strftime_offset(self, nobs, tz_aware):
"""Not optimized yet as %z is not supported by `convert_strftime_format`"""
self.data["dt"].dt.strftime(date_format="%Y-%m-%dT%H:%M:%S%z")
class PeriodStrftime:
timeout = 1500
@@ -73,6 +104,12 @@ def setup(self, nobs, freq):
def time_frame_period_to_str(self, nobs, freq):
self.data["p"].astype(str)
def time_frame_period_str(self, nobs, freq):
self.data["p"].apply(str)
def time_frame_period_repr(self, nobs, freq):
self.data["p"].apply(repr)
def time_frame_period_formatting_default(self, nobs, freq):
self.data["p"].dt.strftime(date_format=None)