[READY] perf improvements for strftime by smarie · Pull Request #51298 · pandas-dev/pandas (original) (raw)

Expand Up

@@ -6,10 +6,10 @@

class DatetimeStrftime:

timeout = 1500

params = [1000, 10000]

param_names = ["nobs"]

params = ([1000, 10000], [False, True])

param_names = ["nobs", "tz_aware"]

def setup(self, nobs):

def setup(self, nobs, tz_aware):

d = "2018-11-29"

dt = "2018-11-26 11🔞27.0"

self.data = pd.DataFrame(

Expand All

@@ -19,37 +19,68 @@ def setup(self, nobs):

"r": [np.random.uniform()] * nobs,

}

)

if tz_aware:

self.data["dt"] = self.data["dt"].dt.tz_localize("UTC")

self.data["d"] = self.data["d"].dt.tz_localize("UTC")

self.data["i"] = self.data["dt"]

self.data.set_index("i", inplace=True)

def time_frame_date_to_str(self, nobs):

def time_frame_date_to_str(self, nobs, tz_aware):

self.data["d"].astype(str)

def time_frame_date_formatting_default(self, nobs):

def time_frame_date_formatting_default(self, nobs, tz_aware):

self.data["d"].dt.strftime(date_format=None)

def time_frame_date_formatting_default_explicit(self, nobs):

self.data["d"].dt.strftime(date_format="%Y-%m-%d")

def time_frame_date_formatting_index_to_str(self, nobs, tz_aware):

self.data.index.astype(str)

def time_frame_date_formatting_index_default(self, nobs, tz_aware):

self.data.index.strftime(date_format=None)

def time_frame_date_formatting_custom(self, nobs):

def time_frame_date_formatting_custom(self, nobs, tz_aware):

self.data["d"].dt.strftime(date_format="%Y---%m---%d")

def time_frame_datetime_to_str(self, nobs):

def time_frame_date_formatting_index_custom(self, nobs, tz_aware):

self.data.index.strftime(date_format="%Y---%m---%d")

def time_frame_datetime_to_str(self, nobs, tz_aware):

self.data["dt"].astype(str)

def time_frame_datetime_formatting_default(self, nobs):

def time_frame_datetime_formatting_default(self, nobs, tz_aware):

self.data["dt"].dt.strftime(date_format=None)

def time_frame_datetime_formatting_default_explicit_date_only(self, nobs):

def time_frame_datetime_formatting_default_explicit_date_only(self, nobs, tz_aware):

self.data["dt"].dt.strftime(date_format="%Y-%m-%d")

def time_frame_datetime_formatting_default_explicit(self, nobs):

def time_frame_datetime_formatting_default_explicit(self, nobs, tz_aware):

self.data["dt"].dt.strftime(date_format="%Y-%m-%d %H:%M:%S")

def time_frame_datetime_formatting_default_with_float(self, nobs):

def time_frame_datetime_formatting_default_with_float(self, nobs, tz_aware):

self.data["dt"].dt.strftime(date_format="%Y-%m-%d %H:%M:%S.%f")

def time_frame_datetime_formatting_custom(self, nobs):

def time_frame_datetime_formatting_index_to_str(self, nobs, tz_aware):

self.data.set_index("dt").index.astype(str)

def time_frame_datetime_formatting_index_default(self, nobs, tz_aware):

self.data.set_index("dt").index.strftime(date_format=None)

def time_frame_datetime_formatting_custom(self, nobs, tz_aware):

self.data["dt"].dt.strftime(date_format="%Y-%m-%d --- %H:%M:%S")

def time_frame_datetime_formatting_index_custom(self, nobs, tz_aware):

self.data.set_index("dt").index.strftime(date_format="%Y-%m-%d --- %H:%M:%S")

def time_frame_datetime_formatting_iso8601_map(self, nobs, tz_aware):

self.data["dt"].map(lambda timestamp: timestamp.isoformat())

def time_frame_datetime_formatting_iso8601_strftime_Z(self, nobs, tz_aware):

self.data["dt"].dt.strftime(date_format="%Y-%m-%dT%H:%M:%SZ")

def time_frame_datetime_formatting_iso8601_strftime_offset(self, nobs, tz_aware):

"""Not optimized yet as %z is not supported by `convert_strftime_format`"""

self.data["dt"].dt.strftime(date_format="%Y-%m-%dT%H:%M:%S%z")

class PeriodStrftime:

timeout = 1500

Expand All

@@ -73,6 +104,12 @@ def setup(self, nobs, freq):

def time_frame_period_to_str(self, nobs, freq):

self.data["p"].astype(str)

def time_frame_period_str(self, nobs, freq):

self.data["p"].apply(str)

def time_frame_period_repr(self, nobs, freq):

self.data["p"].apply(repr)

def time_frame_period_formatting_default(self, nobs, freq):

self.data["p"].dt.strftime(date_format=None)

Expand Down