Better handling of "medium" category.
parent
8a9595c615
commit
70232949c3
|
@ -82,11 +82,15 @@ print(model_input["target"].value_counts())
|
||||||
REMOVE_MEDIUM = True
|
REMOVE_MEDIUM = True
|
||||||
if ("medium" in model_input["target"]) and REMOVE_MEDIUM:
|
if ("medium" in model_input["target"]) and REMOVE_MEDIUM:
|
||||||
model_input = model_input[model_input["target"] != "medium"]
|
model_input = model_input[model_input["target"] != "medium"]
|
||||||
print(model_input["target"].value_counts())
|
|
||||||
|
|
||||||
model_input["target"] = (
|
model_input["target"] = (
|
||||||
model_input["target"].astype(str).apply(lambda x: 0 if x == "low" else 1)
|
model_input["target"].astype(str).apply(lambda x: 0 if x == "low" else 1)
|
||||||
)
|
)
|
||||||
|
else:
|
||||||
|
model_input["target"] = model_input["target"].map(
|
||||||
|
{"low": 0, "medium": 1, "high": 2}
|
||||||
|
)
|
||||||
|
print(model_input["target"].value_counts())
|
||||||
|
|
||||||
|
|
||||||
# %% jupyter={"outputs_hidden": false, "source_hidden": false}
|
# %% jupyter={"outputs_hidden": false, "source_hidden": false}
|
||||||
# UnderSampling
|
# UnderSampling
|
||||||
|
|
Loading…
Reference in New Issue