Skip to content

Commit

Permalink
fix: fix variable name inconsistency.
Browse files Browse the repository at this point in the history
  • Loading branch information
Aiko committed Jan 12, 2024
1 parent f13f6b0 commit 46605dc
Show file tree
Hide file tree
Showing 2 changed files with 16 additions and 9 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -12,7 +12,7 @@ class Command(BaseCommand):
def __init__(self):
self.detection = SpamDetector()
self.processor = self.detection.processor
self.user_meta_classifier = self.detection.user_metadata_classifier
self.user_meta_classifier = self.detection.usermeta_classifier
self.text_classifier = self.detection.text_classifier

def add_arguments(self, parser):
Expand Down
23 changes: 15 additions & 8 deletions django/curator/spam_classifiers.py
Original file line number Diff line number Diff line change
Expand Up @@ -176,6 +176,7 @@ def __init__(self):

def fit(self):
print("Training TextSpamClassifier...")
model_metrics = None
model = Pipeline(
[
("cleaner", FunctionTransformer(self.preprocess)),
Expand All @@ -187,15 +188,15 @@ def fit(self):
all_df = self.processor.get_all_users_df()

if all_df.empty:
return None
return model_metrics # = None

data_x, data_y = self.concat_pd(all_df)
if data_x.empty:
return None
return model_metrics # = None

if len(data_y.value_counts()) != 2:
print("Cannot create a binary classifier!!")
return None
return model_metrics # = None

(
train_x,
Expand All @@ -218,14 +219,16 @@ def fit(self):

def predict(self):
print("TextSpamClassifier is making predictions...")
evaluated_user_ids = []
spam_user_ids = []
df = self.processor.get_unlabelled_by_curator_df()
if df.empty: # no-op if no data found
return []
return evaluated_user_ids, spam_user_ids

model = self.load_model(self.MODEL_FILE_PATH)
data_x, data_y = self.concat_pd(df)
if data_x.empty:
return []
return evaluated_user_ids, spam_user_ids

predictions, confidences = self.get_predictions(model, data_x["text"])

Expand Down Expand Up @@ -282,6 +285,7 @@ def __init__(self):

def fit(self):
print("Training UserMetadataSpamClassifier...")
model_metrics = None
model = Pipeline(
[
("cleaner", FunctionTransformer(self.preprocess)),
Expand All @@ -292,11 +296,11 @@ def fit(self):
# obtain df from pipleline
df = self.processor.get_all_users_df()
if df.empty:
return None # if no untrained data found
return model_metrics # None if no untrained data found

if len(df["labelled_by_curator"].value_counts()) != 2:
print("Cannot create a binary classifier!!")
return None
return model_metrics

feats, targets = self.__input_df_transformation(df)
(
Expand All @@ -321,9 +325,11 @@ def fit(self):

def predict(self):
print("UserMetadataSpamClassifier is making predictions...")
evaluated_user_ids = []
spam_user_ids = []
df = self.processor.get_unlabelled_by_curator_df()
if df.empty: # no-op if no data found
return []
return evaluated_user_ids, spam_user_ids

model = self.load_model(self.MODEL_FILE_PATH)

Expand Down Expand Up @@ -396,6 +402,7 @@ def __input_df_transformation(self, df: pd.DataFrame):
].fillna(
""
)

df.loc[:, ["user_id", "labelled_by_curator"]] = df[
["user_id", "labelled_by_curator"]
].fillna(0)
Expand Down

0 comments on commit 46605dc

Please sign in to comment.