Created
November 4, 2022 16:51
-
-
Save Polaris000/e6f6a18fed69cdc49f914dc38631242d to your computer and use it in GitHub Desktop.
Revisions
-
Polaris000 created this gist
Nov 4, 2022 .There are no files selected for viewing
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters. Learn more about bidirectional Unicode charactersOriginal file line number Diff line number Diff line change @@ -0,0 +1,36 @@ def auc_recall_at_k_np(y_true, y_conf): """ Experiment #2: -------------- Compute AUC under the Recall@k curve using numpy's functions. y_true: A numpy array of expected predictions y_conf: A numpy array of the model's confidence scores for each datapoint Returns: AUC-Recall@k (float) """ # if there are no positive targets (good leads), # auc becomes invalid if y_true.count(1) == 0: return np.nan conf_df = pd.DataFrame() conf_df["conf"] = y_conf conf_df["expected"] = y_true conf_df.columns = ["conf", "expected"] conf_df = conf_df.sort_values("conf", ascending=False) ranking = conf_df["expected"].to_numpy() recall_at_k = (ranking == 1).cumsum() / (ranking == 1).sum() # calculating ideal recall@k ideal_recall_at_k = np.minimum( np.ones(len(ranking)), np.array(list(range(1, len(ranking) + 1)))/ (ranking == 1).sum() ) return np.trapz(recall_at_k) / np.trapz(ideal_recall_at_k)