-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathtest.py
97 lines (75 loc) · 3.08 KB
/
test.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
import torch
from tqdm import tqdm
from randomGuess import random_guess_baseline
from sklearn.metrics import f1_score, accuracy_score
import torchmetrics
import parse_arg
import logging
from datetime import datetime
from utils import setup_logging
# from utils import setup_logging
from models.model_utils import get_models
import sys
args = parse_arg.parse_arguments()
time = datetime.now().strftime("%Y-%m-%d_%H-%M-%S")
output_folder = f"{args.save_dir}/{time}"
# setup_logging(output_folder=output_folder, console_level="info", debug_filename="info.log")
logging.info(" ".join(sys.argv))
logging.info(f"Arguments: {args}")
logging.info(f"The testing outputs are being saved in {output_folder}")
def test(model, model_type, data):
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
# Load best model if not provided
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
model = model.to(device)
data.node_features = data.node_features.to(device)
if model_type in ["hgnn", "hgnnp"]:
data.hg = data.hg.to(device)
# Test the model
model.eval()
with torch.no_grad():
if model_type in ["hgnn", "hgnnp"]:
out = model(data.node_features, data.hg)
else:
out = model(data)
pred = torch.softmax(out, dim=1)
logging.info(f"Shape and dim of pred: {pred.shape}, {pred.dim()}")
target = data.y[data.test_mask].squeeze().long().to(device)
target = target.long()
logging.info(f"Shape and dim of target: {target.shape}, {target.dim()}")
y_true = target.cpu().numpy()
y_pred_probs = pred[data.test_mask].cpu().numpy()
y_pred = []
for prob in tqdm(y_pred_probs, desc="Inferencing", leave=True):
y_pred.append(prob.argmax())
y_true_flat = y_true.ravel()
y_pred_flat = torch.tensor(y_pred).numpy().ravel()
auroc = torchmetrics.AUROC(num_classes=16, task="multiclass").to(device)
auc_score = auroc(pred[data.test_mask], target)
auc_score = auroc.compute()
# Micro metrics
micro_f1 = f1_score(y_true_flat, y_pred_flat, average="micro")
# Macro metrics
test_f1 = f1_score(y_true_flat, y_pred_flat, average="macro")
test_acc = accuracy_score(y_true_flat, y_pred_flat)
rand_acc, rand_f1_micro, rand_auc, rand_f1 = random_guess_baseline(y_true)
logging.info(
f"""Random Guess Metrics
Accuracy: {rand_acc:.4f},
Precision: {rand_f1_micro:.4f},
Recall: {rand_auc:.4f},
F1 Score: {rand_f1:.4f}
"""
)
logging.info(
f"""Test Accuracy: {test_acc:.4f},
Test F1 Score (Macro): {test_f1:.4f},
Test Micro F1 Score: {micro_f1:.4f},
Test AUC Score: {auc_score:.4f}"""
)
model = model.to("cpu")
torch.cuda.empty_cache()
return test_acc, test_f1, micro_f1, auc_score
# if __name__ == "__main__":
# args = parse_arg.parse_arguments()
# test(model_path=args.test_model_path)