forked from VumBleBot/odqa_baseline_code
-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathrun_retrieval.py
120 lines (89 loc) · 3.76 KB
/
run_retrieval.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
import random
from itertools import product
from collections import defaultdict
import wandb
import numpy as np
import matplotlib.pyplot as plt
from transformers import set_seed
from fuzzywuzzy import fuzz
from utils.tools import get_args, update_args
from utils.slack_api import report_retriever_to_slack
from utils.prepare import get_dataset, get_retriever
def get_topk_fig(args, topk_result):
dup = set()
colors = ["#ED5934", "#A3ED40", "#ED2867", "#11EDA4", "#C91CED"]
markers = ["8", "*", "^", "D", "X", "+"]
linestyles = ["solid", "dashed", "dashdot", "dotted"]
def get_cml():
tries = 10
while tries:
co = random.choice(colors)
mk = random.choice(markers)
li = random.choice(linestyles)
if tuple((co, mk, li)) not in dup:
return co, mk, li
dup.add(tuple((co, mk, li)))
tries -= 1
raise TimeoutError("운이 안 좋으면 일어날 수 있는 에러")
fig, ax = plt.subplots(ncols=1, nrows=1, figsize=(10, 10))
ax.set_title("Compare TOP-K", loc="left", fontsize=12, va="bottom", fontweight="semibold")
ax.spines["top"].set_visible(False)
ax.spines["right"].set_visible(False)
ax.set_ylim([0, 1])
x_pos = list(range(1, args.retriever.topk + 1))
term = args.retriever.topk // 10 if args.retriever.topk >= 10 else args.retriever.topk
x_tick = x_pos[:-1][::term] + [x_pos[-1]]
ax.set_xticks(x_tick)
for name, topk in topk_result.items():
co, mk, li = get_cml()
ax.plot(x_pos, topk, color=co, marker=mk, linestyle=li, label=name)
ax.text(
x_pos[-1] + 0.1,
topk[-1],
s=name,
fontweight="bold",
va="center",
ha="left",
bbox=dict(boxstyle="round,pad=0.3", fc=co, ec="black", alpha=0.3),
)
ax.legend(loc="lower right")
return fig
def train_retriever(args):
strategies = args.strategies
seeds = args.seeds[: args.run_cnt]
topk_result = defaultdict(list)
wandb.init(project="p-stage-3", reinit=True)
wandb.run.name = "COMPARE RETRIEVER"
for idx, (seed, strategy) in enumerate(product(seeds, strategies)):
args = update_args(args, strategy)
set_seed(seed)
datasets = get_dataset(args, is_train=True)
retriever = get_retriever(args)
valid_datasets = retriever.retrieve(datasets["validation"], topk=args.retriever.topk)
print(f"전략: {strategy} RETRIEVER: {args.model.retriever_name}")
legend_name = "_".join([strategy, args.model.retriever_name])
topk = args.retriever.topk
cur_cnt, tot_cnt = 0, len(datasets["validation"])
indexes = np.array(range(tot_cnt * topk))
print("total_cnt:", tot_cnt)
print("valid_datasets:", valid_datasets)
qc_dict = defaultdict(bool)
for idx, fancy_index in enumerate(zip([indexes[i::topk] for i in range(topk)])):
topk_dataset = valid_datasets["validation"][fancy_index[0]]
for question, real, pred in zip(
topk_dataset["question"], topk_dataset["original_context"], topk_dataset["context"]
):
# if two texts overlaps more than 65%,
if fuzz.ratio(real, pred) > 85 and not qc_dict[question]:
qc_dict[question] = True
cur_cnt += 1
topk_acc = cur_cnt / tot_cnt
topk_result[legend_name].append(topk_acc)
print(f"TOPK: {idx + 1} ACC: {topk_acc * 100:.2f}")
fig = get_topk_fig(args, topk_result)
wandb.log({"retriever topk result": wandb.Image(fig)})
if args.report is True:
report_retriever_to_slack(args, fig)
if __name__ == "__main__":
args = get_args()
train_retriever(args)