xlm-roberta-large / src /utils /combine_preds_3cls.py
shayekh's picture
Upload 61 files
cc9c7ee
raw
history blame
2.11 kB
import os
import argparse
from omegaconf import OmegaConf
def binary_intersection(lst1, lst2):
lst3 = list(set([value for value in lst1 if value in lst2]))
return lst3
def binary_union(lst1, lst2):
lst3 = list(set(lst1 + lst2))
return lst3
def combine(files, type="union"):
text = {}
if type == "union":
fn = binary_union
else:
fn = binary_intersection
for fil in files:
with open(fil, "r") as f:
for line in f:
line_split = line.split("\t")
if int(line_split[0]) in text:
text[int(line_split[0])] = fn(
text[int(line_split[0])], eval(line_split[1])
)
else:
text[int(line_split[0])] = eval(line_split[1])
return text
def combine_I(files, type="union"):
text = {}
if type == "union":
fn = binary_union
else:
fn = binary_intersection
for fil in files:
with open(fil, "r") as f:
for line in f:
line_split = line.split("\t")
if int(line_split[0]) in text:
text[int(line_split[0])] = fn(
text[int(line_split[0])], eval(line_split[2])
)
else:
text[int(line_split[0])] = eval(line_split[2])
return text
def write_dict_to_file(text, text_I, path):
with open(path, "w") as f:
for id, spans in text.items():
# if id != len(text) - 1:
if 1:
f.write(f"{id}\t{str(spans)}\t{str(text_I[id])}\n")
# else:
# f.write(f"{id}\t{str(spans)}")
if __name__ == "__main__":
parser = argparse.ArgumentParser(
prog="combine_preds.py", description="Combine span predictions."
)
parser.add_argument(
"--config",
type=str,
action="store",
help="The configuration for combining predictions.",
)
args = parser.parse_args()
combine_config = OmegaConf.load(args.config)
text = combine(combine_config.files, combine_config.type)
text_I = combine_I(combine_config.files, combine_config.type)
dir = "/".join(combine_config.path.split("/")[:-1])
if not os.path.exists(dir):
os.makedirs(dir)
write_dict_to_file(text, text_I, combine_config.path)