|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
import gc |
|
|
|
|
|
import pandas as pd |
|
|
from tqdm import tqdm |
|
|
|
|
|
from dataset import load_hoho_dataset |
|
|
from process_sample import process_sample |
|
|
|
|
|
|
|
|
|
|
|
if __name__ == "__main__": |
|
|
dataset = load_hoho_dataset(testing=True) |
|
|
|
|
|
solution = [] |
|
|
|
|
|
num_sample = 0 |
|
|
for subset_name in dataset.keys(): |
|
|
print(f"Predicting {subset_name}") |
|
|
for i, sample in enumerate(tqdm(dataset[subset_name])): |
|
|
res = process_sample(sample) |
|
|
solution.append(res) |
|
|
|
|
|
num_sample += 1 |
|
|
if num_sample % 10 == 0: |
|
|
gc.collect() |
|
|
|
|
|
print("------------ Saving results ---------------") |
|
|
sub = pd.DataFrame(solution, columns=["order_id", "wf_vertices", "wf_edges"]) |
|
|
sub.to_parquet("submission.parquet") |
|
|
print("------------ Done ------------ ") |
|
|
|