ispl_safe / script.py

new moe model

d1fc27c 10 months ago

7.54 kB

	import io
	import time
	import os

	os.environ['OMP_NUM_THREADS'] = '1'
	os.environ['OPENBLAS_NUM_THREADS'] = '1'
	os.environ['MKL_NUM_THREADS'] = '1'
	os.environ['NUMEXPR_NUM_THREADS'] = '1'

	import torch
	import tqdm.auto as tqdm
	from glob import glob
	import numpy as np
	import pandas as pd

	from models import Model
	from datasets import load_dataset
	from preprocess import preprocess, preprocess_FS

	from src.rawnet_model import RawNet
	from src.lcnn_model import LCNN
	from src.resnet_model import ResNet_LogSpec, ResNet_MelSpec
	from src.moe_model import UltimateMOE, MOE_attention, MOE_attention_FS

	# Import your model and anything else you want
	# You can even install other packages included in your repo
	# However, during the evaluation the container will not have access to the internet.
	# So you must include everything you need in your model repo. Common python libraries will be installed.
	# Feel free to contact us to add dependencies to the requiremnts.txt
	# For testing, this is the docker image that will be used https://github.com/huggingface/competitions/blob/main/Dockerfile
	# It can be pulled here https://hub.docker.com/r/huggingface/competitions/tags


	# load the dataset. dataset will be automatically downloaded to /tmp/data during evaluation
	print('Load Dataset')
	# DATASET_PATH = "/tmp/data_test"
	# dataset_remote = glob(os.path.join(DATASET_PATH, '*'))
	DATASET_PATH = "/tmp/data"
	dataset_remote = load_dataset(DATASET_PATH,split="test", streaming=True)

	device = "cuda:0"
	# device = "cpu"

	print('Define Model')

	# # RAWNET2 MODEL
	# config = {
	# "first_conv": 1024, "in_channels": 1, "filts": [20, [20, 20], [20, 128], [128, 128]],
	# "blocks": [2, 4], "nb_fc_node": 1024, "gru_node": 1024, "nb_gru_layer": 3, "nb_classes": 2
	# }
	# model = RawNet(config, device).to(device)
	# model_path = './checkpoints/RAWNET_ASVSPOOF_FOR_INTHEWILD_PURDUE.pth'
	# model.load_state_dict(torch.load(model_path, map_location=device))

	# RESNET MODEL
	# model = ResNet_LogSpec(sample_rate=24000, return_emb=False).to(device)
	# model_path = './checkpoints/RESNET_LOGSPEC_ALL_DATA_FS_24000.pth'

	# model = ResNet_MelSpec(sample_rate=24000, return_emb=False).to(device)
	# model_path = './checkpoints/RESNET_MELSPEC_ALL_DATA_FS_24000.pth'

	## LCNN MODEL
	# model = LCNN(return_emb=False, fs=24000).to(device)
	# model_path = './checkpoints/LCNN_ASVSPOOF_FOR_INTHEWILD_PURDUE.pth'
	# model_path = './checkpoints/LCNN_ALL_DATA.pth'
	# model_path = './checkpoints/LCNN_ALL_DATA_AUG.pth'
	# model_path = './checkpoints/LCNN_ALL_DATA_TTS_AUG.pth'
	# model_path = './checkpoints/LCNN_ALL_DATA_TTS_MOD.pth'
	# model_path = './checkpoints/LCNN_ALL_DATA_HI_FREQ_22050.pth'

	# model_path = './checkpoints/LCNN_ALL_DATA_FS_16000.pth'
	# model_path = './checkpoints/LCNN_ALL_DATA_FS_22050.pth'
	# model_path = './checkpoints/LCNN_ALL_DATA_FS_24000.pth'

	# model.load_state_dict(torch.load(model_path, map_location=device))

	# # MOE MODEL
	expert_1 = LCNN(return_emb=True, fs=24000)
	expert_2 = ResNet_LogSpec(return_emb=True, sample_rate=24000)
	expert_3 = ResNet_MelSpec(return_emb=True, sample_rate=24000)

	model = MOE_attention(experts=[expert_1, expert_2, expert_3], device=device)
	model_path = './checkpoints/MOE_TRANSF_3EXP_MODELS_AUG.pth'

	# expert_1 = LCNN(return_emb=True, fs=16000).to(device)
	# expert_2 = LCNN(return_emb=True, fs=22050).to(device)
	# expert_3 = LCNN(return_emb=True, fs=24000).to(device)
	# # expert_4 = LCNN(return_emb=True).to(device)
	# # expert_5 = LCNN(return_emb=True).to(device)
	# # expert_6 = LCNN(return_emb=True).to(device)
	#
	# model = MOE_attention_FS(experts=[expert_1, expert_2, expert_3], device=device)
	# model_path = './checkpoints/MOE_TRANSF_3EXP_FS_AUG_NO_FREEZE.pth'

	# # # model = UltimateMOE(experts=[expert_1, expert_2, expert_3, expert_4])
	# # # model_path = './checkpoints/MOE_ULTIMATE.pth'
	#
	# # model = MOE_attention(experts=[expert_1, expert_2, expert_3, expert_4, expert_5, expert_6], device=device)
	# # # model_path = './checkpoints/MOE_ATTENTION.pth'
	# # model_path = './checkpoints/MOE_TRANSF.pth'
	#
	# expert_7 = LCNN(return_emb=True).to(device)
	# expert_8 = LCNN(return_emb=True).to(device)
	# model = MOE_attention(experts=[expert_1, expert_2, expert_3, expert_4, expert_5, expert_6, expert_7, expert_8], device=device, freezing=True)
	# # model_path = './checkpoints/MOE_TRANSF_7EXP.pth'
	# # model_path = './checkpoints/MOE_TRANSF_7EXP_AUG.pth'
	# # model_path = './checkpoints/MOE_TRANSF_7EXP_AUG_NO_FREEZE.pth'
	# # model_path = './checkpoints/MOE_TRANSF_8EXP_AUG.pth'
	# model_path = './checkpoints/MOE_TRANSF_8EXP_AUG_NO_FREEZE.pth'

	model = (model).to(device)
	model.load_state_dict(torch.load(model_path, map_location=device))

	model.eval()

	print('Loaded Weights')

	# # EVALUATE OLD MODEL
	# del model
	# model = Model().to(device)

	# SAMPLING_RATE_CODES = {
	# 8000: 2,
	# 16000: 3,
	# 22050: 5,
	# 24000: 7,
	# 32000: 11,
	# 44100: 13,
	# 48000: 17,
	# "other": 19
	# }
	#
	# seen_frequencies = set()

	# iterate over the dataset
	out = []
	for el in tqdm.tqdm(dataset_remote):
	# for el in dataset_remote:

	start_time = time.time()

	# each element is a dict
	# el["id"] id of example and el["audio"] contains the audio file
	# el["audio"]["bytes"] contains bytes from reading the raw audio
	# el["audio"]["path"] containts the filename. This is just for reference and you cant actually load it

	# if you are using libraries that expect a file. You can use BytesIO object

	# try:

	# RUNNING ON HUGGINGFACE
	file_like = io.BytesIO(el["audio"]["bytes"])

	tensor, sr = preprocess(file_like, target_sr=24000)
	# tensor_16, tensor_22, tensor_24 = preprocess_FS(file_like)

	# # RUNNING LOCALLY
	# tensor = preprocess(el)

	with torch.no_grad():
	# soft decision (such as log likelihood score)
	# positive score correspond to synthetic prediction
	# negative score correspond to pristine prediction

	# # OLD MODEL
	# score = model(tensor.to(device)).cpu().item()

	# CUSTOM MODEL
	score = model(tensor.to(device))[:, 1].cpu()
	# score = model(tensor_16.to(device), tensor_22.to(device), tensor_24.to(device))[:, 1].cpu()

	print(f'SCORE OUT: {score}')
	score = score.mean().item()
	print(f'SCORE FINAL: {score}')

	# we require a hard decision to be submited. so you need to pick a threshold
	pred = "generated" if score > model.threshold else "pristine"

	# append your prediction
	# "id" and "pred" are required. "score" will not be used in scoring but we encourage you to include it. We'll use it for analysis of the results

	# RUNNING ON HUGGINGFACE
	total_time = time.time() - start_time

	# freq = sr if sr in SAMPLING_RATE_CODES else "other"
	#
	# # Assegna total_time: codice se è la prima occorrenza, 0 altrimenti
	# if freq not in seen_frequencies:
	# total_time = SAMPLING_RATE_CODES[freq]
	# seen_frequencies.add(freq)
	# # else:
	# # total_time = 0
	# total_time = 1

	out.append(dict(id=el["id"], pred=pred, score=score, time=total_time))
	# # RUNNING LOCALLY
	# out.append(dict(id=el, pred=pred, score=score, time=time.time() - start_time))

	# except Exception as e:
	# print(e)
	# print("failed", el["id"])
	# out.append(dict(id=el["id"], pred="none", score=None))
	# # print("failed", el)
	# # out.append(dict(id=el, pred="none", score=None))

	# save the final result and that's it
	pd.DataFrame(out).to_csv("submission.csv", index=False)