Spaces:

mai0901
/

dr-studio

Sleeping

App Files Files Community

dr-studio / model /code /ECGRecoverDatasetRandomMaskWithRS2V3.py

wogh2012

Upload Dash Docker Space

12f8999 verified about 1 month ago

raw

history blame contribute delete

55.1 kB

	from scipy import signal
	import numpy as np
	import scipy
	import inspect

	from mai.data.util.misc import LeadType


	def adjust_channel_dependency(ecg):
	ecg[2] = ecg[1] - ecg[0]
	ecg[3] = -(ecg[1] + ecg[0]) / 2
	ecg[4] = ecg[0] - ecg[1] / 2
	ecg[5] = ecg[1] - ecg[0] / 2
	return ecg


	def get_mag_range():
	return {
	"PowerlineNoise": {
	0: 0.0,
	1: 0.0062,
	2: 0.0116,
	3: 0.0168,
	4: 0.0222,
	5: 0.0278,
	6: 0.033,
	7: 0.0381,
	8: 0.0436,
	9: 0.049,
	10: 0.0543,
	},
	"BaselineWander": {
	0: 0.0,
	1: 0.01,
	2: 0.022,
	3: 0.035,
	4: 0.045,
	5: 0.06,
	6: 0.064,
	7: 0.086,
	8: 0.09,
	9: 0.1,
	10: 0.12,
	},
	"BaselineShift": {
	0: 0.0,
	1: 0.0317,
	2: 0.0631,
	3: 0.0966,
	4: 0.1286,
	5: 0.1584,
	6: 0.1924,
	7: 0.2257,
	8: 0.2514,
	9: 0.2869,
	10: 0.32,
	},
	"EMGNoise": {
	0: 0.0,
	1: 0.007,
	2: 0.013,
	3: 0.018,
	4: 0.022,
	5: 0.027,
	6: 0.032,
	7: 0.037,
	8: 0.042,
	9: 0.045,
	10: 0.05,
	},
	"RandomCropResize": {
	0: 1.0,
	1: 1.0,
	2: 1.001,
	3: 1.001,
	4: 1.002,
	5: 1.002,
	6: 1.003,
	7: 1.004,
	8: 1.005,
	9: 1.007,
	10: 1.01,
	},
	"TimeWarp": {
	0: 0.0,
	1: 0.014,
	2: 0.027,
	3: 0.041,
	4: 0.055,
	5: 0.07,
	6: 0.086,
	7: 0.103,
	8: 0.142,
	9: 0.202,
	10: 0.5,
	},
	"DynamicTimeWarp": {
	0: 0.0,
	1: 0.146,
	2: 0.292,
	3: 0.439,
	4: 0.585,
	5: 0.731,
	6: 0.877,
	7: 1.0,
	8: 1.239,
	9: 1.633,
	10: 2.0,
	},
	"GaussianSmoothing": {
	0: 1.0,
	1: 1.5,
	2: 1.9,
	3: 2.681,
	4: 3.526,
	5: 3.75,
	6: 4.0,
	7: 4.786,
	8: 5.573,
	9: 5.786,
	10: 6.0,
	},
	"MagnitudeWarping": {
	0: 0.0,
	1: 0.02,
	2: 0.037,
	3: 0.055,
	4: 0.071,
	5: 0.088,
	6: 0.105,
	7: 0.122,
	8: 0.139,
	9: 0.156,
	10: 0.172,
	},
	"AngleRotation": {
	0: 0.533,
	1: 3.742,
	2: 6.231,
	3: 8.839,
	4: 11.26,
	5: 14.112,
	6: 15.868,
	7: 18.057,
	8: 20.816,
	9: 22.954,
	10: 24.0,
	},
	"TimeMask": {
	0: 0.0,
	1: 0.01,
	2: 0.021,
	3: 0.037,
	4: 0.061,
	5: 0.088,
	6: 0.124,
	7: 0.169,
	8: 0.216,
	9: 0.279,
	10: 0.344,
	},
	"ChannelMask": {
	0: 0.0,
	1: 0.33,
	2: 0.67,
	3: 1.0,
	4: 1.5,
	5: 2.0,
	6: 2.25,
	7: 2.5,
	8: 2.75,
	9: 3.0,
	10: 3.5,
	},
	"RandomSpectrogramMask": {
	0: 0.0,
	1: 0.002,
	2: 0.005,
	3: 0.009,
	4: 0.014,
	5: 0.02,
	6: 0.028,
	7: 0.036,
	8: 0.046,
	9: 0.057,
	10: 0.072,
	},
	"FrequencyWarping": {
	0: 0.0075,
	1: 0.018,
	2: 0.0225,
	3: 0.024,
	4: 0.0285,
	5: 0.03,
	6: 0.0345,
	7: 0.0345,
	8: 0.0375,
	9: 0.0375,
	10: 0.039,
	},
	"LowPassFilter": {
	0: 0.0,
	1: 0.043,
	2: 0.154,
	3: 0.271,
	4: 0.371,
	5: 0.429,
	6: 0.484,
	7: 0.552,
	8: 0.599,
	9: 0.636,
	10: 0.667,
	},
	"PartialWhiteNoise": {
	0: 0.0,
	1: 0.019,
	2: 0.03,
	3: 0.039,
	4: 0.047,
	5: 0.055,
	6: 0.061,
	7: 0.068,
	8: 0.074,
	9: 0.08,
	10: 0.086,
	},
	"PermuteWaveSegment": {
	0: 0.0,
	1: 0.284,
	2: 0.568,
	3: 0.852,
	4: 1.486,
	5: 2.1,
	6: 2.815,
	7: 3.399,
	8: 4.45,
	9: 5.994,
	10: 8.0,
	},
	"ConcatWaveSegment": {
	0: 0.0,
	1: 1,
	2: 1,
	3: 2,
	4: 2,
	5: 3,
	6: 3,
	7: 4,
	8: 4,
	9: 5,
	10: 6,
	},
	"Flip": {
	0: 0.0,
	1: 1.0,
	2: 1.0,
	3: 1.0,
	4: 1.0,
	5: 1.0,
	6: 1.0,
	7: 1.0,
	8: 1.0,
	9: 1.0,
	10: 1.0,
	},
	"RandomSpike": {
	0: 0,
	1: 1,
	2: 2,
	3: 3,
	4: 4,
	5: 5,
	6: 6,
	7: 7,
	8: 8,
	9: 9,
	10: 10,
	},
	"DigitizedLeadName": {
	0: 0,
	1: 1,
	2: 2,
	3: 3,
	4: 4,
	5: 5,
	6: 6,
	7: 7,
	8: 8,
	9: 9,
	10: 10,
	},
	}


	def aug_mod(aug_list, params):
	# aug_mod setting for Rand Aumgnet
	aug_range = get_mag_range()
	da_list = []
	for aug in aug_list:
	params_aug = dict()
	for param in params.keys():
	if param in inspect.getfullargspec(globals()[aug].__init__)[0]:
	params_aug[param] = params[param]
	if aug in list(aug_range.keys()):
	params_aug["mag"] = {
	"max": aug_range[aug][int(params["mag"]["max"])],
	"min": aug_range[aug][max(int(params["mag"]["min"]), 0)],
	}
	da_list.append(globals()[aug](**params_aug))
	return da_list


	## PowerlineNoise
	class PowerlineNoise(object):
	def __init__(self, mag={"max": 0.5, "min": 0}, p=1.0, freq=500, dependency=True):
	# self.min_amplitude = min_amplitude
	# self.max_amplitude = max_amplitude
	self.max_amplitude = mag["max"]
	self.min_amplitude = mag["min"]
	self.freq = freq
	self.p = p
	self.dependency = dependency

	def __call__(self, sample):
	if self.p > np.random.uniform(0, 1):
	new_sample = sample
	C, T = new_sample.shape
	# amp_channel = np.random.normal(1, 0.1, size=(C,1))
	amp = np.random.uniform(self.min_amplitude, self.max_amplitude, size=(1, 1))
	# amp = amp_channel*amp_general
	f = 50 if np.random.uniform(0, 1) > 0.5 else 60
	noise = self.apply_powerline_noise(T, f)
	new_sample = new_sample + noise * amp
	if self.dependency:
	new_sample = adjust_channel_dependency(new_sample)
	else:
	new_sample = sample
	return new_sample

	def apply_powerline_noise(self, T, f):
	t = np.linspace(0, T - 1, T)
	phase = np.random.uniform(0, 2 * 3.14)
	noise = np.cos(2 * 3.14 * f * (t / self.freq) + phase)
	return noise


	## BaselineWander
	class BaselineWander(object):
	def __init__(
	self,
	mag={"max": 0.5, "min": 0},
	p=1.0,
	aug_freq={"max": 0.2, "min": 0.01},
	k=3,
	freq=500,
	dependency=True,
	):
	self.min_amplitude = mag["min"]
	self.max_amplitude = mag["max"]
	self.min_freq = aug_freq["min"]
	self.max_freq = aug_freq["max"]
	self.k = k
	self.freq = freq
	self.p = p
	self.dependency = dependency

	def __call__(self, sample):
	if self.p > np.random.uniform(0, 1):
	new_sample = sample.copy()
	C, T = new_sample.shape
	amp_channel = np.random.normal(1, 0.5, size=(C, 1))
	# c = np.array([i for i in range(12)])
	amp_general = np.random.uniform(
	self.min_amplitude, self.max_amplitude, size=self.k
	)
	noise = np.zeros(shape=(1, T))
	for k in range(self.k):
	noise += self.apply_baseline_wander(T) * amp_general[k]
	noise = noise * amp_channel
	new_sample[:, :] = new_sample[:, :] + noise[:, :]
	if self.dependency:
	new_sample = adjust_channel_dependency(new_sample)
	else:
	new_sample = sample
	return new_sample

	def apply_baseline_wander(self, T):
	f = np.random.uniform(self.min_freq, self.max_freq)
	t = np.linspace(0, T - 1, T)
	r = np.random.uniform(0, 2 * 3.14)
	noise = np.cos(2 * 3.14 * f * (t / self.freq) + r)
	return noise


	## BaselineShift
	class BaselineShift(object):
	def __init__(
	self,
	mag={"max": 0.5, "min": 0},
	shift_ratio=0.2,
	num_segment=1,
	freq=500,
	dependency=False,
	p=1.0,
	):
	self.max_amplitude = mag["max"]
	self.min_amplitude = mag["min"]
	self.shift_ratio = shift_ratio
	self.num_segment = num_segment
	self.freq = freq
	self.p = p
	self.dependency = dependency

	def __call__(self, sample):
	if self.p > np.random.uniform(0, 1):
	new_sample = sample.copy()
	C, T = new_sample.shape
	shift_length = T * self.shift_ratio
	# amp_channel = np.random.normal(1,0.1,size=(C,1))
	amp_channel = np.random.choice([1, -1], size=(C, 1))
	amp_general = np.random.uniform(
	self.min_amplitude, self.max_amplitude, size=(1, 1)
	)
	amp = amp_channel * amp_general
	noise = np.zeros(shape=(C, T))
	for i in range(self.num_segment):
	segment_len = np.random.normal(shift_length, shift_length * 0.2)
	t0 = int(np.random.uniform(0, T - segment_len))
	t = int(t0 + segment_len)
	# c = np.random.randint(1,12,size=np.random.randint(1,12))
	noise[:, t0:t] = 1
	new_sample = new_sample + noise * amp
	if self.dependency:
	new_sample = adjust_channel_dependency(new_sample)
	else:
	new_sample = sample
	return new_sample


	# EMGNoise
	class EMGNoise(object):
	def __init__(
	self,
	mag={"max": 0.5, "min": 0},
	# min_amplitude=0, max_amplitude=0.05,
	dependency=True,
	p=1.0,
	):
	# self.min_amplitude = min_amplitude
	# self.max_amplitude = max_amplitude
	self.max_amplitude = mag["max"]
	self.min_amplitude = mag["min"]
	self.p = p
	self.dependency = dependency

	def __call__(self, sample):
	if self.p > np.random.uniform(0, 1):
	new_sample = sample.copy()
	C, T = new_sample.shape
	amp = np.random.uniform(self.min_amplitude, self.max_amplitude, size=(C, 1))
	# c = np.random.randint(1,12,size=np.random.randint(1,12))
	noise = np.random.normal(0, 1, [C, T])
	# new_sample[c] = new_sample[c] + noise[c]*amp[c]
	new_sample = new_sample + noise * amp
	if self.dependency:
	new_sample = adjust_channel_dependency(new_sample)
	else:
	new_sample = sample
	return new_sample


	# RandomCropResize


	class RandomCropResize(object):
	def __init__(
	self,
	mag={"max": 1.2, "min": 1.1},
	# min_rate=1.0, max_rate=1.1,
	dependency=False,
	p=1.0,
	):
	# self.min_rate = min_rate
	# self.max_rate = max_rate
	self.min_rate = mag["min"]
	self.max_rate = mag["max"]
	self.dependency = dependency
	self.p = p

	def __call__(self, sample):
	if self.p > np.random.uniform(0, 1):
	try:
	new_sample = sample.copy()
	C, T = new_sample.shape
	rate = np.random.uniform(self.min_rate, self.max_rate)
	rate = 1 / rate if np.random.uniform(0, 1) > 0.5 else rate
	if self.max_rate > 1:
	new_sample = np.concatenate([new_sample] * 3, 1)
	start = np.random.randint(new_sample.shape[1] - int(T * rate))
	new_sample = new_sample[:, start : start + int(T * rate)]
	new_sample = signal.resample(new_sample, T, axis=1)
	if self.dependency:
	new_sample = adjust_channel_dependency(new_sample)
	except Exception:
	new_sample = sample
	else:
	new_sample = sample
	return new_sample


	# TimeWarp
	class TimeWarp(object):
	def __init__(
	self,
	mag={"max": 20, "min": 0},
	# iteration=1,
	dependency=False,
	p=1.0,
	):
	self.epsilon_max = 10 / np.max([mag["max"], 0.001])
	self.epsilon_min = 10 / np.max([mag["min"], 0.001])
	self.scale_max = mag["max"] # mag['max'] # mag['max']
	self.scale_min = mag["min"] # mag['min'] # mag['min']
	self.iteration = 1 # 210 if mag['max'] == 0 else 1
	self.dependency = dependency
	self.p = p

	def __call__(self, sample):
	if self.p > np.random.uniform(0, 1):
	new_sample = sample.copy()
	C, T = new_sample.shape
	for _ in range(self.iteration):
	epsilon = np.random.uniform(self.epsilon_min, self.epsilon_max)
	scale = np.random.uniform(self.scale_min, self.scale_max)
	pmf = np.random.normal(loc=0, scale=scale, size=T)
	pmf = np.cumsum(pmf) # random walk
	pmf = pmf - np.min(pmf) + epsilon # make it positive

	cdf = np.cumsum(pmf) # by definition monotonically increasing
	t_new = (
	(cdf - cdf[0]) / (cdf[-1] - cdf[0]) * (len(cdf) - 1)
	) # correct normalization
	# t_old = np.arange(T)
	new_sample = new_sample[:, t_new.astype(int)]
	if self.dependency:
	new_sample = adjust_channel_dependency(new_sample)
	else:
	new_sample = sample
	return new_sample


	# DynamicTimeWarp
	class DynamicTimeWarp(object):
	def __init__(
	self,
	mag={"max": 3, "min": 3},
	freq=500,
	scale=1,
	epsilon=10,
	dependency=True,
	p=1.0,
	):
	self.num_of_warps_min = mag["min"]
	self.num_of_warps_max = mag["max"]
	self.radius = freq
	self.scale = 0.1
	self.epsilon = 0.1
	self.dependency = dependency
	self.p = p

	def __call__(self, sample):
	if self.p > np.random.uniform(0, 1):
	new_sample = sample.copy()
	C, T = new_sample.shape
	radius = self.radius
	t_new = np.arange(T)
	num_of_warps = np.random.randint(
	self.num_of_warps_min, self.num_of_warps_max + 1
	)
	for i in range(num_of_warps):
	section_length = T // num_of_warps
	point = np.random.randint(section_length * i, section_length * (i + 1))

	warp_from = (
	point - radius // 2
	if point - radius // 2 > section_length * i
	else section_length * i
	)
	warp_from = (
	warp_from
	if point + radius // 2 < section_length * (i + 1)
	else section_length * (i + 1) - radius - 1
	)
	warp_to = warp_from + radius

	pmf = np.random.normal(loc=0, scale=self.scale, size=radius)
	pmf = np.cumsum(pmf) # random walk
	pmf = pmf - np.min(pmf) + self.epsilon # make it positive
	cdf = np.cumsum(pmf) # by definition monotonically increasing
	t_new[warp_from:warp_to] = warp_from + (cdf - cdf[0]) / (
	cdf[-1] - cdf[0]
	) * (len(cdf) - 1)

	new_sample = new_sample[:, t_new.astype(int)]
	if self.dependency:
	new_sample = adjust_channel_dependency(new_sample)
	else:
	new_sample = sample

	return new_sample


	# GaussianSmoothing
	class GaussianSmoothing(object):
	def __init__(
	self,
	mag={"max": 15, "min": 3},
	p=1.0,
	# min_window_length=3,
	# max_window_length=15,
	dependency=False,
	):
	self.min_window_length = mag["min"]
	self.max_window_length = mag["max"]
	# self.max_window_length = mag
	self.dependency = dependency
	self.p = p

	def __call__(self, sample):
	if self.p > np.random.uniform(0, 1):
	new_sample = sample.copy()
	C, T = new_sample.shape
	window_length = np.random.randint(
	self.min_window_length, self.max_window_length + 1
	)
	new_sample = self.apply_gaussian_smoothing(new_sample, window_length)
	if self.dependency:
	new_sample = adjust_channel_dependency(new_sample)
	else:
	new_sample = sample
	return new_sample

	def apply_gaussian_smoothing(self, wave, window_length):
	C, T = wave.shape
	window = scipy.signal.windows.gaussian(window_length, std=window_length // 2)
	window = window / window.sum()
	new_wave = []
	for i in range(C):
	new_wave.append(np.convolve(window, wave[i], "same"))
	new_wave = np.stack(new_wave)
	return new_wave


	# MagnitudeWarping
	class MagnitudeWarping(object):
	def __init__(self, mag={"max": 0.5, "min": 0.1}, dependency=True, p=1.0):
	self.std_max = mag["max"]
	self.std_min = mag["min"]
	# self.std = mag
	self.dependency = dependency
	self.p = p

	def __call__(self, sample):
	if self.p > np.random.uniform(0, 1):
	new_sample = sample.copy()
	std = np.random.uniform(self.std_min, self.std_max)
	C, T = new_sample.shape
	amplitude = np.random.normal(1, std, size=(C, T))
	new_sample = new_sample * amplitude
	if self.dependency:
	new_sample = adjust_channel_dependency(new_sample)
	else:
	new_sample = sample
	return new_sample


	# AngleRotation
	class AngleRotation(object):
	def __init__(
	self, mag={"max": 45, "min": 0}, method="dower", dependency=True, p=1.0
	):
	assert method in ["dower", "plsv", "qlsv", "kors"]
	self.min_rotation = mag["min"]
	self.max_rotation = mag["max"]
	# self.max_rotation = mag
	self.dependency = dependency
	self.p = p

	if method == "dower":
	self.trans_inv = np.array(
	[
	[-0.172, -0.073, 0.122, 0.231, 0.239, 0.193, 0.156, -0.009],
	[0.057, -0.019, -0.106, -0.022, 0.040, 0.048, -0.227, 0.886],
	[-0.228, -0.310, -0.245, -0.063, 0.054, 0.108, 0.021, 0.102],
	]
	)
	elif method == "plsv":
	self.trans_inv = np.array(
	[
	[-0.266, 0.027, 0.065, 0.131, 0.203, 0.220, 0.370, -0.154],
	[0.088, -0.088, 0.003, 0.042, 0.047, 0.067, -0.131, 0.717],
	[-0.319, -0.198, -0.167, -0.099, -0.009, 0.060, 0.184, -0.114],
	]
	)
	elif method == "qlsv":
	self.trans_inv = np.array(
	[
	[-0.147, -0.058, 0.037, 0.139, 0.232, 0.226, 0.199, -0.018],
	[0.023, -0.085, -0.003, 0.033, 0.060, 0.104, -0.146, 0.503],
	[-0.184, -0.163, -0.190, -0.119, -0.023, 0.043, 0.085, -0.130],
	]
	)
	elif method == "kors":
	self.trans_inv = np.array(
	[
	[-0.130, 0.050, -0.010, 0.140, 0.060, 0.540, 0.380, -0.070],
	[0.060, -0.020, -0.050, 0.060, -0.170, 0.130, -0.070, 0.930],
	[-0.430, -0.060, -0.140, -0.200, -0.110, 0.310, 0.110, -0.230],
	]
	)
	self.trans = np.linalg.pinv(self.trans_inv)

	def __call__(self, sample):
	if self.p > np.random.uniform(0, 1):
	new_sample = sample.copy()
	C, T = new_sample.shape
	theta = np.random.randint(self.min_rotation, self.max_rotation + 1, 3)
	if C == 12:
	new_sample_8lead = new_sample[[6, 7, 8, 9, 10, 11, 0, 1], :]
	rot_x = np.array(
	[
	[1, 0, 0],
	[
	0,
	np.cos(theta[0] * np.pi / 180),
	-np.sin(theta[0] * np.pi / 180),
	],
	[
	0,
	np.sin(theta[0] * np.pi / 180),
	np.cos(theta[0] * np.pi / 180),
	],
	]
	)
	rot_y = np.array(
	[
	[
	np.cos(theta[1] * np.pi / 180),
	0,
	-np.sin(theta[1] * np.pi / 180),
	],
	[0, 1, 0],
	[
	np.sin(theta[1] * np.pi / 180),
	0,
	np.cos(theta[1] * np.pi / 180),
	],
	]
	)
	rot_z = np.array(
	[
	[
	np.cos(theta[2] * np.pi / 180),
	-np.sin(theta[2] * np.pi / 180),
	0,
	],
	[
	np.sin(theta[2] * np.pi / 180),
	np.cos(theta[2] * np.pi / 180),
	0,
	],
	[0, 0, 1],
	]
	)
	rot = np.einsum("ab,bc,cd->ad", rot_x, rot_y, rot_z)
	mtx1 = np.einsum("ab,bc->ac", self.trans, rot)
	mtx2 = np.einsum("ab,bc->ac", self.trans_inv, new_sample_8lead)
	new_sample_8lead = np.einsum("ab,bc->ac", mtx1, mtx2)
	new_sample_12lead = np.zeros([C, T])
	new_sample_12lead[[6, 7, 8, 9, 10, 11, 0, 1], :] = new_sample_8lead
	new_sample = adjust_channel_dependency(new_sample_12lead)
	if self.dependency:
	new_sample = adjust_channel_dependency(new_sample)
	new_sample = (np.mean(theta) / 30) * new_sample + (
	30 - np.mean(theta)
	) / 30 * sample
	else:
	new_sample = sample

	return new_sample


	# TimeMask
	class TimeMask(object):
	def __init__(
	self,
	mag={"max": 0.3, "min": 0.0},
	# min_band_part=0.0,
	# max_band_part=0.3,
	num=1,
	dependency=True,
	p=1.0,
	):
	self.min_band_part = mag["max"]
	self.max_band_part = mag["min"]
	# self.max_band_part = mag
	self.num = num
	self.dependency = dependency
	self.p = p

	def __call__(self, sample):
	if self.p > np.random.uniform(0, 1):
	new_sample = sample.copy()
	C, T = new_sample.shape
	for _ in range(self.num):
	t0 = np.random.uniform(0, 1 - self.max_band_part)
	t = np.random.uniform(self.min_band_part, self.max_band_part)
	mask_from = int(t0 * T)
	mask_to = int((t0 + t) * T)
	new_sample[:, mask_from:mask_to] = 0
	if self.dependency:
	new_sample = adjust_channel_dependency(new_sample)
	else:
	new_sample = sample
	return new_sample


	# ChannelMask
	class ChannelMask(object):
	def __init__(
	self,
	mag={"max": 4, "min": 1},
	# min_num_channel=0,
	# max_num_channel=4,
	dependency=False,
	p=1.0,
	):
	self.min_num_channel = mag["min"]
	self.max_num_channel = mag["max"]
	# self.max_num_channel = mag
	self.dependency = dependency
	self.p = p

	def __call__(self, sample):
	if self.p > np.random.uniform(0, 1):
	new_sample = sample.copy()
	C, T = new_sample.shape
	num_channel = np.random.randint(
	self.min_num_channel, self.max_num_channel + 1
	)
	if num_channel > C:
	num_channel = C
	channels = np.random.choice(list(range(C)), num_channel, replace=False)
	new_sample[channels, :] = 0
	if self.dependency:
	new_sample = adjust_channel_dependency(new_sample)
	else:
	new_sample = sample
	return new_sample


	# RandomSpectrogramMask


	class RandomSpectrogramMask(object):
	def __init__(self, mag={"max": 0.5, "min": 0.2}, freq=500, dependency=False, p=1.0):
	self.random_mask_prob_min = mag["min"]
	self.random_mask_prob_max = mag["max"]
	self.freq = freq
	self.dependency = dependency
	self.p = p

	def __call__(self, sample):
	if self.p > np.random.uniform(0, 1):
	new_sample = sample.copy()
	_, _, z = scipy.signal.stft(
	new_sample, fs=self.freq, nperseg=self.freq // 5
	)
	N, C, T = z.shape
	mask_prob = np.random.uniform(
	self.random_mask_prob_min, self.random_mask_prob_max
	)
	mask = np.random.choice(
	[0, 1], size=(N, C, T), p=[mask_prob, 1 - mask_prob]
	)
	_, new_sample = scipy.signal.istft(
	z * mask, fs=self.freq, nperseg=self.freq // 5
	)
	if self.dependency:
	new_sample = adjust_channel_dependency(new_sample)
	new_sample = new_sample[:, : sample.shape[-1]]
	else:
	new_sample = sample
	return new_sample


	## FrequencyWarping
	class FrequencyWarping(object):
	def __init__(self, mag, scale=0.1, dependency=True, p=1.0):
	# self.scale = scale
	self.scale_max = mag["max"]
	self.scale_min = mag["min"]
	self.dependency = dependency
	self.p = p

	def __call__(self, sample):
	if self.p > np.random.uniform(0, 1):
	new_sample = sample.copy()
	z = np.fft.fft(new_sample)
	C, F = z.shape
	scale = np.random.uniform(self.scale_min, self.scale_max)
	pmf = np.random.normal(loc=1, scale=scale, size=F)
	cdf = np.cumsum(pmf)
	f_new = (cdf - cdf[0]) / (cdf[-1] - cdf[0]) * (len(cdf) - 1)
	z_new = z[:, np.round(f_new).astype(int)]
	new_sample = np.real(np.fft.ifft(z_new))
	if self.dependency:
	new_sample = adjust_channel_dependency(new_sample)
	else:
	new_sample = sample
	return new_sample


	## LowPassFilter
	class LowPassFilter(object):
	def __init__(
	self,
	mag={"max": 0.8, "min": 0.5},
	# cutoff_ratio_min=0.0,
	# cutoff_ratio_max=0.8,
	dependency=False,
	p=1.0,
	):
	self.cutoff_ratio_min = mag["min"]
	self.cutoff_ratio_max = mag["max"]
	# self.cutoff_ratio_max = mag
	self.dependency = dependency
	self.p = p

	def __call__(self, sample):
	if self.p > np.random.uniform(0, 1):
	new_sample = sample.copy()
	z = np.fft.fft(new_sample)
	C, F = z.shape
	mask_prob = np.random.uniform(self.cutoff_ratio_min, self.cutoff_ratio_max)
	mask = np.ones([C, F])
	mask[
	:,
	int((F // 2) - ((F * mask_prob) // 2)) : int(
	(F // 2) + ((F * mask_prob) // 2)
	),
	] = 0
	new_sample = np.real(np.fft.ifft(z * mask))
	if self.dependency:
	new_sample = adjust_channel_dependency(new_sample)
	else:
	new_sample = sample
	return new_sample


	## PartialWhiteNoise
	class PartialWhiteNoise(object):
	def __init__(
	self,
	mag={"max": 0.3, "min": 0.0},
	# scale=3,
	# min_band_part=0.0,
	# max_band_part=0.3,
	num=1,
	dependency=True,
	p=1.0,
	):
	self.min_band_part = mag["min"]
	self.max_band_part = mag["max"]
	# self.max_band_part = mag
	# self.scale = scale
	self.num = num
	self.dependency = dependency
	self.p = p

	def __call__(self, sample):
	if self.p > np.random.uniform(0, 1):
	new_sample = sample.copy()
	C, T = new_sample.shape
	for _ in range(self.num):
	t0 = np.random.uniform(0, 1 - self.max_band_part)
	t = np.random.uniform(self.min_band_part, self.max_band_part)
	mask_from = int(t0 * T)
	mask_to = int(t0 * T) + int(t * T)
	scale = t * 2.7
	new_sample[:, mask_from:mask_to] = (
	new_sample[:, mask_from:mask_to]
	+ np.random.normal(0, scale, [C, mask_to - mask_from])
	* np.std(new_sample, 1, keepdims=True) ** 0.5
	)
	if self.dependency:
	new_sample = adjust_channel_dependency(new_sample)
	else:
	new_sample = sample
	return new_sample


	# PermuteWaveSegment
	class PermuteWaveSegment(object):
	def __init__(
	self,
	mag={"max": 4, "min": 0},
	# min_num_segment=0,
	# max_num_segment=4,
	sampling_rate=500,
	dependency=False,
	p=1.0,
	):
	self.min_num_segment = mag["min"]
	self.max_num_segment = mag["max"]
	self.sampling_rate = sampling_rate
	self.dependency = dependency
	self.p = p

	def __call__(self, sample):
	if self.p > np.random.uniform(0, 1):
	sample = sample.copy()
	C, T = sample.shape
	num_segment = np.random.randint(
	self.min_num_segment, self.max_num_segment + 1
	)
	segment_point = np.sort(np.random.randint(0, T, num_segment + 1))
	seg_index = segment_point[
	[
	int(x)
	for x in np.linspace(0, len(segment_point) - 1, num_segment + 1)
	]
	]
	seg_index = np.concatenate([[0], seg_index, [T]], 0)
	seg_index = np.random.permutation(
	[[i, j] for i, j in zip(seg_index[:-1], seg_index[1:])]
	)
	new_sample = []
	for start, end in seg_index:
	new_sample.append(sample[:, start:end])
	crop_start = np.random.randint(T - (segment_point[-1] - segment_point[0]))
	new_sample = np.concatenate(new_sample * 2, axis=1)[
	:, crop_start : crop_start + T
	]
	if self.dependency:
	new_sample = adjust_channel_dependency(new_sample)
	else:
	new_sample = sample
	return new_sample


	# ConcatWaveSegment
	class ConcatWaveSegment(object):
	def __init__(
	self,
	mag={"max": 4, "min": 0},
	# min_num_segment=0,
	# max_num_segment=4,
	sampling_rate=500,
	dependency=True,
	p=1.0,
	):
	self.min_num_segment = mag["min"]
	self.max_num_segment = mag["max"]
	self.sampling_rate = sampling_rate
	self.dependency = dependency
	self.p = p

	def __call__(self, sample):
	if self.p > np.random.uniform(0, 1):
	try:
	C, T = sample.shape
	num_segment = np.random.randint(
	self.min_num_segment, self.max_num_segment + 1
	)
	segment_point = np.sort(np.random.randint(0, T, num_segment + 1))
	seg_point = segment_point[
	[
	int(x)
	for x in np.linspace(0, len(segment_point) - 1, num_segment + 1)
	]
	]
	index = np.random.randint(0, len(seg_point) - 1, 1)[0]
	sample_segment = sample[:, seg_point[index] : seg_point[index + 1]]
	new_sample = np.concatenate(
	[sample_segment] * (T // len(sample_segment[0]) + 1), 1
	)[:, :T]
	if self.dependency:
	new_sample = adjust_channel_dependency(new_sample)
	if new_sample.shape[1] < T:
	new_sample = sample
	except Exception:
	new_sample = sample
	else:
	new_sample = sample
	return new_sample


	class Flip(object):
	def __init__(self, mag={"max": 0.5, "min": 0.1}, p=0.1):
	self.std_max = mag["max"]
	self.std_min = mag["min"]
	self.p = p # flip 은 확률 10%로 세팅

	def __call__(self, sample):
	if self.p > np.random.uniform(0, 1):
	new_sample = sample.copy()
	if self.std_max != 0:
	new_sample = -new_sample
	else:
	new_sample = sample
	return new_sample


	class RandomSpike(object):
	def __init__(self, mag={"max": 2, "min": 1}, p=1.0, freq=500):
	self.max_ratio = mag["max"]
	self.min_ratio = mag["min"]
	self.p = p
	self.freq = freq

	def _visible_segment_for_channel(self, c: int, T: int):
	"""
	채널별 보이는 구간 반환.
	T=5000 이면 segment_len = 1250:
	0~2 -> 0~1250
	3~5 -> 1250~2500
	6~8 -> 2500~3750
	9~11 -> 3750~5000
	"""
	segment_len = T // 4
	if c <= 2: # I, II, III
	return 0, segment_len
	elif c <= 5: # aVR, aVL, aVF
	return segment_len, 2 * segment_len
	elif c <= 8: # V1, V2, V3
	return 2 * segment_len, 3 * segment_len
	else: # V4, V5, V6
	return 3 * segment_len, 4 * segment_len

	def __call__(self, sample):
	if self.p <= np.random.uniform(0, 1):
	return sample

	new_sample = np.copy(sample)
	C, T = new_sample.shape
	assert C == 12, f"이 구현은 12리드를 가정합니다. 현재 C={C}"

	spike_len = int(np.random.uniform(0, self.max_ratio) * 1.2) + 1
	n_spikes = self.max_ratio // 2

	for _ in range(n_spikes):
	for c in range(C):
	seg_start, seg_end = self._visible_segment_for_channel(c, T)

	# 해당 리드의 보이는 구간 안에서만 시작 위치 랜덤
	max_start = seg_end - spike_len
	start = np.random.randint(seg_start, max_start)

	# amplitude
	range_c = (new_sample[c].max() - new_sample[c].min()) / 2
	scale = np.random.uniform(0.5, 1.5)
	sign = np.random.choice([-1.0, 1.0])
	spike_amp = sign * range_c * scale

	new_sample[c, start : start + spike_len] = spike_amp

	return new_sample


	import os


	class DigitizedLeadName(object):
	def __init__(self, mag={"max": 2, "min": 1}, p=1.0, freq=500):
	"""
	place: 1 → upper 템플릿, -1 → under 템플릿
	height: 템플릿 전체에 더할 vertical shift (place * height)
	width_scale: 시간축 scaling factor (1: 그대로, 2: 길이 2배)
	p: augmentation probability
	"""

	mag_to_param_range = {
	"width_scale_range": {
	1: (1, 1.000000001),
	2: (0.9, 1.1),
	3: (0.85, 1.2),
	4: (0.8, 1.3),
	5: (0.75, 1.4),
	6: (0.7, 1.5),
	7: (0.65, 1.6),
	8: (0.6, 1.7),
	9: (0.55, 1.8),
	10: (0.5, 1.9),
	},
	"height_scale_range": {
	1: (1, 1.000000001),
	2: (0.94, 1.06),
	3: (0.88, 1.12),
	4: (0.82, 1.18),
	5: (0.76, 1.24),
	6: (0.70, 1.30),
	7: (0.64, 1.36),
	8: (0.58, 1.42),
	9: (0.52, 1.48),
	10: (0.5, 1.54),
	},
	"height_shift_range": {
	1: (0, 0.000000001),
	2: (0.0, 0.1),
	3: (0.0, 0.2),
	4: (0.0, 0.3),
	5: (0.0, 0.4),
	6: (0.0, 0.5),
	7: (0.0, 0.6),
	8: (0.0, 0.7),
	9: (0.0, 0.8),
	10: (0.0, 0.9),
	},
	"text_space_range": {
	1: (0, 2),
	2: (0, 2),
	3: (0, 2),
	4: (0, 3),
	5: (0, 3),
	6: (0, 3),
	7: (0, 4),
	8: (0, 4),
	9: (0, 4),
	10: (0, 5),
	},
	}

	self.p = p
	self.mag = int(mag["max"])
	self.height_shift_range = mag_to_param_range["height_shift_range"][self.mag]
	self.height_scale_range = mag_to_param_range["height_scale_range"][self.mag]
	self.width_scale_range = mag_to_param_range["width_scale_range"][self.mag]
	self.text_space_range = mag_to_param_range["text_space_range"][self.mag]

	self.upper_template, self.under_template = self._load_and_split_templates(
	"DigitizedLeadNameTemplate.npz"
	)

	self.lead_order = [lead.name for lead in LeadType]

	# -------------------- 템플릿 로드 -------------------- #
	def _load_and_split_templates(self, filename):
	"""
	.npz에서 upper/under 템플릿을 읽고,
	각 lead 템플릿(1D: 값 + NaN)을 NaN 기준으로 글자 단위로 분리한다.

	반환:
	upper_split: {lead_name: [char0, char1, ...]}
	under_split: {lead_name: [char0, char1, ...]}
	"""
	path = os.path.join(os.path.dirname(__file__), "datasets", filename)
	data = np.load(path, allow_pickle=True)

	upper_raw = {
	k: v.astype(np.float32)
	for k, v in zip(data["upper_keys"], data["upper_values"])
	}
	under_raw = {
	k: v.astype(np.float32)
	for k, v in zip(data["under_keys"], data["under_values"])
	}

	def _split_dict(tpl_dict):
	out = {}
	for lead_name, tpl in tpl_dict.items():
	tpl = np.asarray(tpl, dtype=np.float32)
	L = len(tpl)
	chars = []
	i = 0
	while i < L:
	# NaN 건너뛰기
	if np.isnan(tpl[i]):
	i += 1
	continue
	# non-NaN 시작
	j = i + 1
	while j < L and not np.isnan(tpl[j]):
	j += 1
	seg = tpl[i:j]
	if seg.size > 0:
	chars.append(seg)
	i = j
	out[lead_name] = chars
	return out

	upper_split = _split_dict(upper_raw)
	under_split = _split_dict(under_raw)
	return upper_split, under_split

	# -------------------- width scaling (1D, NaN 없음) -------------------- #
	def _scale_width(self, tpl, scale: float):
	"""
	tpl: 1D float32 ndarray
	scale: >0, 1이면 그대로, 2이면 길이 2배 등
	"""
	L = len(tpl)
	if L <= 1 or scale == 1.0:
	return tpl

	new_L = max(2, int(round(L * scale)))
	idx_old = (np.arange(new_L) / scale).astype(int)
	idx_old = np.clip(idx_old, 0, L - 1)
	return tpl[idx_old]

	# -------------------- 글자 단위 변형 + 랜덤 간격으로 lead 템플릿 조립 -------------------- #
	def _build_lead_template(self, char_list, place: int):
	"""
	char_list: [char0, char1, ...], 각 char는 non-NaN float32 1D
	place: 1 or -1 (위/아래 템플릿 방향)
	"""
	segments = []
	n_chars = len(char_list)

	for idx, char_tpl in enumerate(char_list):
	w_scale = np.random.uniform(*self.width_scale_range)
	h_scale = np.random.uniform(*self.height_scale_range)
	h_shift = np.random.uniform(*self.height_shift_range)

	char_scaled = self._scale_width(char_tpl, w_scale)
	char_scaled = char_scaled * h_scale
	char_scaled = char_scaled + (place * h_shift)

	segments.append(char_scaled)

	# 글자 사이 gap (NaN)
	if idx < n_chars - 1:
	gap_len = np.random.randint(*self.text_space_range)
	segments.append(np.full(gap_len, np.nan, dtype=np.float32))

	if not segments:
	return np.zeros(0, dtype=np.float32)

	return np.concatenate(segments)

	# -------------------- 메인 -------------------- #
	def __call__(self, sample: np.ndarray):
	if self.p <= np.random.uniform(0, 1):
	return sample

	# 여기서부터는 그냥 float32 로 고정
	new_sample = np.copy(sample)
	C, T = new_sample.shape

	if C < 12:
	return new_sample

	seg_len = T // 4
	global_start = np.random.randint(0, seg_len)

	place = 1 if self.mag % 2 == 1 else -1
	tpl_source = self.upper_template if place == 1 else self.under_template

	for lead_idx, lead_name in enumerate(self.lead_order):
	char_list = tpl_source.get(lead_name)

	tpl_scaled = self._build_lead_template(char_list, place)
	L = len(tpl_scaled)

	group = lead_idx // 3 # 0: I~III, 1: aVR~aVF, 2: V1~V3, 3: V4~V6
	base = group * seg_len
	insert_start = base + global_start
	seg_end = base + seg_len

	max_L_in_seg = seg_end - insert_start
	if L > max_L_in_seg:
	tpl_seg = tpl_scaled[:max_L_in_seg]
	else:
	tpl_seg = tpl_scaled

	target = new_sample[lead_idx, insert_start : insert_start + len(tpl_seg)]
	mask = ~np.isnan(tpl_seg)
	target[mask] = tpl_seg[mask]

	return new_sample

	import numpy as np
	import pandas as pd
	import torch
	import logging
	from torch.utils.data import Dataset
	from mai.data.util.load import load_mai_data
	from mai.sigproc.sigproc_composer import SigprocComposer
	from mai.sigproc.datamodel import SigprocConfig
	from torchvision import transforms
	import traceback as tb


	class BaseDatasetV3(Dataset):
	def __init__(
	self, table=pd.DataFrame([]), label="label", stage="test", dataset_params=None
	):
	self.table = table.reset_index(drop=True)
	self.len = len(table)
	self.stage = stage
	self.randomness = True if self.stage.upper() == "TRAIN" else False
	self.label = label
	self.success_idx = 0
	self.dataset_params = dataset_params

	self.aux_data = self.dataset_params.aux_data
	self.num_aux = len(self.aux_data)
	self.wave_type = self.dataset_params.wave_type
	self.wave_config_list = self.dataset_params.wave_config
	self.preprocessor = dict()
	self.sampling_rate = dict()
	for wave_type in self.wave_type:
	for wave_config in self.wave_config_list:
	if wave_config.name == wave_type:
	preproc_config = wave_config.params.preproc_config
	preproc_config = SigprocConfig(preproc_config)
	composer = SigprocComposer(
	getattr(wave_config.params, "additional_module_path", None)
	)
	self.preprocessor[wave_type] = composer.create(preproc_config)
	# necessary params: sampling_rate_target
	for preproc in preproc_config:
	proc_name, proc_config = preproc
	if proc_name == "ResampleSignal":
	self.sampling_rate[
	wave_type
	] = proc_config.params.sampling_rate_target

	def __len__(self):
	return self.len

	def __getitem__(self, index):
	try:
	obj_id, input, label = self._read_signal(index)
	self.success_idx = index
	except Exception:
	logging.getLogger().error(
	f"Failed to _read_signal in Dataset. Using fallback index {self.success_idx}. {tb.format_exc()}"
	)
	obj_id, input, label = self._read_signal(self.success_idx)
	(obj_id, offset) = obj_id
	return (obj_id, offset), input, label

	def _read_signal(self, index):
	row = self.table.loc[index]
	obj_id, mai_json = self._get_mai_json(row)
	meta, sig = self.preprocessing(mai_json)
	aux = self._get_aux_data(row, meta)
	label = torch.tensor(row[self.label], dtype=torch.float32)

	return obj_id, [sig, aux], label

	def _get_mai_json(self, row):
	obj_id = row["objectid"]
	start, length = row["start"], row["length"]
	mai_json = load_mai_data(obj_id, self.wave_type, (start, length))
	return (obj_id, start), mai_json

	def preprocessing(self, signal_json, required_lead_type=None):
	raise NotImplementedError

	def parse_signal_json(self, signal_json):
	raise NotImplementedError

	def _get_aux_data(self, row):
	return {col: row[col] for col in self.aux_data if col in row}

	def normalize_aux(self, aux):
	aux_norm_params = {
	"age": {"min": 0, "max": 90},
	"gender": {"min": -1, "max": 1},
	"weight": {"min": 25, "max": 125},
	"height": {"min": 120, "max": 200},
	}
	aux_list = list()
	for k in aux.keys():
	if k in ["age", "gender", "weight", "height"]:
	mn = aux_norm_params[k]["min"]
	mx = aux_norm_params[k]["max"]
	aux[k] = (aux[k] - mn) / (mx - mn)
	aux[k] = np.nan_to_num(aux[k], 0)
	aux_list.append(aux[k])
	else:
	aux_list.append(aux[k])
	return np.array(aux_list)

	def apply_augmentation(self, sig, aug_params, wave_type="ecg"):
	if (self.stage == "train") and (aug_params != {}):
	N, I = aug_params["number"], aug_params["intensity"] # noqa: E741
	aug_setup_params = {
	"mag": {"max": I, "min": I - 1},
	"freq": self.sampling_rate[wave_type],
	"p": aug_params["prob"],
	"dependency": aug_params["lead_dependency"],
	}
	# this import statement must be here. see https://git.medicalai.com:50001/team-ai/solver/solver2/-/issues/273

	DAList = aug_mod(self.get_aug_list(aug_params["list"]), aug_setup_params)
	if len(DAList) > 0:
	ops = np.random.choice(DAList, N)
	if len(ops) > 0:
	augment = transforms.Compose(ops)
	sig = augment(sig)
	return sig

	def get_aug_list(self, aug_params):
	aug_list = list()
	for aug_item in aug_params:
	if isinstance(aug_item, dict):
	for aug, value in aug_item.items():
	if value > np.random.uniform(0, 1):
	aug_list.append(aug)
	else:
	aug_list.append(aug_item)
	return aug_list

	import numpy as np
	import pandas as pd
	import torch
	import ast
	from mai.data.util.misc import LeadType


	class ECGDatasetV3(BaseDatasetV3):
	def __init__(
	self, table=pd.DataFrame([]), label="label", stage="test", dataset_params=None
	):
	super(ECGDatasetV3, self).__init__(table, label, stage, dataset_params)

	def _read_signal(self, index):
	row = self.table.loc[index]
	obj_id, mai_json = self._get_mai_json(row)
	aux_dict = self._get_aux_data(row)

	required_lead_type = (
	ast.literal_eval(row["lead_type"])
	if hasattr(row, "lead_type")
	else LeadType.__dict__["_member_names_"]
	)

	if self.label == "label":
	label = torch.tensor(row[self.label], dtype=torch.float32)
	else: # mult-label
	label = torch.tensor(
	[row[_label] for _label in self.label], dtype=torch.float32
	)

	_, ecg, aux = self.preprocessing(mai_json, aux_dict, required_lead_type)

	return obj_id, [ecg, aux], label

	def preprocessing(
	self, mai_json, aux_dict: dict = {}, required_lead_type: list = None
	):
	meta, wave = mai_json

	sampling_rate_input = wave["ecg"].sampling_rate
	mv_unit = wave["ecg"].unit
	waveform_data = wave["ecg"].waveform.data
	wave_params = self.wave_config_list[0].params

	if required_lead_type is None:
	required_lead_type = list(waveform_data.keys())

	waveform_dict = {
	lead_name: np.array(waveform_data[lead_name], dtype=np.float32) * mv_unit
	for lead_name in required_lead_type if lead_name in waveform_data
	}
	ecg_dict, _ = self.preprocessor["ecg"](
	waveform_dict, sampling_rate_input, self.randomness
	)
	ecg_array = np.array(list(ecg_dict.values()))
	ecg_array = self.apply_augmentation(ecg_array, wave_params.augmentation, "ecg")
	ecg_array = torch.tensor(ecg_array, dtype=torch.float32)

	aux = self.normalize_aux(aux_dict)
	aux = torch.tensor(aux, dtype=torch.float32)

	return meta, ecg_array, aux

	import ast
	import hashlib
	import json
	import numpy as np
	import pandas as pd
	import torch
	from mai.data.util.misc import LeadType


	class ECGRecoverDatasetRandomMaskWithRS2V3(ECGDatasetV3):
	"""ECGRecoverDatasetRandomMaskWithRSV3 와 달리, Rhythmstrip(Lead II) 을 13번째 리드로 사용하지 않고 Lead II 자리에 넣어서 return"""

	def __init__(
	self, table=pd.DataFrame([]), label="label", stage="test", dataset_params=None
	):
	super(ECGRecoverDatasetRandomMaskWithRS2V3, self).__init__(
	table, label, stage, dataset_params
	)

	def test(self, obj_id=["6116253a31ee975e584d1dad"]):
	print(obj_id)
	path = f"/bfai/nfs_export/workspace/share/data/ecg_recover/ptbxl_wo_leadname/{obj_id[0][18:22]}/{obj_id[0]}.json"
	with open(path, "rb") as digitized_file:
	digitized = np.array(json.load(digitized_file))
	# if len(digitized) > 12:
	# digitized = digitized[:12]

	return self.apply_random_mask(digitized, obj_id=obj_id[0])

	def _read_signal(self, index):
	row = self.table.loc[index]
	obj_id, origin_json = self._get_mai_json(row)
	aux_dict = self._get_aux_data(row)

	required_lead_type = (
	ast.literal_eval(row["lead_type"])
	if hasattr(row, "lead_type")
	else LeadType.__dict__["_member_names_"]
	)

	_, origin, _ = self.preprocessing(origin_json, aux_dict, required_lead_type)

	with open(row["digitized_path"], "rb") as digitized_file:
	digitized = np.array(json.load(digitized_file))
	assert len(digitized) == 13

	digitized, mask = self.apply_random_mask(
	digitized,
	obj_id=obj_id[0],
	deterministic=self.dataset_params.deterministic_masking,
	)
	digitized = torch.tensor(digitized, dtype=torch.float32)
	mask = torch.tensor(mask, dtype=torch.float32)

	return obj_id, [digitized, mask], origin

	def apply_random_mask(
	self, digitized: np.ndarray, obj_id: str = "", deterministic: bool = False
	):
	"""
	digitized: (13, 5000)
	return:
	masked_signal: (12, 5000)
	mask: (12, 5000) (1 = invisible, 0 = visible)
	"""

	def _seed_rng(s: str):
	h = hashlib.sha256(s.encode()).hexdigest()
	return np.random.default_rng(int(h[:16], 16) % (2**32))

	# -------------------------
	# RNG 선택
	# -------------------------
	if deterministic:
	rng = _seed_rng(obj_id) # -> deterministic masking
	else:
	# -> train 일 때 매번 다르게 masking
	if self.stage == "train":
	rng = np.random.default_rng()
	else:
	rng = _seed_rng(obj_id)

	fs = 500
	group_len = 1250 # 2.5s * fs
	total_len = 5000 # 10s * fs

	visible = np.zeros_like(digitized, dtype=np.float16)

	# each lead masking
	for g in range(4):
	vis_len = int(rng.uniform(1.25 * fs, group_len + 1))

	max_offset = group_len - vis_len
	offset = int(rng.uniform(0, max_offset + 1))

	start = g * group_len + offset
	end = start + vis_len

	for lead in range(g * 3, g * 3 + 3):
	visible[lead, start:end] = 1

	# rhythm strip masking
	left_mask = int(rng.uniform(0, 1 * fs + 1))
	right_mask = int(rng.uniform(0, 1 * fs + 1))

	rs_start = left_mask
	rs_end = total_len - right_mask
	visible[12, rs_start:rs_end] = 1

	masked = digitized * visible
	mask = 1 - visible

	target_lead = 1 # Lead II
	masked[target_lead] = masked[12]
	mask[target_lead] = mask[12]

	# -------------------------
	# 최종 12-lead만 반환
	# -------------------------
	masked = masked[:12]
	mask = mask[:12]

	return masked, mask