Spaces:

Simbals
/

TextRetrieval

Runtime error

App Files Files Community

PierreHanna commited on Jan 25, 2023

Commit

8d66428

1 Parent(s): e628964

Delete models.py

Browse files

Files changed (1) hide show

models.py +0 -382

models.py DELETED Viewed

@@ -1,382 +0,0 @@
-import tensorflow as tf
-from tensorflow.keras.layers import BatchNormalization, Concatenate
-from tensorflow.keras.layers import Lambda, Flatten, Dense
-from tensorflow.keras.initializers import glorot_uniform, RandomNormal, Zeros, HeNormal, Constant
-from tensorflow.keras.layers import Input, Subtract, Dense, Lambda, Dropout,LeakyReLU, ReLU, PReLU, Attention
-from tensorflow.keras.models import Sequential
-from tensorflow.keras.layers import Conv2D, Conv1D, ZeroPadding2D, Activation, Input, concatenate, ConvLSTM2D, LSTM
-from tensorflow.keras.layers import AveragePooling1D, MaxPooling1D, GlobalMaxPooling1D, GlobalMaxPooling2D, TimeDistributed, GlobalAveragePooling1D
-from tensorflow.keras.layers import MaxPooling2D, AveragePooling2D, GlobalAveragePooling2D, UpSampling1D, Reshape
-from tensorflow.keras.models import Model
-from tensorflow.keras.layers import Conv2D, Conv1D, ZeroPadding2D, Activation, Multiply, Add, MaxPool1D, Permute
-from keras import backend as K
-import tensorflow_addons as tfa
-import numpy as np
-MARGIN = 0.5
-DIM_OUT = 1024
-def triplet_loss_new(y_true, y_pred):
-    anchor, positive, negative = y_pred[:,:DIM_OUT], y_pred[:,DIM_OUT:2*DIM_OUT], y_pred[:,2*DIM_OUT:]
-    positive_dist = K.sum(K.square(anchor-positive), axis=-1)
-    negative_dist = K.sum(K.square(anchor-negative), axis=-1)
-    return K.sum(K.maximum(positive_dist - negative_dist + MARGIN, 0), axis=0)
-# Define the contrastive loss function, NT_Xent (Tensorflow version)
-def nt_xent_loss_4(y_true, y_pred, tau=0.07):
-    '''call
-        Calculates the infonce loss described in SimCLR
-        https://arxiv.org/abs/2002.05709
-        Args:
-            z1 (tf.Tensor): The embeddings, view 1 (half of batch)
-            z2 (tf.Tensor): The embeddings, view 2 (half of batch)
-        Returns:
-            tf.Tensor: The loss
-    '''
-    z1 = y_pred[:,:DIM_OUT]
-    z2 = y_pred[:,DIM_OUT:2*DIM_OUT]
-    # Combine the two embeddings
-    z = tf.concat([z1, z2], axis=0)
-    # Normalize each row
-    z = tf.math.l2_normalize(z, axis=1)
-    batch_size = tf.shape(z)[0]
-    ones = tf.ones((batch_size // 2, ))
-    labels = tf.experimental.numpy.diagflat(ones, batch_size // 2) + \
-                tf.experimental.numpy.diagflat(ones, -batch_size // 2)
-    # Similarity matrix
-    sim_m = z @ tf.transpose(z)
-    # Setting diagonal to -1
-    sim_m = tf.linalg.set_diag(sim_m, -tf.ones((batch_size, )))
-    # Crossentropy
-    sim_m = sim_m / tau
-    entropy = tf.multiply(-labels, tf.nn.log_softmax(sim_m, axis=1))
-    return tf.reduce_mean(tf.reduce_sum(entropy, axis=1))
-# Define the contrastive loss function, NT_Xent (Tensorflow version)
-def nt_xent_loss_3(y_true, y_pred, tau=0.07):
-    """ Calculates the contrastive loss of the input data using NT_Xent. The
-    equation can be found in the paper: https://arxiv.org/pdf/2002.05709.pdf
-    (This is the Tensorflow implementation of the standard numpy version found
-    in the NT_Xent function).
-    Args:
-        zi: One half of the input data, shape = (batch_size, feature_1, feature_2, ..., feature_N)
-        zj: Other half of the input data, must have the same shape as zi
-        tau: Temperature parameter (a constant), default = 1.
-    Returns:
-        loss: The complete NT_Xent constrastive loss
-    """
-    zi = y_pred[:,:DIM_OUT]
-    zj = y_pred[:,DIM_OUT:2*DIM_OUT]
-    z = tf.cast(tf.concat((zi, zj), 0), dtype=tf.float32)
-    loss = 0
-    for k in range(zi.shape[0]):
-        # Numerator (compare i,j & j,i)
-        i = k
-        j = k + zi.shape[0]
-        # Instantiate the cosine similarity loss function
-        cosine_sim = tf.keras.losses.CosineSimilarity(axis=-1, reduction=tf.keras.losses.Reduction.NONE)
-        sim = tf.squeeze(- cosine_sim(tf.reshape(z[i], (1, -1)), tf.reshape(z[j], (1, -1))))
-        numerator = tf.math.exp(sim / tau)
-        # Denominator (compare i & j to all samples apart from themselves)
-        sim_ik = - cosine_sim(tf.reshape(z[i], (1, -1)), z[tf.range(z.shape[0]) != i])
-        sim_jk = - cosine_sim(tf.reshape(z[j], (1, -1)), z[tf.range(z.shape[0]) != j])
-        denominator_ik = tf.reduce_sum(tf.math.exp(sim_ik / tau))
-        denominator_jk = tf.reduce_sum(tf.math.exp(sim_jk / tau))
-        # Calculate individual and combined losses
-        loss_ij = - tf.math.log(numerator / denominator_ik)
-        loss_ji = - tf.math.log(numerator / denominator_jk)
-        loss += loss_ij + loss_ji
-    # Divide by the total number of samples
-    loss /= z.shape[0]
-    return loss
-def nt_xent_loss_2(y_true, y_pred, temperature=0.07):
-        # InfoNCE loss (information noise-contrastive estimation)
-        # NT-Xent loss (normalized temperature-scaled cross entropy)
-        projections_1 = y_pred[:,:DIM_OUT]
-        projections_2 = y_pred[:,DIM_OUT:2*DIM_OUT]
-        # Cosine similarity: the dot product of the l2-normalized feature vectors
-        projections_1 = tf.math.l2_normalize(projections_1, axis=1)
-        projections_2 = tf.math.l2_normalize(projections_2, axis=1)
-        similarities = (
-            tf.matmul(projections_1, projections_2, transpose_b=True) / temperature
-        )
-        # The similarity between the representations of two augmented views of the
-        # same image should be higher than their similarity with other views
-        batch_size = tf.shape(projections_1)[0]
-        contrastive_labels = tf.range(batch_size)
-        contrastive_accuracy = tf.keras.metrics.SparseCategoricalAccuracy()
-        contrastive_accuracy.update_state(contrastive_labels, similarities)
-        contrastive_accuracy.update_state(
-            contrastive_labels, tf.transpose(similarities)
-        )
-        # The temperature-scaled similarities are used as logits for cross-entropy
-        # a symmetrized version of the loss is used here
-        loss_1_2 = tf.keras.losses.sparse_categorical_crossentropy(
-            contrastive_labels, similarities, from_logits=True
-        )
-        loss_2_1 = tf.keras.losses.sparse_categorical_crossentropy(
-            contrastive_labels, tf.transpose(similarities), from_logits=True
-        )
-        return (loss_1_2 + loss_2_1) / 2
-#def contrastive_loss(xi, xj,  tau=1, normalize=False):
-################# ERREUR SUR CETTE VERSION ???
-def nt_xent_loss(y_true, y_pred, tau=0.07, normalize=False):
-        ''' this loss is the modified torch implementation by M Diephuis here: https://github.com/mdiephuis/SimCLR/
-        the inputs:
-        xi, xj: image features extracted from a batch of images 2N, composed of N matching paints
-        tau: temperature parameter
-        normalize: normalize or not. seem to not be very useful, so better to try without.
-        '''
-        xi = y_pred[:,:DIM_OUT]
-        xj = y_pred[:,DIM_OUT:2*DIM_OUT]
-        #xi=tf.transpose(xi)
-        #xj=tf.transpose(xj)
-        x = tf.keras.backend.concatenate((xi, xj), axis=0)
-        #print(xi.shape)
-        #print(x.shape)
-        sim_mat = tf.keras.backend.dot(x, tf.keras.backend.transpose(x))
-        if normalize:
-            sim_mat_denom = tf.keras.backend.dot(tf.keras.backend.l2_normalize(x, axis=1).unsqueeze(1), tf.keras.backend.l2_normalize(x, axis=1).unsqueeze(1).T)
-            sim_mat = sim_mat / sim_mat_denom.clamp(min=1e-16)
-        sim_mat = tf.keras.backend.exp(sim_mat /tau)
-        if normalize:
-            sim_mat_denom = tf.keras.backend.l2_normalize(xi, dim=1) * tf.keras.backend.l2_normalize(xj, axis=1)
-            sim_match = tf.keras.backend.exp(tf.keras.backend.sum(xi * xj, axis=-1) / sim_mat_denom / tau)
-        else:
-            sim_match = tf.keras.backend.exp(tf.keras.backend.sum(xi * xj, axis=-1) / tau)
-        sim_match = tf.keras.backend.concatenate((sim_match, sim_match), axis=0)
-        #print(tf.keras.backend.shape(x)[0])
-        norm_sum = tf.keras.backend.exp(tf.keras.backend.ones(tf.keras.backend.shape(x)[0]) / tau)
-        #norm_sum = tf.keras.backend.ones(12) # NON
-        #norm_sum = tf.keras.backend.exp(32/ tau) #OK
-        #norm_sum = tf.keras.backend.shape(x)[0] #OK
-        #return K.sum(xi)
-        return tf.math.reduce_mean(-tf.keras.backend.log(sim_match / (tf.keras.backend.sum(sim_mat, axis=-1) - norm_sum)))
-def create_encoder_model_audio(in_shape, dim, final_activ):
-    #return create_encoder_model_resnet_byte_1d(in_shape)
-    return create_encoder_model_mlp(in_shape, dim, final_activ=final_activ) #1024
-def create_encoder_model_text(in_shape, dim, final_activ):
-    #return create_encoder_model_resnet_byte_1d(in_shape)
-    return create_encoder_model_mlp(in_shape, dim, final_activ=final_activ) #1024
-######### RESNET 1D
-def residual_block_byte_1d(x, filters, activation="relu"):
-    # Shortcut
-    s = Conv1D(filters, 1, padding="same")(x)
-    y = BatchNormalization()(s)
-    y = Activation(activation)(y)
-    y = Conv1D(filters, 3, padding="same")(y)
-    y = BatchNormalization()(y)
-    y = Conv1D(filters, 1, padding="same")(y)
-    y = BatchNormalization()(y)
-    y = Add()([y, s])
-    y = Activation(activation)(y)
-    return y
-    #return MaxPool1D(pool_size=2, strides=2)(x)
-def create_encoder_model_resnet_byte_1d(input_shape):
-    inputs = Input(shape=input_shape)
-    x = Conv1D(32, 7, strides = 2, padding="same")(inputs)
-    x = MaxPooling1D(pool_size=3, strides=2)(x)
-    for i in range(3):
-        x = residual_block_byte_1d(x, 32)
-    for i in range(4):
-        x = residual_block_byte_1d(x, 64)
-    for i in range(6):
-        x = residual_block_byte_1d(x, 128)
-    for i in range(3):
-        x = residual_block_byte_1d(x, 256)
-    #print(x.shape)
-    x = AveragePooling1D(pool_size=3, strides=3)(x)
-    x = GlobalAveragePooling1D()(x)
-    #x = Flatten()(x)
-    x = Dense(DIM_OUT, activation="relu")(x)
-    model =  Dense(DIM_OUT, activation='sigmoid')(x)
-    model = BatchNormalization()(model)
-    model = Lambda(lambda x: K.l2_normalize(x,axis=-1))(model)
-    model = Model(inputs=inputs,outputs=model)
-    #model.summary()
-    return model
-# simple MLP
-def create_encoder_model_mlp(input_shape, size1, final_activ=None):
-    inputs = Input(shape=input_shape)
-    x = Dense(size1, activation="relu")(inputs)
-    x = Dropout(0.1)(x)
-    #x = BatchNormalization()(x)
-    '''
-    x = Dense(1024, activation="relu")(x)
-    x = Dropout(0.1)(x)
-    x = Dense(1024, activation="relu")(x)
-    x = Dropout(0.1)(x)
-    x = Dense(1024, activation="relu")(x)
-    x = Dropout(0.1)(x)
-    x = Dense(1024, activation="relu")(x)
-    x = Dropout(0.1)(x)
-    '''
-    #x = BatchNormalization()(x)
-    #x = Dense(512, activation="relu")(x)
-    #x = BatchNormalization()(x)
-    '''
-    if final_activ != None :
-        model =  Dense(DIM_OUT)(x)#, activation='sigmoid')(x)
-    else :
-        model =  Dense(DIM_OUT, activation=final_activ)(x)
-    '''
-    model =  Dense(DIM_OUT, activation=final_activ)(x)
-    model = Dropout(0.1)(model)
-    #model = BatchNormalization()(model)
-    model = Lambda(lambda x: K.l2_normalize(x,axis=-1))(model)
-    model = Model(inputs=inputs,outputs=model)
-    model.summary()
-    return model
-def make_bert_preprocess_model(sentence_features, tfhub_handle_preprocess, seq_length=128):
-  """Returns Model mapping string features to BERT inputs.
-  """
-  input_segments = [
-      tf.keras.layers.Input(shape=(), dtype=tf.string, name=ft)
-      for ft in sentence_features]
-  bert_preprocess = hub.load(tfhub_handle_preprocess)
-  tokenizer = hub.KerasLayer(bert_preprocess.tokenize, name='tokenizer')
-  segments = [tokenizer(s) for s in input_segments]
-  truncated_segments = segments
-  packer = hub.KerasLayer(bert_preprocess.bert_pack_inputs,
-                          arguments=dict(seq_length=seq_length),
-                          name='packer')
-  model_inputs = packer(truncated_segments)
-  return tf.keras.Model(input_segments, model_inputs)
-def process(prompt, lang):
-    # Getting prompt user
-    #prompt = input("Audio Search - enter text : ")
-    #print(prompt)
-    # prompt embedding
-    bert_model_name = 'small_bert/bert_en_uncased_L-4_H-512_A-8'
-    tfhub_handle_encoder = 'https://tfhub.dev/tensorflow/small_bert/bert_en_uncased_L-4_H-512_A-8/1'
-    tfhub_handle_preprocess = 'https://tfhub.dev/tensorflow/bert_en_uncased_preprocess/3'
-    MAX_LENGTH = 130 # MAX de 512 !!! TENSORFLOW !!!
-    TOP = 10
-    bert_preprocess_model = make_bert_preprocess_model(['my_input'], tfhub_handle_preprocess, seq_length = MAX_LENGTH)
-    bert_model = hub.KerasLayer(tfhub_handle_encoder)
-    now = datetime.datetime.now()
-    print()
-    print('*************')
-    print("Current Time: ", str(now))
-    print("Text input : ", prompt)
-    print('*************')
-    print()
-    prompt=[prompt]
-    text_preprocessed = bert_preprocess_model([np.array(prompt)])
-    embed_prompt = bert_model(text_preprocessed)
-    print("   text representation computed.")
-    # Embed text
-    #from models import *
-    encoder_text = tf.keras.models.load_model(encoder_text_path)
-    embed_query  = encoder_text.predict(embed_prompt["pooled_output"])
-    faiss.normalize_L2(embed_query)
-    print("   text embed computed.")
-    # load embed audio catalog
-    index = faiss.read_index("BMG_221022.index")
-    # distance computing
-    D, I = index.search(embed_query, TOP)
-    # names index
-    import joblib
-    audio_names = joblib.load(open('BMG_221022_names.index', 'rb'))
-    #url
-    url_dict={}
-    with open("bmg_clean.csv") as csv_file:
-        csv_reader = csv.reader(csv_file, delimiter=';')
-        for row in csv_reader:
-          f = row[2].split('/')[-1]
-          url_dict[f.split('/')[-1][:-4]] = row[2]
-    # output : top N audio file names
-    print(I)
-    print(D)
-    print("----")
-    for i in range(len(I[0])):
-        print(audio_names[I[0][i]], " with distance ", D[0][i])
-        print("    url : ", url_dict[audio_names[I[0][i]]])
-    return [url_dict[audio_names[I[0][0]]], url_dict[audio_names[I[0][1]]], url_dict[audio_names[I[0][2]]], url_dict[audio_names[I[0][3]]], url_dict[audio_names[I[0][4]]]]