Taykhoom commited on
Commit
fc7070b
·
verified ·
1 Parent(s): 5c51c76

Upload README.md with huggingface_hub

Browse files
Files changed (1) hide show
  1. README.md +3 -0
README.md CHANGED
@@ -65,6 +65,9 @@ sequences = [
65
  "GGGUGCGAUCAUACCAGCACUAAUGCCCUCCUGGGAAGUCCUCGUGUUGCACCCCU",
66
  "AUCGGGCUUAGCAUAGCUU",
67
  ]
 
 
 
68
  enc = tokenizer(sequences, return_tensors="pt", padding=True)
69
 
70
  with torch.no_grad():
 
65
  "GGGUGCGAUCAUACCAGCACUAAUGCCCUCCUGGGAAGUCCUCGUGUUGCACCCCU",
66
  "AUCGGGCUUAGCAUAGCUU",
67
  ]
68
+ # RNA-FM was trained on RNA sequences (U not T). T is not in the vocabulary.
69
+ # If your sequences use DNA notation, convert first:
70
+ # sequences = [s.replace("T", "U") for s in sequences]
71
  enc = tokenizer(sequences, return_tensors="pt", padding=True)
72
 
73
  with torch.no_grad():