Compare commits

...

1 Commits

Author SHA1 Message Date
coolneng 07776a0538
Perform one hot encoding on the sequences 2021-06-25 00:04:01 +02:00
1 changed files with 2 additions and 2 deletions

View File

@ -3,8 +3,7 @@ from typing import Dict, List, Tuple
from Bio.pairwise2 import align from Bio.pairwise2 import align
from Bio.SeqIO import parse from Bio.SeqIO import parse
from numpy.random import random from numpy.random import random
from tensorflow import Tensor, int64 from tensorflow import Tensor, int64, one_hot
from tensorflow.data import TFRecordDataset
from tensorflow.data import AUTOTUNE, TFRecordDataset from tensorflow.data import AUTOTUNE, TFRecordDataset
from tensorflow.io import TFRecordWriter, VarLenFeature, parse_single_example from tensorflow.io import TFRecordWriter, VarLenFeature, parse_single_example
from tensorflow.sparse import to_dense from tensorflow.sparse import to_dense
@ -84,6 +83,7 @@ def transform_features(parsed_features) -> Dict[str, Tensor]:
sparse_features = ["sequence", "label"] sparse_features = ["sequence", "label"]
for element in sparse_features: for element in sparse_features:
features[element] = to_dense(parsed_features[element]) features[element] = to_dense(parsed_features[element])
features[element] = one_hot(features[element], depth=len(BASES))
return features return features