Notebook
# Removing invalid samples - already done duplicate_dict = {} rows_to_delete = [] count = 0 for i in range(seqs.shape[0]): if 'X' in seqs[i] \ or 'U' in seqs[i] \ or '3CO' in target[i]\ or '3NI' in target[i] \ or 'FE2'in target[i] \ or 'CU1'in target[i]\ or 'MN3' in target[i] \ or np.isnan(cluster_numbers[i]): rows_to_delete.append(i) count +=1 elif seqs[i] not in duplicate_dict.keys(): duplicate_dict[seqs[i]] = target[i] else: if target[i] != duplicate_dict[seqs[i]]: rows_to_delete.append(i) count +=1 # df = df.drop(df.index[rows_to_delete]) # df.to_parquet('Metal_all_20180601.parquet') seqs = np.delete(seqs, rows_to_delete, 0) target = np.delete(target, rows_to_delete) cluster_numbers = np.delete(cluster_numbers, rows_to_delete)
from keras.models import model_from_json # load json and create model json_file = open('./models/metal_predict.json', 'r') loaded_model_json = json_file.read() json_file.close() model = model_from_json(loaded_model_json) # load weights into new model model.load_weights("./models/metal_predict.h5") print("Loaded model from disk")