Skip to content

Commit 305ec02

Browse files
committed
Speed up sampling
1 parent e950d08 commit 305ec02

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

sample.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -110,10 +110,10 @@ def do_sample(source, train_ratio, sorting="random", tw=None):
110110
num_train_logs = math.ceil(train_ratio * len(sequences_extracted['Normal']))
111111
if sorting == "random":
112112
print('Randomly selecting ' + str(num_train_logs) + ' sequences from ' + str(len(sequences_extracted['Normal'])) + ' normal sequences for training')
113-
train_seq_id_list = random.sample(list(sequences_extracted['Normal'].keys()), num_train_logs)
113+
train_seq_id_list = set(random.sample(list(sequences_extracted['Normal'].keys()), num_train_logs))
114114
elif sorting == "chronological":
115115
print('Chronologically selecting ' + str(num_train_logs) + ' sequences from ' + str(len(sequences_extracted['Normal'])) + ' normal sequences for training')
116-
train_seq_id_list = list(sequences_extracted['Normal'].keys())[:num_train_logs]
116+
train_seq_id_list = set(list(sequences_extracted['Normal'].keys())[:num_train_logs])
117117
else:
118118
print("Warning: Unknown sorting mode!")
119119
print('Write vector files ...')

0 commit comments

Comments
 (0)