diff --git a/orcasong_contrib/data_tools/make_data_split/make_data_split.py b/orcasong_contrib/data_tools/make_data_split/make_data_split.py
index f278fa3b125e282c36158e43e3bac7544c323092..65e68a01198a6afbe37d25190d00f2f0311cc6aa 100644
--- a/orcasong_contrib/data_tools/make_data_split/make_data_split.py
+++ b/orcasong_contrib/data_tools/make_data_split/make_data_split.py
@@ -22,7 +22,7 @@ import toml
 import docopt
 import natsort as ns
 import h5py
-
+import random
 
 def parse_input():
     """
@@ -92,7 +92,9 @@ def get_h5_filepaths(dirpath):
         if f.endswith('.h5'):
             filepaths.append(dirpath + '/' + f)
 
-    filepaths = ns.natsorted(filepaths)  # TODO should not be necessary actually!
+    #randomize order
+    random.Random(42).shuffle(filepaths)
+    
     return filepaths