auditok: demos/audio_tokenize

comparison demos/audio_tokenize_demo.py @ 10:9be2d0ca4c00

Python 3.x support

author	Amine Sehili <amine.sehili@gmail.com>
date	Tue, 24 Nov 2015 01:57:53 +0100
parents	edee860b9f61
children	421d2f534c14

comparison

equal deleted inserted replaced

-:c2ddae4d2c36
+:9be2d0ca4c00
 @author: Amine SEHILI <amine.sehili@gmail.com>
 September, 2015
 """
 from auditok import ADSFactory, AudioEnergyValidator, StreamTokenizer, player_for, dataset
+import sys
-# We set the `record` argument to True so that we can rewind the source
+try:
-asource = ADSFactory.ads(filename=dataset.one_to_six_arabic_16000_mono_bc_noise, record=True)
-validator = AudioEnergyValidator(sample_width=asource.get_sample_width(), energy_threshold=65)
+# We set the `record` argument to True so that we can rewind the source
+asource = ADSFactory.ads(filename=dataset.one_to_six_arabic_16000_mono_bc_noise, record=True)
-# Defalut analysis window is 10 ms (float(asource.get_block_size()) / asource.get_sampling_rate())
+validator = AudioEnergyValidator(sample_width=asource.get_sample_width(), energy_threshold=65)
-# min_length=20 : minimum length of a valid audio activity is 20 * 10 == 200 ms
-# max_length=400 :  maximum length of a valid audio activity is 400 * 10 == 4000 ms == 4 seconds
-# max_continuous_silence=30 : maximum length of a tolerated  silence within a valid audio activity is 30 * 30 == 300 ms
-tokenizer = StreamTokenizer(validator=validator, min_length=20, max_length=400, max_continuous_silence=30)
-asource.open()
+# Defalut analysis window is 10 ms (float(asource.get_block_size()) / asource.get_sampling_rate())
-tokens = tokenizer.tokenize(asource)
+# min_length=20 : minimum length of a valid audio activity is 20 * 10 == 200 ms
+# max_length=400 :  maximum length of a valid audio activity is 400 * 10 == 4000 ms == 4 seconds
+# max_continuous_silence=30 : maximum length of a tolerated  silence within a valid audio activity is 30 * 30 == 300 ms
+tokenizer = StreamTokenizer(validator=validator, min_length=20, max_length=400, max_continuous_silence=30)
-# Play detected regions back
+asource.open()
+tokens = tokenizer.tokenize(asource)
-player = player_for(asource)
+# Play detected regions back
-# Rewind and read the whole signal
+player = player_for(asource)
-asource.rewind()
-original_signal = []
-while True:
+# Rewind and read the whole signal
-w = asource.read()
+asource.rewind()
-if w is None:
+original_signal = []
-break
-original_signal.append(w)
-original_signal = ''.join(original_signal)
+while True:
+w = asource.read()
+if w is None:
+break
+original_signal.append(w)
-print("\n ** Playing original file...")
+original_signal = b''.join(original_signal)
 player.play(original_signal)
 print("\n ** playing detected regions...\n")
 for i,t in enumerate(tokens):
 print("Token [{0}] starts at {1} and ends at {2}".format(i+1, t[1], t[2]))
-data = ''.join(t[0])
+data = b''.join(t[0])
 player.play(data)
 assert len(tokens) == 8
 asource.close()
 player.stop()
+except KeyboardInterrupt:
+player.stop()
+asource.close()
+sys.exit(0)
+"""
+except Exception as e:
+sys.stderr.write(str(e) + "\n")
+sys.exit(1)
+"""

Mercurial > hg > auditok

comparison demos/audio_tokenize_demo.py @ 10:9be2d0ca4c00