annotate tests/test_core.py @ 236:8c92420d15d5

Raise ValueError for too small analysis window
author Amine Sehili <amine.sehili@gmail.com>
date Fri, 19 Jul 2019 23:24:17 +0100
parents d8267b3334f0
children c684f90cc3cd
rev   line source
amine@192 1 import os
amine@221 2 import math
amine@88 3 from random import random
amine@192 4 from tempfile import TemporaryDirectory
amine@221 5 from unittest import TestCase
amine@86 6 from genty import genty, genty_dataset
amine@207 7 from auditok import split, AudioRegion, AudioParameterError
amine@215 8 from auditok.core import _duration_to_nb_windows
amine@212 9 from auditok.util import AudioDataSource
amine@210 10 from auditok.io import (
amine@210 11 _normalize_use_channel,
amine@210 12 _extract_selected_channel,
amine@210 13 get_audio_source,
amine@210 14 )
amine@86 15
amine@86 16
amine@88 17 def _make_random_length_regions(
amine@88 18 byte_seq, sampling_rate, sample_width, channels
amine@88 19 ):
amine@88 20 regions = []
amine@88 21 for b in byte_seq:
amine@88 22 duration = round(random() * 10, 6)
amine@95 23 data = b * int(duration * sampling_rate) * sample_width * channels
amine@88 24 start = round(random() * 13, 3)
amine@88 25 region = AudioRegion(
amine@88 26 data, start, sampling_rate, sample_width, channels
amine@88 27 )
amine@88 28 regions.append(region)
amine@88 29 return regions
amine@88 30
amine@88 31
amine@86 32 @genty
amine@215 33 class TestFunctions(TestCase):
amine@215 34 @genty_dataset(
amine@221 35 zero_duration=(0, 1, None, 0),
amine@221 36 multiple=(0.3, 0.1, round, 3),
amine@221 37 not_multiple_ceil=(0.35, 0.1, math.ceil, 4),
amine@221 38 not_multiple_floor=(0.35, 0.1, math.floor, 3),
amine@221 39 small_duration=(0.05, 0.1, round, 0),
amine@221 40 small_duration_ceil=(0.05, 0.1, math.ceil, 1),
amine@233 41 with_round_error=(0.3, 0.1, math.floor, 3, {"epsilon": 1e-6}),
amine@221 42 negative_duration=(-0.5, 0.1, math.ceil, ValueError),
amine@221 43 negative_analysis_window=(0.5, -0.1, math.ceil, ValueError),
amine@215 44 )
amine@221 45 def test_duration_to_nb_windows(
amine@232 46 self, duration, analysis_window, round_fn, expected, kwargs=None
amine@221 47 ):
amine@221 48 if expected == ValueError:
amine@215 49 with self.assertRaises(expected):
amine@221 50 _duration_to_nb_windows(duration, analysis_window, round_fn)
amine@215 51 else:
amine@232 52 if kwargs is None:
amine@232 53 kwargs = {}
amine@221 54 result = _duration_to_nb_windows(
amine@232 55 duration, analysis_window, round_fn, **kwargs
amine@221 56 )
amine@215 57 self.assertEqual(result, expected)
amine@215 58
amine@215 59
amine@215 60 @genty
amine@207 61 class TestSplit(TestCase):
amine@207 62 @genty_dataset(
amine@207 63 simple=(
amine@207 64 0.2,
amine@207 65 5,
amine@207 66 0.2,
amine@207 67 False,
amine@207 68 False,
amine@207 69 {"eth": 50},
amine@207 70 [(2, 16), (17, 31), (34, 76)],
amine@207 71 ),
amine@214 72 short_max_dur=(
amine@214 73 0.3,
amine@214 74 2,
amine@214 75 0.2,
amine@214 76 False,
amine@214 77 False,
amine@214 78 {"eth": 50},
amine@214 79 [(2, 16), (17, 31), (34, 54), (54, 74), (74, 76)],
amine@214 80 ),
amine@214 81 long_min_dur=(3, 5, 0.2, False, False, {"eth": 50}, [(34, 76)]),
amine@214 82 long_max_silence=(0.2, 80, 10, False, False, {"eth": 50}, [(2, 76)]),
amine@214 83 zero_max_silence=(
amine@214 84 0.2,
amine@214 85 5,
amine@214 86 0.0,
amine@214 87 False,
amine@214 88 False,
amine@214 89 {"eth": 50},
amine@214 90 [(2, 14), (17, 24), (26, 29), (34, 76)],
amine@214 91 ),
amine@207 92 low_energy_threshold=(
amine@207 93 0.2,
amine@207 94 5,
amine@207 95 0.2,
amine@207 96 False,
amine@207 97 False,
amine@207 98 {"energy_threshold": 40},
amine@207 99 [(0, 50), (50, 76)],
amine@207 100 ),
amine@207 101 high_energy_threshold=(
amine@207 102 0.2,
amine@207 103 5,
amine@207 104 0.2,
amine@207 105 False,
amine@207 106 False,
amine@207 107 {"energy_threshold": 60},
amine@207 108 [],
amine@207 109 ),
amine@207 110 trim_leading_and_trailing_silence=(
amine@207 111 0.2,
amine@207 112 10, # use long max_dur
amine@207 113 0.5, # and a max_silence longer than any inter-region silence
amine@207 114 True,
amine@207 115 False,
amine@207 116 {"eth": 50},
amine@207 117 [(2, 76)],
amine@207 118 ),
amine@207 119 drop_trailing_silence=(
amine@207 120 0.2,
amine@207 121 5,
amine@207 122 0.2,
amine@207 123 True,
amine@207 124 False,
amine@207 125 {"eth": 50},
amine@207 126 [(2, 14), (17, 29), (34, 76)],
amine@207 127 ),
amine@207 128 drop_trailing_silence_2=(
amine@207 129 1.5,
amine@207 130 5,
amine@207 131 0.2,
amine@207 132 True,
amine@207 133 False,
amine@207 134 {"eth": 50},
amine@207 135 [(34, 76)],
amine@207 136 ),
amine@207 137 strict_min_dur=(
amine@207 138 0.3,
amine@207 139 2,
amine@207 140 0.2,
amine@207 141 False,
amine@207 142 True,
amine@207 143 {"eth": 50},
amine@207 144 [(2, 16), (17, 31), (34, 54), (54, 74)],
amine@207 145 ),
amine@207 146 )
amine@207 147 def test_split_params(
amine@207 148 self,
amine@207 149 min_dur,
amine@207 150 max_dur,
amine@207 151 max_silence,
amine@207 152 drop_trailing_silence,
amine@207 153 strict_min_dur,
amine@207 154 kwargs,
amine@207 155 expected,
amine@207 156 ):
amine@207 157 with open("tests/data/test_split_10HZ_mono.raw", "rb") as fp:
amine@207 158 data = fp.read()
amine@207 159
amine@207 160 regions = split(
amine@207 161 data,
amine@207 162 min_dur,
amine@207 163 max_dur,
amine@207 164 max_silence,
amine@207 165 drop_trailing_silence,
amine@207 166 strict_min_dur,
amine@207 167 analysis_window=0.1,
amine@207 168 sr=10,
amine@207 169 sw=2,
amine@207 170 ch=1,
amine@207 171 **kwargs
amine@207 172 )
amine@207 173 regions = list(regions)
amine@207 174 err_msg = "Wrong number of regions after split, expected: "
amine@210 175 err_msg += "{}, found: {}".format(len(expected), len(regions))
amine@207 176 self.assertEqual(len(regions), len(expected), err_msg)
amine@207 177
amine@207 178 sample_width = 2
amine@207 179 for reg, exp in zip(regions, expected):
amine@207 180 onset, offset = exp
amine@207 181 exp_data = data[onset * sample_width : offset * sample_width]
amine@207 182 self.assertEqual(bytes(reg), exp_data)
amine@207 183
amine@211 184 @genty_dataset(
amine@211 185 stereo_all_default=(2, {}, [(2, 16), (17, 31), (34, 76)]),
amine@213 186 mono_max_read=(1, {"max_read": 5}, [(2, 16), (17, 31), (34, 50)]),
amine@213 187 mono_max_read_short_name=(1, {"mr": 5}, [(2, 16), (17, 31), (34, 50)]),
amine@211 188 mono_use_channel_1=(
amine@211 189 1,
amine@211 190 {"eth": 50, "use_channel": 1},
amine@211 191 [(2, 16), (17, 31), (34, 76)],
amine@211 192 ),
amine@211 193 mono_uc_1=(1, {"eth": 50, "uc": 1}, [(2, 16), (17, 31), (34, 76)]),
amine@211 194 mono_use_channel_left=(
amine@211 195 1,
amine@211 196 {"eth": 50, "use_channel": "left"},
amine@211 197 [(2, 16), (17, 31), (34, 76)],
amine@211 198 ),
amine@211 199 mono_uc_left=(
amine@211 200 1,
amine@211 201 {"eth": 50, "uc": "left"},
amine@211 202 [(2, 16), (17, 31), (34, 76)],
amine@211 203 ),
amine@211 204 mono_use_channel_None=(
amine@211 205 1,
amine@211 206 {"eth": 50, "use_channel": None},
amine@211 207 [(2, 16), (17, 31), (34, 76)],
amine@211 208 ),
amine@211 209 stereo_use_channel_1=(
amine@211 210 2,
amine@211 211 {"eth": 50, "use_channel": 1},
amine@211 212 [(2, 16), (17, 31), (34, 76)],
amine@211 213 ),
amine@211 214 stereo_use_channel_left=(
amine@211 215 2,
amine@211 216 {"eth": 50, "use_channel": "left"},
amine@211 217 [(2, 16), (17, 31), (34, 76)],
amine@211 218 ),
amine@211 219 stereo_use_channel_no_use_channel_given=(
amine@211 220 2,
amine@211 221 {"eth": 50},
amine@211 222 [(2, 16), (17, 31), (34, 76)],
amine@211 223 ),
amine@211 224 stereo_use_channel_minus_2=(
amine@211 225 2,
amine@211 226 {"eth": 50, "use_channel": -2},
amine@211 227 [(2, 16), (17, 31), (34, 76)],
amine@211 228 ),
amine@211 229 stereo_uc_2=(2, {"eth": 50, "uc": 2}, [(10, 32), (36, 76)]),
amine@211 230 stereo_use_channel_right=(
amine@211 231 2,
amine@211 232 {"eth": 50, "use_channel": "right"},
amine@211 233 [(10, 32), (36, 76)],
amine@211 234 ),
amine@211 235 stereo_uc_minus_1=(2, {"eth": 50, "uc": -1}, [(10, 32), (36, 76)]),
amine@213 236 mono_uc_mix=(
amine@213 237 1,
amine@213 238 {"eth": 50, "uc": "mix"},
amine@213 239 [(2, 16), (17, 31), (34, 76)],
amine@213 240 ),
amine@213 241 stereo_use_channel_mix=(
amine@213 242 2,
amine@213 243 {"energy_threshold": 53.5, "use_channel": "mix"},
amine@213 244 [(54, 76)],
amine@213 245 ),
amine@213 246 stereo_uc_mix=(2, {"eth": 52, "uc": "mix"}, [(17, 26), (54, 76)]),
amine@213 247 stereo_uc_mix_default_eth=(
amine@213 248 2,
amine@213 249 {"uc": "mix"},
amine@213 250 [(10, 16), (17, 31), (36, 76)],
amine@213 251 ),
amine@211 252 )
amine@211 253 def test_split_kwargs(self, channels, kwargs, expected):
amine@211 254
amine@211 255 mono_or_stereo = "mono" if channels == 1 else "stereo"
amine@211 256 filename = "tests/data/test_split_10HZ_{}.raw".format(mono_or_stereo)
amine@211 257 with open(filename, "rb") as fp:
amine@211 258 data = fp.read()
amine@211 259
amine@211 260 regions = split(
amine@211 261 data,
amine@211 262 min_dur=0.2,
amine@211 263 max_dur=5,
amine@211 264 max_silence=0.2,
amine@211 265 drop_trailing_silence=False,
amine@211 266 strict_min_dur=False,
amine@211 267 analysis_window=0.1,
amine@211 268 sr=10,
amine@211 269 sw=2,
amine@211 270 ch=channels,
amine@211 271 **kwargs
amine@211 272 )
amine@212 273 regions = list(regions)
amine@211 274 sample_width = 2
amine@211 275 import numpy as np
amine@211 276
amine@211 277 use_channel = kwargs.get("use_channel", kwargs.get("uc"))
amine@211 278 # extrat channel of interest
amine@211 279 if channels != 1:
amine@211 280 use_channel = kwargs.get("use_channel", kwargs.get("uc"))
amine@211 281 use_channel = _normalize_use_channel(use_channel)
amine@211 282 data = _extract_selected_channel(
amine@211 283 data, channels, sample_width, use_channel=use_channel
amine@211 284 )
amine@211 285 err_msg = "Wrong number of regions after split, expected: "
amine@211 286 err_msg += "{}, found: {}".format(expected, regions)
amine@211 287 self.assertEqual(len(regions), len(expected), err_msg)
amine@212 288 for reg, exp in zip(regions, expected):
amine@212 289 onset, offset = exp
amine@212 290 exp_data = data[onset * sample_width : offset * sample_width]
amine@212 291 self.assertEqual(bytes(reg), exp_data)
amine@211 292
amine@212 293 @genty_dataset(
amine@220 294 mono_aw_0_2_max_silence_0_2=(
amine@220 295 0.2,
amine@220 296 5,
amine@220 297 0.2,
amine@220 298 1,
amine@220 299 {"uc": 1, "aw": 0.2},
amine@220 300 [(2, 30), (34, 76)],
amine@220 301 ),
amine@220 302 mono_aw_0_2_max_silence_0_3=(
amine@220 303 0.2,
amine@220 304 5,
amine@220 305 0.3,
amine@220 306 1,
amine@220 307 {"uc": 1, "aw": 0.2},
amine@227 308 [(2, 30), (34, 76)],
amine@220 309 ),
amine@220 310 mono_aw_0_2_max_silence_0_4=(
amine@220 311 0.2,
amine@220 312 5,
amine@227 313 0.4,
amine@220 314 1,
amine@220 315 {"uc": 1, "aw": 0.2},
amine@220 316 [(2, 32), (34, 76)],
amine@220 317 ),
amine@231 318 mono_aw_0_2_max_silence_0=(
amine@231 319 0.2,
amine@231 320 5,
amine@231 321 0,
amine@231 322 1,
amine@231 323 {"uc": 1, "aw": 0.2},
amine@231 324 [(2, 14), (16, 24), (26, 28), (34, 76)],
amine@231 325 ),
amine@220 326 mono_aw_0_2=(
amine@220 327 0.2,
amine@220 328 5,
amine@220 329 0.2,
amine@220 330 1,
amine@220 331 {"uc": 1, "aw": 0.2},
amine@220 332 [(2, 30), (34, 76)],
amine@220 333 ),
amine@231 334 mono_aw_0_3_max_silence_0=(
amine@231 335 0.3,
amine@231 336 5,
amine@231 337 0,
amine@231 338 1,
amine@231 339 {"uc": 1, "aw": 0.3},
amine@231 340 [(3, 12), (15, 24), (36, 76)],
amine@231 341 ),
amine@231 342 mono_aw_0_3_max_silence_0_3=(
amine@231 343 0.3,
amine@231 344 5,
amine@231 345 0.3,
amine@231 346 1,
amine@231 347 {"uc": 1, "aw": 0.3},
amine@231 348 [(3, 27), (36, 76)],
amine@231 349 ),
amine@231 350 mono_aw_0_3_max_silence_0_5=(
amine@231 351 0.3,
amine@231 352 5,
amine@231 353 0.5,
amine@231 354 1,
amine@231 355 {"uc": 1, "aw": 0.3},
amine@231 356 [(3, 27), (36, 76)],
amine@231 357 ),
amine@231 358 mono_aw_0_3_max_silence_0_6=(
amine@231 359 0.3,
amine@231 360 5,
amine@231 361 0.6,
amine@231 362 1,
amine@231 363 {"uc": 1, "aw": 0.3},
amine@231 364 [(3, 30), (36, 76)],
amine@231 365 ),
amine@231 366 mono_aw_0_4_max_silence_0=(
amine@231 367 0.2,
amine@231 368 5,
amine@232 369 0,
amine@231 370 1,
amine@231 371 {"uc": 1, "aw": 0.4},
amine@231 372 [(4, 12), (16, 24), (36, 76)],
amine@231 373 ),
amine@231 374 mono_aw_0_4_max_silence_0_3=(
amine@231 375 0.2,
amine@231 376 5,
amine@231 377 0.3,
amine@231 378 1,
amine@231 379 {"uc": 1, "aw": 0.4},
amine@231 380 [(4, 12), (16, 24), (36, 76)],
amine@231 381 ),
amine@231 382 mono_aw_0_4_max_silence_0_4=(
amine@231 383 0.2,
amine@231 384 5,
amine@231 385 0.4,
amine@231 386 1,
amine@231 387 {"uc": 1, "aw": 0.4},
amine@231 388 [(4, 28), (36, 76)],
amine@231 389 ),
amine@220 390 stereo_uc_1_analysis_window_0_2=(
amine@220 391 0.2,
amine@220 392 5,
amine@220 393 0.2,
amine@220 394 2,
amine@220 395 {"uc": 1, "analysis_window": 0.2},
amine@220 396 [(2, 30), (34, 76)],
amine@220 397 ),
amine@231 398 stereo_uc_2_analysis_window_0_2=(
amine@231 399 0.2,
amine@231 400 5,
amine@231 401 0.2,
amine@231 402 2,
amine@231 403 {"uc": 2, "analysis_window": 0.2},
amine@231 404 [(10, 32), (36, 76)],
amine@231 405 ),
amine@233 406 stereo_uc_mix_aw_0_1_max_silence_0=(
amine@233 407 0.2,
amine@233 408 5,
amine@233 409 0,
amine@233 410 2,
amine@233 411 {"uc": "mix", "analysis_window": 0.1},
amine@233 412 [(10, 14), (17, 24), (26, 29), (36, 76)],
amine@233 413 ),
amine@233 414 stereo_uc_mix_aw_0_1_max_silence_0_1=(
amine@233 415 0.2,
amine@233 416 5,
amine@233 417 0.1,
amine@233 418 2,
amine@233 419 {"uc": "mix", "analysis_window": 0.1},
amine@233 420 [(10, 15), (17, 25), (26, 30), (36, 76)],
amine@233 421 ),
amine@233 422 stereo_uc_mix_aw_0_1_max_silence_0_2=(
amine@233 423 0.2,
amine@233 424 5,
amine@233 425 0.2,
amine@233 426 2,
amine@233 427 {"uc": "mix", "analysis_window": 0.1},
amine@233 428 [(10, 16), (17, 31), (36, 76)],
amine@233 429 ),
amine@233 430 stereo_uc_mix_aw_0_1_max_silence_0_3=(
amine@233 431 0.2,
amine@233 432 5,
amine@233 433 0.3,
amine@233 434 2,
amine@233 435 {"uc": "mix", "analysis_window": 0.1},
amine@233 436 [(10, 32), (36, 76)],
amine@233 437 ),
amine@233 438 stereo_uc_mix_aw_0_2_max_silence_0_min_dur_0_3=(
amine@233 439 0.3,
amine@233 440 5,
amine@233 441 0,
amine@233 442 2,
amine@233 443 {"uc": "mix", "analysis_window": 0.2},
amine@233 444 [(10, 14), (16, 24), (36, 76)],
amine@233 445 ),
amine@233 446 stereo_uc_mix_aw_0_2_max_silence_0_min_dur_0_41=(
amine@233 447 0.41,
amine@233 448 5,
amine@233 449 0,
amine@233 450 2,
amine@233 451 {"uc": "mix", "analysis_window": 0.2},
amine@233 452 [(16, 24), (36, 76)],
amine@233 453 ),
amine@233 454 stereo_uc_mix_aw_0_2_max_silence_0_1=(
amine@233 455 0.2,
amine@233 456 5,
amine@233 457 0.1,
amine@233 458 2,
amine@233 459 {"uc": "mix", "analysis_window": 0.2},
amine@233 460 [(10, 14), (16, 24), (26, 28), (36, 76)],
amine@233 461 ),
amine@233 462 stereo_uc_mix_aw_0_2_max_silence_0_2=(
amine@233 463 0.2,
amine@233 464 5,
amine@233 465 0.2,
amine@233 466 2,
amine@233 467 {"uc": "mix", "analysis_window": 0.2},
amine@233 468 [(10, 30), (36, 76)],
amine@233 469 ),
amine@233 470 stereo_uc_mix_aw_0_2_max_silence_0_4=(
amine@233 471 0.2,
amine@233 472 5,
amine@233 473 0.4,
amine@233 474 2,
amine@233 475 {"uc": "mix", "analysis_window": 0.2},
amine@233 476 [(10, 32), (36, 76)],
amine@233 477 ),
amine@233 478 stereo_uc_mix_aw_0_2_max_silence_0_5=(
amine@233 479 0.2,
amine@233 480 5,
amine@233 481 0.5,
amine@233 482 2,
amine@233 483 {"uc": "mix", "analysis_window": 0.2},
amine@233 484 [(10, 32), (36, 76)],
amine@233 485 ),
amine@233 486 stereo_uc_mix_aw_0_2_max_silence_0_6=(
amine@233 487 0.2,
amine@233 488 5,
amine@233 489 0.6,
amine@233 490 2,
amine@233 491 {"uc": "mix", "analysis_window": 0.2},
amine@233 492 [(10, 34), (36, 76)],
amine@233 493 ),
amine@233 494 stereo_uc_mix_aw_0_3_max_silence_0=(
amine@233 495 0.2,
amine@233 496 5,
amine@233 497 0,
amine@233 498 2,
amine@233 499 {"uc": "mix", "analysis_window": 0.3},
amine@233 500 [(9, 24), (27, 30), (36, 76)],
amine@233 501 ),
amine@233 502 stereo_uc_mix_aw_0_3_max_silence_0_min_dur_0_3=(
amine@233 503 0.4,
amine@233 504 5,
amine@233 505 0,
amine@233 506 2,
amine@233 507 {"uc": "mix", "analysis_window": 0.3},
amine@233 508 [(9, 24), (36, 76)],
amine@233 509 ),
amine@233 510 stereo_uc_mix_aw_0_3_max_silence_0_6=(
amine@233 511 0.2,
amine@233 512 5,
amine@233 513 0.6,
amine@233 514 2,
amine@233 515 {"uc": "mix", "analysis_window": 0.3},
amine@233 516 [(9, 57), (57, 76)],
amine@233 517 ),
amine@233 518 stereo_uc_mix_aw_0_3_max_silence_0_6_max_dur_5_1=(
amine@233 519 0.2,
amine@233 520 5.1,
amine@233 521 0.6,
amine@233 522 2,
amine@233 523 {"uc": "mix", "analysis_window": 0.3},
amine@233 524 [(9, 60), (60, 76)],
amine@233 525 ),
amine@233 526 stereo_uc_mix_aw_0_3_max_silence_0_6_max_dur_5_2=(
amine@233 527 0.2,
amine@233 528 5.2,
amine@233 529 0.6,
amine@233 530 2,
amine@233 531 {"uc": "mix", "analysis_window": 0.3},
amine@233 532 [(9, 60), (60, 76)],
amine@233 533 ),
amine@233 534 stereo_uc_mix_aw_0_3_max_silence_0_6_max_dur_5_3=(
amine@233 535 0.2,
amine@233 536 5.3,
amine@233 537 0.6,
amine@233 538 2,
amine@233 539 {"uc": "mix", "analysis_window": 0.3},
amine@233 540 [(9, 60), (60, 76)],
amine@233 541 ),
amine@233 542 stereo_uc_mix_aw_0_3_max_silence_0_6_max_dur_5_4=(
amine@233 543 0.2,
amine@233 544 5.4,
amine@233 545 0.6,
amine@233 546 2,
amine@233 547 {"uc": "mix", "analysis_window": 0.3},
amine@233 548 [(9, 63), (63, 76)],
amine@233 549 ),
amine@233 550 stereo_uc_mix_aw_0_4_max_silence_0=(
amine@233 551 0.2,
amine@233 552 5,
amine@233 553 0,
amine@233 554 2,
amine@233 555 {"uc": "mix", "analysis_window": 0.4},
amine@233 556 [(16, 24), (36, 76)],
amine@233 557 ),
amine@233 558 stereo_uc_mix_aw_0_4_max_silence_0_3=(
amine@233 559 0.2,
amine@233 560 5,
amine@233 561 0.3,
amine@233 562 2,
amine@233 563 {"uc": "mix", "analysis_window": 0.4},
amine@233 564 [(16, 24), (36, 76)],
amine@233 565 ),
amine@233 566 stereo_uc_mix_aw_0_4_max_silence_0_4=(
amine@233 567 0.2,
amine@233 568 5,
amine@233 569 0.4,
amine@233 570 2,
amine@233 571 {"uc": "mix", "analysis_window": 0.4},
amine@233 572 [(16, 28), (36, 76)],
amine@233 573 ),
amine@220 574 )
amine@220 575 def test_split_analysis_window(
amine@220 576 self, min_dur, max_dur, max_silence, channels, kwargs, expected
amine@220 577 ):
amine@220 578
amine@220 579 mono_or_stereo = "mono" if channels == 1 else "stereo"
amine@220 580 filename = "tests/data/test_split_10HZ_{}.raw".format(mono_or_stereo)
amine@220 581 with open(filename, "rb") as fp:
amine@220 582 data = fp.read()
amine@220 583
amine@220 584 regions = split(
amine@220 585 data,
amine@220 586 min_dur=min_dur,
amine@220 587 max_dur=max_dur,
amine@220 588 max_silence=max_silence,
amine@220 589 drop_trailing_silence=False,
amine@220 590 strict_min_dur=False,
amine@220 591 sr=10,
amine@220 592 sw=2,
amine@220 593 ch=channels,
amine@220 594 **kwargs
amine@220 595 )
amine@220 596 regions = list(regions)
amine@220 597 sample_width = 2
amine@220 598 import numpy as np
amine@220 599
amine@220 600 use_channel = kwargs.get("use_channel", kwargs.get("uc"))
amine@220 601 # extrat channel of interest
amine@220 602 if channels != 1:
amine@220 603 use_channel = kwargs.get("use_channel", kwargs.get("uc"))
amine@220 604 use_channel = _normalize_use_channel(use_channel)
amine@220 605 data = _extract_selected_channel(
amine@220 606 data, channels, sample_width, use_channel=use_channel
amine@220 607 )
amine@220 608 err_msg = "Wrong number of regions after split, expected: "
amine@220 609 err_msg += "{}, found: {}".format(expected, regions)
amine@220 610 self.assertEqual(len(regions), len(expected), err_msg)
amine@220 611 for reg, exp in zip(regions, expected):
amine@220 612 onset, offset = exp
amine@220 613 exp_data = data[onset * sample_width : offset * sample_width]
amine@220 614 self.assertEqual(bytes(reg), exp_data)
amine@220 615
amine@220 616 @genty_dataset(
amine@212 617 filename_audio_format=(
amine@212 618 "tests/data/test_split_10HZ_stereo.raw",
amine@212 619 {"audio_format": "raw", "sr": 10, "sw": 2, "ch": 2},
amine@212 620 ),
amine@212 621 filename_audio_format_short_name=(
amine@212 622 "tests/data/test_split_10HZ_stereo.raw",
amine@212 623 {"fmt": "raw", "sr": 10, "sw": 2, "ch": 2},
amine@212 624 ),
amine@212 625 filename_no_audio_format=(
amine@212 626 "tests/data/test_split_10HZ_stereo.raw",
amine@212 627 {"sr": 10, "sw": 2, "ch": 2},
amine@212 628 ),
amine@212 629 filename_no_long_audio_params=(
amine@212 630 "tests/data/test_split_10HZ_stereo.raw",
amine@212 631 {"sampling_rate": 10, "sample_width": 2, "channels": 2},
amine@212 632 ),
amine@212 633 bytes_=(
amine@212 634 open("tests/data/test_split_10HZ_stereo.raw", "rb").read(),
amine@212 635 {"sr": 10, "sw": 2, "ch": 2},
amine@212 636 ),
amine@212 637 audio_reader=(
amine@212 638 AudioDataSource(
amine@212 639 "tests/data/test_split_10HZ_stereo.raw",
amine@212 640 sr=10,
amine@212 641 sw=2,
amine@212 642 ch=2,
amine@212 643 block_dur=0.1,
amine@212 644 ),
amine@212 645 {},
amine@212 646 ),
amine@212 647 audio_region=(
amine@212 648 AudioRegion(
amine@212 649 open("tests/data/test_split_10HZ_stereo.raw", "rb").read(),
amine@212 650 0,
amine@212 651 10,
amine@212 652 2,
amine@212 653 2,
amine@212 654 ),
amine@212 655 {},
amine@212 656 ),
amine@212 657 audio_source=(
amine@212 658 get_audio_source(
amine@212 659 "tests/data/test_split_10HZ_stereo.raw", sr=10, sw=2, ch=2
amine@212 660 ),
amine@212 661 {},
amine@212 662 ),
amine@212 663 )
amine@212 664 def test_split_input_type(self, input, kwargs):
amine@212 665
amine@212 666 with open("tests/data/test_split_10HZ_mono.raw", "rb") as fp:
amine@212 667 data = fp.read()
amine@212 668
amine@212 669 regions = split(
amine@212 670 input,
amine@212 671 min_dur=0.2,
amine@212 672 max_dur=5,
amine@212 673 max_silence=0.2,
amine@212 674 drop_trailing_silence=False,
amine@212 675 strict_min_dur=False,
amine@212 676 analysis_window=0.1,
amine@212 677 **kwargs
amine@212 678 )
amine@212 679 regions = list(regions)
amine@212 680 expected = [(2, 16), (17, 31), (34, 76)]
amine@212 681 sample_width = 2
amine@212 682 err_msg = "Wrong number of regions after split, expected: "
amine@212 683 err_msg += "{}, found: {}".format(expected, regions)
amine@212 684 self.assertEqual(len(regions), len(expected), err_msg)
amine@211 685 for reg, exp in zip(regions, expected):
amine@211 686 onset, offset = exp
amine@211 687 exp_data = data[onset * sample_width : offset * sample_width]
amine@211 688 self.assertEqual(bytes(reg), exp_data)
amine@211 689
amine@223 690 @genty_dataset(
amine@223 691 min_dur_greater_than_max_dur=(0.5, 0.4, 0.1),
amine@223 692 durations_OK_but_wrong_number_of_analysis_windows=(0.44, 0.49, 0.1),
amine@223 693 )
amine@223 694 def test_split_wrong_min_max_dur(self, min_dur, max_dur, analysis_window):
amine@223 695
amine@223 696 with self.assertRaises(ValueError) as val_err:
amine@223 697 split(
amine@223 698 b"0" * 16,
amine@223 699 min_dur=min_dur,
amine@223 700 max_dur=max_dur,
amine@223 701 max_silence=0.2,
amine@223 702 sr=16000,
amine@223 703 sw=1,
amine@223 704 ch=1,
amine@223 705 analysis_window=analysis_window,
amine@223 706 )
amine@223 707
amine@223 708 err_msg = "'min_dur' ({0} sec.) results in {1} analysis "
amine@223 709 err_msg += "window(s) ({1} == ceil({0} / {2})) which is "
amine@223 710 err_msg += "higher than the number of analysis window(s) for "
amine@223 711 err_msg += "'max_dur' ({3} == floor({4} / {2}))"
amine@223 712
amine@223 713 err_msg = err_msg.format(
amine@223 714 min_dur,
amine@223 715 math.ceil(min_dur / analysis_window),
amine@223 716 analysis_window,
amine@223 717 math.floor(max_dur / analysis_window),
amine@223 718 max_dur,
amine@223 719 )
amine@223 720 self.assertEqual(err_msg, str(val_err.exception))
amine@223 721
amine@224 722 @genty_dataset(
amine@224 723 max_silence_equals_max_dur=(0.5, 0.5, 0.1),
amine@224 724 max_silence_greater_than_max_dur=(0.5, 0.4, 0.1),
amine@224 725 durations_OK_but_wrong_number_of_analysis_windows=(0.44, 0.49, 0.1),
amine@224 726 )
amine@224 727 def test_split_wrong_max_silence_max_dur(
amine@224 728 self, max_silence, max_dur, analysis_window
amine@224 729 ):
amine@224 730
amine@224 731 with self.assertRaises(ValueError) as val_err:
amine@224 732 split(
amine@224 733 b"0" * 16,
amine@224 734 min_dur=0.2,
amine@224 735 max_dur=max_dur,
amine@224 736 max_silence=max_silence,
amine@224 737 sr=16000,
amine@224 738 sw=1,
amine@224 739 ch=1,
amine@224 740 analysis_window=analysis_window,
amine@224 741 )
amine@224 742
amine@224 743 err_msg = "'max_silence' ({0} sec.) results in {1} analysis "
amine@224 744 err_msg += "window(s) ({1} == floor({0} / {2})) which is "
amine@224 745 err_msg += "higher or equal to the number of analysis window(s) for "
amine@224 746 err_msg += "'max_dur' ({3} == floor({4} / {2}))"
amine@224 747
amine@224 748 err_msg = err_msg.format(
amine@224 749 max_silence,
amine@224 750 math.floor(max_silence / analysis_window),
amine@224 751 analysis_window,
amine@224 752 math.floor(max_dur / analysis_window),
amine@224 753 max_dur,
amine@224 754 )
amine@224 755 self.assertEqual(err_msg, str(val_err.exception))
amine@224 756
amine@226 757 @genty_dataset(
amine@226 758 negative_min_dur=({"min_dur": -1},),
amine@226 759 zero_min_dur=({"min_dur": 0},),
amine@226 760 negative_max_dur=({"max_dur": -1},),
amine@226 761 zero_max_dur=({"max_dur": 0},),
amine@226 762 negative_max_silence=({"max_silence": -1},),
amine@226 763 )
amine@226 764 def test_split_negative_temporal_params(self, wrong_param):
amine@226 765
amine@226 766 params = {"min_dur": 0.2, "max_dur": 0.5, "max_silence": 0.1}
amine@226 767 params.update(wrong_param)
amine@226 768 with self.assertRaises(ValueError) as val_err:
amine@226 769 split(None, **params)
amine@226 770
amine@226 771 name = set(wrong_param).pop()
amine@226 772 value = wrong_param[name]
amine@226 773 err_msg = "'{}' ({}) must be >{} 0".format(
amine@226 774 name, value, "=" if name == "max_silence" else ""
amine@226 775 )
amine@226 776 self.assertEqual(err_msg, str(val_err.exception))
amine@226 777
amine@236 778 def test_split_too_small_analysis_window(self):
amine@236 779 with self.assertRaises(ValueError) as val_err:
amine@236 780 split(b"", sr=10, sw=1, ch=1, analysis_window=0.09)
amine@236 781 err_msg = "Too small 'analysis_windows' (0.09) for sampling rate (10)."
amine@236 782 err_msg += " Analysis windows should at least be 1/10 to cover one "
amine@236 783 err_msg += "single data sample"
amine@236 784 self.assertEqual(err_msg, str(val_err.exception))
amine@236 785
amine@207 786
amine@207 787 @genty
amine@207 788 class TestAudioRegion(TestCase):
amine@86 789 @genty_dataset(
amine@86 790 simple=(b"\0" * 8000, 0, 8000, 1, 1, 1, 1, 1000),
amine@86 791 one_ms_less_than_1_sec=(
amine@86 792 b"\0" * 7992,
amine@86 793 0,
amine@86 794 8000,
amine@86 795 1,
amine@86 796 1,
amine@86 797 0.999,
amine@86 798 0.999,
amine@86 799 999,
amine@86 800 ),
amine@86 801 tree_quarter_ms_less_than_1_sec=(
amine@86 802 b"\0" * 7994,
amine@86 803 0,
amine@86 804 8000,
amine@86 805 1,
amine@86 806 1,
amine@86 807 0.99925,
amine@86 808 0.99925,
amine@86 809 999,
amine@86 810 ),
amine@86 811 half_ms_less_than_1_sec=(
amine@86 812 b"\0" * 7996,
amine@86 813 0,
amine@86 814 8000,
amine@86 815 1,
amine@86 816 1,
amine@86 817 0.9995,
amine@86 818 0.9995,
amine@86 819 1000,
amine@86 820 ),
amine@86 821 quarter_ms_less_than_1_sec=(
amine@86 822 b"\0" * 7998,
amine@86 823 0,
amine@86 824 8000,
amine@86 825 1,
amine@86 826 1,
amine@86 827 0.99975,
amine@86 828 0.99975,
amine@86 829 1000,
amine@86 830 ),
amine@86 831 simple_sample_width_2=(b"\0" * 8000 * 2, 0, 8000, 2, 1, 1, 1, 1000),
amine@86 832 simple_stereo=(b"\0" * 8000 * 2, 0, 8000, 1, 2, 1, 1, 1000),
amine@86 833 simple_multichannel=(b"\0" * 8000 * 5, 0, 8000, 1, 5, 1, 1, 1000),
amine@86 834 simple_sample_width_2_multichannel=(
amine@86 835 b"\0" * 8000 * 2 * 5,
amine@86 836 0,
amine@86 837 8000,
amine@86 838 2,
amine@86 839 5,
amine@86 840 1,
amine@86 841 1,
amine@86 842 1000,
amine@86 843 ),
amine@86 844 one_ms_less_than_1s_sw_2_multichannel=(
amine@86 845 b"\0" * 7992 * 2 * 5,
amine@86 846 0,
amine@86 847 8000,
amine@86 848 2,
amine@86 849 5,
amine@86 850 0.999,
amine@86 851 0.999,
amine@86 852 999,
amine@86 853 ),
amine@86 854 tree_qrt_ms_lt_1_s_sw_2_multichannel=(
amine@86 855 b"\0" * 7994 * 2 * 5,
amine@86 856 0,
amine@86 857 8000,
amine@86 858 2,
amine@86 859 5,
amine@86 860 0.99925,
amine@86 861 0.99925,
amine@86 862 999,
amine@86 863 ),
amine@86 864 half_ms_lt_1s_sw_2_multichannel=(
amine@86 865 b"\0" * 7996 * 2 * 5,
amine@86 866 0,
amine@86 867 8000,
amine@86 868 2,
amine@86 869 5,
amine@86 870 0.9995,
amine@86 871 0.9995,
amine@86 872 1000,
amine@86 873 ),
amine@86 874 quarter_ms_lt_1s_sw_2_multichannel=(
amine@86 875 b"\0" * 7998 * 2 * 5,
amine@86 876 0,
amine@86 877 8000,
amine@86 878 2,
amine@86 879 5,
amine@86 880 0.99975,
amine@86 881 0.99975,
amine@86 882 1000,
amine@86 883 ),
amine@86 884 arbitrary_length_1=(
amine@86 885 b"\0" * int(8000 * 1.33),
amine@86 886 2.7,
amine@86 887 8000,
amine@86 888 1,
amine@86 889 1,
amine@86 890 4.03,
amine@86 891 1.33,
amine@86 892 1330,
amine@86 893 ),
amine@86 894 arbitrary_length_2=(
amine@86 895 b"\0" * int(8000 * 0.476),
amine@86 896 11.568,
amine@86 897 8000,
amine@86 898 1,
amine@86 899 1,
amine@86 900 12.044,
amine@86 901 0.476,
amine@86 902 476,
amine@86 903 ),
amine@86 904 arbitrary_length_sw_2_multichannel=(
amine@86 905 b"\0" * int(8000 * 1.711) * 2 * 3,
amine@86 906 9.415,
amine@86 907 8000,
amine@86 908 2,
amine@86 909 3,
amine@86 910 11.126,
amine@86 911 1.711,
amine@86 912 1711,
amine@86 913 ),
amine@86 914 arbitrary_samplig_rate=(
amine@86 915 b"\0" * int(3172 * 1.318),
amine@86 916 17.236,
amine@86 917 3172,
amine@86 918 1,
amine@86 919 1,
amine@86 920 17.236 + int(3172 * 1.318) / 3172,
amine@86 921 int(3172 * 1.318) / 3172,
amine@86 922 1318,
amine@86 923 ),
amine@86 924 arbitrary_sr_sw_2_multichannel=(
amine@86 925 b"\0" * int(11317 * 0.716) * 2 * 3,
amine@86 926 18.811,
amine@86 927 11317,
amine@86 928 2,
amine@86 929 3,
amine@86 930 18.811 + int(11317 * 0.716) / 11317,
amine@86 931 int(11317 * 0.716) / 11317,
amine@86 932 716,
amine@86 933 ),
amine@86 934 )
amine@86 935 def test_creation(
amine@86 936 self,
amine@86 937 data,
amine@86 938 start,
amine@86 939 sampling_rate,
amine@86 940 sample_width,
amine@86 941 channels,
amine@86 942 expected_end,
amine@86 943 expected_duration_s,
amine@86 944 expected_duration_ms,
amine@86 945 ):
amine@86 946 region = AudioRegion(
amine@86 947 data, start, sampling_rate, sample_width, channels
amine@86 948 )
amine@86 949 self.assertEqual(region.sampling_rate, sampling_rate)
amine@86 950 self.assertEqual(region.sr, sampling_rate)
amine@86 951 self.assertEqual(region.sample_width, sample_width)
amine@86 952 self.assertEqual(region.sw, sample_width)
amine@86 953 self.assertEqual(region.channels, channels)
amine@86 954 self.assertEqual(region.ch, channels)
amine@86 955 self.assertEqual(region.start, start)
amine@86 956 self.assertEqual(region.end, expected_end)
amine@86 957 self.assertEqual(region.duration, expected_duration_s)
amine@86 958 self.assertEqual(len(region), expected_duration_ms)
amine@86 959 self.assertEqual(bytes(region), data)
amine@88 960
amine@97 961 def test_creation_invalid_data_exception(self):
amine@97 962 with self.assertRaises(AudioParameterError) as audio_param_err:
amine@97 963 _ = AudioRegion(
amine@97 964 data=b"ABCDEFGHI",
amine@97 965 start=0,
amine@97 966 sampling_rate=8,
amine@97 967 sample_width=2,
amine@97 968 channels=1,
amine@97 969 )
amine@97 970 self.assertEqual(
amine@97 971 "The length of audio data must be an integer "
amine@97 972 "multiple of `sample_width * channels`",
amine@97 973 str(audio_param_err.exception),
amine@97 974 )
amine@97 975
amine@88 976 @genty_dataset(
amine@192 977 simple=("output.wav", 1.230, "output.wav"),
amine@192 978 start=("output_{start}.wav", 1.230, "output_1.23.wav"),
amine@192 979 start_2=("output_{start}.wav", 1.233712, "output_1.233712.wav"),
amine@192 980 start_3=("output_{start}.wav", 1.2300001, "output_1.23.wav"),
amine@192 981 start_4=("output_{start:.3f}.wav", 1.233712, "output_1.234.wav"),
amine@192 982 start_5=(
amine@192 983 "output_{start:.8f}.wav",
amine@192 984 1.233712345,
amine@192 985 "output_1.23371200.wav",
amine@192 986 ),
amine@192 987 start_end_duration=(
amine@192 988 "output_{start}_{end}_{duration}.wav",
amine@192 989 1.455,
amine@192 990 "output_1.455_2.455_1.0.wav",
amine@192 991 ),
amine@192 992 start_end_duration_2=(
amine@192 993 "output_{start}_{end}_{duration}.wav",
amine@192 994 1.455321,
amine@192 995 "output_1.455321_2.455321_1.0.wav",
amine@192 996 ),
amine@192 997 )
amine@192 998 def test_save(self, format, start, expected):
amine@192 999 with TemporaryDirectory() as tmpdir:
amine@192 1000 region = AudioRegion(b"0" * 160, start, 160, 1, 1)
amine@192 1001 format = os.path.join(tmpdir, format)
amine@192 1002 filename = region.save(format)[len(tmpdir) + 1 :]
amine@192 1003 self.assertEqual(filename, expected)
amine@192 1004
amine@193 1005 def test_save_file_exists_exception(self):
amine@193 1006 with TemporaryDirectory() as tmpdir:
amine@193 1007 filename = os.path.join(tmpdir, "output.wav")
amine@193 1008 open(filename, "w").close()
amine@193 1009 region = AudioRegion(b"0" * 160, 0, 160, 1, 1)
amine@193 1010 with self.assertRaises(FileExistsError):
amine@193 1011 region.save(filename, exists_ok=False)
amine@193 1012
amine@192 1013 @genty_dataset(
amine@194 1014 first_half=(
amine@194 1015 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@194 1016 slice(0, 500),
amine@194 1017 0,
amine@194 1018 b"a" * 80,
amine@194 1019 ),
amine@194 1020 second_half=(
amine@194 1021 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@194 1022 slice(500, None),
amine@194 1023 0.5,
amine@194 1024 b"b" * 80,
amine@194 1025 ),
amine@194 1026 second_half_negative=(
amine@194 1027 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@194 1028 slice(-500, None),
amine@194 1029 0.5,
amine@194 1030 b"b" * 80,
amine@194 1031 ),
amine@194 1032 middle=(
amine@194 1033 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@194 1034 slice(200, 750),
amine@194 1035 0.2,
amine@194 1036 b"a" * 48 + b"b" * 40,
amine@194 1037 ),
amine@194 1038 middle_negative=(
amine@194 1039 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@194 1040 slice(-800, -250),
amine@194 1041 0.2,
amine@194 1042 b"a" * 48 + b"b" * 40,
amine@194 1043 ),
amine@194 1044 middle_sw2=(
amine@194 1045 AudioRegion(b"a" * 160 + b"b" * 160, 0, 160, 2, 1),
amine@194 1046 slice(200, 750),
amine@194 1047 0.2,
amine@194 1048 b"a" * 96 + b"b" * 80,
amine@194 1049 ),
amine@194 1050 middle_ch2=(
amine@194 1051 AudioRegion(b"a" * 160 + b"b" * 160, 0, 160, 1, 2),
amine@194 1052 slice(200, 750),
amine@194 1053 0.2,
amine@194 1054 b"a" * 96 + b"b" * 80,
amine@194 1055 ),
amine@194 1056 middle_sw2_ch2=(
amine@194 1057 AudioRegion(b"a" * 320 + b"b" * 320, 0, 160, 2, 2),
amine@194 1058 slice(200, 750),
amine@194 1059 0.2,
amine@194 1060 b"a" * 192 + b"b" * 160,
amine@194 1061 ),
amine@194 1062 but_first_sample=(
amine@194 1063 AudioRegion(b"a" * 4000 + b"b" * 4000, 0, 8000, 1, 1),
amine@194 1064 slice(1, None),
amine@194 1065 0.001,
amine@194 1066 b"a" * (4000 - 8) + b"b" * 4000,
amine@194 1067 ),
amine@194 1068 but_first_sample_negative=(
amine@194 1069 AudioRegion(b"a" * 4000 + b"b" * 4000, 0, 8000, 1, 1),
amine@194 1070 slice(-999, None),
amine@194 1071 0.001,
amine@194 1072 b"a" * (4000 - 8) + b"b" * 4000,
amine@194 1073 ),
amine@194 1074 but_last_sample=(
amine@194 1075 AudioRegion(b"a" * 4000 + b"b" * 4000, 0, 8000, 1, 1),
amine@194 1076 slice(0, 999),
amine@194 1077 0,
amine@194 1078 b"a" * 4000 + b"b" * (4000 - 8),
amine@194 1079 ),
amine@194 1080 but_last_sample_negative=(
amine@194 1081 AudioRegion(b"a" * 4000 + b"b" * 4000, 0, 8000, 1, 1),
amine@194 1082 slice(0, -1),
amine@194 1083 0,
amine@194 1084 b"a" * 4000 + b"b" * (4000 - 8),
amine@194 1085 ),
amine@194 1086 big_negative_start=(
amine@194 1087 AudioRegion(b"a" * 160, 0, 160, 1, 1),
amine@194 1088 slice(-5000, None),
amine@194 1089 0,
amine@194 1090 b"a" * 160,
amine@194 1091 ),
amine@194 1092 big_negative_stop=(
amine@194 1093 AudioRegion(b"a" * 160, 0, 160, 1, 1),
amine@194 1094 slice(None, -1500),
amine@194 1095 0,
amine@194 1096 b"",
amine@194 1097 ),
amine@194 1098 empty=(
amine@194 1099 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@194 1100 slice(0, 0),
amine@194 1101 0,
amine@194 1102 b"",
amine@194 1103 ),
amine@194 1104 empty_start_stop_reversed=(
amine@194 1105 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@194 1106 slice(200, 100),
amine@194 1107 0.2,
amine@194 1108 b"",
amine@194 1109 ),
amine@194 1110 empty_big_positive_start=(
amine@194 1111 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@194 1112 slice(2000, 3000),
amine@194 1113 2,
amine@194 1114 b"",
amine@194 1115 ),
amine@194 1116 empty_negative_reversed=(
amine@194 1117 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@194 1118 slice(-100, -200),
amine@194 1119 0.9,
amine@194 1120 b"",
amine@194 1121 ),
amine@194 1122 empty_big_negative_stop=(
amine@194 1123 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@194 1124 slice(0, -2000),
amine@194 1125 0,
amine@194 1126 b"",
amine@194 1127 ),
amine@230 1128 arbitrary_sampling_rate=(
amine@230 1129 AudioRegion(b"a" * 124 + b"b" * 376, 0, 1234, 1, 1),
amine@230 1130 slice(100, 200),
amine@230 1131 123 / 1234,
amine@230 1132 b"a" + b"b" * 123,
amine@230 1133 ),
amine@194 1134 )
amine@231 1135 def test_region_temporal_slicing(
amine@194 1136 self, region, slice_, expected_start, expected_data
amine@194 1137 ):
amine@229 1138 sub_region = region.millis[slice_]
amine@194 1139 self.assertEqual(sub_region.start, expected_start)
amine@194 1140 self.assertEqual(bytes(sub_region), expected_data)
amine@194 1141
amine@229 1142 start_sec = slice_.start / 1000 if slice_.start is not None else None
amine@229 1143 stop_sec = slice_.stop / 1000 if slice_.stop is not None else None
amine@229 1144
amine@229 1145 sub_region = region.sec[start_sec:stop_sec]
amine@229 1146 self.assertEqual(sub_region.start, expected_start)
amine@229 1147 self.assertEqual(bytes(sub_region), expected_data)
amine@229 1148
amine@194 1149 @genty_dataset(
amine@231 1150 first_half=(
amine@231 1151 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@231 1152 slice(0, 80),
amine@231 1153 0,
amine@231 1154 b"a" * 80,
amine@231 1155 ),
amine@231 1156 second_half=(
amine@231 1157 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@231 1158 slice(80, None),
amine@231 1159 0.5,
amine@231 1160 b"b" * 80,
amine@231 1161 ),
amine@231 1162 second_half_negative=(
amine@231 1163 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@231 1164 slice(-80, None),
amine@231 1165 0.5,
amine@231 1166 b"b" * 80,
amine@231 1167 ),
amine@231 1168 middle=(
amine@231 1169 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@231 1170 slice(160 // 5, 160 // 4 * 3),
amine@231 1171 0.2,
amine@231 1172 b"a" * 48 + b"b" * 40,
amine@231 1173 ),
amine@231 1174 middle_negative=(
amine@231 1175 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@231 1176 slice(-160 // 5 * 4, -160 // 4),
amine@231 1177 0.2,
amine@231 1178 b"a" * 48 + b"b" * 40,
amine@231 1179 ),
amine@231 1180 middle_sw2=(
amine@231 1181 AudioRegion(b"a" * 160 + b"b" * 160, 0, 160, 2, 1),
amine@231 1182 slice(160 // 5, 160 // 4 * 3),
amine@231 1183 0.2,
amine@231 1184 b"a" * 96 + b"b" * 80,
amine@231 1185 ),
amine@231 1186 middle_ch2=(
amine@231 1187 AudioRegion(b"a" * 160 + b"b" * 160, 0, 160, 1, 2),
amine@231 1188 slice(160 // 5, 160 // 4 * 3),
amine@231 1189 0.2,
amine@231 1190 b"a" * 96 + b"b" * 80,
amine@231 1191 ),
amine@231 1192 middle_sw2_ch2=(
amine@231 1193 AudioRegion(b"a" * 320 + b"b" * 320, 0, 160, 2, 2),
amine@231 1194 slice(160 // 5, 160 // 4 * 3),
amine@231 1195 0.2,
amine@231 1196 b"a" * 192 + b"b" * 160,
amine@231 1197 ),
amine@231 1198 but_first_sample=(
amine@231 1199 AudioRegion(b"a" * 4000 + b"b" * 4000, 0, 8000, 1, 1),
amine@231 1200 slice(1, None),
amine@231 1201 1 / 8000,
amine@231 1202 b"a" * (4000 - 1) + b"b" * 4000,
amine@231 1203 ),
amine@231 1204 but_first_sample_negative=(
amine@231 1205 AudioRegion(b"a" * 4000 + b"b" * 4000, 0, 8000, 1, 1),
amine@231 1206 slice(-7999, None),
amine@231 1207 1 / 8000,
amine@231 1208 b"a" * (4000 - 1) + b"b" * 4000,
amine@231 1209 ),
amine@231 1210 but_last_sample=(
amine@231 1211 AudioRegion(b"a" * 4000 + b"b" * 4000, 0, 8000, 1, 1),
amine@231 1212 slice(0, 7999),
amine@231 1213 0,
amine@231 1214 b"a" * 4000 + b"b" * (4000 - 1),
amine@231 1215 ),
amine@231 1216 but_last_sample_negative=(
amine@231 1217 AudioRegion(b"a" * 4000 + b"b" * 4000, 0, 8000, 1, 1),
amine@231 1218 slice(0, -1),
amine@231 1219 0,
amine@231 1220 b"a" * 4000 + b"b" * (4000 - 1),
amine@231 1221 ),
amine@231 1222 big_negative_start=(
amine@231 1223 AudioRegion(b"a" * 160, 0, 160, 1, 1),
amine@231 1224 slice(-1600, None),
amine@231 1225 0,
amine@231 1226 b"a" * 160,
amine@231 1227 ),
amine@231 1228 big_negative_stop=(
amine@231 1229 AudioRegion(b"a" * 160, 0, 160, 1, 1),
amine@231 1230 slice(None, -1600),
amine@231 1231 0,
amine@231 1232 b"",
amine@231 1233 ),
amine@231 1234 empty=(
amine@231 1235 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@231 1236 slice(0, 0),
amine@231 1237 0,
amine@231 1238 b"",
amine@231 1239 ),
amine@231 1240 empty_start_stop_reversed=(
amine@231 1241 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@231 1242 slice(80, 40),
amine@231 1243 0.5,
amine@231 1244 b"",
amine@231 1245 ),
amine@231 1246 empty_big_positive_start=(
amine@231 1247 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@231 1248 slice(1600, 3000),
amine@231 1249 10,
amine@231 1250 b"",
amine@231 1251 ),
amine@231 1252 empty_negative_reversed=(
amine@231 1253 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@231 1254 slice(-16, -32),
amine@231 1255 0.9,
amine@231 1256 b"",
amine@231 1257 ),
amine@231 1258 empty_big_negative_stop=(
amine@231 1259 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@231 1260 slice(0, -2000),
amine@231 1261 0,
amine@231 1262 b"",
amine@231 1263 ),
amine@231 1264 arbitrary_sampling_rate=(
amine@231 1265 AudioRegion(b"a" * 124 + b"b" * 376, 0, 1235, 1, 1),
amine@231 1266 slice(100, 200),
amine@231 1267 100 / 1235,
amine@231 1268 b"a" * 24 + b"b" * 76,
amine@231 1269 ),
amine@231 1270 arbitrary_sampling_rate_middle_sw2_ch2=(
amine@231 1271 AudioRegion(b"a" * 124 + b"b" * 376, 0, 1235, 2, 2),
amine@231 1272 slice(25, 50),
amine@231 1273 25 / 1235,
amine@231 1274 b"a" * 24 + b"b" * 76,
amine@231 1275 ),
amine@231 1276 )
amine@231 1277 def test_region_sample_slicing(
amine@231 1278 self, region, slice_, expected_start, expected_data
amine@231 1279 ):
amine@231 1280 sub_region = region[slice_]
amine@231 1281 self.assertEqual(sub_region.start, expected_start)
amine@231 1282 self.assertEqual(bytes(sub_region), expected_data)
amine@231 1283
amine@231 1284 @genty_dataset(
amine@88 1285 simple=(8000, 1, 1),
amine@88 1286 stereo_sw_2=(8000, 2, 2),
amine@229 1287 arbitrary_sr_multichannel=(5413, 2, 3),
amine@88 1288 )
amine@88 1289 def test_concatenation(self, sampling_rate, sample_width, channels):
amine@88 1290
amine@88 1291 region_1, region_2 = _make_random_length_regions(
amine@88 1292 [b"a", b"b"], sampling_rate, sample_width, channels
amine@88 1293 )
amine@88 1294
amine@88 1295 expected_start = region_1.start
amine@88 1296 expected_duration = region_1.duration + region_2.duration
amine@88 1297 expected_end = expected_start + expected_duration
amine@88 1298 expected_data = bytes(region_1) + bytes(region_2)
amine@88 1299 concat_region = region_1 + region_2
amine@88 1300
amine@88 1301 self.assertEqual(concat_region.start, expected_start)
amine@88 1302 self.assertAlmostEqual(concat_region.end, expected_end, places=6)
amine@88 1303 self.assertAlmostEqual(
amine@88 1304 concat_region.duration, expected_duration, places=6
amine@88 1305 )
amine@88 1306 self.assertEqual(bytes(concat_region), expected_data)
amine@88 1307
amine@88 1308 @genty_dataset(
amine@88 1309 simple=(8000, 1, 1),
amine@88 1310 stereo_sw_2=(8000, 2, 2),
amine@229 1311 arbitrary_sr_multichannel=(5413, 2, 3),
amine@88 1312 )
amine@88 1313 def test_concatenation_many(self, sampling_rate, sample_width, channels):
amine@88 1314
amine@88 1315 regions = _make_random_length_regions(
amine@88 1316 [b"a", b"b", b"c"], sampling_rate, sample_width, channels
amine@88 1317 )
amine@88 1318 expected_start = regions[0].start
amine@88 1319 expected_duration = sum(r.duration for r in regions)
amine@88 1320 expected_end = expected_start + expected_duration
amine@88 1321 expected_data = b"".join(bytes(r) for r in regions)
amine@88 1322 concat_region = sum(regions)
amine@88 1323
amine@88 1324 self.assertEqual(concat_region.start, expected_start)
amine@88 1325 self.assertAlmostEqual(concat_region.end, expected_end, places=6)
amine@88 1326 self.assertAlmostEqual(
amine@88 1327 concat_region.duration, expected_duration, places=6
amine@88 1328 )
amine@88 1329 self.assertEqual(bytes(concat_region), expected_data)
amine@88 1330
amine@88 1331 def test_concatenation_different_sampling_rate_error(self):
amine@88 1332
amine@88 1333 region_1 = AudioRegion(b"a" * 100, 0, 8000, 1, 1)
amine@88 1334 region_2 = AudioRegion(b"b" * 100, 0, 3000, 1, 1)
amine@88 1335
amine@88 1336 with self.assertRaises(ValueError) as val_err:
amine@88 1337 region_1 + region_2
amine@88 1338 self.assertEqual(
amine@88 1339 "Can only concatenate AudioRegions of the same "
amine@88 1340 "sampling rate (8000 != 3000)",
amine@88 1341 str(val_err.exception),
amine@88 1342 )
amine@88 1343
amine@88 1344 def test_concatenation_different_sample_width_error(self):
amine@88 1345
amine@88 1346 region_1 = AudioRegion(b"a" * 100, 0, 8000, 2, 1)
amine@88 1347 region_2 = AudioRegion(b"b" * 100, 0, 8000, 4, 1)
amine@88 1348
amine@88 1349 with self.assertRaises(ValueError) as val_err:
amine@88 1350 region_1 + region_2
amine@88 1351 self.assertEqual(
amine@88 1352 "Can only concatenate AudioRegions of the same "
amine@88 1353 "sample width (2 != 4)",
amine@88 1354 str(val_err.exception),
amine@88 1355 )
amine@88 1356
amine@88 1357 def test_concatenation_different_number_of_channels_error(self):
amine@88 1358
amine@88 1359 region_1 = AudioRegion(b"a" * 100, 0, 8000, 1, 1)
amine@88 1360 region_2 = AudioRegion(b"b" * 100, 0, 8000, 1, 2)
amine@88 1361
amine@88 1362 with self.assertRaises(ValueError) as val_err:
amine@88 1363 region_1 + region_2
amine@88 1364 self.assertEqual(
amine@88 1365 "Can only concatenate AudioRegions of the same "
amine@88 1366 "number of channels (1 != 2)",
amine@88 1367 str(val_err.exception),
amine@88 1368 )
amine@196 1369
amine@196 1370 @genty_dataset(
amine@196 1371 simple=(0.01, 0.03, 30),
amine@196 1372 rounded_len_floor=(0.00575, 0.01725, 17),
amine@196 1373 rounded_len_ceil=(0.00625, 0.01875, 19),
amine@196 1374 )
amine@196 1375 def test_multiplication(
amine@196 1376 self, duration, expected_duration, expected_length
amine@196 1377 ):
amine@196 1378 sw = 2
amine@196 1379 data = b"0" * int(duration * 8000 * sw)
amine@196 1380 region = AudioRegion(data, 0, 8000, sw, 1)
amine@196 1381 m_region = 1 * region * 3
amine@196 1382 self.assertEqual(bytes(m_region), data * 3)
amine@196 1383 self.assertEqual(m_region.sr, 8000)
amine@196 1384 self.assertEqual(m_region.sw, 2)
amine@196 1385 self.assertEqual(m_region.ch, 1)
amine@196 1386 self.assertEqual(m_region.duration, expected_duration)
amine@196 1387 self.assertEqual(len(m_region), expected_length)
amine@197 1388
amine@198 1389 @genty_dataset(_str=("x", "str"), _float=(1.4, "float"))
amine@197 1390 def test_multiplication_non_int(self, factor, _type):
amine@197 1391 with self.assertRaises(TypeError) as type_err:
amine@198 1392 AudioRegion(b"0" * 80, 0, 8000, 1, 1) * factor
amine@197 1393 err_msg = "Can't multiply AudioRegion by a non-int of type '{}'"
amine@197 1394 self.assertEqual(err_msg.format(_type), str(type_err.exception))