annotate tests/test_core.py @ 233:d8267b3334f0

Add more tests for different analysis windows with channel mixing in split
author Amine Sehili <amine.sehili@gmail.com>
date Fri, 19 Jul 2019 21:43:01 +0100
parents 4282cea451d6
children 8c92420d15d5
rev   line source
amine@192 1 import os
amine@221 2 import math
amine@88 3 from random import random
amine@192 4 from tempfile import TemporaryDirectory
amine@221 5 from unittest import TestCase
amine@86 6 from genty import genty, genty_dataset
amine@207 7 from auditok import split, AudioRegion, AudioParameterError
amine@215 8 from auditok.core import _duration_to_nb_windows
amine@212 9 from auditok.util import AudioDataSource
amine@210 10 from auditok.io import (
amine@210 11 _normalize_use_channel,
amine@210 12 _extract_selected_channel,
amine@210 13 get_audio_source,
amine@210 14 )
amine@86 15
amine@86 16
amine@88 17 def _make_random_length_regions(
amine@88 18 byte_seq, sampling_rate, sample_width, channels
amine@88 19 ):
amine@88 20 regions = []
amine@88 21 for b in byte_seq:
amine@88 22 duration = round(random() * 10, 6)
amine@95 23 data = b * int(duration * sampling_rate) * sample_width * channels
amine@88 24 start = round(random() * 13, 3)
amine@88 25 region = AudioRegion(
amine@88 26 data, start, sampling_rate, sample_width, channels
amine@88 27 )
amine@88 28 regions.append(region)
amine@88 29 return regions
amine@88 30
amine@88 31
amine@86 32 @genty
amine@215 33 class TestFunctions(TestCase):
amine@215 34 @genty_dataset(
amine@221 35 zero_duration=(0, 1, None, 0),
amine@221 36 multiple=(0.3, 0.1, round, 3),
amine@221 37 not_multiple_ceil=(0.35, 0.1, math.ceil, 4),
amine@221 38 not_multiple_floor=(0.35, 0.1, math.floor, 3),
amine@221 39 small_duration=(0.05, 0.1, round, 0),
amine@221 40 small_duration_ceil=(0.05, 0.1, math.ceil, 1),
amine@233 41 with_round_error=(0.3, 0.1, math.floor, 3, {"epsilon": 1e-6}),
amine@221 42 negative_duration=(-0.5, 0.1, math.ceil, ValueError),
amine@221 43 negative_analysis_window=(0.5, -0.1, math.ceil, ValueError),
amine@215 44 )
amine@221 45 def test_duration_to_nb_windows(
amine@232 46 self, duration, analysis_window, round_fn, expected, kwargs=None
amine@221 47 ):
amine@221 48 if expected == ValueError:
amine@215 49 with self.assertRaises(expected):
amine@221 50 _duration_to_nb_windows(duration, analysis_window, round_fn)
amine@215 51 else:
amine@232 52 if kwargs is None:
amine@232 53 kwargs = {}
amine@221 54 result = _duration_to_nb_windows(
amine@232 55 duration, analysis_window, round_fn, **kwargs
amine@221 56 )
amine@215 57 self.assertEqual(result, expected)
amine@215 58
amine@215 59
amine@215 60 @genty
amine@207 61 class TestSplit(TestCase):
amine@207 62 @genty_dataset(
amine@207 63 simple=(
amine@207 64 0.2,
amine@207 65 5,
amine@207 66 0.2,
amine@207 67 False,
amine@207 68 False,
amine@207 69 {"eth": 50},
amine@207 70 [(2, 16), (17, 31), (34, 76)],
amine@207 71 ),
amine@214 72 short_max_dur=(
amine@214 73 0.3,
amine@214 74 2,
amine@214 75 0.2,
amine@214 76 False,
amine@214 77 False,
amine@214 78 {"eth": 50},
amine@214 79 [(2, 16), (17, 31), (34, 54), (54, 74), (74, 76)],
amine@214 80 ),
amine@214 81 long_min_dur=(3, 5, 0.2, False, False, {"eth": 50}, [(34, 76)]),
amine@214 82 long_max_silence=(0.2, 80, 10, False, False, {"eth": 50}, [(2, 76)]),
amine@214 83 zero_max_silence=(
amine@214 84 0.2,
amine@214 85 5,
amine@214 86 0.0,
amine@214 87 False,
amine@214 88 False,
amine@214 89 {"eth": 50},
amine@214 90 [(2, 14), (17, 24), (26, 29), (34, 76)],
amine@214 91 ),
amine@207 92 low_energy_threshold=(
amine@207 93 0.2,
amine@207 94 5,
amine@207 95 0.2,
amine@207 96 False,
amine@207 97 False,
amine@207 98 {"energy_threshold": 40},
amine@207 99 [(0, 50), (50, 76)],
amine@207 100 ),
amine@207 101 high_energy_threshold=(
amine@207 102 0.2,
amine@207 103 5,
amine@207 104 0.2,
amine@207 105 False,
amine@207 106 False,
amine@207 107 {"energy_threshold": 60},
amine@207 108 [],
amine@207 109 ),
amine@207 110 trim_leading_and_trailing_silence=(
amine@207 111 0.2,
amine@207 112 10, # use long max_dur
amine@207 113 0.5, # and a max_silence longer than any inter-region silence
amine@207 114 True,
amine@207 115 False,
amine@207 116 {"eth": 50},
amine@207 117 [(2, 76)],
amine@207 118 ),
amine@207 119 drop_trailing_silence=(
amine@207 120 0.2,
amine@207 121 5,
amine@207 122 0.2,
amine@207 123 True,
amine@207 124 False,
amine@207 125 {"eth": 50},
amine@207 126 [(2, 14), (17, 29), (34, 76)],
amine@207 127 ),
amine@207 128 drop_trailing_silence_2=(
amine@207 129 1.5,
amine@207 130 5,
amine@207 131 0.2,
amine@207 132 True,
amine@207 133 False,
amine@207 134 {"eth": 50},
amine@207 135 [(34, 76)],
amine@207 136 ),
amine@207 137 strict_min_dur=(
amine@207 138 0.3,
amine@207 139 2,
amine@207 140 0.2,
amine@207 141 False,
amine@207 142 True,
amine@207 143 {"eth": 50},
amine@207 144 [(2, 16), (17, 31), (34, 54), (54, 74)],
amine@207 145 ),
amine@207 146 )
amine@207 147 def test_split_params(
amine@207 148 self,
amine@207 149 min_dur,
amine@207 150 max_dur,
amine@207 151 max_silence,
amine@207 152 drop_trailing_silence,
amine@207 153 strict_min_dur,
amine@207 154 kwargs,
amine@207 155 expected,
amine@207 156 ):
amine@207 157 with open("tests/data/test_split_10HZ_mono.raw", "rb") as fp:
amine@207 158 data = fp.read()
amine@207 159
amine@207 160 regions = split(
amine@207 161 data,
amine@207 162 min_dur,
amine@207 163 max_dur,
amine@207 164 max_silence,
amine@207 165 drop_trailing_silence,
amine@207 166 strict_min_dur,
amine@207 167 analysis_window=0.1,
amine@207 168 sr=10,
amine@207 169 sw=2,
amine@207 170 ch=1,
amine@207 171 **kwargs
amine@207 172 )
amine@207 173 regions = list(regions)
amine@207 174 err_msg = "Wrong number of regions after split, expected: "
amine@210 175 err_msg += "{}, found: {}".format(len(expected), len(regions))
amine@207 176 self.assertEqual(len(regions), len(expected), err_msg)
amine@207 177
amine@207 178 sample_width = 2
amine@207 179 for reg, exp in zip(regions, expected):
amine@207 180 onset, offset = exp
amine@207 181 exp_data = data[onset * sample_width : offset * sample_width]
amine@207 182 self.assertEqual(bytes(reg), exp_data)
amine@207 183
amine@211 184 @genty_dataset(
amine@211 185 stereo_all_default=(2, {}, [(2, 16), (17, 31), (34, 76)]),
amine@213 186 mono_max_read=(1, {"max_read": 5}, [(2, 16), (17, 31), (34, 50)]),
amine@213 187 mono_max_read_short_name=(1, {"mr": 5}, [(2, 16), (17, 31), (34, 50)]),
amine@211 188 mono_use_channel_1=(
amine@211 189 1,
amine@211 190 {"eth": 50, "use_channel": 1},
amine@211 191 [(2, 16), (17, 31), (34, 76)],
amine@211 192 ),
amine@211 193 mono_uc_1=(1, {"eth": 50, "uc": 1}, [(2, 16), (17, 31), (34, 76)]),
amine@211 194 mono_use_channel_left=(
amine@211 195 1,
amine@211 196 {"eth": 50, "use_channel": "left"},
amine@211 197 [(2, 16), (17, 31), (34, 76)],
amine@211 198 ),
amine@211 199 mono_uc_left=(
amine@211 200 1,
amine@211 201 {"eth": 50, "uc": "left"},
amine@211 202 [(2, 16), (17, 31), (34, 76)],
amine@211 203 ),
amine@211 204 mono_use_channel_None=(
amine@211 205 1,
amine@211 206 {"eth": 50, "use_channel": None},
amine@211 207 [(2, 16), (17, 31), (34, 76)],
amine@211 208 ),
amine@211 209 stereo_use_channel_1=(
amine@211 210 2,
amine@211 211 {"eth": 50, "use_channel": 1},
amine@211 212 [(2, 16), (17, 31), (34, 76)],
amine@211 213 ),
amine@211 214 stereo_use_channel_left=(
amine@211 215 2,
amine@211 216 {"eth": 50, "use_channel": "left"},
amine@211 217 [(2, 16), (17, 31), (34, 76)],
amine@211 218 ),
amine@211 219 stereo_use_channel_no_use_channel_given=(
amine@211 220 2,
amine@211 221 {"eth": 50},
amine@211 222 [(2, 16), (17, 31), (34, 76)],
amine@211 223 ),
amine@211 224 stereo_use_channel_minus_2=(
amine@211 225 2,
amine@211 226 {"eth": 50, "use_channel": -2},
amine@211 227 [(2, 16), (17, 31), (34, 76)],
amine@211 228 ),
amine@211 229 stereo_uc_2=(2, {"eth": 50, "uc": 2}, [(10, 32), (36, 76)]),
amine@211 230 stereo_use_channel_right=(
amine@211 231 2,
amine@211 232 {"eth": 50, "use_channel": "right"},
amine@211 233 [(10, 32), (36, 76)],
amine@211 234 ),
amine@211 235 stereo_uc_minus_1=(2, {"eth": 50, "uc": -1}, [(10, 32), (36, 76)]),
amine@213 236 mono_uc_mix=(
amine@213 237 1,
amine@213 238 {"eth": 50, "uc": "mix"},
amine@213 239 [(2, 16), (17, 31), (34, 76)],
amine@213 240 ),
amine@213 241 stereo_use_channel_mix=(
amine@213 242 2,
amine@213 243 {"energy_threshold": 53.5, "use_channel": "mix"},
amine@213 244 [(54, 76)],
amine@213 245 ),
amine@213 246 stereo_uc_mix=(2, {"eth": 52, "uc": "mix"}, [(17, 26), (54, 76)]),
amine@213 247 stereo_uc_mix_default_eth=(
amine@213 248 2,
amine@213 249 {"uc": "mix"},
amine@213 250 [(10, 16), (17, 31), (36, 76)],
amine@213 251 ),
amine@211 252 )
amine@211 253 def test_split_kwargs(self, channels, kwargs, expected):
amine@211 254
amine@211 255 mono_or_stereo = "mono" if channels == 1 else "stereo"
amine@211 256 filename = "tests/data/test_split_10HZ_{}.raw".format(mono_or_stereo)
amine@211 257 with open(filename, "rb") as fp:
amine@211 258 data = fp.read()
amine@211 259
amine@211 260 regions = split(
amine@211 261 data,
amine@211 262 min_dur=0.2,
amine@211 263 max_dur=5,
amine@211 264 max_silence=0.2,
amine@211 265 drop_trailing_silence=False,
amine@211 266 strict_min_dur=False,
amine@211 267 analysis_window=0.1,
amine@211 268 sr=10,
amine@211 269 sw=2,
amine@211 270 ch=channels,
amine@211 271 **kwargs
amine@211 272 )
amine@212 273 regions = list(regions)
amine@211 274 sample_width = 2
amine@211 275 import numpy as np
amine@211 276
amine@211 277 use_channel = kwargs.get("use_channel", kwargs.get("uc"))
amine@211 278 # extrat channel of interest
amine@211 279 if channels != 1:
amine@211 280 use_channel = kwargs.get("use_channel", kwargs.get("uc"))
amine@211 281 use_channel = _normalize_use_channel(use_channel)
amine@211 282 data = _extract_selected_channel(
amine@211 283 data, channels, sample_width, use_channel=use_channel
amine@211 284 )
amine@211 285 err_msg = "Wrong number of regions after split, expected: "
amine@211 286 err_msg += "{}, found: {}".format(expected, regions)
amine@211 287 self.assertEqual(len(regions), len(expected), err_msg)
amine@212 288 for reg, exp in zip(regions, expected):
amine@212 289 onset, offset = exp
amine@212 290 exp_data = data[onset * sample_width : offset * sample_width]
amine@212 291 self.assertEqual(bytes(reg), exp_data)
amine@211 292
amine@212 293 @genty_dataset(
amine@220 294 mono_aw_0_2_max_silence_0_2=(
amine@220 295 0.2,
amine@220 296 5,
amine@220 297 0.2,
amine@220 298 1,
amine@220 299 {"uc": 1, "aw": 0.2},
amine@220 300 [(2, 30), (34, 76)],
amine@220 301 ),
amine@220 302 mono_aw_0_2_max_silence_0_3=(
amine@220 303 0.2,
amine@220 304 5,
amine@220 305 0.3,
amine@220 306 1,
amine@220 307 {"uc": 1, "aw": 0.2},
amine@227 308 [(2, 30), (34, 76)],
amine@220 309 ),
amine@220 310 mono_aw_0_2_max_silence_0_4=(
amine@220 311 0.2,
amine@220 312 5,
amine@227 313 0.4,
amine@220 314 1,
amine@220 315 {"uc": 1, "aw": 0.2},
amine@220 316 [(2, 32), (34, 76)],
amine@220 317 ),
amine@231 318 mono_aw_0_2_max_silence_0=(
amine@231 319 0.2,
amine@231 320 5,
amine@231 321 0,
amine@231 322 1,
amine@231 323 {"uc": 1, "aw": 0.2},
amine@231 324 [(2, 14), (16, 24), (26, 28), (34, 76)],
amine@231 325 ),
amine@220 326 mono_aw_0_2=(
amine@220 327 0.2,
amine@220 328 5,
amine@220 329 0.2,
amine@220 330 1,
amine@220 331 {"uc": 1, "aw": 0.2},
amine@220 332 [(2, 30), (34, 76)],
amine@220 333 ),
amine@231 334 mono_aw_0_3_max_silence_0=(
amine@231 335 0.3,
amine@231 336 5,
amine@231 337 0,
amine@231 338 1,
amine@231 339 {"uc": 1, "aw": 0.3},
amine@231 340 [(3, 12), (15, 24), (36, 76)],
amine@231 341 ),
amine@231 342 mono_aw_0_3_max_silence_0_3=(
amine@231 343 0.3,
amine@231 344 5,
amine@231 345 0.3,
amine@231 346 1,
amine@231 347 {"uc": 1, "aw": 0.3},
amine@231 348 [(3, 27), (36, 76)],
amine@231 349 ),
amine@231 350 mono_aw_0_3_max_silence_0_5=(
amine@231 351 0.3,
amine@231 352 5,
amine@231 353 0.5,
amine@231 354 1,
amine@231 355 {"uc": 1, "aw": 0.3},
amine@231 356 [(3, 27), (36, 76)],
amine@231 357 ),
amine@231 358 mono_aw_0_3_max_silence_0_6=(
amine@231 359 0.3,
amine@231 360 5,
amine@231 361 0.6,
amine@231 362 1,
amine@231 363 {"uc": 1, "aw": 0.3},
amine@231 364 [(3, 30), (36, 76)],
amine@231 365 ),
amine@231 366 mono_aw_0_4_max_silence_0=(
amine@231 367 0.2,
amine@231 368 5,
amine@232 369 0,
amine@231 370 1,
amine@231 371 {"uc": 1, "aw": 0.4},
amine@231 372 [(4, 12), (16, 24), (36, 76)],
amine@231 373 ),
amine@231 374 mono_aw_0_4_max_silence_0_3=(
amine@231 375 0.2,
amine@231 376 5,
amine@231 377 0.3,
amine@231 378 1,
amine@231 379 {"uc": 1, "aw": 0.4},
amine@231 380 [(4, 12), (16, 24), (36, 76)],
amine@231 381 ),
amine@231 382 mono_aw_0_4_max_silence_0_4=(
amine@231 383 0.2,
amine@231 384 5,
amine@231 385 0.4,
amine@231 386 1,
amine@231 387 {"uc": 1, "aw": 0.4},
amine@231 388 [(4, 28), (36, 76)],
amine@231 389 ),
amine@220 390 stereo_uc_1_analysis_window_0_2=(
amine@220 391 0.2,
amine@220 392 5,
amine@220 393 0.2,
amine@220 394 2,
amine@220 395 {"uc": 1, "analysis_window": 0.2},
amine@220 396 [(2, 30), (34, 76)],
amine@220 397 ),
amine@231 398 stereo_uc_2_analysis_window_0_2=(
amine@231 399 0.2,
amine@231 400 5,
amine@231 401 0.2,
amine@231 402 2,
amine@231 403 {"uc": 2, "analysis_window": 0.2},
amine@231 404 [(10, 32), (36, 76)],
amine@231 405 ),
amine@233 406 stereo_uc_mix_aw_0_1_max_silence_0=(
amine@233 407 0.2,
amine@233 408 5,
amine@233 409 0,
amine@233 410 2,
amine@233 411 {"uc": "mix", "analysis_window": 0.1},
amine@233 412 [(10, 14), (17, 24), (26, 29), (36, 76)],
amine@233 413 ),
amine@233 414 stereo_uc_mix_aw_0_1_max_silence_0_1=(
amine@233 415 0.2,
amine@233 416 5,
amine@233 417 0.1,
amine@233 418 2,
amine@233 419 {"uc": "mix", "analysis_window": 0.1},
amine@233 420 [(10, 15), (17, 25), (26, 30), (36, 76)],
amine@233 421 ),
amine@233 422 stereo_uc_mix_aw_0_1_max_silence_0_2=(
amine@233 423 0.2,
amine@233 424 5,
amine@233 425 0.2,
amine@233 426 2,
amine@233 427 {"uc": "mix", "analysis_window": 0.1},
amine@233 428 [(10, 16), (17, 31), (36, 76)],
amine@233 429 ),
amine@233 430 stereo_uc_mix_aw_0_1_max_silence_0_3=(
amine@233 431 0.2,
amine@233 432 5,
amine@233 433 0.3,
amine@233 434 2,
amine@233 435 {"uc": "mix", "analysis_window": 0.1},
amine@233 436 [(10, 32), (36, 76)],
amine@233 437 ),
amine@233 438 stereo_uc_mix_aw_0_2_max_silence_0_min_dur_0_3=(
amine@233 439 0.3,
amine@233 440 5,
amine@233 441 0,
amine@233 442 2,
amine@233 443 {"uc": "mix", "analysis_window": 0.2},
amine@233 444 [(10, 14), (16, 24), (36, 76)],
amine@233 445 ),
amine@233 446 stereo_uc_mix_aw_0_2_max_silence_0_min_dur_0_41=(
amine@233 447 0.41,
amine@233 448 5,
amine@233 449 0,
amine@233 450 2,
amine@233 451 {"uc": "mix", "analysis_window": 0.2},
amine@233 452 [(16, 24), (36, 76)],
amine@233 453 ),
amine@233 454 stereo_uc_mix_aw_0_2_max_silence_0_1=(
amine@233 455 0.2,
amine@233 456 5,
amine@233 457 0.1,
amine@233 458 2,
amine@233 459 {"uc": "mix", "analysis_window": 0.2},
amine@233 460 [(10, 14), (16, 24), (26, 28), (36, 76)],
amine@233 461 ),
amine@233 462 stereo_uc_mix_aw_0_2_max_silence_0_2=(
amine@233 463 0.2,
amine@233 464 5,
amine@233 465 0.2,
amine@233 466 2,
amine@233 467 {"uc": "mix", "analysis_window": 0.2},
amine@233 468 [(10, 30), (36, 76)],
amine@233 469 ),
amine@233 470 stereo_uc_mix_aw_0_2_max_silence_0_4=(
amine@233 471 0.2,
amine@233 472 5,
amine@233 473 0.4,
amine@233 474 2,
amine@233 475 {"uc": "mix", "analysis_window": 0.2},
amine@233 476 [(10, 32), (36, 76)],
amine@233 477 ),
amine@233 478 stereo_uc_mix_aw_0_2_max_silence_0_5=(
amine@233 479 0.2,
amine@233 480 5,
amine@233 481 0.5,
amine@233 482 2,
amine@233 483 {"uc": "mix", "analysis_window": 0.2},
amine@233 484 [(10, 32), (36, 76)],
amine@233 485 ),
amine@233 486 stereo_uc_mix_aw_0_2_max_silence_0_6=(
amine@233 487 0.2,
amine@233 488 5,
amine@233 489 0.6,
amine@233 490 2,
amine@233 491 {"uc": "mix", "analysis_window": 0.2},
amine@233 492 [(10, 34), (36, 76)],
amine@233 493 ),
amine@233 494 stereo_uc_mix_aw_0_3_max_silence_0=(
amine@233 495 0.2,
amine@233 496 5,
amine@233 497 0,
amine@233 498 2,
amine@233 499 {"uc": "mix", "analysis_window": 0.3},
amine@233 500 [(9, 24), (27, 30), (36, 76)],
amine@233 501 ),
amine@233 502 stereo_uc_mix_aw_0_3_max_silence_0_min_dur_0_3=(
amine@233 503 0.4,
amine@233 504 5,
amine@233 505 0,
amine@233 506 2,
amine@233 507 {"uc": "mix", "analysis_window": 0.3},
amine@233 508 [(9, 24), (36, 76)],
amine@233 509 ),
amine@233 510 stereo_uc_mix_aw_0_3_max_silence_0_6=(
amine@233 511 0.2,
amine@233 512 5,
amine@233 513 0.6,
amine@233 514 2,
amine@233 515 {"uc": "mix", "analysis_window": 0.3},
amine@233 516 [(9, 57), (57, 76)],
amine@233 517 ),
amine@233 518 stereo_uc_mix_aw_0_3_max_silence_0_6_max_dur_5_1=(
amine@233 519 0.2,
amine@233 520 5.1,
amine@233 521 0.6,
amine@233 522 2,
amine@233 523 {"uc": "mix", "analysis_window": 0.3},
amine@233 524 [(9, 60), (60, 76)],
amine@233 525 ),
amine@233 526 stereo_uc_mix_aw_0_3_max_silence_0_6_max_dur_5_2=(
amine@233 527 0.2,
amine@233 528 5.2,
amine@233 529 0.6,
amine@233 530 2,
amine@233 531 {"uc": "mix", "analysis_window": 0.3},
amine@233 532 [(9, 60), (60, 76)],
amine@233 533 ),
amine@233 534 stereo_uc_mix_aw_0_3_max_silence_0_6_max_dur_5_3=(
amine@233 535 0.2,
amine@233 536 5.3,
amine@233 537 0.6,
amine@233 538 2,
amine@233 539 {"uc": "mix", "analysis_window": 0.3},
amine@233 540 [(9, 60), (60, 76)],
amine@233 541 ),
amine@233 542 stereo_uc_mix_aw_0_3_max_silence_0_6_max_dur_5_4=(
amine@233 543 0.2,
amine@233 544 5.4,
amine@233 545 0.6,
amine@233 546 2,
amine@233 547 {"uc": "mix", "analysis_window": 0.3},
amine@233 548 [(9, 63), (63, 76)],
amine@233 549 ),
amine@233 550 stereo_uc_mix_aw_0_4_max_silence_0=(
amine@233 551 0.2,
amine@233 552 5,
amine@233 553 0,
amine@233 554 2,
amine@233 555 {"uc": "mix", "analysis_window": 0.4},
amine@233 556 [(16, 24), (36, 76)],
amine@233 557 ),
amine@233 558 stereo_uc_mix_aw_0_4_max_silence_0_3=(
amine@233 559 0.2,
amine@233 560 5,
amine@233 561 0.3,
amine@233 562 2,
amine@233 563 {"uc": "mix", "analysis_window": 0.4},
amine@233 564 [(16, 24), (36, 76)],
amine@233 565 ),
amine@233 566 stereo_uc_mix_aw_0_4_max_silence_0_4=(
amine@233 567 0.2,
amine@233 568 5,
amine@233 569 0.4,
amine@233 570 2,
amine@233 571 {"uc": "mix", "analysis_window": 0.4},
amine@233 572 [(16, 28), (36, 76)],
amine@233 573 ),
amine@220 574 )
amine@220 575 def test_split_analysis_window(
amine@220 576 self, min_dur, max_dur, max_silence, channels, kwargs, expected
amine@220 577 ):
amine@220 578
amine@220 579 mono_or_stereo = "mono" if channels == 1 else "stereo"
amine@220 580 filename = "tests/data/test_split_10HZ_{}.raw".format(mono_or_stereo)
amine@220 581 with open(filename, "rb") as fp:
amine@220 582 data = fp.read()
amine@220 583
amine@220 584 regions = split(
amine@220 585 data,
amine@220 586 min_dur=min_dur,
amine@220 587 max_dur=max_dur,
amine@220 588 max_silence=max_silence,
amine@220 589 drop_trailing_silence=False,
amine@220 590 strict_min_dur=False,
amine@220 591 sr=10,
amine@220 592 sw=2,
amine@220 593 ch=channels,
amine@220 594 **kwargs
amine@220 595 )
amine@220 596 regions = list(regions)
amine@220 597 sample_width = 2
amine@220 598 import numpy as np
amine@220 599
amine@220 600 use_channel = kwargs.get("use_channel", kwargs.get("uc"))
amine@220 601 # extrat channel of interest
amine@220 602 if channels != 1:
amine@220 603 use_channel = kwargs.get("use_channel", kwargs.get("uc"))
amine@220 604 use_channel = _normalize_use_channel(use_channel)
amine@220 605 data = _extract_selected_channel(
amine@220 606 data, channels, sample_width, use_channel=use_channel
amine@220 607 )
amine@220 608 err_msg = "Wrong number of regions after split, expected: "
amine@220 609 err_msg += "{}, found: {}".format(expected, regions)
amine@220 610 self.assertEqual(len(regions), len(expected), err_msg)
amine@220 611 for reg, exp in zip(regions, expected):
amine@220 612 onset, offset = exp
amine@220 613 exp_data = data[onset * sample_width : offset * sample_width]
amine@220 614 self.assertEqual(bytes(reg), exp_data)
amine@220 615
amine@220 616 @genty_dataset(
amine@212 617 filename_audio_format=(
amine@212 618 "tests/data/test_split_10HZ_stereo.raw",
amine@212 619 {"audio_format": "raw", "sr": 10, "sw": 2, "ch": 2},
amine@212 620 ),
amine@212 621 filename_audio_format_short_name=(
amine@212 622 "tests/data/test_split_10HZ_stereo.raw",
amine@212 623 {"fmt": "raw", "sr": 10, "sw": 2, "ch": 2},
amine@212 624 ),
amine@212 625 filename_no_audio_format=(
amine@212 626 "tests/data/test_split_10HZ_stereo.raw",
amine@212 627 {"sr": 10, "sw": 2, "ch": 2},
amine@212 628 ),
amine@212 629 filename_no_long_audio_params=(
amine@212 630 "tests/data/test_split_10HZ_stereo.raw",
amine@212 631 {"sampling_rate": 10, "sample_width": 2, "channels": 2},
amine@212 632 ),
amine@212 633 bytes_=(
amine@212 634 open("tests/data/test_split_10HZ_stereo.raw", "rb").read(),
amine@212 635 {"sr": 10, "sw": 2, "ch": 2},
amine@212 636 ),
amine@212 637 audio_reader=(
amine@212 638 AudioDataSource(
amine@212 639 "tests/data/test_split_10HZ_stereo.raw",
amine@212 640 sr=10,
amine@212 641 sw=2,
amine@212 642 ch=2,
amine@212 643 block_dur=0.1,
amine@212 644 ),
amine@212 645 {},
amine@212 646 ),
amine@212 647 audio_region=(
amine@212 648 AudioRegion(
amine@212 649 open("tests/data/test_split_10HZ_stereo.raw", "rb").read(),
amine@212 650 0,
amine@212 651 10,
amine@212 652 2,
amine@212 653 2,
amine@212 654 ),
amine@212 655 {},
amine@212 656 ),
amine@212 657 audio_source=(
amine@212 658 get_audio_source(
amine@212 659 "tests/data/test_split_10HZ_stereo.raw", sr=10, sw=2, ch=2
amine@212 660 ),
amine@212 661 {},
amine@212 662 ),
amine@212 663 )
amine@212 664 def test_split_input_type(self, input, kwargs):
amine@212 665
amine@212 666 with open("tests/data/test_split_10HZ_mono.raw", "rb") as fp:
amine@212 667 data = fp.read()
amine@212 668
amine@212 669 regions = split(
amine@212 670 input,
amine@212 671 min_dur=0.2,
amine@212 672 max_dur=5,
amine@212 673 max_silence=0.2,
amine@212 674 drop_trailing_silence=False,
amine@212 675 strict_min_dur=False,
amine@212 676 analysis_window=0.1,
amine@212 677 **kwargs
amine@212 678 )
amine@212 679 regions = list(regions)
amine@212 680 expected = [(2, 16), (17, 31), (34, 76)]
amine@212 681 sample_width = 2
amine@212 682 err_msg = "Wrong number of regions after split, expected: "
amine@212 683 err_msg += "{}, found: {}".format(expected, regions)
amine@212 684 self.assertEqual(len(regions), len(expected), err_msg)
amine@211 685 for reg, exp in zip(regions, expected):
amine@211 686 onset, offset = exp
amine@211 687 exp_data = data[onset * sample_width : offset * sample_width]
amine@211 688 self.assertEqual(bytes(reg), exp_data)
amine@211 689
amine@223 690 @genty_dataset(
amine@223 691 min_dur_greater_than_max_dur=(0.5, 0.4, 0.1),
amine@223 692 durations_OK_but_wrong_number_of_analysis_windows=(0.44, 0.49, 0.1),
amine@223 693 )
amine@223 694 def test_split_wrong_min_max_dur(self, min_dur, max_dur, analysis_window):
amine@223 695
amine@223 696 with self.assertRaises(ValueError) as val_err:
amine@223 697 split(
amine@223 698 b"0" * 16,
amine@223 699 min_dur=min_dur,
amine@223 700 max_dur=max_dur,
amine@223 701 max_silence=0.2,
amine@223 702 sr=16000,
amine@223 703 sw=1,
amine@223 704 ch=1,
amine@223 705 analysis_window=analysis_window,
amine@223 706 )
amine@223 707
amine@223 708 err_msg = "'min_dur' ({0} sec.) results in {1} analysis "
amine@223 709 err_msg += "window(s) ({1} == ceil({0} / {2})) which is "
amine@223 710 err_msg += "higher than the number of analysis window(s) for "
amine@223 711 err_msg += "'max_dur' ({3} == floor({4} / {2}))"
amine@223 712
amine@223 713 err_msg = err_msg.format(
amine@223 714 min_dur,
amine@223 715 math.ceil(min_dur / analysis_window),
amine@223 716 analysis_window,
amine@223 717 math.floor(max_dur / analysis_window),
amine@223 718 max_dur,
amine@223 719 )
amine@223 720 self.assertEqual(err_msg, str(val_err.exception))
amine@223 721
amine@224 722 @genty_dataset(
amine@224 723 max_silence_equals_max_dur=(0.5, 0.5, 0.1),
amine@224 724 max_silence_greater_than_max_dur=(0.5, 0.4, 0.1),
amine@224 725 durations_OK_but_wrong_number_of_analysis_windows=(0.44, 0.49, 0.1),
amine@224 726 )
amine@224 727 def test_split_wrong_max_silence_max_dur(
amine@224 728 self, max_silence, max_dur, analysis_window
amine@224 729 ):
amine@224 730
amine@224 731 with self.assertRaises(ValueError) as val_err:
amine@224 732 split(
amine@224 733 b"0" * 16,
amine@224 734 min_dur=0.2,
amine@224 735 max_dur=max_dur,
amine@224 736 max_silence=max_silence,
amine@224 737 sr=16000,
amine@224 738 sw=1,
amine@224 739 ch=1,
amine@224 740 analysis_window=analysis_window,
amine@224 741 )
amine@224 742
amine@224 743 err_msg = "'max_silence' ({0} sec.) results in {1} analysis "
amine@224 744 err_msg += "window(s) ({1} == floor({0} / {2})) which is "
amine@224 745 err_msg += "higher or equal to the number of analysis window(s) for "
amine@224 746 err_msg += "'max_dur' ({3} == floor({4} / {2}))"
amine@224 747
amine@224 748 err_msg = err_msg.format(
amine@224 749 max_silence,
amine@224 750 math.floor(max_silence / analysis_window),
amine@224 751 analysis_window,
amine@224 752 math.floor(max_dur / analysis_window),
amine@224 753 max_dur,
amine@224 754 )
amine@224 755 self.assertEqual(err_msg, str(val_err.exception))
amine@224 756
amine@226 757 @genty_dataset(
amine@226 758 negative_min_dur=({"min_dur": -1},),
amine@226 759 zero_min_dur=({"min_dur": 0},),
amine@226 760 negative_max_dur=({"max_dur": -1},),
amine@226 761 zero_max_dur=({"max_dur": 0},),
amine@226 762 negative_max_silence=({"max_silence": -1},),
amine@226 763 )
amine@226 764 def test_split_negative_temporal_params(self, wrong_param):
amine@226 765
amine@226 766 params = {"min_dur": 0.2, "max_dur": 0.5, "max_silence": 0.1}
amine@226 767 params.update(wrong_param)
amine@226 768 with self.assertRaises(ValueError) as val_err:
amine@226 769 split(None, **params)
amine@226 770
amine@226 771 name = set(wrong_param).pop()
amine@226 772 value = wrong_param[name]
amine@226 773 err_msg = "'{}' ({}) must be >{} 0".format(
amine@226 774 name, value, "=" if name == "max_silence" else ""
amine@226 775 )
amine@226 776 self.assertEqual(err_msg, str(val_err.exception))
amine@226 777
amine@207 778
amine@207 779 @genty
amine@207 780 class TestAudioRegion(TestCase):
amine@86 781 @genty_dataset(
amine@86 782 simple=(b"\0" * 8000, 0, 8000, 1, 1, 1, 1, 1000),
amine@86 783 one_ms_less_than_1_sec=(
amine@86 784 b"\0" * 7992,
amine@86 785 0,
amine@86 786 8000,
amine@86 787 1,
amine@86 788 1,
amine@86 789 0.999,
amine@86 790 0.999,
amine@86 791 999,
amine@86 792 ),
amine@86 793 tree_quarter_ms_less_than_1_sec=(
amine@86 794 b"\0" * 7994,
amine@86 795 0,
amine@86 796 8000,
amine@86 797 1,
amine@86 798 1,
amine@86 799 0.99925,
amine@86 800 0.99925,
amine@86 801 999,
amine@86 802 ),
amine@86 803 half_ms_less_than_1_sec=(
amine@86 804 b"\0" * 7996,
amine@86 805 0,
amine@86 806 8000,
amine@86 807 1,
amine@86 808 1,
amine@86 809 0.9995,
amine@86 810 0.9995,
amine@86 811 1000,
amine@86 812 ),
amine@86 813 quarter_ms_less_than_1_sec=(
amine@86 814 b"\0" * 7998,
amine@86 815 0,
amine@86 816 8000,
amine@86 817 1,
amine@86 818 1,
amine@86 819 0.99975,
amine@86 820 0.99975,
amine@86 821 1000,
amine@86 822 ),
amine@86 823 simple_sample_width_2=(b"\0" * 8000 * 2, 0, 8000, 2, 1, 1, 1, 1000),
amine@86 824 simple_stereo=(b"\0" * 8000 * 2, 0, 8000, 1, 2, 1, 1, 1000),
amine@86 825 simple_multichannel=(b"\0" * 8000 * 5, 0, 8000, 1, 5, 1, 1, 1000),
amine@86 826 simple_sample_width_2_multichannel=(
amine@86 827 b"\0" * 8000 * 2 * 5,
amine@86 828 0,
amine@86 829 8000,
amine@86 830 2,
amine@86 831 5,
amine@86 832 1,
amine@86 833 1,
amine@86 834 1000,
amine@86 835 ),
amine@86 836 one_ms_less_than_1s_sw_2_multichannel=(
amine@86 837 b"\0" * 7992 * 2 * 5,
amine@86 838 0,
amine@86 839 8000,
amine@86 840 2,
amine@86 841 5,
amine@86 842 0.999,
amine@86 843 0.999,
amine@86 844 999,
amine@86 845 ),
amine@86 846 tree_qrt_ms_lt_1_s_sw_2_multichannel=(
amine@86 847 b"\0" * 7994 * 2 * 5,
amine@86 848 0,
amine@86 849 8000,
amine@86 850 2,
amine@86 851 5,
amine@86 852 0.99925,
amine@86 853 0.99925,
amine@86 854 999,
amine@86 855 ),
amine@86 856 half_ms_lt_1s_sw_2_multichannel=(
amine@86 857 b"\0" * 7996 * 2 * 5,
amine@86 858 0,
amine@86 859 8000,
amine@86 860 2,
amine@86 861 5,
amine@86 862 0.9995,
amine@86 863 0.9995,
amine@86 864 1000,
amine@86 865 ),
amine@86 866 quarter_ms_lt_1s_sw_2_multichannel=(
amine@86 867 b"\0" * 7998 * 2 * 5,
amine@86 868 0,
amine@86 869 8000,
amine@86 870 2,
amine@86 871 5,
amine@86 872 0.99975,
amine@86 873 0.99975,
amine@86 874 1000,
amine@86 875 ),
amine@86 876 arbitrary_length_1=(
amine@86 877 b"\0" * int(8000 * 1.33),
amine@86 878 2.7,
amine@86 879 8000,
amine@86 880 1,
amine@86 881 1,
amine@86 882 4.03,
amine@86 883 1.33,
amine@86 884 1330,
amine@86 885 ),
amine@86 886 arbitrary_length_2=(
amine@86 887 b"\0" * int(8000 * 0.476),
amine@86 888 11.568,
amine@86 889 8000,
amine@86 890 1,
amine@86 891 1,
amine@86 892 12.044,
amine@86 893 0.476,
amine@86 894 476,
amine@86 895 ),
amine@86 896 arbitrary_length_sw_2_multichannel=(
amine@86 897 b"\0" * int(8000 * 1.711) * 2 * 3,
amine@86 898 9.415,
amine@86 899 8000,
amine@86 900 2,
amine@86 901 3,
amine@86 902 11.126,
amine@86 903 1.711,
amine@86 904 1711,
amine@86 905 ),
amine@86 906 arbitrary_samplig_rate=(
amine@86 907 b"\0" * int(3172 * 1.318),
amine@86 908 17.236,
amine@86 909 3172,
amine@86 910 1,
amine@86 911 1,
amine@86 912 17.236 + int(3172 * 1.318) / 3172,
amine@86 913 int(3172 * 1.318) / 3172,
amine@86 914 1318,
amine@86 915 ),
amine@86 916 arbitrary_sr_sw_2_multichannel=(
amine@86 917 b"\0" * int(11317 * 0.716) * 2 * 3,
amine@86 918 18.811,
amine@86 919 11317,
amine@86 920 2,
amine@86 921 3,
amine@86 922 18.811 + int(11317 * 0.716) / 11317,
amine@86 923 int(11317 * 0.716) / 11317,
amine@86 924 716,
amine@86 925 ),
amine@86 926 )
amine@86 927 def test_creation(
amine@86 928 self,
amine@86 929 data,
amine@86 930 start,
amine@86 931 sampling_rate,
amine@86 932 sample_width,
amine@86 933 channels,
amine@86 934 expected_end,
amine@86 935 expected_duration_s,
amine@86 936 expected_duration_ms,
amine@86 937 ):
amine@86 938 region = AudioRegion(
amine@86 939 data, start, sampling_rate, sample_width, channels
amine@86 940 )
amine@86 941 self.assertEqual(region.sampling_rate, sampling_rate)
amine@86 942 self.assertEqual(region.sr, sampling_rate)
amine@86 943 self.assertEqual(region.sample_width, sample_width)
amine@86 944 self.assertEqual(region.sw, sample_width)
amine@86 945 self.assertEqual(region.channels, channels)
amine@86 946 self.assertEqual(region.ch, channels)
amine@86 947 self.assertEqual(region.start, start)
amine@86 948 self.assertEqual(region.end, expected_end)
amine@86 949 self.assertEqual(region.duration, expected_duration_s)
amine@86 950 self.assertEqual(len(region), expected_duration_ms)
amine@86 951 self.assertEqual(bytes(region), data)
amine@88 952
amine@97 953 def test_creation_invalid_data_exception(self):
amine@97 954 with self.assertRaises(AudioParameterError) as audio_param_err:
amine@97 955 _ = AudioRegion(
amine@97 956 data=b"ABCDEFGHI",
amine@97 957 start=0,
amine@97 958 sampling_rate=8,
amine@97 959 sample_width=2,
amine@97 960 channels=1,
amine@97 961 )
amine@97 962 self.assertEqual(
amine@97 963 "The length of audio data must be an integer "
amine@97 964 "multiple of `sample_width * channels`",
amine@97 965 str(audio_param_err.exception),
amine@97 966 )
amine@97 967
amine@88 968 @genty_dataset(
amine@192 969 simple=("output.wav", 1.230, "output.wav"),
amine@192 970 start=("output_{start}.wav", 1.230, "output_1.23.wav"),
amine@192 971 start_2=("output_{start}.wav", 1.233712, "output_1.233712.wav"),
amine@192 972 start_3=("output_{start}.wav", 1.2300001, "output_1.23.wav"),
amine@192 973 start_4=("output_{start:.3f}.wav", 1.233712, "output_1.234.wav"),
amine@192 974 start_5=(
amine@192 975 "output_{start:.8f}.wav",
amine@192 976 1.233712345,
amine@192 977 "output_1.23371200.wav",
amine@192 978 ),
amine@192 979 start_end_duration=(
amine@192 980 "output_{start}_{end}_{duration}.wav",
amine@192 981 1.455,
amine@192 982 "output_1.455_2.455_1.0.wav",
amine@192 983 ),
amine@192 984 start_end_duration_2=(
amine@192 985 "output_{start}_{end}_{duration}.wav",
amine@192 986 1.455321,
amine@192 987 "output_1.455321_2.455321_1.0.wav",
amine@192 988 ),
amine@192 989 )
amine@192 990 def test_save(self, format, start, expected):
amine@192 991 with TemporaryDirectory() as tmpdir:
amine@192 992 region = AudioRegion(b"0" * 160, start, 160, 1, 1)
amine@192 993 format = os.path.join(tmpdir, format)
amine@192 994 filename = region.save(format)[len(tmpdir) + 1 :]
amine@192 995 self.assertEqual(filename, expected)
amine@192 996
amine@193 997 def test_save_file_exists_exception(self):
amine@193 998 with TemporaryDirectory() as tmpdir:
amine@193 999 filename = os.path.join(tmpdir, "output.wav")
amine@193 1000 open(filename, "w").close()
amine@193 1001 region = AudioRegion(b"0" * 160, 0, 160, 1, 1)
amine@193 1002 with self.assertRaises(FileExistsError):
amine@193 1003 region.save(filename, exists_ok=False)
amine@193 1004
amine@192 1005 @genty_dataset(
amine@194 1006 first_half=(
amine@194 1007 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@194 1008 slice(0, 500),
amine@194 1009 0,
amine@194 1010 b"a" * 80,
amine@194 1011 ),
amine@194 1012 second_half=(
amine@194 1013 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@194 1014 slice(500, None),
amine@194 1015 0.5,
amine@194 1016 b"b" * 80,
amine@194 1017 ),
amine@194 1018 second_half_negative=(
amine@194 1019 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@194 1020 slice(-500, None),
amine@194 1021 0.5,
amine@194 1022 b"b" * 80,
amine@194 1023 ),
amine@194 1024 middle=(
amine@194 1025 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@194 1026 slice(200, 750),
amine@194 1027 0.2,
amine@194 1028 b"a" * 48 + b"b" * 40,
amine@194 1029 ),
amine@194 1030 middle_negative=(
amine@194 1031 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@194 1032 slice(-800, -250),
amine@194 1033 0.2,
amine@194 1034 b"a" * 48 + b"b" * 40,
amine@194 1035 ),
amine@194 1036 middle_sw2=(
amine@194 1037 AudioRegion(b"a" * 160 + b"b" * 160, 0, 160, 2, 1),
amine@194 1038 slice(200, 750),
amine@194 1039 0.2,
amine@194 1040 b"a" * 96 + b"b" * 80,
amine@194 1041 ),
amine@194 1042 middle_ch2=(
amine@194 1043 AudioRegion(b"a" * 160 + b"b" * 160, 0, 160, 1, 2),
amine@194 1044 slice(200, 750),
amine@194 1045 0.2,
amine@194 1046 b"a" * 96 + b"b" * 80,
amine@194 1047 ),
amine@194 1048 middle_sw2_ch2=(
amine@194 1049 AudioRegion(b"a" * 320 + b"b" * 320, 0, 160, 2, 2),
amine@194 1050 slice(200, 750),
amine@194 1051 0.2,
amine@194 1052 b"a" * 192 + b"b" * 160,
amine@194 1053 ),
amine@194 1054 but_first_sample=(
amine@194 1055 AudioRegion(b"a" * 4000 + b"b" * 4000, 0, 8000, 1, 1),
amine@194 1056 slice(1, None),
amine@194 1057 0.001,
amine@194 1058 b"a" * (4000 - 8) + b"b" * 4000,
amine@194 1059 ),
amine@194 1060 but_first_sample_negative=(
amine@194 1061 AudioRegion(b"a" * 4000 + b"b" * 4000, 0, 8000, 1, 1),
amine@194 1062 slice(-999, None),
amine@194 1063 0.001,
amine@194 1064 b"a" * (4000 - 8) + b"b" * 4000,
amine@194 1065 ),
amine@194 1066 but_last_sample=(
amine@194 1067 AudioRegion(b"a" * 4000 + b"b" * 4000, 0, 8000, 1, 1),
amine@194 1068 slice(0, 999),
amine@194 1069 0,
amine@194 1070 b"a" * 4000 + b"b" * (4000 - 8),
amine@194 1071 ),
amine@194 1072 but_last_sample_negative=(
amine@194 1073 AudioRegion(b"a" * 4000 + b"b" * 4000, 0, 8000, 1, 1),
amine@194 1074 slice(0, -1),
amine@194 1075 0,
amine@194 1076 b"a" * 4000 + b"b" * (4000 - 8),
amine@194 1077 ),
amine@194 1078 big_negative_start=(
amine@194 1079 AudioRegion(b"a" * 160, 0, 160, 1, 1),
amine@194 1080 slice(-5000, None),
amine@194 1081 0,
amine@194 1082 b"a" * 160,
amine@194 1083 ),
amine@194 1084 big_negative_stop=(
amine@194 1085 AudioRegion(b"a" * 160, 0, 160, 1, 1),
amine@194 1086 slice(None, -1500),
amine@194 1087 0,
amine@194 1088 b"",
amine@194 1089 ),
amine@194 1090 empty=(
amine@194 1091 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@194 1092 slice(0, 0),
amine@194 1093 0,
amine@194 1094 b"",
amine@194 1095 ),
amine@194 1096 empty_start_stop_reversed=(
amine@194 1097 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@194 1098 slice(200, 100),
amine@194 1099 0.2,
amine@194 1100 b"",
amine@194 1101 ),
amine@194 1102 empty_big_positive_start=(
amine@194 1103 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@194 1104 slice(2000, 3000),
amine@194 1105 2,
amine@194 1106 b"",
amine@194 1107 ),
amine@194 1108 empty_negative_reversed=(
amine@194 1109 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@194 1110 slice(-100, -200),
amine@194 1111 0.9,
amine@194 1112 b"",
amine@194 1113 ),
amine@194 1114 empty_big_negative_stop=(
amine@194 1115 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@194 1116 slice(0, -2000),
amine@194 1117 0,
amine@194 1118 b"",
amine@194 1119 ),
amine@230 1120 arbitrary_sampling_rate=(
amine@230 1121 AudioRegion(b"a" * 124 + b"b" * 376, 0, 1234, 1, 1),
amine@230 1122 slice(100, 200),
amine@230 1123 123 / 1234,
amine@230 1124 b"a" + b"b" * 123,
amine@230 1125 ),
amine@194 1126 )
amine@231 1127 def test_region_temporal_slicing(
amine@194 1128 self, region, slice_, expected_start, expected_data
amine@194 1129 ):
amine@229 1130 sub_region = region.millis[slice_]
amine@194 1131 self.assertEqual(sub_region.start, expected_start)
amine@194 1132 self.assertEqual(bytes(sub_region), expected_data)
amine@194 1133
amine@229 1134 start_sec = slice_.start / 1000 if slice_.start is not None else None
amine@229 1135 stop_sec = slice_.stop / 1000 if slice_.stop is not None else None
amine@229 1136
amine@229 1137 sub_region = region.sec[start_sec:stop_sec]
amine@229 1138 self.assertEqual(sub_region.start, expected_start)
amine@229 1139 self.assertEqual(bytes(sub_region), expected_data)
amine@229 1140
amine@194 1141 @genty_dataset(
amine@231 1142 first_half=(
amine@231 1143 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@231 1144 slice(0, 80),
amine@231 1145 0,
amine@231 1146 b"a" * 80,
amine@231 1147 ),
amine@231 1148 second_half=(
amine@231 1149 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@231 1150 slice(80, None),
amine@231 1151 0.5,
amine@231 1152 b"b" * 80,
amine@231 1153 ),
amine@231 1154 second_half_negative=(
amine@231 1155 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@231 1156 slice(-80, None),
amine@231 1157 0.5,
amine@231 1158 b"b" * 80,
amine@231 1159 ),
amine@231 1160 middle=(
amine@231 1161 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@231 1162 slice(160 // 5, 160 // 4 * 3),
amine@231 1163 0.2,
amine@231 1164 b"a" * 48 + b"b" * 40,
amine@231 1165 ),
amine@231 1166 middle_negative=(
amine@231 1167 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@231 1168 slice(-160 // 5 * 4, -160 // 4),
amine@231 1169 0.2,
amine@231 1170 b"a" * 48 + b"b" * 40,
amine@231 1171 ),
amine@231 1172 middle_sw2=(
amine@231 1173 AudioRegion(b"a" * 160 + b"b" * 160, 0, 160, 2, 1),
amine@231 1174 slice(160 // 5, 160 // 4 * 3),
amine@231 1175 0.2,
amine@231 1176 b"a" * 96 + b"b" * 80,
amine@231 1177 ),
amine@231 1178 middle_ch2=(
amine@231 1179 AudioRegion(b"a" * 160 + b"b" * 160, 0, 160, 1, 2),
amine@231 1180 slice(160 // 5, 160 // 4 * 3),
amine@231 1181 0.2,
amine@231 1182 b"a" * 96 + b"b" * 80,
amine@231 1183 ),
amine@231 1184 middle_sw2_ch2=(
amine@231 1185 AudioRegion(b"a" * 320 + b"b" * 320, 0, 160, 2, 2),
amine@231 1186 slice(160 // 5, 160 // 4 * 3),
amine@231 1187 0.2,
amine@231 1188 b"a" * 192 + b"b" * 160,
amine@231 1189 ),
amine@231 1190 but_first_sample=(
amine@231 1191 AudioRegion(b"a" * 4000 + b"b" * 4000, 0, 8000, 1, 1),
amine@231 1192 slice(1, None),
amine@231 1193 1 / 8000,
amine@231 1194 b"a" * (4000 - 1) + b"b" * 4000,
amine@231 1195 ),
amine@231 1196 but_first_sample_negative=(
amine@231 1197 AudioRegion(b"a" * 4000 + b"b" * 4000, 0, 8000, 1, 1),
amine@231 1198 slice(-7999, None),
amine@231 1199 1 / 8000,
amine@231 1200 b"a" * (4000 - 1) + b"b" * 4000,
amine@231 1201 ),
amine@231 1202 but_last_sample=(
amine@231 1203 AudioRegion(b"a" * 4000 + b"b" * 4000, 0, 8000, 1, 1),
amine@231 1204 slice(0, 7999),
amine@231 1205 0,
amine@231 1206 b"a" * 4000 + b"b" * (4000 - 1),
amine@231 1207 ),
amine@231 1208 but_last_sample_negative=(
amine@231 1209 AudioRegion(b"a" * 4000 + b"b" * 4000, 0, 8000, 1, 1),
amine@231 1210 slice(0, -1),
amine@231 1211 0,
amine@231 1212 b"a" * 4000 + b"b" * (4000 - 1),
amine@231 1213 ),
amine@231 1214 big_negative_start=(
amine@231 1215 AudioRegion(b"a" * 160, 0, 160, 1, 1),
amine@231 1216 slice(-1600, None),
amine@231 1217 0,
amine@231 1218 b"a" * 160,
amine@231 1219 ),
amine@231 1220 big_negative_stop=(
amine@231 1221 AudioRegion(b"a" * 160, 0, 160, 1, 1),
amine@231 1222 slice(None, -1600),
amine@231 1223 0,
amine@231 1224 b"",
amine@231 1225 ),
amine@231 1226 empty=(
amine@231 1227 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@231 1228 slice(0, 0),
amine@231 1229 0,
amine@231 1230 b"",
amine@231 1231 ),
amine@231 1232 empty_start_stop_reversed=(
amine@231 1233 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@231 1234 slice(80, 40),
amine@231 1235 0.5,
amine@231 1236 b"",
amine@231 1237 ),
amine@231 1238 empty_big_positive_start=(
amine@231 1239 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@231 1240 slice(1600, 3000),
amine@231 1241 10,
amine@231 1242 b"",
amine@231 1243 ),
amine@231 1244 empty_negative_reversed=(
amine@231 1245 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@231 1246 slice(-16, -32),
amine@231 1247 0.9,
amine@231 1248 b"",
amine@231 1249 ),
amine@231 1250 empty_big_negative_stop=(
amine@231 1251 AudioRegion(b"a" * 80 + b"b" * 80, 0, 160, 1, 1),
amine@231 1252 slice(0, -2000),
amine@231 1253 0,
amine@231 1254 b"",
amine@231 1255 ),
amine@231 1256 arbitrary_sampling_rate=(
amine@231 1257 AudioRegion(b"a" * 124 + b"b" * 376, 0, 1235, 1, 1),
amine@231 1258 slice(100, 200),
amine@231 1259 100 / 1235,
amine@231 1260 b"a" * 24 + b"b" * 76,
amine@231 1261 ),
amine@231 1262 arbitrary_sampling_rate_middle_sw2_ch2=(
amine@231 1263 AudioRegion(b"a" * 124 + b"b" * 376, 0, 1235, 2, 2),
amine@231 1264 slice(25, 50),
amine@231 1265 25 / 1235,
amine@231 1266 b"a" * 24 + b"b" * 76,
amine@231 1267 ),
amine@231 1268 )
amine@231 1269 def test_region_sample_slicing(
amine@231 1270 self, region, slice_, expected_start, expected_data
amine@231 1271 ):
amine@231 1272 sub_region = region[slice_]
amine@231 1273 self.assertEqual(sub_region.start, expected_start)
amine@231 1274 self.assertEqual(bytes(sub_region), expected_data)
amine@231 1275
amine@231 1276 @genty_dataset(
amine@88 1277 simple=(8000, 1, 1),
amine@88 1278 stereo_sw_2=(8000, 2, 2),
amine@229 1279 arbitrary_sr_multichannel=(5413, 2, 3),
amine@88 1280 )
amine@88 1281 def test_concatenation(self, sampling_rate, sample_width, channels):
amine@88 1282
amine@88 1283 region_1, region_2 = _make_random_length_regions(
amine@88 1284 [b"a", b"b"], sampling_rate, sample_width, channels
amine@88 1285 )
amine@88 1286
amine@88 1287 expected_start = region_1.start
amine@88 1288 expected_duration = region_1.duration + region_2.duration
amine@88 1289 expected_end = expected_start + expected_duration
amine@88 1290 expected_data = bytes(region_1) + bytes(region_2)
amine@88 1291 concat_region = region_1 + region_2
amine@88 1292
amine@88 1293 self.assertEqual(concat_region.start, expected_start)
amine@88 1294 self.assertAlmostEqual(concat_region.end, expected_end, places=6)
amine@88 1295 self.assertAlmostEqual(
amine@88 1296 concat_region.duration, expected_duration, places=6
amine@88 1297 )
amine@88 1298 self.assertEqual(bytes(concat_region), expected_data)
amine@88 1299
amine@88 1300 @genty_dataset(
amine@88 1301 simple=(8000, 1, 1),
amine@88 1302 stereo_sw_2=(8000, 2, 2),
amine@229 1303 arbitrary_sr_multichannel=(5413, 2, 3),
amine@88 1304 )
amine@88 1305 def test_concatenation_many(self, sampling_rate, sample_width, channels):
amine@88 1306
amine@88 1307 regions = _make_random_length_regions(
amine@88 1308 [b"a", b"b", b"c"], sampling_rate, sample_width, channels
amine@88 1309 )
amine@88 1310 expected_start = regions[0].start
amine@88 1311 expected_duration = sum(r.duration for r in regions)
amine@88 1312 expected_end = expected_start + expected_duration
amine@88 1313 expected_data = b"".join(bytes(r) for r in regions)
amine@88 1314 concat_region = sum(regions)
amine@88 1315
amine@88 1316 self.assertEqual(concat_region.start, expected_start)
amine@88 1317 self.assertAlmostEqual(concat_region.end, expected_end, places=6)
amine@88 1318 self.assertAlmostEqual(
amine@88 1319 concat_region.duration, expected_duration, places=6
amine@88 1320 )
amine@88 1321 self.assertEqual(bytes(concat_region), expected_data)
amine@88 1322
amine@88 1323 def test_concatenation_different_sampling_rate_error(self):
amine@88 1324
amine@88 1325 region_1 = AudioRegion(b"a" * 100, 0, 8000, 1, 1)
amine@88 1326 region_2 = AudioRegion(b"b" * 100, 0, 3000, 1, 1)
amine@88 1327
amine@88 1328 with self.assertRaises(ValueError) as val_err:
amine@88 1329 region_1 + region_2
amine@88 1330 self.assertEqual(
amine@88 1331 "Can only concatenate AudioRegions of the same "
amine@88 1332 "sampling rate (8000 != 3000)",
amine@88 1333 str(val_err.exception),
amine@88 1334 )
amine@88 1335
amine@88 1336 def test_concatenation_different_sample_width_error(self):
amine@88 1337
amine@88 1338 region_1 = AudioRegion(b"a" * 100, 0, 8000, 2, 1)
amine@88 1339 region_2 = AudioRegion(b"b" * 100, 0, 8000, 4, 1)
amine@88 1340
amine@88 1341 with self.assertRaises(ValueError) as val_err:
amine@88 1342 region_1 + region_2
amine@88 1343 self.assertEqual(
amine@88 1344 "Can only concatenate AudioRegions of the same "
amine@88 1345 "sample width (2 != 4)",
amine@88 1346 str(val_err.exception),
amine@88 1347 )
amine@88 1348
amine@88 1349 def test_concatenation_different_number_of_channels_error(self):
amine@88 1350
amine@88 1351 region_1 = AudioRegion(b"a" * 100, 0, 8000, 1, 1)
amine@88 1352 region_2 = AudioRegion(b"b" * 100, 0, 8000, 1, 2)
amine@88 1353
amine@88 1354 with self.assertRaises(ValueError) as val_err:
amine@88 1355 region_1 + region_2
amine@88 1356 self.assertEqual(
amine@88 1357 "Can only concatenate AudioRegions of the same "
amine@88 1358 "number of channels (1 != 2)",
amine@88 1359 str(val_err.exception),
amine@88 1360 )
amine@196 1361
amine@196 1362 @genty_dataset(
amine@196 1363 simple=(0.01, 0.03, 30),
amine@196 1364 rounded_len_floor=(0.00575, 0.01725, 17),
amine@196 1365 rounded_len_ceil=(0.00625, 0.01875, 19),
amine@196 1366 )
amine@196 1367 def test_multiplication(
amine@196 1368 self, duration, expected_duration, expected_length
amine@196 1369 ):
amine@196 1370 sw = 2
amine@196 1371 data = b"0" * int(duration * 8000 * sw)
amine@196 1372 region = AudioRegion(data, 0, 8000, sw, 1)
amine@196 1373 m_region = 1 * region * 3
amine@196 1374 self.assertEqual(bytes(m_region), data * 3)
amine@196 1375 self.assertEqual(m_region.sr, 8000)
amine@196 1376 self.assertEqual(m_region.sw, 2)
amine@196 1377 self.assertEqual(m_region.ch, 1)
amine@196 1378 self.assertEqual(m_region.duration, expected_duration)
amine@196 1379 self.assertEqual(len(m_region), expected_length)
amine@197 1380
amine@198 1381 @genty_dataset(_str=("x", "str"), _float=(1.4, "float"))
amine@197 1382 def test_multiplication_non_int(self, factor, _type):
amine@197 1383 with self.assertRaises(TypeError) as type_err:
amine@198 1384 AudioRegion(b"0" * 80, 0, 8000, 1, 1) * factor
amine@197 1385 err_msg = "Can't multiply AudioRegion by a non-int of type '{}'"
amine@197 1386 self.assertEqual(err_msg.format(_type), str(type_err.exception))