From b2ef31a93615d55173f6d6f05a3cf76d44d4c20d Mon Sep 17 00:00:00 2001 From: Vladimir Malenovsky Date: Tue, 30 May 2023 13:56:19 +0200 Subject: [PATCH 1/3] new naming convention from IVAS-7a in ISM-1 and ISM-2 --- item_gen_configs/P800-1.yml | 90 +++++++++++++++++++++---------------- item_gen_configs/P800-2.yml | 89 ++++++++++++++++++++---------------- 2 files changed, 103 insertions(+), 76 deletions(-) diff --git a/item_gen_configs/P800-1.yml b/item_gen_configs/P800-1.yml index d3e79309..a597eaef 100644 --- a/item_gen_configs/P800-1.yml +++ b/item_gen_configs/P800-1.yml @@ -45,257 +45,271 @@ add_low_level_random_noise: true ### Specify the mono source filenames (the program will search for it in the input_path folder) ### Specify the stereo IR source filenames (the program will search for it in the input_path_IR folder) ### Specify the overlap length in seconds for each input source (negative value creates a gap) -### Note 1: use [val1, val2, ...] for multiple sources in a scene -### Note 2: use the "start:step:stop" notation for moving sources, where step will be applied in 20ms frames +### Note 1: use brackets [val1, val2, ...] for multiple sources in a scene +### Note 2: use the Matlab notation "start:step:stop" to create moving sources (step will be applied in 20ms frames) + +### Naming convention for P.800 items +### The filenames of the input content samples are represented by: +### leeeayszz.wav +### The filenames of the accompanying metadata files (applicable to metadata-assisted spatial audio, object-based audio) are represented by: +### leeeayszz.met for metadata-assisted spatial audio +### leeeayszz.wav.o.csv for object-based audio +### where: +### l stands for the listening lab designator (a through d according to Table 2) +### eee stands for the experiment designator, e.g. p01 (see Table 1) +### a stands audio, and y is the per experiment category according to IVAS-8a +### s stands for sample and zz is the sample number; 01, 02, 03, 04, 05, 06, 07, where 07 is the preliminary +### o stands for object number; 0, 1, 2, 3 + scenes: cat1_1: - name: "C1P1.wav" + name: "lp01a1s01" description: "Small anechoic room with AB microphone pickup, partial overlap between the talkers." source: ["f1_s1.wav", "m1_s1.wav"] IR: ["SAABP01.wav", "SAABP07.wav"] overlap: 1.0 cat1_2: - name: "C1P2.wav" + name: "lp01a1s02" description: "Small anechoic room with AB microphone pickup, partial overlap between the talkers." source: ["m2_s1.wav", "f2_s1.wav"] IR: ["SAABP05.wav", "SAABP03.wav"] overlap: 1.0 cat1_3: - name: "C1P3.wav" + name: "lp01a1s03" description: "Small anechoic room with AB microphone pickup, partial overlap between the talkers." source: ["f3_s1.wav", "m3_s1.wav"] IR: ["SAABP02.wav", "SAABP06.wav"] overlap: 1.0 cat1_4: - name: "C1P4.wav" + name: "lp01a1s04" description: "Small anechoic room with AB microphone pickup, partial overlap between the talkers." source: ["m1_s2.wav", "f1_s2.wav"] IR: ["SAABP04.wav", "SAABP01.wav"] overlap: 1.0 cat1_5: - name: "C1P5.wav" + name: "lp01a1s05" description: "Small anechoic room with AB microphone pickup, partial overlap between the talkers." source: ["f2_s2.wav", "m2_s2.wav"] IR: ["SAABP03.wav", "SAABP04.wav"] overlap: 1.0 cat1_6: - name: "C1P6.wav" + name: "lp01a1s06" description: "Small anechoic room with AB microphone pickup, partial overlap between the talkers." source: ["m3_s2.wav", "f3_s2.wav"] IR: ["SAABP07.wav", "SAABP02.wav"] overlap: 1.0 cat2_1: - name: "C2P1.wav" + name: "lp01a2s01" description: "Large anechoic room with AB microphone pickup, no overlap between the talkers." source: ["m3_s3.wav", "f3_s3.wav"] IR: ["LAABP05.wav", "LAABP11.wav"] overlap: -1.0 cat2_2: - name: "C2P2.wav" + name: "lp01a2s02" description: "Large anechoic room with AB microphone pickup, no overlap between the talkers." source: ["f1_s3.wav", "m1.wav"] IR: ["LAABP01.wav", "LAABP06.wav"] overlap: -1.0 cat2_3: - name: "C2P3.wav" + name: "lp01a2s03" description: "Large anechoic room with AB microphone pickup, no overlap between the talkers." source: ["m2_s3.wav", "f2_s3.wav"] IR: ["LAABP03.wav", "LAABP07.wav"] overlap: -1.0 cat2_4: - name: "C2P4.wav" + name: "lp01a2s04" description: "Large anechoic room with AB microphone pickup, no overlap between the talkers." source: ["f3_s4.wav", "m3_s4.wav"] IR: ["LAABP05.wav", "LAABP08.wav"] overlap: -1.0 cat2_5: - name: "C2P5.wav" + name: "lp01a2s05" description: "Large anechoic room with AB microphone pickup, no overlap between the talkers." source: ["m1_s4.wav", "f1_s4.wav"] IR: ["LAABP09.wav", "LAABP07.wav"] overlap: -1.0 cat2_6: - name: "C2P6.wav" + name: "lp01a2s06" description: "Large anechoic room with AB microphone pickup, no overlap between the talkers." source: ["f2_s4.wav", "m2_s4.wav"] IR: ["LAABP10.wav", "LAABP09.wav"] overlap: -1.0 cat3_1: - name: "C3P1.wav" + name: "lp01a3s01" description: "Small anechoic room with MS microphone pickup, no overlap between the talkers." source: ["f2_s5.wav", "m2_s5.wav"] IR: ["SAMSP01.wav", "SAMSP07.wav"] overlap: -1.0 cat3_2: - name: "C3P2.wav" + name: "lp01a3s02" description: "Small anechoic room with MS microphone pickup, no overlap between the talkers." source: ["m3_s5.wav", "f3_s5.wav"] IR: ["SAMSP05.wav", "SAMSP03.wav"] overlap: -1.0 cat3_3: - name: "C3P3.wav" + name: "lp01a3s03" description: "Small anechoic room with MS microphone pickup, no overlap between the talkers." source: ["f1_s5.wav", "m1_s5.wav"] IR: ["SAMSP02.wav", "SAMSP06.wav"] overlap: -1.0 cat3_4: - name: "C3P4.wav" + name: "lp01a3s04" description: "Small anechoic room with MS microphone pickup, no overlap between the talkers." source: ["m2_s6.wav", "f2_s6.wav"] IR: ["SAMSP04.wav", "SAMSP01.wav"] overlap: -1.0 cat3_5: - name: "C3P5.wav" + name: "lp01a3s05" description: "Small anechoic room with MS microphone pickup, no overlap between the talkers." source: ["f3_s6.wav", "m3_s6.wav"] IR: ["SAMSP03.wav", "SAMSP04.wav"] overlap: -1.0 cat3_6: - name: "C3P6.wav" + name: "lp01a3s06" description: "Small anechoic room with MS microphone pickup, no overlap between the talkers." source: ["m1_s6.wav", "f1_s6.wav"] IR: ["SAMSP07.wav", "SAMSP02.wav"] overlap: -1.0 cat4_1: - name: "C4P1.wav" + name: "lp01a4s01" description: "Small echoic room with AB microphone pickup, partial overlap between the talkers." source: ["m1_s7.wav", "f1_s7.wav"] IR: ["SEABP01.wav", "SEABP07.wav"] overlap: 1.0 cat4_2: - name: "C4P2.wav" + name: "lp01a4s02" description: "Small echoic room with AB microphone pickup, partial overlap between the talkers." source: ["f2_s7.wav", "m2_s7.wav"] IR: ["SEABP05.wav", "SEABP03.wav"] overlap: 1.0 cat4_3: - name: "C4P3.wav" + name: "lp01a4s03" description: "Small echoic room with AB microphone pickup, partial overlap between the talkers." source: ["m3_s7.wav", "f3_s7.wav"] IR: ["SEABP02.wav", "SEABP06.wav"] overlap: 1.0 cat4_4: - name: "C4P4.wav" + name: "lp01a4s04" description: "Small echoic room with AB microphone pickup, partial overlap between the talkers." source: ["f1_s8.wav", "m1_s8.wav"] IR: ["SEABP04.wav", "SEABP01.wav"] overlap: 1.0 cat4_5: - name: "C4P5.wav" + name: "lp01a4s05" description: "Small echoic room with AB microphone pickup, partial overlap between the talkers." source: ["m2_s8.wav", "f2_s8.wav"] IR: ["SEABP03.wav", "SEABP04.wav"] overlap: 1.0 cat4_6: - name: "C4P6.wav" + name: "lp01a4s06" description: "Small echoic room with AB microphone pickup, partial overlap between the talkers." source: ["f3_s8.wav", "m3_s8.wav"] IR: ["SEABP07.wav", "SEABP02.wav"] overlap: 1.0 cat5_1: - name: "C5P1.wav" + name: "lp01a5s01" description: "Large echoic room with AB microphone pickup, partial overlap between the talkers." source: ["f3_s9.wav", "m3_s9.wav"] IR: ["LEABP02.wav", "LEABP08.wav"] overlap: 1.0 cat5_2: - name: "C5P2.wav" + name: "lp01a5s02" description: "Large echoic room with AB microphone pickup, partial overlap between the talkers." source: ["m1_s9.wav", "f1_s9.wav"] IR: ["LEABP09.wav", "LEABP04.wav"] overlap: 1.0 cat5_3: - name: "C5P3.wav" + name: "lp01a5s03" description: "Large echoic room with AB microphone pickup, partial overlap between the talkers." source: ["f2_s9.wav", "m2_s9.wav"] IR: ["LEABP06.wav", "LEABP10.wav"] overlap: 1.0 cat5_4: - name: "C5P4.wav" + name: "lp01a5s04" description: "Large echoic room with AB microphone pickup, partial overlap between the talkers." source: ["m3_s10.wav", "f3_s10.wav"] IR: ["LEABP11.wav", "LEABP08.wav"] overlap: 1.0 cat5_5: - name: "C5P5.wav" + name: "lp01a5s05" description: "Large echoic room with AB microphone pickup, partial overlap between the talkers." source: ["f1_s10.wav", "m1_s10.wav"] IR: ["LEABP10.wav", "LEABP12.wav"] overlap: 1.0 cat5_6: - name: "C5P6.wav" + name: "lp01a5s06" description: "Large echoic room with AB microphone pickup, partial overlap between the talkers." source: ["m2_s10.wav", "f2_s10.wav"] IR: ["LEABP12.wav", "LEABP01.wav"] overlap: 1.0 cat6_1: - name: "C6P1.wav" + name: "lp01a6s01" description: "Small echoic room with binaural microphone pickup, no overlap between the talkers." source: ["m2_s11.wav", "f2_s11.wav"] IR: ["SEABP01.wav", "SEABP07.wav"] overlap: -1.0 cat6_2: - name: "C6P2.wav" + name: "lp01a6s02" description: "Small echoic room with binaural microphone pickup, no overlap between the talkers." source: ["f3_s11.wav", "m3_s11.wav"] IR: ["SEABP05.wav", "SEABP03.wav"] overlap: -1.0 cat6_3: - name: "C6P3.wav" + name: "lp01a6s03" description: "Small echoic room with binaural microphone pickup, no overlap between the talkers." source: ["m1_s11.wav", "f1_s11.wav"] IR: ["SEABP02.wav", "SEABP06.wav"] overlap: -1.0 cat6_4: - name: "C6P4.wav" + name: "lp01a6s04" description: "Small echoic room with binaural microphone pickup, no overlap between the talkers." source: ["f2_s12.wav", "m2_s12.wav"] IR: ["SEABP04.wav", "SEABP01.wav"] overlap: -1.0 cat6_5: - name: "C6P5.wav" + name: "lp01a6s05" description: "Small echoic room with binaural microphone pickup, no overlap between the talkers." source: ["m3_s12.wav", "f3_s12.wav"] IR: ["SEABP03.wav", "SEABP04.wav"] overlap: -1.0 cat6_6: - name: "C6P6.wav" + name: "lp01a6s06" description: "Small echoic room with binaural microphone pickup, no overlap between the talkers." source: ["f1_s12.wav", "m1_s12.wav"] IR: ["SEABP07.wav", "SEABP02.wav"] diff --git a/item_gen_configs/P800-2.yml b/item_gen_configs/P800-2.yml index 33ffa837..422eb55a 100644 --- a/item_gen_configs/P800-2.yml +++ b/item_gen_configs/P800-2.yml @@ -45,257 +45,270 @@ add_low_level_random_noise: true ### Specify the mono source filenames (the program will search for it in the input_path folder) ### Specify the stereo IR source filenames (the program will search for it in the input_path_IR folder) ### Specify the overlap length in seconds for each input source (negative value creates a gap) -### Note 1: use [val1, val2, ...] for multiple sources in a scene -### Note 2: use the "start:step:stop" notation for moving sources, where step will be applied in 20ms frames +### Note 1: use brackets [val1, val2, ...] for multiple sources in a scene +### Note 2: use the Matlab notation "start:step:stop" to create moving sources (step will be applied in 20ms frames) + +### Naming convention for P.800 items +### The filenames of the input content samples are represented by: +### leeeayszz.wav +### The filenames of the accompanying metadata files (applicable to metadata-assisted spatial audio, object-based audio) are represented by: +### leeeayszz.met for metadata-assisted spatial audio +### leeeayszz.wav.o.csv for object-based audio +### where: +### l stands for the listening lab designator (a through d according to Table 2) +### eee stands for the experiment designator, e.g. p01 (see Table 1) +### a stands audio, and y is the per experiment category according to IVAS-8a +### s stands for sample and zz is the sample number; 01, 02, 03, 04, 05, 06, 07, where 07 is the preliminary +### o stands for object number; 0, 1, 2, 3 scenes: cat1_1: - name: "C1P1.wav" + name: "lp02a1s01" description: "Car with AB microphone pickup, no overlap between the talkers, car noise." source: ["f1_s1.wav", "m1_s1.wav"] IR: ["Car_TalkPos5_Stereo_M5_SinSweep_2chn.wav", "Car_TalkPos1_Stereo_M5_SinSweep_2chn.wav"] overlap: -1.0 cat1_2: - name: "C1P2.wav" + name: "lp02a1s02" description: "Car with AB microphone pickup, no overlap between the talkers, car noise." source: ["m2_s1.wav", "f2_s1.wav"] IR: ["Car_TalkPos2_Stereo_M5_SinSweep_2chn.wav", "Car_TalkPos5_Stereo_M5_SinSweep_2chn.wav"] overlap: -1.0 cat1_3: - name: "C1P3.wav" + name: "lp02a1s03" description: "Car with AB microphone pickup, no overlap between the talkers, car noise." source: ["f3_s1.wav", "m3_s1.wav"] IR: ["Car_TalkPos5_Stereo_M5_SinSweep_2chn.wav", "Car_TalkPos3_Stereo_M5_SinSweep_2chn.wav"] overlap: -1.0 cat1_4: - name: "C1P4.wav" + name: "lp02a1s04" description: "Car with AB microphone pickup, no overlap between the talkers, car noise." source: ["m1_s2.wav", "f1_s2.wav"] IR: ["Car_TalkPos4_Stereo_M5_SinSweep_2chn.wav", "Car_TalkPos5_Stereo_M5_SinSweep_2chn.wav"] overlap: -1.0 cat1_5: - name: "C1P5.wav" + name: "lp02a1s05" description: "Car with AB microphone pickup, no overlap between the talkers, car noise." source: ["f2_s2.wav", "m2_s2.wav"] IR: ["Car_TalkPos2_Stereo_M5_SinSweep_2chn.wav", "Car_TalkPos4_Stereo_M5_SinSweep_2chn.wav"] overlap: -1.0 cat1_6: - name: "C1P6.wav"u + name: "lp02a1s06" description: "Car with AB microphone pickup, no overlap between the talkers, car noise." source: ["m3_s2.wav", "f3_s2.wav"] IR: ["Car_TalkPos3_Stereo_M5_SinSweep_2chn.wav", "Car_TalkPos2_Stereo_M5_SinSweep_2chn.wav"] overlap: -1.0 cat2_1: - name: "C2P1.wav" + name: "lp02a2s01" description: "Car with AB microphone pickup, no overlap between the talkers, street noise." source: ["m3_s3.wav", "f3_s3.wav"] IR: ["", ""] overlap: -1.0 cat2_2: - name: "C2P2.wav" + name: "lp02a2s02" description: "Car with AB microphone pickup, no overlap between the talkers, street noise." source: ["f1_s3.wav", "m1.wav"] IR: ["", ""] overlap: -1.0 cat2_3: - name: "C2P3.wav" + name: "lp02a2s03" description: "Car with AB microphone pickup, no overlap between the talkers, street noise." source: ["m2_s3.wav", "f2_s3.wav"] IR: ["", ""] overlap: -1.0 cat2_4: - name: "C2P4.wav" + name: "lp02a2s04" description: "Car with AB microphone pickup, no overlap between the talkers, street noise." source: ["f3_s4.wav", "m3_s4.wav"] IR: ["", ""] overlap: -1.0 cat2_5: - name: "C2P5.wav" + name: "lp02a2s05" description: "Car with AB microphone pickup, no overlap between the talkers, street noise." source: ["m1_s4.wav", "f1_s4.wav"] IR: ["", ""] overlap: -1.0 cat2_6: - name: "C2P6.wav" + name: "lp02a2s06" description: "Car with AB microphone pickup, no overlap between the talkers, street noise." source: ["f2_s4.wav", "m2_s4.wav"] IR: ["", ""] overlap: -1.0 cat3_1: - name: "C3P1.wav" + name: "lp02a3s01" description: "Small echoic room with MS microphone pickup, no overlap between the talkers, office noise." source: ["f2_s5.wav", "m2_s5.wav"] IR: ["SEMSP01.wav", "SEMSP07.wav"] overlap: -1.0 cat3_2: - name: "C3P2.wav" + name: "lp02a3s02" description: "Small echoic room with MS microphone pickup, no overlap between the talkers, office noise." source: ["m3_s5.wav", "f3_s5.wav"] IR: ["SEMSP05.wav", "SEMSP03.wav"] overlap: -1.0 cat3_3: - name: "C3P3.wav" + name: "lp02a3s03" description: "Small echoic room with MS microphone pickup, no overlap between the talkers, office noise." source: ["f1_s5.wav", "m1_s5.wav"] IR: ["SEMSP02.wav", "SEMSP06.wav"] overlap: -1.0 cat3_4: - name: "C3P4.wav" + name: "lp02a3s04" description: "Small echoic room with MS microphone pickup, no overlap between the talkers, office noise." source: ["m2_s6.wav", "f2_s6.wav"] IR: ["SEMSP04.wav", "SEMSP01.wav"] overlap: -1.0 cat3_5: - name: "C3P5.wav" + name: "lp02a3s05" description: "Small echoic room with MS microphone pickup, no overlap between the talkers, office noise." source: ["f3_s6.wav", "m3_s6.wav"] IR: ["SEMSP03.wav", "SEMSP04.wav"] overlap: -1.0 cat3_6: - name: "C3P6.wav" + name: "lp02a3s06" description: "Small echoic room with MS microphone pickup, no overlap between the talkers, office noise." source: ["m1_s6.wav", "f1_s6.wav"] IR: ["SEMSP07.wav", "SEMSP02.wav"] overlap: -1.0 cat4_1: - name: "C4P1.wav" + name: "lp02a4s01" description: "Small echoic room with AB microphone pickup, partial overlap between the talkers, office noise." source: ["m1_s7.wav", "f1_s7.wav"] IR: ["SEABP01.wav", "SEABP07.wav"] overlap: -1.0 cat4_2: - name: "C4P2.wav" + name: "lp02a4s02" description: "Small echoic room with AB microphone pickup, partial overlap between the talkers, office noise." source: ["f2_s7.wav", "m2_s7.wav"] IR: ["SEABP05.wav", "SEABP03.wav"] overlap: -1.0 cat4_3: - name: "C4P3.wav" + name: "lp02a4s03" description: "Small echoic room with AB microphone pickup, partial overlap between the talkers, office noise." source: ["m3_s7.wav", "f3_s7.wav"] IR: ["SEABP02.wav", "SEABP06.wav"] overlap: -1.0 cat4_4: - name: "C4P4.wav" + name: "lp02a4s04" description: "Small echoic room with AB microphone pickup, partial overlap between the talkers, office noise." source: ["f1_s8.wav", "m1_s8.wav"] IR: ["SEABP04.wav", "SEABP01.wav"] overlap: -1.0 cat4_5: - name: "C4P5.wav" + name: "lp02a4s05" description: "Small echoic room with AB microphone pickup, partial overlap between the talkers, office noise." source: ["m2_s8.wav", "f2_s8.wav"] IR: ["SEABP03.wav", "SEABP04.wav"] overlap: -1.0 cat4_6: - name: "C4P6.wav" + name: "lp02a4s06" description: "Small echoic room with AB microphone pickup, partial overlap between the talkers, office noise." source: ["f3_s8.wav", "m3_s8.wav"] IR: ["SEABP07.wav", "SEABP02.wav"] overlap: -1.0 cat5_1: - name: "C5P1.wav" + name: "lp02a5s01" description: "Large echoic room with AB microphone pickup, partial overlap between the talkers, office noise." source: ["f3_s9.wav", "m3_s9.wav"] IR: ["LEABP02.wav", "LEABP08.wav"] overlap: -1.0 cat5_2: - name: "C5P2.wav" + name: "lp02a5s02" description: "Large echoic room with AB microphone pickup, partial overlap between the talkers, office noise." source: ["m1_s9.wav", "f1_s9.wav"] IR: ["LEABP09.wav", "LEABP04.wav"] overlap: -1.0 cat5_3: - name: "C5P3.wav" + name: "lp02a5s03" description: "Large echoic room with AB microphone pickup, partial overlap between the talkers, office noise." source: ["f2_s9.wav", "m2_s9.wav"] IR: ["LEABP06.wav", "LEABP10.wav"] overlap: -1.0 cat5_4: - name: "C5P4.wav" + name: "lp02a5s04" description: "Large echoic room with AB microphone pickup, partial overlap between the talkers, office noise." source: ["m3_s10.wav", "f3_s10.wav"] IR: ["LEABP11.wav", "LEABP08.wav"] overlap: -1.0 cat5_5: - name: "C5P5.wav" + name: "lp02a5s05" description: "Large echoic room with AB microphone pickup, partial overlap between the talkers, office noise." source: ["f1_s10.wav", "m1_s10.wav"] IR: ["LEABP10.wav", "LEABP12.wav"] overlap: -1.0 cat5_6: - name: "C5P6.wav" + name: "lp02a5s06" description: "Large echoic room with AB microphone pickup, partial overlap between the talkers, office noise." source: ["m2_s10.wav", "f2_s10.wav"] IR: ["LEABP12.wav", "LEABP01.wav"] overlap: -1.0 cat6_1: - name: "C6P1.wav" + name: "lp02a6s01" description: "Small echoic room with binaural microphone pickup, no overlap between the talkers, office noise." source: ["m2_s11.wav", "f2_s11.wav"] IR: ["SEBIP01.wav", "SEBIP07.wav"] overlap: -1.0 cat6_2: - name: "C6P2.wav" + name: "lp02a6s02" description: "Small echoic room with binaural microphone pickup, no overlap between the talkers, office noise." source: ["f3_s11.wav", "m3_s11.wav"] IR: ["SEBIP05.wav", "SEBIP03.wav"] overlap: -1.0 cat6_3: - name: "C6P3.wav" + name: "lp02a6s03" description: "Small echoic room with binaural microphone pickup, no overlap between the talkers, office noise." source: ["m1_s11.wav", "f1_s11.wav"] IR: ["SEBIP02.wav", "SEBIP06.wav"] overlap: -1.0 cat6_4: - name: "C6P4.wav" + name: "lp02a6s04" description: "Small echoic room with binaural microphone pickup, no overlap between the talkers, office noise." source: ["f2_s12.wav", "m2_s12.wav"] IR: ["SEBIP04.wav", "SEBIP01.wav"] overlap: -1.0 cat6_5: - name: "C6P5.wav" + name: "lp02a6s05" description: "Small echoic room with binaural microphone pickup, no overlap between the talkers, office noise." source: ["m3_s12.wav", "f3_s12.wav"] IR: ["SEBIP03.wav", "SEBIP04.wav"] overlap: -1.0 cat6_6: - name: "C6P6.wav" + name: "lp02a6s06" description: "Small echoic room with binaural microphone pickup, no overlap between the talkers, office noise." source: ["f1_s12.wav", "m1_s12.wav"] IR: ["SEBIP07.wav", "SEBIP02.wav"] -- GitLab From f21915ae87ee3bc9a14e94e511bfdb9e0835b8a0 Mon Sep 17 00:00:00 2001 From: Vladimir Malenovsky Date: Tue, 30 May 2023 14:46:53 +0200 Subject: [PATCH 2/3] new naming convention from IVAS-7a in STERO tests --- item_gen_configs/P800-6.yml | 90 ++++++++++++++++++++---------------- item_gen_configs/P800-7.yml | 91 ++++++++++++++++++++----------------- 2 files changed, 100 insertions(+), 81 deletions(-) diff --git a/item_gen_configs/P800-6.yml b/item_gen_configs/P800-6.yml index 59003a44..689697f5 100644 --- a/item_gen_configs/P800-6.yml +++ b/item_gen_configs/P800-6.yml @@ -35,7 +35,7 @@ add_low_level_random_noise: true ### Scene description ################################################ -### Each scene must start with the sceneN tag +### Each scene must start with a unique tag ### Specify the mono source filename (the program will search for it in the input_path folder) ### Specify azimuth and elevation for each input source ### Note 1: use [val1, val2, ...] for multiple sources in a scene @@ -44,13 +44,23 @@ add_low_level_random_noise: true ### Note 3: we're using right-handed coordinate system with azi = 0 pointing from the nose to the screen ### azimuth: float, [-180,180]; positive indicates left ### elevation: float, [-90,90]; positive indicates up -### distance: float, tbd: default: 1 -### spread: float, [0,360]; spread in angles from 0 ... 360˚ -### gain: float, [0,1] + +### Naming convention for P.800 items +### The filenames of the input content samples are represented by: +### leeeayszz.wav +### The filenames of the accompanying metadata files (applicable to metadata-assisted spatial audio, object-based audio) are represented by: +### leeeayszz.met for metadata-assisted spatial audio +### leeeayszz.wav.o.csv for object-based audio +### where: +### l stands for the listening lab designator (a through d according to Table 2) +### eee stands for the experiment designator, e.g. p01 (see Table 1) +### a stands audio, and y is the per experiment category according to IVAS-8a +### s stands for sample and zz is the sample number; 01, 02, 03, 04, 05, 06, 07, where 07 is the preliminary +### o stands for object number; 0, 1, 2, 3 scenes: a1: - name: "G1S1.wav" + name: "lp06a1s01" description: "Talker sitting at a table" source: ["m1_s1.wav", "m1_s7.wav"] azimuth: 0 @@ -58,7 +68,7 @@ scenes: overlap: -0.5 a2: - name: "G6S2.wav" + name: "lp06a1s02" description: "Talker sitting at a table" source: ["f3_s2.wav", "f3_s8.wav"] azimuth: 60 @@ -66,238 +76,238 @@ scenes: overlap: -0.5 a3: - name: "G5S3.wav" + name: "lp06a1s03" description: "Talker sitting at a table" source: ["m3_s3.wav", "m3_s9.wav"] azimuth: 120 elevation: 0 a4: - name: "G4S4.wav" + name: "lp06a1s04" description: "Talker sitting at a table" source: ["f2_s4.wav", "f2_s10.wav"] azimuth: 180 elevation: 0 a5: - name: "G3S5.wav" + name: "lp06a1s05" description: "Talker sitting at a table" source: ["m2_s5.wav", "m2_s11.wav"] azimuth: 240 elevation: 0 a6: - name: "G2S6.wav" + name: "lp06a1s06" description: "Talker sitting at a table" source: ["f1_s6.wav", "f1_s12.wav"] azimuth: 300 elevation: 0 b1: - name: "G2S1.wav" + name: "lp06a2s01" description: "standing talker." source: ["f1_s1.wav", "f1_s7.wav"] azimuth: 120 elevation: 35 b2: - name: "G1S2.wav" + name: "lp06a2s02" description: "standing talker." source: ["m1_s2.wav", "m1_s8.wav"] azimuth: 180 elevation: 35 b3: - name: "G6S3.wav" + name: "lp06a2s03" description: "standing talker." source: ["f3_s3.wav", "f3_s9.wav"] azimuth: 240 elevation: 35 b4: - name: "G5S4.wav" + name: "lp06a2s04" description: "standing talker." source: ["m3_s4.wav", "m3_s10.wav"] azimuth: 300 elevation: 35 b5: - name: "G4S5.wav" + name: "lp06a2s05" description: "standing talker." source: ["f2_s5.wav", "f2_s11.wav"] azimuth: 0 elevation: 35 b6: - name: "G3S6.wav" + name: "lp06a2s06" description: "standing talker." source: ["m2_s6.wav", "m2_s12.wav"] azimuth: 60 elevation: 35 c1: - name: "G3S1.wav" + name: "lp06a3s01" description: "Smaller talker (child) walking around a table." source: ["m2_s1.wav", "m2_s7.wav"] azimuth: "0:1:360" elevation: 0 c2: - name: "G2S2.wav" + name: ""lp06a3s02" description: "Smaller talker (child) walking around a table." source: ["f1_s2.wav", "f1_s8.wav"] azimuth: "60:1:60+360" elevation: 0 c3: - name: "G1S3.wav" + name: "lp06a3s03" description: "Smaller talker (child) walking around a table." source: ["m1_s3.wav", "m1_s9.wav"] azimuth: "120:1:120+360" elevation: 0 c4: - name: "G6S4.wav" + name: "lp06a3s04" description: "Smaller talker (child) walking around a table." source: ["f3_s4.wav", "f3_s10.wav"] azimuth: "180:1:180+360" elevation: 0 c5: - name: "G5S5.wav" + name: "lp06a3s05" description: "Smaller talker (child) walking around a table." source: ["m3_s5.wav", "m3_s11.wav"] azimuth: "240:1:240+360" elevation: 0 c6: - name: "G4S6.wav" + name: "lp06a3s06" description: "Smaller talker (child) walking around a table." source: ["f2_s6.wav", "f2_s12.wav"] azimuth: "300:1:300+360" elevation: 0 d1: - name: "G4S1.wav" + name: "lp06a4s01" description: "Talker walking around the table." source: ["f2_s1.wav", "f2_s7.wav"] azimuth: "0:-1:-360" elevation: 35 d2: - name: "G3S2.wav" + name: "lp06a4s02" description: "Talker walking around the table." source: ["m2_s2.wav", "m2_s8.wav"] azimuth: "60:-1:60-360" elevation: 35 d3: - name: "G2S3.wav" + name: "lp06a4s03" description: "Talker walking around the table." source: ["f1_s3.wav", "f1_s9.wav"] azimuth: "120:-1:120-360" elevation: 35 d4: - name: "G1S4.wav" + name: "lp06a4s04" description: "Talker walking around the table." source: ["m1_s4.wav", "m1_s10.wav"] azimuth: "180:-1:180-360" elevation: 35 d5: - name: "G6S5.wav" + name: "lp06a4s05" description: "Talker walking around the table." source: ["f3_s5.wav", "f3_s11.wav"] azimuth: "240:-1:240-360" elevation: 35 d6: - name: "G5S6.wav" + name: "lp06a4s06" description: "Talker walking around the table." source: ["m3_s6.wav", "m3_s12.wav"] azimuth: "300:-1:300-360" elevation: 35 e1: - name: "G5S1.wav" + name: "lp06a5s01" description: "Elevation displacement." source: ["m3_s1.wav", "m3_s7.wav"] azimuth: 240 elevation: "-90:0.5:90" e2: - name: "G4S2.wav" + name: "lp06a5s02" description: "Elevation displacement." source: ["f2_s2.wav", "f2_s8.wav"] azimuth: 300 elevation: 0 e3: - name: "G3S3.wav" + name: "lp06a5s03" description: "Elevation displacement." source: ["m2_s3.wav", "m2_s9.wav"] azimuth: 0 elevation: "-90:0.5:90" e4: - name: "G2S4.wav" + name: "lp06a5s04" description: "Elevation displacement." source: ["f1_s4.wav", "f1_s10.wav"] azimuth: 60 elevation: "-90:0.5:90" e5: - name: "G1S5.wav" + name: "lp06a5s05" description: "Elevation displacement." source: ["m1_s5.wav", "m1_s11.wav"] azimuth: 120 elevation: "-90:0.5:90" e6: - name: "G6S6.wav" + name: "lp06a5s06" description: "Elevation displacement." source: ["f3_s6.wav", "f3_s12.wav"] azimuth: 180 elevation: "-90:0.5:90" f1: - name: "G6S1.wav" + name: "lp06a6s01" description: "Azimuth and elevation displacement." source: ["f3_s1.wav", "f3_s7.wav"] azimuth: "60:0.5:60+180" elevation: "35:-0.2:-35" f2: - name: "G5S2.wav" + name: "lp06a6s02" description: "Azimuth and elevation displacement." source: ["m3_s2.wav", "m3_s8.wav"] azimuth: "120:0.5:120+180" elevation: "35:-0.2:-35" f3: - name: "G4S3.wav" + name: "lp06a6s03" description: "Azimuth and elevation displacement." source: ["f2_s3.wav", "f2_s9.wav"] azimuth: "180:0.5:180+180" elevation: "35:-0.2:-35" f4: - name: "G3S4.wav" + name: "lp06a6s04" description: "Azimuth and elevation displacement." source: ["m2_s4.wav", "m2_s10.wav"] azimuth: "240:0.5:240+180" elevation: "35:-0.2:-35" f5: - name: "G2S5.wav" + name: "lp06a6s05" description: "Azimuth and elevation displacement." source: ["f1_s5.wav", "f1_s11.wav"] azimuth: "300:0.5:300+180" elevation: "35:-0.2:-35" f6: - name: "G1S6.wav" + name: "lp06a6s06" description: "Azimuth and elevation displacement." source: ["m1_s6.wav", "m1_s12.wav"] azimuth: "0:0.5:0+180" diff --git a/item_gen_configs/P800-7.yml b/item_gen_configs/P800-7.yml index db89d3f2..7b8e1bba 100644 --- a/item_gen_configs/P800-7.yml +++ b/item_gen_configs/P800-7.yml @@ -34,23 +34,32 @@ add_low_level_random_noise: true ### Scene description ################################################ -### Each scene must start with the sceneN tag +### Each scene must start with a unique tag ### Specify the mono source filename (the program will search for it in the input_path folder) ### Specify azimuth and elevation for each input source -### Specify the overlap length in seconds for each input source (negative value creates a gap) ### Note 1: use [val1, val2, ...] for multiple sources in a scene ### Note 2: use the "start:step:stop" notation for moving sources, where step will be applied in 20ms frames ### Note 3: we're using right-handed coordinate system with azi = 0 pointing from the nose to the screen ### azimuth: float, [-180,180]; positive indicates left ### elevation: float, [-90,90]; positive indicates up -### distance: float, tbd: default: 1 -### spread: float, [0,360]; spread in angles from 0 ... 360˚ -### gain: float, [0,1] + +### Naming convention for P.800 items +### The filenames of the input content samples are represented by: +### leeeayszz.wav +### The filenames of the accompanying metadata files (applicable to metadata-assisted spatial audio, object-based audio) are represented by: +### leeeayszz.met for metadata-assisted spatial audio +### leeeayszz.wav.o.csv for object-based audio +### where: +### l stands for the listening lab designator (a through d according to Table 2) +### eee stands for the experiment designator, e.g. p01 (see Table 1) +### a stands audio, and y is the per experiment category according to IVAS-8a +### s stands for sample and zz is the sample number; 01, 02, 03, 04, 05, 06, 07, where 07 is the preliminary +### o stands for object number; 0, 1, 2, 3 scenes: a1: - name: "G1S1.wav" + name: "lp07a1s01" description: "Two talkers sitting at a table, at different azimuth angles with respect to the microphone, non-overlapping utterances." source: ["m1_s1.wav", "f1_s1.wav"] azimuth: [0, 50] @@ -58,7 +67,7 @@ scenes: overlap: -1.0 a2: - name: "G6S2.wav" + name: "lp07a1s02" description: "Two talkers sitting at a table, at different azimuth angles with respect to the microphone, non-overlapping utterances." source: ["f3_s8.wav", "m1_s8.wav"] azimuth: [50, 350] @@ -66,7 +75,7 @@ scenes: overlap: -1.0 a3: - name: "G5S3.wav" + name: "lp07a1s03" description: "Two talkers sitting at a table, at different azimuth angles with respect to the microphone, non-overlapping utterances." source: ["f2_s9.wav", "m3_s9.wav"] azimuth: [40, 290] @@ -74,7 +83,7 @@ scenes: overlap: -1.0 a4: - name: "G4S4.wav" + name: "lp07a1s04" description: "Two talkers sitting at a table, at different azimuth angles with respect to the microphone, non-overlapping utterances." source: ["f1_s10.wav", "m2_s10.wav"] azimuth: [30, 230] @@ -82,7 +91,7 @@ scenes: overlap: -1.0 a5: - name: "G3S5.wav" + name: "lp07a1s05" description: "Two talkers sitting at a table, at different azimuth angles with respect to the microphone, non-overlapping utterances." source: ["m3_s5.wav", "f3_s5.wav"] azimuth: [20, 170] @@ -90,7 +99,7 @@ scenes: overlap: -1.0 a6: - name: "G2S6.wav" + name: "lp07a1s06" description: "Two talkers sitting at a table, at different azimuth angles with respect to the microphone, non-overlapping utterances." source: ["m2_s6.wav", "f2_s6.wav"] azimuth: [10, 110] @@ -98,7 +107,7 @@ scenes: overlap: -1.0 b1: - name: "G2S1.wav" + name: "lp07a2s01" description: "Two standing talkers, at different azimuth angles with respect to the microphone, ~30% overlapping utterances." source: ["m2_s1.wav", "f2_s1.wav"] azimuth: [20, 170] @@ -106,7 +115,7 @@ scenes: overlap: 1.0 b2: - name: "G1S2.wav" + name: "lp07a2s02" description: "Two standing talkers, at different azimuth angles with respect to the microphone, ~30% overlapping utterances." source: ["m1_s2.wav", "f1_s2.wav"] azimuth: [10, 110] @@ -114,7 +123,7 @@ scenes: overlap: 1.0 b3: - name: "G6S3.wav" + name: "lp07a2s03" description: "Two standing talkers, at different azimuth angles with respect to the microphone, ~30% overlapping utterances." source: ["f3_s9.wav", "m1_s9.wav"] azimuth: [0, 50] @@ -122,7 +131,7 @@ scenes: overlap: 1.0 b4: - name: "G5S4.wav" + name: "lp07a2s04" description: "Two standing talkers, at different azimuth angles with respect to the microphone, ~30% overlapping utterances." source: ["f2_s10.wav", "m3_s10.wav"] azimuth: [50, 350] @@ -130,7 +139,7 @@ scenes: overlap: 1.0 b5: - name: "G4S5.wav" + name: "lp07a2s05" description: "Two standing talkers, at different azimuth angles with respect to the microphone, ~30% overlapping utterances." source: ["f1_s11.wav", "m2_s11.wav"] azimuth: [40, 290] @@ -138,7 +147,7 @@ scenes: overlap: 1.0 b6: - name: "G3S6.wav" + name: "lp07a2s06" description: "Two standing talkers, at different azimuth angles with respect to the microphone, ~30% overlapping utterances." source: ["m3_s6.wav", "f3_s6.wav"] azimuth: [30, 230] @@ -146,7 +155,7 @@ scenes: overlap: 1.0 c1: - name: "G3S1.wav" + name: "lp07a3s01" description: "one talker sitting at a table, second talker standing beside the table, non-overlapping utterances." source: ["m3_s1.wav", "f3_s1.wav"] azimuth: [40, 290] @@ -154,7 +163,7 @@ scenes: overlap: -1.0 c2: - name: "G2S2.wav" + name: "lp07a3s02" description: "one talker sitting at a table, second talker standing beside the table, non-overlapping utterances." source: ["m2_s2.wav", "f2_s2.wav"] azimuth: [30, 230] @@ -162,7 +171,7 @@ scenes: overlap: -1.0 c3: - name: "G1S3.wav" + name: "lp07a3s03" description: "one talker sitting at a table, second talker standing beside the table, non-overlapping utterances." source: ["m1_s3.wav", "f1_s3.wav"] azimuth: [20, 170] @@ -170,7 +179,7 @@ scenes: overlap: -1.0 c4: - name: "G6S4.wav" + name: "lp07a3s04" description: "one talker sitting at a table, second talker standing beside the table, non-overlapping utterances." source: ["f3_s10.wav", "m1_s10.wav"] azimuth: [10, 110] @@ -178,7 +187,7 @@ scenes: overlap: -1.0 c5: - name: "G5S5.wav" + name: "lp07a3s05" description: "one talker sitting at a table, second talker standing beside the table, non-overlapping utterances." source: ["f2_s11.wav", "m3_s11.wav"] azimuth: [0, 50] @@ -186,7 +195,7 @@ scenes: overlap: -1.0 c6: - name: "G4S6.wav" + name: "lp07a3s06" description: "one talker sitting at a table, second talker standing beside the table, non-overlapping utterances." source: ["f1_s12.wav", "m2_s12.wav"] azimuth: [50, 350] @@ -194,7 +203,7 @@ scenes: overlap: -1.0 d1: - name: "G4S1.wav" + name: "lp07a4s01" description: "one talker sitting at a table, second talker walking around the table, ~30% overlapping utterances." source: ["f1_s7.wav", "m2_s7.wav"] azimuth: [50, "180:1:120 + 360"] @@ -202,7 +211,7 @@ scenes: overlap: 1.0 d2: - name: "G3S2.wav" + name: "lp07a4s02" description: "one talker sitting at a table, second talker walking around the table, ~30% overlapping utterances." source: ["m3_s2.wav", "f3_s2.wav"] azimuth: [300, "-70:-1:-10 - 360"] @@ -210,7 +219,7 @@ scenes: overlap: 1.0 d3: - name: "G2S3.wav" + name: "lp07a4s03" description: "one talker sitting at a table, second talker walking around the table, ~30% overlapping utterances." source: ["m2_s3.wav", "f2_s3.wav"] azimuth: [250, "-20:-1:-320"] @@ -218,7 +227,7 @@ scenes: overlap: 1.0 d4: - name: "G1S4.wav" + name: "lp07a4s04" description: "one talker sitting at a table, second talker walking around the table, ~30% overlapping utterances." source: ["m1_s4.wav", "f1_s4.wav"] azimuth: [200, "30:-1:-270"] @@ -226,7 +235,7 @@ scenes: overlap: 1.0 d5: - name: "G6S5.wav" + name: "lp07a4s05" description: "one talker sitting at a table, second talker walking around the table, ~30% overlapping utterances." source: ["f3_s11.wav", "m1_s11.wav"] azimuth: [150, "80:1:20 + 360"] @@ -234,7 +243,7 @@ scenes: overlap: 1.0 d6: - name: "G5S6.wav" + name: "lp07a4s06" description: "one talker sitting at a table, second talker walking around the table, ~30% overlapping utterances." source: ["f2_s12.wav", "m3_s12.wav"] azimuth: [100, "130:1:70 + 360"] @@ -242,7 +251,7 @@ scenes: overlap: 1.0 e1: - name: "G5S1.wav" + name: "lp07a5s01" description: "Two talkers walking side-by-side around the table, ~30% overlapping utterances" source: ["f2_s7.wav", "m3_s7.wav"] azimuth: ["80:1:20 + 360", "80:1:20 + 360"] @@ -250,7 +259,7 @@ scenes: overlap: 1.0 e2: - name: "G4S2.wav" + name: "lp07a5s02" description: "Two talkers walking side-by-side around the table, ~30% overlapping utterances" source: ["f1_s8.wav", "m2_s8.wav"] azimuth: ["130:1:70 + 360", "130:1:70 + 360"] @@ -258,7 +267,7 @@ scenes: overlap: 1.0 e3: - name: "G3S3.wav" + name: "lp07a5s03" description: "Two talkers walking side-by-side around the table, ~30% overlapping utterances" source: ["m3_s3.wav", "f3_s3.wav"] azimuth: ["180:1:120 + 360", "180:1:120 + 360"] @@ -266,7 +275,7 @@ scenes: overlap: 1.0 e4: - name: "G2S4.wav" + name: "lp07a5s04" description: "Two talkers walking side-by-side around the table, ~30% overlapping utterances" source: ["m2_s4.wav", "f2_s4.wav"] azimuth: ["-70:-1:-10 - 360", "-70:-1:-10 - 360"] @@ -274,7 +283,7 @@ scenes: overlap: 1.0 e5: - name: "G1S5.wav" + name: "lp07a5s05" description: "Two talkers walking side-by-side around the table, ~30% overlapping utterances" source: ["m1_s5.wav", "f1_s5.wav"] azimuth: ["-20:-1:-320", "-20:-1:-320"] @@ -282,7 +291,7 @@ scenes: overlap: 1.0 e6: - name: "G6S6.wav" + name: "lp07a5s06" description: "Two talkers walking side-by-side around the table, ~30% overlapping utterances" source: ["f3_s12.wav", "m1_s12.wav"] azimuth: ["30:-1:-270", "30:-1:-270"] @@ -290,7 +299,7 @@ scenes: overlap: 1.0 f1: - name: "G6S1.wav" + name: "lp07a6s01" description: "Two talkers walking around the table in opposite directions, non-overlapping utterances." source: ["f3_s7.wav", "m1_s7.wav"] azimuth: ["60:1:0 + 360", "60:-1:120 - 360"] @@ -298,7 +307,7 @@ scenes: overlap: -1.0 f2: - name: "G5S2.wav" + name: "lp07a6s02" description: "Two talkers walking around the table in opposite directions, non-overlapping utterances." source: ["f2_s8.wav", "m3_s8.wav"] azimuth: ["0:1:300", "0:-1:60 - 360"] @@ -306,7 +315,7 @@ scenes: overlap: -1.0 f3: - name: "G4S3.wav" + name: "lp07a6s03" description: "Two talkers walking around the table in opposite directions, non-overlapping utterances." source: ["f1_s9.wav", "m2_s9.wav"] azimuth: ["300:1:240 + 360", "300:-1:0"] @@ -314,7 +323,7 @@ scenes: overlap: -1.0 f4: - name: "G3S4.wav" + name: "lp07a6s04" description: "Two talkers walking around the table in opposite directions, non-overlapping utterances." source: ["m3_s4.wav", "f3_s4.wav"] azimuth: ["240:1:180 + 360", "240:-1:-60"] @@ -322,7 +331,7 @@ scenes: overlap: -1.0 f5: - name: "G2S5.wav" + name: "lp07a6s05" description: "Two talkers walking around the table in opposite directions, non-overlapping utterances." source: ["m2_s5.wav", "f2_s5.wav"] azimuth: ["180:1:120 + 360", "180:-1:-120"] @@ -330,7 +339,7 @@ scenes: overlap: -1.0 f6: - name: "G1S6.wav" + name: "lp07a6s06" description: "Two talkers walking around the table in opposite directions, non-overlapping utterances." source: ["m1_s6.wav", "f1_s6.wav"] azimuth: ["120:1:60 + 360", "120:-1:180 - 360"] -- GitLab From e897243efa886dce557ffb98c2914e9e57bc0f7b Mon Sep 17 00:00:00 2001 From: Vladimir Malenovsky Date: Tue, 30 May 2023 15:24:42 +0200 Subject: [PATCH 3/3] add free-field IRs in the P800-2 STEREO+bckgnd test (street env.) --- item_gen_configs/P800-2.yml | 10 +++++----- .../generation/IR/FreeField_IR_Python_AB_20cm_Pos0.wav | 3 +++ .../generation/IR/FreeField_IR_Python_AB_20cm_Pos1.wav | 3 +++ .../generation/IR/FreeField_IR_Python_AB_20cm_Pos2.wav | 3 +++ .../generation/IR/FreeField_IR_Python_AB_20cm_Pos3.wav | 3 +++ .../generation/IR/FreeField_IR_Python_AB_20cm_Pos4.wav | 3 +++ 6 files changed, 20 insertions(+), 5 deletions(-) create mode 100644 ivas_processing_scripts/generation/IR/FreeField_IR_Python_AB_20cm_Pos0.wav create mode 100644 ivas_processing_scripts/generation/IR/FreeField_IR_Python_AB_20cm_Pos1.wav create mode 100644 ivas_processing_scripts/generation/IR/FreeField_IR_Python_AB_20cm_Pos2.wav create mode 100644 ivas_processing_scripts/generation/IR/FreeField_IR_Python_AB_20cm_Pos3.wav create mode 100644 ivas_processing_scripts/generation/IR/FreeField_IR_Python_AB_20cm_Pos4.wav diff --git a/item_gen_configs/P800-2.yml b/item_gen_configs/P800-2.yml index 422eb55a..0df89d95 100644 --- a/item_gen_configs/P800-2.yml +++ b/item_gen_configs/P800-2.yml @@ -115,35 +115,35 @@ scenes: name: "lp02a2s02" description: "Car with AB microphone pickup, no overlap between the talkers, street noise." source: ["f1_s3.wav", "m1.wav"] - IR: ["", ""] + IR: ["FreeField_IR_Python_AB_20cm_Pos0.wav", "FreeField_IR_Python_AB_20cm_Pos1.wav"] overlap: -1.0 cat2_3: name: "lp02a2s03" description: "Car with AB microphone pickup, no overlap between the talkers, street noise." source: ["m2_s3.wav", "f2_s3.wav"] - IR: ["", ""] + IR: ["FreeField_IR_Python_AB_20cm_Pos2.wav", "FreeField_IR_Python_AB_20cm_Pos0.wav"] overlap: -1.0 cat2_4: name: "lp02a2s04" description: "Car with AB microphone pickup, no overlap between the talkers, street noise." source: ["f3_s4.wav", "m3_s4.wav"] - IR: ["", ""] + IR: ["FreeField_IR_Python_AB_20cm_Pos1.wav", "FreeField_IR_Python_AB_20cm_Pos3.wav"] overlap: -1.0 cat2_5: name: "lp02a2s05" description: "Car with AB microphone pickup, no overlap between the talkers, street noise." source: ["m1_s4.wav", "f1_s4.wav"] - IR: ["", ""] + IR: ["FreeField_IR_Python_AB_20cm_Pos4.wav", "FreeField_IR_Python_AB_20cm_Pos2.wav"] overlap: -1.0 cat2_6: name: "lp02a2s06" description: "Car with AB microphone pickup, no overlap between the talkers, street noise." source: ["f2_s4.wav", "m2_s4.wav"] - IR: ["", ""] + IR: ["FreeField_IR_Python_AB_20cm_Pos3.wav", "FreeField_IR_Python_AB_20cm_Pos5.wav"] overlap: -1.0 cat3_1: diff --git a/ivas_processing_scripts/generation/IR/FreeField_IR_Python_AB_20cm_Pos0.wav b/ivas_processing_scripts/generation/IR/FreeField_IR_Python_AB_20cm_Pos0.wav new file mode 100644 index 00000000..dab9ab5a --- /dev/null +++ b/ivas_processing_scripts/generation/IR/FreeField_IR_Python_AB_20cm_Pos0.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d60467504761f1f531c84fa1d89816e34977d27494c4aec5f7ea7eefecbc8522 +size 984 diff --git a/ivas_processing_scripts/generation/IR/FreeField_IR_Python_AB_20cm_Pos1.wav b/ivas_processing_scripts/generation/IR/FreeField_IR_Python_AB_20cm_Pos1.wav new file mode 100644 index 00000000..801f97f5 --- /dev/null +++ b/ivas_processing_scripts/generation/IR/FreeField_IR_Python_AB_20cm_Pos1.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0b1fe6ce5301e031574a84c4b789157a1596d41ba0b2d36320199bf1288f2b8 +size 984 diff --git a/ivas_processing_scripts/generation/IR/FreeField_IR_Python_AB_20cm_Pos2.wav b/ivas_processing_scripts/generation/IR/FreeField_IR_Python_AB_20cm_Pos2.wav new file mode 100644 index 00000000..0c5b820a --- /dev/null +++ b/ivas_processing_scripts/generation/IR/FreeField_IR_Python_AB_20cm_Pos2.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34cad461f6ded9cb3bc7af0eef69b771515cb388c5d0fc263fd5a1baf86fccda +size 984 diff --git a/ivas_processing_scripts/generation/IR/FreeField_IR_Python_AB_20cm_Pos3.wav b/ivas_processing_scripts/generation/IR/FreeField_IR_Python_AB_20cm_Pos3.wav new file mode 100644 index 00000000..0c5b820a --- /dev/null +++ b/ivas_processing_scripts/generation/IR/FreeField_IR_Python_AB_20cm_Pos3.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34cad461f6ded9cb3bc7af0eef69b771515cb388c5d0fc263fd5a1baf86fccda +size 984 diff --git a/ivas_processing_scripts/generation/IR/FreeField_IR_Python_AB_20cm_Pos4.wav b/ivas_processing_scripts/generation/IR/FreeField_IR_Python_AB_20cm_Pos4.wav new file mode 100644 index 00000000..801f97f5 --- /dev/null +++ b/ivas_processing_scripts/generation/IR/FreeField_IR_Python_AB_20cm_Pos4.wav @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0b1fe6ce5301e031574a84c4b789157a1596d41ba0b2d36320199bf1288f2b8 +size 984 -- GitLab