diff --git a/.gitignore b/.gitignore index ebc9a2ed4d1758cbeebdeea0a42616d5bb75e78a..bb354bbe7ca2da5ab09fec4be60fe94316a61d70 100644 --- a/.gitignore +++ b/.gitignore @@ -11,8 +11,9 @@ venv/ *.bs *.192 mc.double -experiments/selection/*/proc_input/*.wav -experiments/selection/*/proc_input/*.pcm +experiments/selection/*/proc_input/cat*/*.wav +experiments/selection/*/proc_input/cat*/*.csv +experiments/selection/*/proc_input/cat*/*.pcm experiments/selection/*/proc_output/ experiments/selection/*/config/*cat*-lab_*.yml *~ diff --git a/item_gen_configs/P800-1.yml b/experiments/selection/P800-1/config/item_gen_P800-1.yml similarity index 89% rename from item_gen_configs/P800-1.yml rename to experiments/selection/P800-1/config/item_gen_P800-1.yml index b6e48e0e7cd1bcae7bd0692d8911a1f00d6553d3..6b89a00d969671159bf625f6780d422e7dbe68c9 100644 --- a/item_gen_configs/P800-1.yml +++ b/experiments/selection/P800-1/config/item_gen_P800-1.yml @@ -146,6 +146,13 @@ scenes: source: ["m3s02.wav", "f3s02.wav"] IR: ["IR_g_p01_a_07_00_stAB100.wav", "IR_g_p01_a_02_00_stAB100.wav"] overlap: 1.0 + + cat1_7: + name: "cat1/a1s07.wav" + description: "Preliminary: Small anechoic room with AB microphone pickup, partial overlap between the talkers." + source: ["f1s13.wav", "m1s13.wav"] + IR: ["IR_g_p01_a_01_00_stAB100.wav", "IR_g_p01_a_07_00_stAB100.wav"] + overlap: 1.0 cat2_1: name: "cat2/a2s01.wav" @@ -189,6 +196,13 @@ scenes: IR: ["IR_g_p01_c_10_00_stAB150.wav", "IR_g_p01_c_09_00_stAB150.wav"] overlap: -1.0 + cat2_7: + name: "cat2/a2s07.wav" + description: "Preliminary: Large anechoic room with AB microphone pickup, no overlap between the talkers." + source: ["m2s13.wav", "f2s13.wav"] + IR: ["IR_g_p01_c_05_00_stAB150.wav", "IR_g_p01_c_11_00_stAB150.wav"] + overlap: -1.0 + cat3_1: name: "cat3/a3s01.wav" description: "Small anechoic room with MS microphone pickup, no overlap between the talkers." @@ -231,6 +245,13 @@ scenes: IR: ["IR_g_p01_a_07_00_stMS100.wav", "IR_g_p01_a_02_00_stMS100.wav"] overlap: -1.0 + cat3_7: + name: "cat3/a3s07.wav" + description: "Preliminary: Small anechoic room with MS microphone pickup, no overlap between the talkers." + source: ["f3s13.wav", "m3s13.wav"] + IR: ["IR_g_p01_a_02_00_stMS100.wav", "IR_g_p01_a_06_00_stMS100.wav"] + overlap: -1.0 + cat4_1: name: "cat4/a4s01.wav" description: "Small echoic room with AB microphone pickup, partial overlap between the talkers." @@ -273,6 +294,13 @@ scenes: IR: ["IR_g_p01_b_07_00_stAB100.wav", "IR_g_p01_b_02_00_stAB100.wav"] overlap: 1.0 + cat4_7: + name: "cat4/a4s07.wav" + description: "Preliminary: Small echoic room with AB microphone pickup, partial overlap between the talkers." + source: ["m1s14.wav", "f1s14.wav"] + IR: ["IR_g_p01_b_04_00_stAB100.wav", "IR_g_p01_b_01_00_stAB100.wav"] + overlap: 1.0 + cat5_1: name: "cat5/a5s01.wav" description: "Large echoic room with AB microphone pickup, partial overlap between the talkers." @@ -315,6 +343,13 @@ scenes: IR: ["IR_g_p01_d_12_00_stAB150.wav", "IR_g_p01_d_01_00_stAB150.wav"] overlap: 1.0 + cat5_7: + name: "cat5/a5s07.wav" + description: "Preliminary: Large echoic room with AB microphone pickup, partial overlap between the talkers." + source: ["f2s14.wav", "m2s14.wav"] + IR: ["IR_g_p01_d_10_00_stAB150.wav", "IR_g_p01_d_12_00_stAB150.wav"] + overlap: 1.0 + cat6_1: name: "cat6/a6s01.wav" description: "Small echoic room with binaural microphone pickup, no overlap between the talkers." @@ -357,3 +392,9 @@ scenes: IR: ["IR_g_p01_b_07_00_stBI100.wav", "IR_g_p01_b_02_00_stBI100.wav"] overlap: -1.0 + cat6_7: + name: "cat6/a6s07.wav" + description: "Preliminary: Small echoic room with binaural microphone pickup, no overlap between the talkers." + source: ["m2s14.wav", "f2s14.wav"] + IR: ["IR_g_p01_b_07_00_stBI100.wav", "IR_g_p01_b_02_00_stBI100.wav"] + overlap: -1.0 diff --git a/item_gen_configs/P800-2.yml b/experiments/selection/P800-2/config/item_gen_P800-2.yml similarity index 89% rename from item_gen_configs/P800-2.yml rename to experiments/selection/P800-2/config/item_gen_P800-2.yml index 84b0e95dd5b6de0dbe7816dc1059b4aace5d1ecc..d929ae6cf53ebdb9cfd69fc60919ee5b4071ed2b 100644 --- a/item_gen_configs/P800-2.yml +++ b/experiments/selection/P800-2/config/item_gen_P800-2.yml @@ -145,6 +145,13 @@ scenes: IR: ["Car_TalkPos3_Stereo_M5_SinSweep_2chn.wav", "Car_TalkPos2_Stereo_M5_SinSweep_2chn.wav"] overlap: -1.0 + cat1_7: + name: "cat1/a1s07" + description: "Preliminary: Car with AB microphone pickup, no overlap between the talkers, car noise." + source: ["f1s13.wav", "m1s13.wav"] + IR: ["Car_TalkPos5_Stereo_M5_SinSweep_2chn.wav", "Car_TalkPos1_Stereo_M5_SinSweep_2chn.wav"] + overlap: -1.0 + cat2_1: name: "cat2/a2s01.wav" description: "Car with AB microphone pickup, no overlap between the talkers, street noise." @@ -187,6 +194,13 @@ scenes: IR: ["FreeField_IR_Python_AB_20cm_Pos3.wav", "FreeField_IR_Python_AB_20cm_Pos0.wav"] overlap: -1.0 + cat2_7: + name: "cat2/a2s07.wav" + description: "Preliminary: Street conversation with AB microphone pickup, no overlap between the talkers, street noise." + source: ["m2s13.wav", "f2s13.wav"] + IR: ["FreeField_IR_Python_AB_20cm_Pos0.wav", "FreeField_IR_Python_AB_20cm_Pos1.wav"] + overlap: -1.0 + cat3_1: name: "cat3/a3s01.wav" description: "Small echoic room with MS microphone pickup, no overlap between the talkers, office noise." @@ -229,6 +243,13 @@ scenes: IR: ["IR_g_p02_b_07_00_stMS100.wav", "IR_g_p02_b_02_00_stMS100.wav"] overlap: -1.0 + cat3_7: + name: "cat3/a3s07.wav" + description: "Preliminary: Small echoic room with MS microphone pickup, no overlap between the talkers, office noise." + source: ["f3s13.wav", "m3s13.wav"] + IR: ["IR_g_p02_b_02_00_stMS100.wav", "IR_g_p02_b_06_00_stMS100.wav"] + overlap: -1.0 + cat4_1: name: "cat4/a4s01.wav" description: "Small echoic room with AB microphone pickup, partial overlap between the talkers, office noise." @@ -271,6 +292,13 @@ scenes: IR: ["IR_g_p02_b_07_00_stAB100.wav", "IR_g_p02_b_02_00_stAB100.wav"] overlap: -1.0 + cat4_7: + name: "cat4/a4s07.wav" + description: "Preliminary: Small echoic room with AB microphone pickup, partial overlap between the talkers, office noise." + source: ["f1s14.wav", "m1s14.wav"] + IR: ["IR_g_p02_b_04_00_stAB100.wav", "IR_g_p02_b_01_00_stAB100.wav"] + overlap: -1.0 + cat5_1: name: "cat5/a5s01.wav" description: "Large echoic room with AB microphone pickup, partial overlap between the talkers, office noise." @@ -313,6 +341,13 @@ scenes: IR: ["IR_g_p02_d_12_00_stAB150.wav", "IR_g_p02_d_01_00_stAB150.wav"] overlap: -1.0 + cat5_7: + name: "cat5/a5s07.wav" + description: "Preliminary: Large echoic room with AB microphone pickup, partial overlap between the talkers, office noise." + source: ["m2s14.wav", "f2s14.wav"] + IR: ["IR_g_p02_d_10_00_stAB150.wav", "IR_g_p02_d_12_00_stAB150.wav"] + overlap: -1.0 + cat6_1: name: "cat6/a6s01.wav" description: "Small echoic room with binaural microphone pickup, no overlap between the talkers, office noise." @@ -354,4 +389,11 @@ scenes: source: ["f1s12.wav", "m1s12.wav"] IR: ["IR_g_p02_b_07_00_stBI100.wav", "IR_g_p02_b_02_00_stBI100.wav"] overlap: -1.0 + + cat6_7: + name: "cat6/a6s07.wav" + description: "Small echoic room with binaural microphone pickup, no overlap between the talkers, office noise." + source: ["f3s14.wav", "m3s14.wav"] + IR: ["IR_g_p02_b_07_00_stBI100.wav", "IR_g_p02_b_02_00_stBI100.wav"] + overlap: -1.0 \ No newline at end of file diff --git a/item_gen_configs/P800-4.yml b/experiments/selection/P800-4/config/item_gen_P800-4.yml similarity index 90% rename from item_gen_configs/P800-4.yml rename to experiments/selection/P800-4/config/item_gen_P800-4.yml index 540f7ffc4524b05c8abff323b3605d4473907b58..e2560d4669daa27cd78f09e0e9c80beb5f1cfcf5 100644 --- a/item_gen_configs/P800-4.yml +++ b/experiments/selection/P800-4/config/item_gen_P800-4.yml @@ -155,6 +155,14 @@ scenes: overlap: 0.5 format: "FOA" + cat1_7: + name: "cat1/a1s07.wav" + description: "Preliminary: " + source: ["f1s13.wav", "m1s13.wav"] + IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + overlap: 0.5 + format: "FOA" + cat2_1: name: "cat2/a2s01.wav" description: "" @@ -203,6 +211,14 @@ scenes: overlap: 0.5 format: "FOA" + cat2_7: + name: "cat2/a2s07.wav" + description: "Preliminary:" + source: ["m2s13.wav", "f2s13.wav"] + IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + overlap: 0.5 + format: "FOA" + cat3_1: name: "cat3/a3s01.wav" description: "" @@ -218,7 +234,7 @@ scenes: IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" - + cat3_3: name: "cat3/a3s03.wav" description: "" @@ -251,6 +267,14 @@ scenes: overlap: 0.5 format: "FOA" + cat3_7: + name: "cat3/a3s07.wav" + description: "Preliminary: " + source: ["f3s13.wav", "m3s13.wav"] + IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + overlap: 0.5 + format: "FOA" + cat4_1: name: "cat4/a4s01.wav" description: "" @@ -299,6 +323,14 @@ scenes: overlap: 0.5 format: "FOA" + cat4_7: + name: "cat4/a4s07.wav" + description: "Preliminary: " + source: ["m1s14.wav", "f1s14.wav"] + IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + overlap: 0.5 + format: "FOA" + cat5_1: name: "cat5/a5s01.wav" description: "" @@ -347,6 +379,14 @@ scenes: overlap: 0.5 format: "FOA" + cat5_7: + name: "cat5/a5s07.wav" + description: "Preliminary: " + source: ["f2s14.wav", "m2s14.wav"] + IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + overlap: 0.5 + format: "FOA" + cat6_1: name: "cat6/a6s01.wav" description: "" @@ -395,4 +435,11 @@ scenes: overlap: 0.5 format: "FOA" + cat6_7: + name: "cat6/a6s07.wav" + description: "Preliminary:" + source: ["m3s14.wav", "f3s14.wav"] + IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + overlap: 0.5 + format: "FOA" diff --git a/item_gen_configs/P800-5.yml b/experiments/selection/P800-5/config/item_gen_P800-5.yml similarity index 90% rename from item_gen_configs/P800-5.yml rename to experiments/selection/P800-5/config/item_gen_P800-5.yml index 0fad95cb09354fd583e08ecf5007af9854008bc8..64d8ec8e7d49a59c880454ad51bf7c919abce09a 100644 --- a/item_gen_configs/P800-5.yml +++ b/experiments/selection/P800-5/config/item_gen_P800-5.yml @@ -155,6 +155,14 @@ scenes: overlap: 0.5 format: "FOA" + cat1_7: + name: "cat1/a1s07.wav" + description: "Preliminary: " + source: ["f1s13.wav", "m1s13.wav"] + IR: ["IR_do_p05_e_01_01_FOA.wav", "IR_do_p05_e_02_01_FOA.wav"] + overlap: 0.5 + format: "FOA" + cat2_1: name: "cat2/a2s01.wav" description: "" @@ -203,6 +211,14 @@ scenes: overlap: 0.5 format: "FOA" + cat2_7: + name: "cat2/a2s07.wav" + description: "" + source: ["m2s13.wav", "f2s13.wav"] + IR: ["IR_do_p05_e_01_01_FOA.wav", "IR_do_p05_e_02_01_FOA.wav"] + overlap: 0.5 + format: "FOA" + cat3_1: name: "cat3/a3s01.wav" description: "" @@ -251,6 +267,14 @@ scenes: overlap: 0.5 format: "FOA" + cat3_7: + name: "cat3/a3s07.wav" + description: "Preliminary: " + source: ["f3s13.wav", "m3s13.wav"] + IR: ["IR_do_p05_e_01_01_FOA.wav", "IR_do_p05_e_02_01_FOA.wav"] + overlap: 0.5 + format: "FOA" + cat4_1: name: "cat4/a4s01.wav" description: "" @@ -299,6 +323,14 @@ scenes: overlap: 0.5 format: "FOA" + cat4_7: + name: "cat4/a4s07.wav" + description: "Preliminary: " + source: ["m1s14.wav", "f1s14.wav"] + IR: ["IR_do_p05_e_01_01_FOA.wav", "IR_do_p05_e_02_01_FOA.wav"] + overlap: 0.5 + format: "FOA" + cat5_1: name: "cat5/a5s01.wav" description: "" @@ -347,6 +379,14 @@ scenes: overlap: 0.5 format: "FOA" + cat5_7: + name: "cat5/a5s07.wav" + description: "Preliminary: " + source: ["f2s14.wav", "m2s14.wav"] + IR: ["IR_do_p05_e_01_01_FOA.wav", "IR_do_p05_e_02_01_FOA.wav"] + overlap: 0.5 + format: "FOA" + cat6_1: name: "cat6/a6s01.wav" description: "" @@ -395,4 +435,11 @@ scenes: overlap: 0.5 format: "FOA" + cat6_7: + name: "cat6/a6s07.wav" + description: "Preliminary:" + source: ["m3s14.wav", "f3s14.wav"] + IR: ["IR_do_p05_e_01_01_FOA.wav", "IR_do_p05_e_02_01_FOA.wav"] + overlap: 0.5 + format: "FOA" diff --git a/item_gen_configs/P800-6.yml b/experiments/selection/P800-6/config/item_gen_P800-6.yml similarity index 88% rename from item_gen_configs/P800-6.yml rename to experiments/selection/P800-6/config/item_gen_P800-6.yml index 2885adf12334189cc16415b625b045459c7480d5..1cddf5bc2e630ef739e6034299d79498c2b7ed9e 100644 --- a/item_gen_configs/P800-6.yml +++ b/experiments/selection/P800-6/config/item_gen_P800-6.yml @@ -134,9 +134,17 @@ scenes: elevation: 0 overlap: -1.0 + cat1_7: + name: "cat1/a1s07.wav" + description: "Preliminary: Talker sitting at a table" + source: ["f1s13.wav", "f1s14.wav"] + azimuth: 0 + elevation: 0 + overlap: -1.0 + cat2_1: name: "cat2/a2s01.wav" - description: "standing talker." + description: "Standing talker." source: ["f1s01.wav", "f1s07.wav"] azimuth: 120 elevation: 35 @@ -144,7 +152,7 @@ scenes: cat2_2: name: "cat2/a2s02.wav" - description: "standing talker." + description: "Standing talker." source: ["m1s02.wav", "m1s08.wav"] azimuth: 180 elevation: 35 @@ -152,7 +160,7 @@ scenes: cat2_3: name: "cat2/a2s03.wav" - description: "standing talker." + description: "Standing talker." source: ["f3s03.wav", "f3s09.wav"] azimuth: 240 elevation: 35 @@ -160,7 +168,7 @@ scenes: cat2_4: name: "cat2/a2s04.wav" - description: "standing talker." + description: "Standing talker." source: ["m3s04.wav", "m3s10.wav"] azimuth: 300 elevation: 35 @@ -168,7 +176,7 @@ scenes: cat2_5: name: "cat2/a2s05.wav" - description: "standing talker." + description: "Standing talker." source: ["f2s05.wav", "f2s11.wav"] azimuth: 0 elevation: 35 @@ -176,12 +184,20 @@ scenes: cat2_6: name: "cat2/a2s06.wav" - description: "standing talker." + description: "Standing talker." source: ["m2s06.wav", "m2s12.wav"] azimuth: 60 elevation: 35 overlap: -1.0 + cat2_7: + name: "cat2/a2s07.wav" + description: "Preliminary: Standing talker." + source: ["m1s13.wav", "m1s14.wav"] + azimuth: 180 + elevation: 35 + overlap: -1.0 + cat3_1: name: "cat3/a3s01.wav" description: "Smaller talker (child) walking around a table." @@ -230,6 +246,14 @@ scenes: elevation: 0 overlap: -1.0 + cat3_7: + name: "cat3/a3s07.wav" + description: "Preliminary: Smaller talker (child) walking around a table." + source: ["f2s13.wav", "f2s14.wav"] + azimuth: "120:1:120+360" + elevation: 0 + overlap: -1.0 + cat4_1: name: "cat4/a4s01.wav" description: "Talker walking around the table." @@ -277,6 +301,14 @@ scenes: azimuth: "300:-1:300-360" elevation: 35 overlap: -1.0 + + cat4_7: + name: "cat4/a4s07.wav" + description: "Preliminary: Talker walking around the table." + source: ["m2s13.wav", "m2s14.wav"] + azimuth: "180:-1:180-360" + elevation: 35 + overlap: -1.0 cat5_1: name: "cat5/a5s01.wav" @@ -326,6 +358,14 @@ scenes: elevation: "-90:0.5:90" overlap: -1.0 + cat5_7: + name: "cat5/a5s07.wav" + description: "Preliminary: Elevation displacement." + source: ["f3s13.wav", "f3s14.wav"] + azimuth: 120 + elevation: "-90:0.5:90" + overlap: -1.0 + cat6_1: name: "cat6/a6s01.wav" description: "Azimuth and elevation displacement." @@ -373,4 +413,12 @@ scenes: azimuth: "0:0.5:0+180" elevation: "35:-0.2:-35" overlap: -1.0 + + cat6_7: + name: "cat6/a6s07.wav" + description: "Preliminary: Azimuth and elevation displacement." + source: ["m3s13.wav", "m3s14.wav"] + azimuth: "0:0.5:0+180" + elevation: "35:-0.2:-35" + overlap: -1.0 \ No newline at end of file diff --git a/item_gen_configs/P800-7.yml b/experiments/selection/P800-7/config/item_gen_P800-7.yml similarity index 84% rename from item_gen_configs/P800-7.yml rename to experiments/selection/P800-7/config/item_gen_P800-7.yml index dc92d089b3ab22d3037193f65ed9c858442d2596..6a5f7a2ed8b7812058d7a4b5cdcda6152a9ab489 100644 --- a/item_gen_configs/P800-7.yml +++ b/experiments/selection/P800-7/config/item_gen_P800-7.yml @@ -133,6 +133,14 @@ scenes: elevation: [15, 15] overlap: -1.0 + cat1_7: + name: "cat1/a1s07.wav" + description: "Preliminary: Two talkers sitting at a table, at different azimuth angles with respect to the microphone, non-overlapping utterances." + source: ["m1s13.wav", "f1s13.wav"] + azimuth: [0, 50] + elevation: [0, 0] + overlap: -1.0 + cat2_1: name: "cat2/a2s01.wav" description: "Two standing talkers, at different azimuth angles with respect to the microphone, ~30% overlapping utterances." @@ -181,9 +189,17 @@ scenes: elevation: [60, 60] overlap: 1.0 + cat2_7: + name: "cat2/a2s07.wav" + description: "Preliminary: Two standing talkers, at different azimuth angles with respect to the microphone, ~30% overlapping utterances." + source: ["f2s13.wav", "m2s13.wav"] + azimuth: [10, 110] + elevation: [30, 30] + overlap: 1.0 + cat3_1: name: "cat3/a3s01.wav" - description: "one talker sitting at a table, second talker standing beside the table, non-overlapping utterances." + description: "One talker sitting at a table, second talker standing beside the table, non-overlapping utterances." source: ["m3s01.wav", "f3s01.wav"] azimuth: [40, 290] elevation: [0, 60] @@ -191,7 +207,7 @@ scenes: cat3_2: name: "cat3/a3s02.wav" - description: "one talker sitting at a table, second talker standing beside the table, non-overlapping utterances." + description: "One talker sitting at a table, second talker standing beside the table, non-overlapping utterances." source: ["m2s02.wav", "f2s02.wav"] azimuth: [30, 230] elevation: [0, 60] @@ -199,7 +215,7 @@ scenes: cat3_3: name: "cat3/a3s03.wav" - description: "one talker sitting at a table, second talker standing beside the table, non-overlapping utterances." + description: "One talker sitting at a table, second talker standing beside the table, non-overlapping utterances." source: ["m1s03.wav", "f1s03.wav"] azimuth: [20, 170] elevation: [0, 60] @@ -207,7 +223,7 @@ scenes: cat3_4: name: "cat3/a3s04.wav" - description: "one talker sitting at a table, second talker standing beside the table, non-overlapping utterances." + description: "One talker sitting at a table, second talker standing beside the table, non-overlapping utterances." source: ["f3s10.wav", "m1s10.wav"] azimuth: [10, 110] elevation: [0, 60] @@ -215,7 +231,7 @@ scenes: cat3_5: name: "cat3/a3s05.wav" - description: "one talker sitting at a table, second talker standing beside the table, non-overlapping utterances." + description: "One talker sitting at a table, second talker standing beside the table, non-overlapping utterances." source: ["f2s11.wav", "m3s11.wav"] azimuth: [0, 50] elevation: [0, 60] @@ -223,15 +239,23 @@ scenes: cat3_6: name: "cat3/a3s06.wav" - description: "one talker sitting at a table, second talker standing beside the table, non-overlapping utterances." + description: "One talker sitting at a table, second talker standing beside the table, non-overlapping utterances." source: ["f1s12.wav", "m2s12.wav"] azimuth: [50, 350] elevation: [0, 60] overlap: -1.0 + cat3_7: + name: "cat3/a3s07.wav" + description: "Preliminary: One talker sitting at a table, second talker standing beside the table, non-overlapping utterances." + source: ["m3s13.wav", "f3s13.wav"] + azimuth: [20, 170] + elevation: [0, 60] + overlap: -1.0 + cat4_1: name: "cat4/a4s01.wav" - description: "one talker sitting at a table, second talker walking around the table, ~30% overlapping utterances." + description: "One talker sitting at a table, second talker walking around the table, ~30% overlapping utterances." source: ["f1s07.wav", "m2s07.wav"] azimuth: [50, "180:1:120 + 360"] elevation: [0, 60] @@ -239,7 +263,7 @@ scenes: cat4_2: name: "cat4/a4s02.wav" - description: "one talker sitting at a table, second talker walking around the table, ~30% overlapping utterances." + description: "One talker sitting at a table, second talker walking around the table, ~30% overlapping utterances." source: ["m3s02.wav", "f3s02.wav"] azimuth: [300, "-70:-1:-10 - 360"] elevation: [0, 60] @@ -247,7 +271,7 @@ scenes: cat4_3: name: "cat4/a4s03.wav" - description: "one talker sitting at a table, second talker walking around the table, ~30% overlapping utterances." + description: "One talker sitting at a table, second talker walking around the table, ~30% overlapping utterances." source: ["m2s03.wav", "f2s03.wav"] azimuth: [250, "-20:-1:-320"] elevation: [0, 60] @@ -255,7 +279,7 @@ scenes: cat4_4: name: "cat4/a4s04.wav" - description: "one talker sitting at a table, second talker walking around the table, ~30% overlapping utterances." + description: "One talker sitting at a table, second talker walking around the table, ~30% overlapping utterances." source: ["m1s04.wav", "f1s04.wav"] azimuth: [200, "30:-1:-270"] elevation: [0, 60] @@ -263,7 +287,7 @@ scenes: cat4_5: name: "cat4/a4s05.wav" - description: "one talker sitting at a table, second talker walking around the table, ~30% overlapping utterances." + description: "One talker sitting at a table, second talker walking around the table, ~30% overlapping utterances." source: ["f3s11.wav", "m1s11.wav"] azimuth: [150, "80:1:20 + 360"] elevation: [0, 60] @@ -271,12 +295,20 @@ scenes: cat4_6: name: "cat4/a4s06.wav" - description: "one talker sitting at a table, second talker walking around the table, ~30% overlapping utterances." + description: "One talker sitting at a table, second talker walking around the table, ~30% overlapping utterances." source: ["f2s12.wav", "m3s12.wav"] azimuth: [100, "130:1:70 + 360"] elevation: [0, 60] overlap: 1.0 + cat4_7: + name: "cat4/a4s07.wav" + description: "Preliminary: One talker sitting at a table, second talker walking around the table, ~30% overlapping utterances." + source: ["f1s14.wav", "m1s14.wav"] + azimuth: [200, "30:-1:-270"] + elevation: [0, 60] + overlap: 1.0 + cat5_1: name: "cat5/a5s01.wav" description: "Two talkers walking side-by-side around the table, ~30% overlapping utterances" @@ -325,6 +357,14 @@ scenes: elevation: [10, 60] overlap: 1.0 + cat5_7: + name: "cat5/a5s07.wav" + description: "Preliminary: Two talkers walking side-by-side around the table, ~30% overlapping utterances" + source: ["m2s14.wav", "f2s14.wav"] + azimuth: ["-20:-1:-320", "-20:-1:-320"] + elevation: [10, 60] + overlap: 1.0 + cat6_1: name: "cat6/a6s01.wav" description: "Two talkers walking around the table in opposite directions, non-overlapping utterances." @@ -372,4 +412,12 @@ scenes: azimuth: ["120:1:60 + 360", "120:-1:180 - 360"] elevation: [20, 50] overlap: -1.0 + + cat6_7: + name: "cat6/a6s07.wav" + description: "Preliminary: Two talkers walking around the table in opposite directions, non-overlapping utterances." + source: ["f3s14.wav", "m3s14.wav"] + azimuth: ["120:1:60 + 360", "120:-1:180 - 360"] + elevation: [20, 50] + overlap: -1.0 \ No newline at end of file diff --git a/item_gen_configs/P800-8.yml b/experiments/selection/P800-8/config/item_gen_P800-8.yml similarity index 72% rename from item_gen_configs/P800-8.yml rename to experiments/selection/P800-8/config/item_gen_P800-8.yml index 8916d0c21af8d650b15c3fd321cefd3fb25bd649..b13ea5d4adfa4564e00138e4bd9ffdac404d0498 100644 --- a/item_gen_configs/P800-8.yml +++ b/experiments/selection/P800-8/config/item_gen_P800-8.yml @@ -111,7 +111,7 @@ scenes: name: "cat1/a1s01.wav" description: "" source: ["f1s01.wav", "m1s01.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p08_e_01_01_FOA.wav", "IR_do_p08_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -119,7 +119,7 @@ scenes: name: "cat1/a1s02.wav" description: "" source: ["m2s01.wav", "f2s01.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p08_e_01_01_FOA.wav", "IR_do_p08_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -127,7 +127,7 @@ scenes: name: "cat1/a1s03.wav" description: "" source: ["f3s01.wav", "m3s01.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p08_e_01_01_FOA.wav", "IR_do_p08_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -135,7 +135,7 @@ scenes: name: "cat1/a1s04.wav" description: "" source: ["m1s02.wav", "f1s02.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p08_e_01_01_FOA.wav", "IR_do_p08_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -143,7 +143,7 @@ scenes: name: "cat1/a1s05.wav" description: "" source: ["f2s02.wav", "m2s02.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p08_e_01_01_FOA.wav", "IR_do_p08_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -151,7 +151,15 @@ scenes: name: "cat1/a1s06.wav" description: "" source: ["m3s02.wav", "f3s02.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p08_e_01_01_FOA.wav", "IR_do_p08_e_02_01_FOA.wav"] + overlap: 0.5 + format: "FOA" + + cat1_7: + name: "cat1/a1s07.wav" + description: "Preliminary: " + source: ["f1s13.wav", "m1s13.wav"] + IR: ["IR_do_p08_e_01_01_FOA.wav", "IR_do_p08_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -203,11 +211,19 @@ scenes: overlap: 0.5 format: "HOA2" + cat2_7: + name: "cat2/a2s07.wav" + description: "Preliminary: " + source: ["m2s13.wav", "f2s13.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] + overlap: 0.5 + format: "HOA2" + cat3_1: name: "cat3/a3s01.wav" description: "" source: ["f2s05.wav", "m2s05.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p08_e_01_01_FOA.wav", "IR_do_p08_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -215,7 +231,7 @@ scenes: name: "cat3/a3s02.wav" description: "" source: ["m3s05.wav", "f3s05.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p08_e_01_01_FOA.wav", "IR_do_p08_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -223,7 +239,7 @@ scenes: name: "cat3/a3s03.wav" description: "" source: ["f1s05.wav", "m1s05.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p08_e_01_01_FOA.wav", "IR_do_p08_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -231,7 +247,7 @@ scenes: name: "cat3/a3s04.wav" description: "" source: ["m2s06.wav", "f2s06.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p08_e_01_01_FOA.wav", "IR_do_p08_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -239,7 +255,7 @@ scenes: name: "cat3/a3s05.wav" description: "" source: ["f3s06.wav", "m3s06.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p08_e_01_01_FOA.wav", "IR_do_p08_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -247,7 +263,15 @@ scenes: name: "cat3/a3s06.wav" description: "" source: ["m1s06.wav", "f1s06.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p08_e_01_01_FOA.wav", "IR_do_p08_e_02_01_FOA.wav"] + overlap: 0.5 + format: "FOA" + + cat3_7: + name: "cat3/a3s07.wav" + description: "Preliminary: " + source: ["f3s13.wav", "m3s13.wav"] + IR: ["IR_do_p08_e_01_01_FOA.wav", "IR_do_p08_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -255,55 +279,63 @@ scenes: name: "cat4/a4s01.wav" description: "" source: ["m1s07.wav", "f1s07.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] overlap: 0.5 - format: "FOA" + format: "HOA2" cat4_2: name: "cat4/a4s02.wav" description: "" source: ["f2s07.wav", "m2s07.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] overlap: 0.5 - format: "FOA" + format: "HOA2" cat4_3: name: "cat4/a4s03.wav" description: "" source: ["m3s07.wav", "f3s07.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] overlap: 0.5 - format: "FOA" + format: "HOA2" cat4_4: name: "cat4/a4s04.wav" description: "" source: ["f1s08.wav", "m1s08.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] overlap: 0.5 - format: "FOA" + format: "HOA2" cat4_5: name: "cat4/a4s05.wav" description: "" source: ["m2s08.wav", "f2s08.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] overlap: 0.5 - format: "FOA" + format: "HOA2" cat4_6: name: "cat4/a4s06.wav" description: "" source: ["f3s08.wav", "m3s08.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] overlap: 0.5 - format: "FOA" + format: "HOA2" + + cat4_7: + name: "cat4/a4s07.wav" + description: "Preliminary: " + source: ["m1s14.wav", "f1s14.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] + overlap: 0.5 + format: "HOA2" cat5_1: name: "cat5/a5s01.wav" description: "" source: ["f3s09.wav", "m3s09.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p08_e_01_01_FOA.wav", "IR_do_p08_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -311,7 +343,7 @@ scenes: name: "cat5/a5s02.wav" description: "" source: ["m1s09.wav", "f1s09.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p08_e_01_01_FOA.wav", "IR_do_p08_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -319,7 +351,7 @@ scenes: name: "cat5/a5s03.wav" description: "" source: ["f2s09.wav", "m2s09.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p08_e_01_01_FOA.wav", "IR_do_p08_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -327,7 +359,7 @@ scenes: name: "cat5/a5s04.wav" description: "" source: ["m3s10.wav", "f3s10.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p08_e_01_01_FOA.wav", "IR_do_p08_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -335,7 +367,7 @@ scenes: name: "cat5/a5s05.wav" description: "" source: ["f1s10.wav", "m1s10.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p08_e_01_01_FOA.wav", "IR_do_p08_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -343,7 +375,15 @@ scenes: name: "cat5/a5s06.wav" description: "" source: ["m2s10.wav", "f2s10.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p08_e_01_01_FOA.wav", "IR_do_p08_e_02_01_FOA.wav"] + overlap: 0.5 + format: "FOA" + + cat5_7: + name: "cat5/a5s07.wav" + description: "Preliminary: " + source: ["f2s14.wav", "m2s14.wav"] + IR: ["IR_do_p08_e_01_01_FOA.wav", "IR_do_p08_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -351,48 +391,55 @@ scenes: name: "cat6/a6s01.wav" description: "" source: ["m2s11.wav", "f2s11.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] overlap: 0.5 - format: "FOA" + format: "HOA2" cat6_2: name: "cat6/a6s02.wav" description: "" source: ["f3s11.wav", "m3s11.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] overlap: 0.5 - format: "FOA" + format: "HOA2" cat6_3: name: "cat6/a6s03.wav" description: "" source: ["m1s11.wav", "f1s11.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] overlap: 0.5 - format: "FOA" + format: "HOA2" cat6_4: name: "cat6/a6s04.wav" description: "" source: ["f2s12.wav", "m2s12.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] overlap: 0.5 - format: "FOA" + format: "HOA2" cat6_5: name: "cat6/a6s05.wav" description: "" source: ["m3s12.wav", "f3s12.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] overlap: 0.5 - format: "FOA" + format: "HOA2" cat6_6: name: "cat6/a6s06.wav" description: "" source: ["f1s12.wav", "m1s12.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] overlap: 0.5 - format: "FOA" + format: "HOA2" + cat6_7: + name: "cat6/a6s07.wav" + description: "Preliminary:" + source: ["m3s14.wav", "f3s14.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] + overlap: 0.5 + format: "HOA2" diff --git a/item_gen_configs/P800-9.yml b/experiments/selection/P800-9/config/item_gen_P800-9.yml similarity index 72% rename from item_gen_configs/P800-9.yml rename to experiments/selection/P800-9/config/item_gen_P800-9.yml index dc8121264244682fdeaf27bf6ec4668e3d21d21d..c46edb177eec281889f285512fe8324b3861283e 100644 --- a/item_gen_configs/P800-9.yml +++ b/experiments/selection/P800-9/config/item_gen_P800-9.yml @@ -111,7 +111,7 @@ scenes: name: "cat1/a1s01.wav" description: "" source: ["f1s01.wav", "m1s01.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p09_e_01_01_FOA.wav", "IR_do_p09_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -119,7 +119,7 @@ scenes: name: "cat1/a1s02.wav" description: "" source: ["m2s01.wav", "f2s01.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p09_e_01_01_FOA.wav", "IR_do_p09_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -127,7 +127,7 @@ scenes: name: "cat1/a1s03.wav" description: "" source: ["f3s01.wav", "m3s01.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p09_e_01_01_FOA.wav", "IR_do_p09_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -135,7 +135,7 @@ scenes: name: "cat1/a1s04.wav" description: "" source: ["m1s02.wav", "f1s02.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p09_e_01_01_FOA.wav", "IR_do_p09_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -143,7 +143,7 @@ scenes: name: "cat1/a1s05.wav" description: "" source: ["f2s02.wav", "m2s02.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p09_e_01_01_FOA.wav", "IR_do_p09_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -151,7 +151,15 @@ scenes: name: "cat1/a1s06.wav" description: "" source: ["m3s02.wav", "f3s02.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p09_e_01_01_FOA.wav", "IR_do_p09_e_02_01_FOA.wav"] + overlap: 0.5 + format: "FOA" + + cat1_7: + name: "cat1/a1s07.wav" + description: "Preliminary: " + source: ["f1s13.wav", "m1s13.wav"] + IR: ["IR_do_p09_e_01_01_FOA.wav", "IR_do_p09_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -203,11 +211,19 @@ scenes: overlap: 0.5 format: "HOA2" + cat2_7: + name: "cat2/a2s07.wav" + description: "Preliminary: " + source: ["m2s13.wav", "f2s13.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] + overlap: 0.5 + format: "HOA2" + cat3_1: name: "cat3/a3s01.wav" description: "" source: ["f2s05.wav", "m2s05.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p09_e_01_01_FOA.wav", "IR_do_p09_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -215,7 +231,7 @@ scenes: name: "cat3/a3s02.wav" description: "" source: ["m3s05.wav", "f3s05.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p09_e_01_01_FOA.wav", "IR_do_p09_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -223,15 +239,15 @@ scenes: name: "cat3/a3s03.wav" description: "" source: ["f1s05.wav", "m1s05.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p09_e_01_01_FOA.wav", "IR_do_p09_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" - + cat3_4: name: "cat3/a3s04.wav" description: "" source: ["m2s06.wav", "f2s06.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p09_e_01_01_FOA.wav", "IR_do_p09_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -239,7 +255,7 @@ scenes: name: "cat3/a3s05.wav" description: "" source: ["f3s06.wav", "m3s06.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p09_e_01_01_FOA.wav", "IR_do_p09_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -247,7 +263,15 @@ scenes: name: "cat3/a3s06.wav" description: "" source: ["m1s06.wav", "f1s06.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p09_e_01_01_FOA.wav", "IR_do_p09_e_02_01_FOA.wav"] + overlap: 0.5 + format: "FOA" + + cat3_7: + name: "cat3/a3s07.wav" + description: "Preliminary: " + source: ["f3s13.wav", "m3s13.wav"] + IR: ["IR_do_p09_e_01_01_FOA.wav", "IR_do_p09_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -255,55 +279,63 @@ scenes: name: "cat4/a4s01.wav" description: "" source: ["m1s07.wav", "f1s07.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] overlap: 0.5 - format: "FOA" + format: "HOA2" cat4_2: name: "cat4/a4s02.wav" description: "" source: ["f2s07.wav", "m2s07.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] overlap: 0.5 - format: "FOA" + format: "HOA2" cat4_3: name: "cat4/a4s03.wav" description: "" source: ["m3s07.wav", "f3s07.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] overlap: 0.5 - format: "FOA" + format: "HOA2" cat4_4: name: "cat4/a4s04.wav" description: "" source: ["f1s08.wav", "m1s08.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] overlap: 0.5 - format: "FOA" + format: "HOA2" cat4_5: name: "cat4/a4s05.wav" description: "" source: ["m2s08.wav", "f2s08.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] overlap: 0.5 - format: "FOA" + format: "HOA2" cat4_6: name: "cat4/a4s06.wav" description: "" source: ["f3s08.wav", "m3s08.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] overlap: 0.5 - format: "FOA" + format: "HOA2" + + cat4_7: + name: "cat4/a4s07.wav" + description: "Preliminary: " + source: ["m1s14.wav", "f1s14.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] + overlap: 0.5 + format: "HOA2" cat5_1: name: "cat5/a5s01.wav" description: "" source: ["f3s09.wav", "m3s09.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p09_e_01_01_FOA.wav", "IR_do_p09_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -311,7 +343,7 @@ scenes: name: "cat5/a5s02.wav" description: "" source: ["m1s09.wav", "f1s09.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p09_e_01_01_FOA.wav", "IR_do_p09_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -319,7 +351,7 @@ scenes: name: "cat5/a5s03.wav" description: "" source: ["f2s09.wav", "m2s09.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p09_e_01_01_FOA.wav", "IR_do_p09_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -327,7 +359,7 @@ scenes: name: "cat5/a5s04.wav" description: "" source: ["m3s10.wav", "f3s10.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p09_e_01_01_FOA.wav", "IR_do_p09_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -335,7 +367,7 @@ scenes: name: "cat5/a5s05.wav" description: "" source: ["f1s10.wav", "m1s10.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p09_e_01_01_FOA.wav", "IR_do_p09_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -343,7 +375,15 @@ scenes: name: "cat5/a5s06.wav" description: "" source: ["m2s10.wav", "f2s10.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["IR_do_p09_e_01_01_FOA.wav", "IR_do_p09_e_02_01_FOA.wav"] + overlap: 0.5 + format: "FOA" + + cat5_7: + name: "cat5/a5s07.wav" + description: "Preliminary: " + source: ["f2s14.wav", "m2s14.wav"] + IR: ["IR_do_p09_e_01_01_FOA.wav", "IR_do_p09_e_02_01_FOA.wav"] overlap: 0.5 format: "FOA" @@ -351,48 +391,55 @@ scenes: name: "cat6/a6s01.wav" description: "" source: ["m2s11.wav", "f2s11.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] overlap: 0.5 - format: "FOA" + format: "HOA2" cat6_2: name: "cat6/a6s02.wav" description: "" source: ["f3s11.wav", "m3s11.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] overlap: 0.5 - format: "FOA" + format: "HOA2" cat6_3: name: "cat6/a6s03.wav" description: "" source: ["m1s11.wav", "f1s11.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] overlap: 0.5 - format: "FOA" + format: "HOA2" cat6_4: name: "cat6/a6s04.wav" description: "" source: ["f2s12.wav", "m2s12.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] overlap: 0.5 - format: "FOA" + format: "HOA2" cat6_5: name: "cat6/a6s05.wav" description: "" source: ["m3s12.wav", "f3s12.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] overlap: 0.5 - format: "FOA" + format: "HOA2" cat6_6: name: "cat6/a6s06.wav" description: "" source: ["f1s12.wav", "m1s12.wav"] - IR: ["IR_do_p04_e_01_01_FOA.wav", "IR_do_p04_e_02_01_FOA.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] overlap: 0.5 - format: "FOA" + format: "HOA2" + cat6_7: + name: "cat6/a6s07.wav" + description: "Preliminary:" + source: ["m3s14.wav", "f3s14.wav"] + IR: ["Nokia_Small_Room3_TalkPos1_EigenOwnHoA2_SinSweep_9chn.wav", "Nokia_Small_Room3_TalkPos2_EigenOwnHoA2_SinSweep_9chn.wav"] + overlap: 0.5 + format: "HOA2" diff --git a/ivas_processing_scripts/generation/__init__.py b/ivas_processing_scripts/generation/__init__.py index 6269871a61814919b8be76638c48647a26cbfc3b..a07bd7331f193ffed3744d983257cee1dc1a42f2 100755 --- a/ivas_processing_scripts/generation/__init__.py +++ b/ivas_processing_scripts/generation/__init__.py @@ -87,25 +87,24 @@ def main(args): # set up logging logger = logging_init(args, cfg) + # make format a list + if not isinstance(cfg.format, list): + cfg.format = [cfg.format] + # generate ISM and STEREO items - if cfg.format == "ISM1": + if "ISM1" in cfg.format: # generate ISM1 items with metadata according to scene description process_ism1_items.generate_ism1_items(cfg, logger) - elif cfg.format == "ISM2": + elif "ISM2" in cfg.format: # generate ISM2 items with metadata according to scene description process_ism2_items.generate_ism2_items(cfg, logger) - elif cfg.format == "STEREO": + elif "STEREO" in cfg.format: # generate STEREO items according to scene description process_stereo_items.generate_stereo_items(cfg, logger) - - # make format a list - if not isinstance(cfg.format, list): - cfg.format = [cfg.format] - - if "FOA" in cfg.format or "HOA2" in cfg.format: + elif "FOA" in cfg.format or "HOA2" in cfg.format: # generate FOA/HOA2 items according to scene description process_ambi_items.generate_ambi_items(cfg, logger) # copy configuration to output directory - with open(cfg.output_path.joinpath(f"{cfg.format}.yml"), "w") as f: + with open(cfg.output_path.joinpath(f"{'_'.join(cfg.format)}.yml"), "w") as f: yaml.safe_dump(cfg._yaml_dump, f) diff --git a/ivas_processing_scripts/generation/process_ism1_items.py b/ivas_processing_scripts/generation/process_ism1_items.py index e78c9a57e641f5004ea833bdcaeecef3386a47d4..f6d14b1c44f80c2802103fe03385768fdd411205 100644 --- a/ivas_processing_scripts/generation/process_ism1_items.py +++ b/ivas_processing_scripts/generation/process_ism1_items.py @@ -299,13 +299,13 @@ def generate_ism1_scene( f"Incorrect value(s) of elevation: {ele[(ele > 90) | (ele < -90)]}" ) - # additional metadata - dist = np.ones(N_frames) # !!!! TBD - check what to do with these metadata + # additional metadata (default values) + radius = np.ones(N_frames) spread = np.zeros(N_frames) gain = np.ones(N_frames) # arrange all metadata fields column-wise into a matrix - y_meta = np.column_stack((azi, ele, dist, spread, gain)) + y_meta = np.column_stack((azi, ele, radius, spread, gain)) # append pre-amble and post-amble to all sources if cfg.preamble != 0.0: @@ -358,9 +358,7 @@ def generate_ism1_scene( csv_filename = os.path.join( cfg.output_path, os.path.dirname(scene["name"]), - cfg.use_output_prefix - + os.path.splitext(os.path.basename(scene["name"]))[0] - + ".0.csv", + cfg.use_output_prefix + os.path.basename(scene["name"]) + ".0.csv", ) with open( diff --git a/ivas_processing_scripts/generation/process_ism2_items.py b/ivas_processing_scripts/generation/process_ism2_items.py index ebb2725f2fcfe7025199ece8b4abbc71dc67c2e6..c1c0964533427c97320e553eec600021e6233ee7 100644 --- a/ivas_processing_scripts/generation/process_ism2_items.py +++ b/ivas_processing_scripts/generation/process_ism2_items.py @@ -274,13 +274,13 @@ def generate_ism2_scene( f"Incorrect value(s) of elevation: {ele[(ele > 90) | (ele < -90)]}" ) - # additional metadata - dist = np.ones(N_frames) # !!!! TBD - check what to do with these metadata + # additional metadata (default values) + radius = np.ones(N_frames) spread = np.zeros(N_frames) gain = np.ones(N_frames) # arrange all metadata fields column-wise into a matrix - x_meta = np.column_stack((azi, ele, dist, spread, gain)) + x_meta = np.column_stack((azi, ele, radius, spread, gain)) # shift the second (and all other) source files (positive shift creates overlap, negative shift creates a gap) if i > 0: @@ -422,9 +422,7 @@ def generate_ism2_scene( csv_filename = os.path.join( cfg.output_path, os.path.dirname(scene["name"]), - cfg.use_output_prefix - + os.path.splitext(os.path.basename(scene["name"]))[0] - + f".{i}.csv", + cfg.use_output_prefix + os.path.basename(scene["name"]) + f".{i}.csv", ) with open(