(Informative)
1. Audio Scene Geometry
An example of Audio Scene Geometry.
{
“BlockIndex”: 1,
“BlockStart”: 1631536788000,
“BlockEnd”: 1631536788063,
“SpeechCount”: 2,
“SpeechList”: [
{
“SpeechID”: “09859d16-3c73-4bb0-9c74-91b451e34925”,
“ChannelID”: 1,
“AzimuthDirection”: 90.0,
“ElevationDirection”: 30.0,
“Distance”: 2.0,
“DistanceFlag”: false
},
{
“SpeechID”: “3cdc2973-e95e-4125-acb7-121ad89067ef”,
“ChannelID”: 2,
“AzimuthDirection”: 180.0,
“ElevationDirection”: 30.0,
“Distance”: 1.27,
“DistanceFlag”: false
}
],
“SourceDetectionMask”: [0,1]
}
2. Damaged List
An example of a damaged list JSON file:
{
“DamagedSections”: [
{
“SegmentStart”: “00:00:01.351”,
“SegmentEnd”: “00:01:55.654”,
},
{
“SegmentStart”: “00:01:55.654”,
“SegmentEnd”: “00:02:35.168”,
}
]
}
3. Editing List
Example of a complete Editing List with two elements: the first related to reading backwards error, whereas the second to speed and equalisation errors.
{
“OriginalSpeedStandard”: 15,
“OriginalEqualisationStandard”: “IEC1”,
“OriginalSampleFrequency”: 96000,
“Restorations”: [{
“RestorationID”: “09859d16-3c73-4bb0-9c74-91b451e34925”,
“PreservationAudioFileStart”: “00:00:00.000”,
“PreservationAudioFileEnd”: “00:00:05.125”,
“RestoredAudioFileURI”: “http://www.place_to_be_defined.com/restored_1”,
“ReadingBackwords”: true,
“AppliedSpeedStandard”: 15,
“AppliedSampleFrequency”: 96000,
“OriginalEqualisationStandard”: “IEC1”
},
{
“RestorationID”: “3cdc2973-e95e-4125-acb7-121ad89067ef “,
“PreservationAudioFileStart”: “00:00:05.125”,
“PreservationAudioFileEnd”: “00:00:15.230”,
“RestoredAudioFileURI”: “http://www.place_to_be_defined.com/restored_2”,
“ReadingBackwords”: false,
“AppliedSpeedStandard”: 7.5,
“AppliedSampleFrequency”: 48000,
“OriginalEqualisationStandard”: “IEC2”
}]
}
4. Irregularity File
An example of Irregularity File from Audio Analyser to Video Analyser is:
{
“Offset”: 150,
“Irregularities”: [{
“IrregularityID”: “09859d16-3c73-4bb0-9c74-91b451e34925”,
“Source”: “a”,
“TimeLabel”: “00:02:45.040”
},{
“IrregularityID”: “3cdc2973-e95e-4125-acb7-121ad89067ef”,
“Source”: “a”,
“TimeLabel”: “00:04:89.020”
}]
}
An example of Irregularity File from Video Analyser to Audio Analyser is:
{
“Irregularities”: [{
“IrregularityID”: “09859d16-3c73-4bb0-9c74-91b451e34925”,
“Source”: “v”,
“TimeLabel”: “00:02:45.040”
},{
“IrregularityID”: “3cdc2973-e95e-4125-acb7-121ad89067ef”,
“Source”: “v”,
“TimeLabel”: “00:04:89.020”
}]
}
An example of Irregularity File from Audio Analyser to Tape Irregularity Classifier is:
{
“Offset”: 150,
“Irregularities”: [{
“IrregularityID”: “09859d16-3c73-4bb0-9c74-91b451e34925”,
“Source”: “a”,
“TimeLabel”: “00:02:45.040”,
“AudioSegmentURI”: “http://www.place_to_be_defined.com/audio_segment_1”,
“IrregularityType”: “ssv”,
“IrregularityProperties: {
“ReadingSpeedStandard”: 15,
“ReadingEqualisationStandard”: “IEC1”,
“WritingSpeedStandard”: 7.5,
“WritingEqualisationStandard”: “IEC2”
}
},{
“IrregularityID”: “3cdc2973-e95e-4125-acb7-121ad89067ef”,
“Source”: “v”,
“TimeLabel”: “00:04:89.020”,
“AudioSegmentURI”: “http://www.place_to_be_defined.com/audio_segment_2”
}]
}
An example of Irregularity File from Video Analyser to Tape Irregularity Classifier is:
{
“Offset”: 150,
“Irregularities”: [{
“IrregularityID”: “09859d16-3c73-4bb0-9c74-91b451e34925”,
“Source”: “a”,
“TimeLabel”: “00:02:45.040”,
“ImageURI”: “http://www.place_to_be_defined.com/image_1”
},{
“IrregularityID”: “3cdc2973-e95e-4125-acb7-121ad89067ef”,
“Source”: “v”,
“TimeLabel”: “00:04:89.020”,
“ImageURI”: “http://www.place_to_be_defined.com/image_2”
}]
}
An example of Irregularity File from Tape Irregularity Classifier to Tape Audio Restoration is:
{
“Irregularities”: [{
“IrregulatityID”: “09859d16-3c73-4bb0-9c74-91b451e34925”,
“Source”: “a”,
“TimeLabel”: “00:02:45.040”,
“IrregularityType”: “ssv”,
“IrregularityProperties: {
“ReadingSpeedStandard”: 15,
“ReadingEqualisationStandard”: “IEC1”,
“WritingSpeedStandard”: 7.5,
“WritingEqualisationStandard”: “IEC2”
}
},{
“IrregulatityID”: “3cdc2973-e95e-4125-acb7-121ad89067ef”,
“Source”: “a”,
“TimeLabel”: “00:04:89.020”,
“IrregularityType”: “esv”,
“IrregularityProperties: {
“ReadingSpeedStandard”: 7.5,
“ReadingEqualisationStandard”: “IEC2”,
“WritingSpeedStandard”: 7.5,
“WritingEqualisationStandard”: “IEC1”
}
}]
}
An example of Irregularity File from Tape Irregularity Classifier to Packager is:
{
“Offset”: 150,
“Irregularities”: [{
“IrregulatityID”: “09859d16-3c73-4bb0-9c74-91b451e34925”,
“Source”: “v”,
“TimeLabel”: “00:02:45.040”,
“IrregularityType”: “sot”,
“ImageURI”: “http://www.place_to_be_defined.com/image_1”
},{
“IrregulatityID”: “3cdc2973-e95e-4125-acb7-121ad89067ef”,
“Source”: “b”,
“TimeLabel”: “00:04:89.020”,
“IrregularityType”: “sp”,
“ImageURI”: “http://www.place_to_be_defined.com/image_2”
}]
}
5. Microphone Array Geometry
{
“MicrophoneArrayType”: 0,
“MicrophoneArrayScat”: 0,
“MicrophoneArrayFilterURI”: “https://mpai.community/standards/mpai-cae/”,
“SamplingRate”: 4,
“SampleType”: 0,
“BlockSize”: 3,
“NumberofMicrophones”: 4,
“MicrophoneList”: [
{
“xCoord”: 1.0,
“yCoord”: 2.0,
“zCoord”: 3.0,
“directivity”: 0,
“micxLookCoord”: 70.2,
“micyLookCoord”: 75.5,
“miczLookCoord”: 87.3
},
{
“xCoord”: 5.3,
“yCoord”: 5.6,
“zCoord”: 74.3,
“directivity”: 1,
“micxLookCoord”: 67.9,
“micyLookCoord”: 75.2,
“miczLookCoord”: 90.0
},
{
“xCoord”: 34.2,
“yCoord”: 65.2,
“zCoord”: 56.9,
“directivity”: 2,
“micxLookCoord”: 56.8,
“micyLookCoord”: 87.9,
“miczLookCoord”: 78.3
},
{
“xCoord”: 34.9,
“yCoord”: 29.7,
“zCoord”: 89.8,
“directivity”: 3,
“micxLookCoord”: 56.9,
“micyLookCoord”: 65.4,
“miczLookCoord”: 72.9
}
],
“MicrophoneArrayLookCoord”: [{
“xLookCoord”: 56.0,
“yLookCoord”: 90.0,
“zLookCoord”: 86.3
}]
}
6. Prosodic Speech Features
{
“intonations”: [{
“pitch”: 300,
“intensity”: 88.7,
“duration”:100.0
},{
“pitch”: 180,
“intensity”: 85.2,
“duration”:98.0
},{
“pitch”: 280,
“intensity”: 92.5,
“duration”:92.0
},{
“pitch”: 230,
“intensity”: 81.9,
“duration”:98.0
},{
“pitch”: 150,
“intensity”: 78.3,
“duration”:98.0
}],
“unit”: “phoneme”
}
7. Neural Speech Features
[
1.456,
5.1289,
0.12,
12345.54378,
12389943.2837,
58.29
]