Frame-level result specification
JSON Schema of frame-level result
This is the JSON schema of the frame-level result
{
"$schema": "http://json-schema.org/draft-04/schema#",
"description": "Oliver API frame-level results JSON schema v1.4.3",
"properties": {
"frames": {
"description": "Contains frame results",
"items": {
"description": "Contains results on current frame",
"properties": {
"aced": {
"description": "Identification of speech",
"type": "string"
},
"et": {
"description": "The end time of the frame in the call",
"type": "number"
},
"intensity": {
"description": "The signal intensity",
"properties": {
"framelevel": {
"description": "Result of current frame",
"type": "number"
},
"uptonow": {
"description": "Decision up to current frame",
"type": "number"
}
},
"type": "object"
},
"no": {
"description": "The current frame counter",
"type": "integer"
},
"speakers": {
"description": "Frame results per speaker",
"items": {
"description": "Frame speaker results",
"properties": {
"age": {
"description": "Speaker age",
"properties": {
"framelevel": {
"description": "Result of current frame",
"type": "number"
},
"uptonow": {
"description": "Decision up to current frame",
"type": "number"
}
},
"type": "object"
},
"beep": {
"description": "Beep detection",
"properties": {
"framelevel": {
"description": "Result of current frame",
"type": "number"
},
"uptonow": {
"description": "Decision up to current frame",
"type": "number"
}
},
"type": "object"
},
"emotion": {
"description": "Speaker emotion",
"properties": {
"framelevel": {
"description": "Result of current frame",
"type": "number"
},
"uptonow": {
"description": "Decision up to current frame",
"type": "number"
}
},
"type": "object"
},
"engagement": {
"description": "Speaker engagement",
"properties": {
"framelevel": {
"description": "Result of current frame",
"type": "number"
},
"uptonow": {
"description": "Decision up to current frame",
"type": "number"
}
},
"type": "object"
},
"escalation": {
"description": "Escalation",
"type": "integer"
},
"f0": {
"description": "Baseline frequency",
"properties": {
"framelevel": {
"description": "Result of current frame",
"type": "number"
},
"uptonow": {
"description": "Decision up to current frame",
"type": "number"
}
},
"type": "object"
},
"gender": {
"description": "Speaker gender",
"properties": {
"framelevel": {
"description": "Result of current frame",
"type": "number"
},
"uptonow": {
"description": "Decision up to current frame",
"type": "number"
}
},
"type": "object"
},
"id": {
"description": "The speaker index",
"type": "integer"
},
"language": {
"description": "Speaker language",
"properties": {
"framelevel": {
"description": "Result of current frame",
"type": "number"
},
"uptonow": {
"description": "Decision up to current frame",
"type": "number"
}
},
"type": "object"
},
"politeness": {
"description": "Speaker politeness",
"properties": {
"framelevel": {
"description": "Result of current frame",
"type": "number"
},
"uptonow": {
"description": "Decision up to current frame",
"type": "number"
}
},
"type": "object"
},
"positivity": {
"description": "Speaker positivity",
"properties": {
"framelevel": {
"description": "Result of current frame",
"type": "number"
},
"uptonow": {
"description": "Decision up to current frame",
"type": "number"
}
},
"type": "object"
},
"resolution": {
"description": "Resolution",
"type": "integer"
},
"empathy": {
"description": "Speaker empathy score",
"type": "number"
},
"ring": {
"description": "Ring detection",
"properties": {
"framelevel": {
"description": "Result of current frame",
"type": "number"
},
"uptonow": {
"description": "Decision up to current frame",
"type": "number"
}
},
"type": "object"
},
"snr": {
"description": "Signal-to-noise ratio",
"properties": {
"framelevel": {
"description": "Result of current frame",
"type": "number"
},
"uptonow": {
"description": "Decision up to current frame",
"type": "number"
}
},
"type": "object"
},
"speaking_rate": {
"description": "Speaking rate",
"properties": {
"framelevel": {
"description": "Result of current frame",
"type": "number"
},
"uptonow": {
"description": "Decision up to current frame",
"type": "number"
}
},
"type": "object"
},
"hesitation": {
"description": "Hesitation",
"properties": {
"framelevel": {
"description": "Result of current frame",
"type": "number"
},
"uptonow": {
"description": "Decision up to current frame",
"type": "number"
}
},
"type": "object"
},
"strength": {
"description": "Speaker strength",
"properties": {
"framelevel": {
"description": "Result of current frame",
"type": "number"
},
"uptonow": {
"description": "Decision up to current frame",
"type": "number"
}
},
"type": "object"
},
"success": {
"description": "Call success",
"properties": {
"framelevel": {
"description": "Result of current frame",
"type": "number"
},
"uptonow": {
"description": "Decision up to current frame",
"type": "number"
}
},
"type": "object"
},
"tone_variety": {
"description": "Tone variety (0-5)",
"properties": {
"framelevel": {
"description": "Result of current frame",
"type": "number"
},
"uptonow": {
"description": "Decision up to current frame",
"type": "number"
}
},
"type": "object"
},
"vad": {
"description": "Voice activity detection",
"properties": {
"framelevel": {
"description": "Result of current frame",
"type": "number"
},
"uptonow": {
"description": "Decision up to current frame",
"type": "number"
}
},
"type": "object"
}
},
"type": "object"
},
"type": "array"
},
"st": {
"description": "The start time of the frame in the call",
"type": "number"
}
},
"required": [
"no",
"st",
"et"
],
"type": "object"
},
"type": "array"
}
},
"required": [
"frames"
],
"type": "object"
}
Updated about 2 years ago