{ "hq": [ { "speaker": 0, "text": "I'm looking at a picture of a yellow minion. I like yellow minions because there are minions in yellow. I enjoy minions.", "start": 1.04, "end": 8.02 } ] }