Example of word-tree output from async real-time transcription – Voicegain

Below is a python script that will start async real-time transcription and will poll it fast until the entire audio has been processed. Incremental results will be saved to separate files. In those results the wordTree field will contain the tree of recognition alternatives. Each word has and id and parentId - these can be used to construct a tree structure in your code.

import requests, time, os, json

JWT = "<your JWT>"
headers = {"Authorization":JWT}
audio_url = "https://tracker.voicegain.ai/attachments/download/363/3sec.wav"
body = {
    "sessions": [
        {
            "asyncMode": "REAL-TIME",
            "poll": {
                "afterlife": 60000,
                "persist": 5000
            },
            "content": {
                "incremental": ["word-tree"],
                "full" : ["word-tree"]
            }
        }
    ],
    "audio":{
        "source": {
            "fromUrl": {
                "url": audio_url
            }
        }
    }
}

init_response = requests.post("https://api.voicegain.ai/v1/asr/transcribe/async", json=body, headers=headers).json()
session_id = init_response["sessions"][0]["sessionId"]
polling_url = init_response["sessions"][0]["poll"]["url"]

print("sessionId: {}".format(session_id))

output_path = "output"
if not os.path.exists(output_path):
    os.mkdir(output_path)

index = 0
while True:
    time.sleep(0.05)
    poll_response = requests.get(polling_url+"?full=false", headers=headers).json()
    # write poll_response to JSON
    poll_response_path = os.path.join(output_path, "{}--{}.json".format(session_id, index))
    with open(poll_response_path, 'w') as outfile:
        json.dump(poll_response, outfile)
    print("Save result to {}".format(poll_response_path))

    is_final = poll_response["result"]["final"]
    index += 1
    if is_final:
        break

poll_response = requests.get(polling_url+"?full=true", headers=headers).json()
# write poll_response to JSON
poll_response_path = os.path.join(output_path, "{}--{}.json".format(session_id, index))
with open(poll_response_path, 'w') as outfile:
    json.dump(poll_response, outfile)
print("Save final result to {}".format(poll_response_path))

You can generate JWT using these instructions.

Related articles