Skip to content

Instantly share code, notes, and snippets.

@djmango
Created June 16, 2023 03:52
Show Gist options
  • Save djmango/5a23caa273bcd079c2a4f5fa89cb5ad4 to your computer and use it in GitHub Desktop.
Save djmango/5a23caa273bcd079c2a4f5fa89cb5ad4 to your computer and use it in GitHub Desktop.
Example Transcript JSON object
{
"transcription_id": "7cf094b91662b7",
"user_id": "931c215c-b6c6-4b86-96dd-193f18d8c6dc",
"created": "2023-05-03T02:40:52.006612+00:00",
"updated": "2023-05-03T02:41:46.412716+00:00",
"name": "2023-05-03 02:40:52",
"status": "complete",
"orphaned": false,
"translate": false,
"recipients": [
"all"
],
"webhooks": [],
"file_ffprobe": {
"streams": [
{
"index": 0,
"codec_name": "h264",
"codec_long_name": "H.264 / AVC / MPEG-4 AVC / MPEG-4 part 10",
"profile": "High",
"codec_type": "video",
"codec_tag_string": "avc1",
"codec_tag": "0x31637661",
"width": 1280,
"height": 534,
"coded_width": 1280,
"coded_height": 534,
"closed_captions": 0,
"film_grain": 0,
"has_b_frames": 0,
"pix_fmt": "yuv420p",
"level": 31,
"chroma_location": "left",
"field_order": "progressive",
"refs": 1,
"is_avc": "true",
"nal_length_size": "4",
"id": "0x1",
"r_frame_rate": "24/1",
"avg_frame_rate": "24/1",
"time_base": "1/48",
"start_pts": 0,
"start_time": "0:00:00.000000",
"duration_ts": 35243,
"duration": "0:12:14.229167",
"bit_rate": "1829574",
"bits_per_raw_sample": "8",
"nb_frames": "17622",
"extradata_size": 39,
"disposition": {
"default": 1,
"dub": 0,
"original": 0,
"comment": 0,
"lyrics": 0,
"karaoke": 0,
"forced": 0,
"hearing_impaired": 0,
"visual_impaired": 0,
"clean_effects": 0,
"attached_pic": 0,
"timed_thumbnails": 0,
"captions": 0,
"descriptions": 0,
"metadata": 0,
"dependent": 0,
"still_image": 0
},
"tags": {
"language": "und",
"handler_name": "VideoHandler",
"vendor_id": "[0][0][0][0]"
}
},
{
"index": 1,
"codec_name": "aac",
"codec_long_name": "AAC (Advanced Audio Coding)",
"profile": "LC",
"codec_type": "audio",
"codec_tag_string": "mp4a",
"codec_tag": "0x6134706d",
"sample_fmt": "fltp",
"sample_rate": "44100",
"channels": 2,
"channel_layout": "stereo",
"bits_per_sample": 0,
"initial_padding": 0,
"id": "0x2",
"r_frame_rate": "0/0",
"avg_frame_rate": "0/0",
"time_base": "1/44100",
"start_pts": 0,
"start_time": "0:00:00.000000",
"duration_ts": 32380928,
"duration": "0:12:14.261406",
"bit_rate": "191999",
"nb_frames": "31622",
"extradata_size": 16,
"disposition": {
"default": 1,
"dub": 0,
"original": 0,
"comment": 0,
"lyrics": 0,
"karaoke": 0,
"forced": 0,
"hearing_impaired": 0,
"visual_impaired": 0,
"clean_effects": 0,
"attached_pic": 0,
"timed_thumbnails": 0,
"captions": 0,
"descriptions": 0,
"metadata": 0,
"dependent": 0,
"still_image": 0
},
"tags": {
"creation_time": "2013-06-01T09:44:03.000000Z",
"language": "und",
"handler_name": "IsoMedia File Produced by Google, 5-11-2011",
"vendor_id": "[0][0][0][0]"
}
}
],
"format": {
"filename": "https://storage.googleapis.com/gtv-videos-bucket/sample/TearsOfSteel.mp4",
"nb_streams": 2,
"nb_programs": 0,
"format_name": "mov,mp4,m4a,3gp,3g2,mj2",
"format_long_name": "QuickTime / MOV",
"start_time": "0:00:00.000000",
"duration": "0:12:14.261406",
"size": "185765954",
"bit_rate": "2023976",
"probe_score": 100,
"tags": {
"major_brand": "mp42",
"minor_version": "0",
"compatible_brands": "isommp42",
"creation_time": "2013-06-01T09:43:52.000000Z"
}
}
},
"file_mimetype": "video/mp4",
"file_extension": "mp4",
"url": "https://storage.googleapis.com/gtv-videos-bucket/sample/TearsOfSteel.mp4",
"duration_seconds": 734.0,
"validated": true,
"uploaded": false,
"transcribed": true,
"transcription_model": "openai/whisper-large",
"transcription_backend": "openai",
"language": "en",
"text_segments": [
{
"start": 0.0,
"end": 7.0,
"text": " We have main engine start."
},
{
"start": 7.0,
"end": 14.0,
"text": " Four, three, two, one."
},
],
"text": "We have main engine start. Four, three, two, one.",
"heading_segments": [],
"summary": "The transcription describes a scene in which two characters, Tom and Celia, discuss their passions and fears. They plan to perform in some kind of show or event, but they are running out of time. They start performing, but things go wrong, causing memories to be overridden. Eventually, they learn a lesson from the experience."
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment