音視頻入門基礎(一)

{"type":"doc","content":[{"type":"paragraph","attrs":{"indent":1,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"本文主要介紹的是音視頻的一些概念的東西,讓大家對音視頻大概有個瞭解。"}]},{"type":"heading","attrs":{"align":null,"level":1},"content":[{"type":"text","text":"1、原始數據"}]},{"type":"paragraph","attrs":{"indent":2,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"原始數據表示的是,我們通過視頻採集卡或者拾音器採集到的數據,播放的時候也是播放原始數據。變聲、馬賽克等處理的也是原始數據。"}]},{"type":"heading","attrs":{"align":null,"level":2},"content":[{"type":"text","text":"1.1音頻"}]},{"type":"bulletedlist","content":[{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":1,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"格式"}]}]},{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":2,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"PCM"}]}]},{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":1,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"重要參數"}]}]},{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":2,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"採樣率:"}]}]}]},{"type":"paragraph","attrs":{"indent":3,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"一秒鐘內對聲音信號的採樣次數,採樣頻率越高聲音的還原就越真實。"}]},{"type":"paragraph","attrs":{"indent":3,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"常見的採樣率有 8K、16K、22.05K、32K、44.1K、48K"}]},{"type":"bulletedlist","content":[{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":2,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"聲道數:"}]}]}]},{"type":"paragraph","attrs":{"indent":3,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"單聲道、雙聲道(立體聲)"}]},{"type":"bulletedlist","content":[{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":2,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"量化位:"}]}]}]},{"type":"paragraph","attrs":{"indent":3,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"決定了聲音的動態範圍"}]},{"type":"paragraph","attrs":{"indent":3,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"常見的有16bit、24bit、32bit"}]},{"type":"heading","attrs":{"align":null,"level":2},"content":[{"type":"text","text":"1.2視頻"}]},{"type":"bulletedlist","content":[{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":1,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"重要參數"}]}]},{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":2,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"分辨率:640*480、1280*720、1920*1080、2K、4K"}]}]},{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":2,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"像素格式:RGB、YUV"}]}]},{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":3,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"RGB:紅綠藍"}]}]},{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":4,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"常見格式:rbg8、rgb16(565)、rgb24、rgb32等"}]}]}]},{"type":"paragraph","attrs":{"indent":5,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"RGB8: 灰度圖、調色板"}]},{"type":"paragraph","attrs":{"indent":5,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"RGB16(565):["},{"type":"text","marks":[{"type":"color","attrs":{"color":"#F5222D","name":"red"}}],"text":"rrrrr "},{"type":"text","marks":[{"type":"color","attrs":{"color":"#00B050","name":"user"}}],"text":"gggggg"},{"type":"text","text":" "},{"type":"text","marks":[{"type":"color","attrs":{"color":"#00B0F0","name":"user"}}],"text":"bbbbb"},{"type":"text","text":"]"}]},{"type":"paragraph","attrs":{"indent":5,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"RGB24:["},{"type":"text","marks":[{"type":"color","attrs":{"color":"#F5222D","name":"red"}}],"text":"R "},{"type":"text","marks":[{"type":"color","attrs":{"color":"#00B050","name":"user"}}],"text":"G"},{"type":"text","text":" "},{"type":"text","marks":[{"type":"color","attrs":{"color":"#00B0F0","name":"user"}}],"text":"B"},{"type":"text","text":"] [ "},{"type":"text","marks":[{"type":"color","attrs":{"color":"#F5222D","name":"red"}}],"text":"R "},{"type":"text","marks":[{"type":"color","attrs":{"color":"#00B050","name":"user"}}],"text":"G"},{"type":"text","text":" "},{"type":"text","marks":[{"type":"color","attrs":{"color":"#00B0F0","name":"user"}}],"text":"B"},{"type":"text","text":"] ["},{"type":"text","marks":[{"type":"color","attrs":{"color":"#F5222D","name":"red"}}],"text":"R "},{"type":"text","marks":[{"type":"color","attrs":{"color":"#00B050","name":"user"}}],"text":"G"},{"type":"text","text":" "},{"type":"text","marks":[{"type":"color","attrs":{"color":"#00B0F0","name":"user"}}],"text":"B"},{"type":"text","text":"]……"}]},{"type":"paragraph","attrs":{"indent":5,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"RGB32:["},{"type":"text","marks":[{"type":"color","attrs":{"color":"#F5222D","name":"red"}}],"text":"R "},{"type":"text","marks":[{"type":"color","attrs":{"color":"#00B050","name":"user"}}],"text":"G"},{"type":"text","text":" "},{"type":"text","marks":[{"type":"color","attrs":{"color":"#00B0F0","name":"user"}}],"text":"B "},{"type":"text","text":"A] ["},{"type":"text","marks":[{"type":"color","attrs":{"color":"#F5222D","name":"red"}}],"text":"R "},{"type":"text","marks":[{"type":"color","attrs":{"color":"#00B050","name":"user"}}],"text":"G"},{"type":"text","text":" "},{"type":"text","marks":[{"type":"color","attrs":{"color":"#00B0F0","name":"user"}}],"text":"B "},{"type":"text","text":"A] ["},{"type":"text","marks":[{"type":"color","attrs":{"color":"#F5222D","name":"red"}}],"text":"R "},{"type":"text","marks":[{"type":"color","attrs":{"color":"#00B050","name":"user"}}],"text":"G"},{"type":"text","text":" "},{"type":"text","marks":[{"type":"color","attrs":{"color":"#00B0F0","name":"user"}}],"text":"B "},{"type":"text","text":"A]……"}]},{"type":"bulletedlist","content":[{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":3,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"YUV :“Y”表示明亮度,“U”和“V”表示的是色度"}]}]},{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":4,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"常見格式:YV12、NV12、YUY2、I420等"}]}]},{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":4,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"分類: "}]}]}]},{"type":"paragraph","attrs":{"indent":6,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"佔字節數:YUV420、YUV422、YUV444"}]},{"type":"paragraph","attrs":{"indent":6,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"打包方式:平面( YV12 )、半打包( NV12 )、打包格式(YUY2)等"}]},{"type":"bulletedlist","content":[{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":5,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"YV12"}]}]}]},{"type":"paragraph","attrs":{"indent":6,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"[Y0 U0 V0] [Y1 U0 V0] [Y2 U1 V1] [Y3 U1 V1] [Y4 U2 V2]…..[Y8 U0 V0]......"}]},{"type":"image","attrs":{"src":"https://static001.geekbang.org/infoq/0b/0b35ac5c983890d8f510abd744d0f8e4.png","alt":null,"title":null,"style":null,"href":null,"fromPaste":true,"pastePass":true}},{"type":"bulletedlist","content":[{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":4,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"NV12"}]}]}]},{"type":"paragraph","attrs":{"indent":5,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"[Y0 U0 V0] [Y1 U0 V0] [Y2 U1 V1] [Y3 U1 V1] [Y4 U2 V2]…..[Y8 U0 V0]......"}]},{"type":"image","attrs":{"src":"https://static001.geekbang.org/infoq/9a/9aea3a6cb07c8df282643c677dd6b07d.png","alt":null,"title":null,"style":null,"href":null,"fromPaste":true,"pastePass":true}},{"type":"bulletedlist","content":[{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":4,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"YUY2"}]}]}]},{"type":"paragraph","attrs":{"indent":5,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"[Y0 U0 V0] [Y1 U0 V0] [Y2 U1 V1] [Y3 U1 V1] [Y4 U2 V2]….."}]},{"type":"image","attrs":{"src":"https://static001.geekbang.org/infoq/6e/6e3cd04702ffdb41f31e5be20ab3870c.png","alt":null,"title":null,"style":null,"href":null,"fromPaste":true,"pastePass":true}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"heading","attrs":{"align":null,"level":1},"content":[{"type":"text","text":"2.編碼"}]},{"type":"heading","attrs":{"align":null,"level":2},"content":[{"type":"text","text":"2.1音頻編碼"}]},{"type":"bulletedlist","content":[{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":1,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"編碼格式"}]}]},{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":2,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"G711、G722、G726、G729、Mpeg1-layer3(mp3)、AAC、OPUS、speex等"}]}]},{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":1,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"重要參數"}]}]},{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":2,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"採樣率"}]}]},{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":2,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"聲道數"}]}]},{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":2,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"量化位"}]}]},{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":2,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"碼率"}]}]},{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":1,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"例子:"}]}]}]},{"type":"paragraph","attrs":{"indent":2,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"以AAC編碼爲例,AAC編碼包括頭部分和數據部分,AAC的頭有兩種ADTS和ADIF,通常我們見到的都是ADTS,ADTS由兩部分組成,固定頭信息和可變頭信息。下圖位一幀AAC編碼幀數據。"}]},{"type":"image","attrs":{"src":"https://static001.geekbang.org/infoq/85/8558c4937c14e634219f30716ada498d.png","alt":null,"title":null,"style":null,"href":null,"fromPaste":true,"pastePass":true}},{"type":"heading","attrs":{"align":null,"level":2},"content":[{"type":"text","text":"2.2視頻編碼"}]},{"type":"bulletedlist","content":[{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":1,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"編碼格式"}]}]},{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":2,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"mpeg-1、mpeg-2、mpeg-4、vp8、vp9、H264、h265、AV1、AVS系列、H.266、MPEG5等"}]}]},{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":1,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"重要參數"}]}]},{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":2,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"分辨率"}]}]},{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":2,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"幀率"}]}]},{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":2,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"碼率"}]}]},{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":1,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"例子:"}]}]}]},{"type":"paragraph","attrs":{"indent":2,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"以H264編碼爲例,H264編碼幀類型包括 SPS、PPS、IDR、P frame、B frame等。下圖爲一幀H264編碼幀(包含了SPS、PPS、IDR)。"}]},{"type":"image","attrs":{"src":"https://static001.geekbang.org/infoq/f8/f80fbf9d0a840a95bfedf70af6f831a0.png","alt":null,"title":null,"style":null,"href":null,"fromPaste":true,"pastePass":true}},{"type":"heading","attrs":{"align":null,"level":1},"content":[{"type":"text","text":"3.文件格式"}]},{"type":"bulletedlist","content":[{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":1,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"文件格式是一種容器,好比杯子,而音視頻數據好比水。杯子是用來裝水的。"}]}]},{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":1,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"常見格式 "}]}]}]},{"type":"paragraph","attrs":{"indent":2,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"MP3、MOV、AVI、RMVB、MP4、FLV、TS、FMP4、MKV等。"}]},{"type":"bulletedlist","content":[{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":1,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"文件格式分兩種:一種是帶索引的,比如AVI、MP4等;另一種是不帶索引的,比如FLV、TS等"}]}]},{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":1,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"文件格式一般由三部分組成:文件頭+音視頻數據+索引,但是有些沒有索引比如flv,有些沒有文件頭和索引比如TS。"}]}]},{"type":"listitem","content":[{"type":"paragraph","attrs":{"indent":1,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"例子:"}]}]}]},{"type":"paragraph","attrs":{"indent":2,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"以FLV文件爲例,音視頻是如何封裝成FLV的。文件頭後續跟着一幀幀的音視頻數據。每幀數據以flvtag打包,這裏就不具體詳解了,有興趣的可以網上查一下flv tag的結構。"}]},{"type":"image","attrs":{"src":"https://static001.geekbang.org/infoq/9a/9a48fb75d0fb18d52c482f201765aa21.png","alt":null,"title":null,"style":null,"href":null,"fromPaste":true,"pastePass":true}},{"type":"heading","attrs":{"align":null,"level":1},"content":[{"type":"text","text":"4.總結"}]},{"type":"paragraph","attrs":{"indent":1,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"這章節我們主要講了三個內容,原始數據、音視頻編碼、文件格式,都是一些基本概念。其中原始數據格式要記住,變聲馬賽克等音視頻的處理都是對原始數據處理的,編碼過數據需要解碼後才能處理。下一章節我們講講如何編碼以及這些編碼參數有什麼作用。"}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"作者:北京華宇信息技術有限公司-研究院-多媒體實驗室"}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"image","attrs":{"src":"https://static001.geekbang.org/infoq/33/33069c7080ad2b01be584bd800f860c6.png","alt":null,"title":"","style":[{"key":"width","value":"100%"},{"key":"bordertype","value":"none"}],"href":"","fromPaste":false,"pastePass":false}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}}]}
發表評論
所有評論
還沒有人評論,想成為第一個評論的人麼? 請在上方評論欄輸入並且點擊發布.
相關文章