// RTP Payload Format for VP9 Video draft-ietf-payload-vp9-03 #include "rtp-packet.h" #include "rtp-profile.h" #include "rtp-payload-internal.h" #include #include #include #include // Timestamp: The RTP timestamp indicates the time when the input frame was sampled, at a clock rate of 90 kHz #define KHz 90 // 90000Hz #define N_VP9_HEADER 1 struct rtp_encode_vp9_t { struct rtp_packet_t pkt; struct rtp_payload_t handler; void* cbparam; int size; }; static void* rtp_vp9_pack_create(int size, uint8_t pt, uint16_t seq, uint32_t ssrc, struct rtp_payload_t *handler, void* cbparam) { struct rtp_encode_vp9_t *packer; packer = (struct rtp_encode_vp9_t *)calloc(1, sizeof(*packer)); if (!packer) return NULL; memcpy(&packer->handler, handler, sizeof(packer->handler)); packer->cbparam = cbparam; packer->size = size; packer->pkt.rtp.v = RTP_VERSION; packer->pkt.rtp.pt = pt; packer->pkt.rtp.seq = seq; packer->pkt.rtp.ssrc = ssrc; return packer; } static void rtp_vp9_pack_destroy(void* pack) { struct rtp_encode_vp9_t *packer; packer = (struct rtp_encode_vp9_t *)pack; #if defined(_DEBUG) || defined(DEBUG) memset(packer, 0xCC, sizeof(*packer)); #endif free(packer); } static void rtp_vp9_pack_get_info(void* pack, uint16_t* seq, uint32_t* timestamp) { struct rtp_encode_vp9_t *packer; packer = (struct rtp_encode_vp9_t *)pack; *seq = (uint16_t)packer->pkt.rtp.seq; *timestamp = packer->pkt.rtp.timestamp; } static int rtp_vp9_pack_input(void* pack, const void* data, int bytes, uint32_t timestamp) { int r, n; uint8_t *rtp; uint8_t vp9_payload_descriptor[1]; const uint8_t *ptr; struct rtp_encode_vp9_t *packer; packer = (struct rtp_encode_vp9_t *)pack; packer->pkt.rtp.timestamp = timestamp; r = 0; ptr = (const uint8_t *)data; //In non-flexible mode (with the F bit below set to 0), for (vp9_payload_descriptor[0] = 0x08 /*Start of a layer frame*/; 0 == r && bytes > 0; ++packer->pkt.rtp.seq) { packer->pkt.payload = ptr; packer->pkt.payloadlen = (bytes + N_VP9_HEADER + RTP_FIXED_HEADER) < packer->size ? bytes : (packer->size - N_VP9_HEADER - RTP_FIXED_HEADER); ptr += packer->pkt.payloadlen; bytes -= packer->pkt.payloadlen; n = RTP_FIXED_HEADER + N_VP9_HEADER + packer->pkt.payloadlen; rtp = (uint8_t*)packer->handler.alloc(packer->cbparam, n); if (!rtp) return -ENOMEM; // Marker bit (M): MUST be set to 1 for the final packet of the highest // spatial layer frame (the final packet of the super frame), and 0 // otherwise. Unless spatial scalability is in use for this super // frame, this will have the same value as the E bit described below. // Note this bit MUST be set to 1 for the target spatial layer frame // if a stream is being rewritten to remove higher spatial layers. packer->pkt.rtp.m = (0 == bytes) ? 1 : 0; vp9_payload_descriptor[0] |= (0 == bytes) ? 0x04 : 0; // End of a layer frame. n = rtp_packet_serialize_header(&packer->pkt, rtp, n); if (n != RTP_FIXED_HEADER) { assert(0); return -1; } memcpy(rtp + n, vp9_payload_descriptor, N_VP9_HEADER); memcpy(rtp + n + N_VP9_HEADER, packer->pkt.payload, packer->pkt.payloadlen); r = packer->handler.packet(packer->cbparam, rtp, n + N_VP9_HEADER + packer->pkt.payloadlen, packer->pkt.rtp.timestamp, 0); packer->handler.free(packer->cbparam, rtp); vp9_payload_descriptor[0] &= ~0x08; } return r; } struct rtp_payload_encode_t *rtp_vp9_encode() { static struct rtp_payload_encode_t encode = { rtp_vp9_pack_create, rtp_vp9_pack_destroy, rtp_vp9_pack_get_info, rtp_vp9_pack_input, }; return &encode; }