package core import ( "context" "errors" "fmt" "net" "net/url" "strings" "sync" "time" "github.com/aler9/gortsplib" "github.com/aler9/gortsplib/pkg/aac" "github.com/aler9/gortsplib/pkg/h264" "github.com/aler9/gortsplib/pkg/ringbuffer" "github.com/aler9/gortsplib/pkg/rtpaac" "github.com/aler9/gortsplib/pkg/rtph264" "github.com/notedit/rtmp/format/flv/flvio" "github.com/aler9/rtsp-simple-server/internal/conf" "github.com/aler9/rtsp-simple-server/internal/externalcmd" "github.com/aler9/rtsp-simple-server/internal/logger" "github.com/aler9/rtsp-simple-server/internal/rtmp" "github.com/aler9/rtsp-simple-server/internal/rtmp/h264conf" "github.com/aler9/rtsp-simple-server/internal/rtmp/message" ) const ( rtmpConnPauseAfterAuthError = 2 * time.Second ) func pathNameAndQuery(inURL *url.URL) (string, url.Values, string) { // remove leading and trailing slashes inserted by OBS and some other clients tmp := strings.TrimRight(inURL.String(), "/") ur, _ := url.Parse(tmp) pathName := strings.TrimLeft(ur.Path, "/") return pathName, ur.Query(), ur.RawQuery } type rtmpConnState int const ( rtmpConnStateIdle rtmpConnState = iota //nolint:deadcode,varcheck rtmpConnStateRead rtmpConnStatePublish ) type rtmpConnPathManager interface { readerSetupPlay(req pathReaderSetupPlayReq) pathReaderSetupPlayRes publisherAnnounce(req pathPublisherAnnounceReq) pathPublisherAnnounceRes } type rtmpConnParent interface { log(logger.Level, string, ...interface{}) connClose(*rtmpConn) } type rtmpConn struct { id string externalAuthenticationURL string rtspAddress string readTimeout conf.StringDuration writeTimeout conf.StringDuration readBufferCount int runOnConnect string runOnConnectRestart bool wg *sync.WaitGroup conn *rtmp.Conn nconn net.Conn externalCmdPool *externalcmd.Pool pathManager rtmpConnPathManager parent rtmpConnParent ctx context.Context ctxCancel func() created time.Time path *path ringBuffer *ringbuffer.RingBuffer // read state rtmpConnState stateMutex sync.Mutex } func newRTMPConn( parentCtx context.Context, id string, externalAuthenticationURL string, rtspAddress string, readTimeout conf.StringDuration, writeTimeout conf.StringDuration, readBufferCount int, runOnConnect string, runOnConnectRestart bool, wg *sync.WaitGroup, nconn net.Conn, externalCmdPool *externalcmd.Pool, pathManager rtmpConnPathManager, parent rtmpConnParent, ) *rtmpConn { ctx, ctxCancel := context.WithCancel(parentCtx) c := &rtmpConn{ id: id, externalAuthenticationURL: externalAuthenticationURL, rtspAddress: rtspAddress, readTimeout: readTimeout, writeTimeout: writeTimeout, readBufferCount: readBufferCount, runOnConnect: runOnConnect, runOnConnectRestart: runOnConnectRestart, wg: wg, conn: rtmp.NewConn(nconn), nconn: nconn, externalCmdPool: externalCmdPool, pathManager: pathManager, parent: parent, ctx: ctx, ctxCancel: ctxCancel, created: time.Now(), } c.log(logger.Info, "opened") c.wg.Add(1) go c.run() return c } func (c *rtmpConn) close() { c.ctxCancel() } func (c *rtmpConn) remoteAddr() net.Addr { return c.nconn.RemoteAddr() } func (c *rtmpConn) log(level logger.Level, format string, args ...interface{}) { c.parent.log(level, "[conn %v] "+format, append([]interface{}{c.nconn.RemoteAddr()}, args...)...) } func (c *rtmpConn) ip() net.IP { return c.nconn.RemoteAddr().(*net.TCPAddr).IP } func (c *rtmpConn) safeState() rtmpConnState { c.stateMutex.Lock() defer c.stateMutex.Unlock() return c.state } func (c *rtmpConn) run() { defer c.wg.Done() err := func() error { if c.runOnConnect != "" { c.log(logger.Info, "runOnConnect command started") _, port, _ := net.SplitHostPort(c.rtspAddress) onConnectCmd := externalcmd.NewCmd( c.externalCmdPool, c.runOnConnect, c.runOnConnectRestart, externalcmd.Environment{ "RTSP_PATH": "", "RTSP_PORT": port, }, func(co int) { c.log(logger.Info, "runOnConnect command exited with code %d", co) }) defer func() { onConnectCmd.Close() c.log(logger.Info, "runOnConnect command stopped") }() } ctx, cancel := context.WithCancel(c.ctx) runErr := make(chan error) go func() { runErr <- c.runInner(ctx) }() select { case err := <-runErr: cancel() return err case <-c.ctx.Done(): cancel() <-runErr return errors.New("terminated") } }() c.ctxCancel() c.parent.connClose(c) c.log(logger.Info, "closed (%v)", err) } func (c *rtmpConn) runInner(ctx context.Context) error { go func() { <-ctx.Done() c.nconn.Close() }() c.nconn.SetReadDeadline(time.Now().Add(time.Duration(c.readTimeout))) c.nconn.SetWriteDeadline(time.Now().Add(time.Duration(c.writeTimeout))) u, isReading, err := c.conn.InitializeServer() if err != nil { return err } if isReading { return c.runRead(ctx, u) } return c.runPublish(ctx, u) } func (c *rtmpConn) runRead(ctx context.Context, u *url.URL) error { pathName, query, rawQuery := pathNameAndQuery(u) res := c.pathManager.readerSetupPlay(pathReaderSetupPlayReq{ author: c, pathName: pathName, authenticate: func( pathIPs []fmt.Stringer, pathUser conf.Credential, pathPass conf.Credential, ) error { return c.authenticate(pathName, pathIPs, pathUser, pathPass, "read", query, rawQuery) }, }) if res.err != nil { if terr, ok := res.err.(pathErrAuthCritical); ok { // wait some seconds to stop brute force attacks <-time.After(rtmpConnPauseAfterAuthError) return errors.New(terr.message) } return res.err } c.path = res.path defer func() { c.path.readerRemove(pathReaderRemoveReq{author: c}) }() c.stateMutex.Lock() c.state = rtmpConnStateRead c.stateMutex.Unlock() var videoTrack *gortsplib.TrackH264 videoTrackID := -1 var audioTrack *gortsplib.TrackAAC audioTrackID := -1 var aacDecoder *rtpaac.Decoder for i, track := range res.stream.tracks() { switch tt := track.(type) { case *gortsplib.TrackH264: if videoTrack != nil { return fmt.Errorf("can't read track %d with RTMP: too many tracks", i+1) } videoTrack = tt videoTrackID = i case *gortsplib.TrackAAC: if audioTrack != nil { return fmt.Errorf("can't read track %d with RTMP: too many tracks", i+1) } audioTrack = tt audioTrackID = i aacDecoder = &rtpaac.Decoder{ SampleRate: tt.Config.SampleRate, SizeLength: tt.SizeLength, IndexLength: tt.IndexLength, IndexDeltaLength: tt.IndexDeltaLength, } aacDecoder.Init() } } if videoTrack == nil && audioTrack == nil { return fmt.Errorf("the stream doesn't contain an H264 track or an AAC track") } c.nconn.SetWriteDeadline(time.Now().Add(time.Duration(c.writeTimeout))) err := c.conn.WriteTracks(videoTrack, audioTrack) if err != nil { return err } c.ringBuffer, _ = ringbuffer.New(uint64(c.readBufferCount)) go func() { <-ctx.Done() c.ringBuffer.Close() }() c.path.readerPlay(pathReaderPlayReq{ author: c, }) if c.path.Conf().RunOnRead != "" { c.log(logger.Info, "runOnRead command started") onReadCmd := externalcmd.NewCmd( c.externalCmdPool, c.path.Conf().RunOnRead, c.path.Conf().RunOnReadRestart, c.path.externalCmdEnv(), func(co int) { c.log(logger.Info, "runOnRead command exited with code %d", co) }) defer func() { onReadCmd.Close() c.log(logger.Info, "runOnRead command stopped") }() } // disable read deadline c.nconn.SetReadDeadline(time.Time{}) var videoInitialPTS *time.Duration videoFirstIDRFound := false var videoStartDTS time.Duration var videoDTSExtractor *h264.DTSExtractor for { item, ok := c.ringBuffer.Pull() if !ok { return fmt.Errorf("terminated") } data := item.(*data) if videoTrack != nil && data.trackID == videoTrackID { if data.h264NALUs == nil { continue } // video is decoded in another routine, // while audio is decoded in this routine: // we have to sync their PTS. if videoInitialPTS == nil { v := data.h264PTS videoInitialPTS = &v } pts := data.h264PTS - *videoInitialPTS idrPresent := false nonIDRPresent := false for _, nalu := range data.h264NALUs { typ := h264.NALUType(nalu[0] & 0x1F) switch typ { case h264.NALUTypeIDR: idrPresent = true case h264.NALUTypeNonIDR: nonIDRPresent = true } } var dts time.Duration // wait until we receive an IDR if !videoFirstIDRFound { if !idrPresent { continue } videoFirstIDRFound = true videoDTSExtractor = h264.NewDTSExtractor() var err error dts, err = videoDTSExtractor.Extract(data.h264NALUs, pts) if err != nil { return err } videoStartDTS = dts dts = 0 pts -= videoStartDTS } else { if !idrPresent && !nonIDRPresent { continue } var err error dts, err = videoDTSExtractor.Extract(data.h264NALUs, pts) if err != nil { return err } dts -= videoStartDTS pts -= videoStartDTS } // insert a H264DecoderConfig before every IDR if idrPresent { sps := videoTrack.SafeSPS() pps := videoTrack.SafePPS() buf, _ := h264conf.Conf{ SPS: sps, PPS: pps, }.Marshal() err = c.conn.WriteMessage(&message.MsgVideo{ ChunkStreamID: 6, MessageStreamID: 1, IsKeyFrame: true, H264Type: flvio.AVC_SEQHDR, Payload: buf, }) if err != nil { return err } } avcc, err := h264.AVCCMarshal(data.h264NALUs) if err != nil { return err } c.nconn.SetWriteDeadline(time.Now().Add(time.Duration(c.writeTimeout))) err = c.conn.WriteMessage(&message.MsgVideo{ ChunkStreamID: 6, MessageStreamID: 1, IsKeyFrame: idrPresent, H264Type: flvio.AVC_NALU, Payload: avcc, DTS: dts, PTSDelta: pts - dts, }) if err != nil { return err } } else if audioTrack != nil && data.trackID == audioTrackID { aus, pts, err := aacDecoder.Decode(data.rtp) if err != nil { if err != rtpaac.ErrMorePacketsNeeded { c.log(logger.Warn, "unable to decode audio track: %v", err) } continue } if videoTrack != nil && !videoFirstIDRFound { continue } pts -= videoStartDTS if pts < 0 { continue } for i, au := range aus { c.nconn.SetWriteDeadline(time.Now().Add(time.Duration(c.writeTimeout))) err := c.conn.WriteMessage(&message.MsgAudio{ ChunkStreamID: 4, MessageStreamID: 1, Rate: flvio.SOUND_44Khz, Depth: flvio.SOUND_16BIT, Channels: flvio.SOUND_STEREO, AACType: flvio.AAC_RAW, Payload: au, DTS: pts + time.Duration(i)*aac.SamplesPerAccessUnit*time.Second/time.Duration(audioTrack.ClockRate()), }) if err != nil { return err } } } } } func (c *rtmpConn) runPublish(ctx context.Context, u *url.URL) error { c.nconn.SetReadDeadline(time.Now().Add(time.Duration(c.readTimeout))) videoTrack, audioTrack, err := c.conn.ReadTracks() if err != nil { return err } var tracks gortsplib.Tracks videoTrackID := -1 audioTrackID := -1 var h264Encoder *rtph264.Encoder if videoTrack != nil { h264Encoder = &rtph264.Encoder{PayloadType: 96} h264Encoder.Init() videoTrackID = len(tracks) tracks = append(tracks, videoTrack) } var aacEncoder *rtpaac.Encoder if audioTrack != nil { aacEncoder = &rtpaac.Encoder{ PayloadType: 96, SampleRate: audioTrack.ClockRate(), SizeLength: 13, IndexLength: 3, IndexDeltaLength: 3, } aacEncoder.Init() audioTrackID = len(tracks) tracks = append(tracks, audioTrack) } pathName, query, rawQuery := pathNameAndQuery(u) res := c.pathManager.publisherAnnounce(pathPublisherAnnounceReq{ author: c, pathName: pathName, authenticate: func( pathIPs []fmt.Stringer, pathUser conf.Credential, pathPass conf.Credential, ) error { return c.authenticate(pathName, pathIPs, pathUser, pathPass, "publish", query, rawQuery) }, }) if res.err != nil { if terr, ok := res.err.(pathErrAuthCritical); ok { // wait some seconds to stop brute force attacks <-time.After(rtmpConnPauseAfterAuthError) return errors.New(terr.message) } return res.err } c.path = res.path defer func() { c.path.publisherRemove(pathPublisherRemoveReq{author: c}) }() c.stateMutex.Lock() c.state = rtmpConnStatePublish c.stateMutex.Unlock() // disable write deadline c.nconn.SetWriteDeadline(time.Time{}) rres := c.path.publisherRecord(pathPublisherRecordReq{ author: c, tracks: tracks, }) if rres.err != nil { return rres.err } for { c.nconn.SetReadDeadline(time.Now().Add(time.Duration(c.readTimeout))) msg, err := c.conn.ReadMessage() if err != nil { return err } switch tmsg := msg.(type) { case *message.MsgVideo: if tmsg.H264Type == flvio.AVC_SEQHDR { var conf h264conf.Conf err = conf.Unmarshal(tmsg.Payload) if err != nil { return fmt.Errorf("unable to parse H264 config: %v", err) } pts := tmsg.DTS + tmsg.PTSDelta nalus := [][]byte{ conf.SPS, conf.PPS, } pkts, err := h264Encoder.Encode(nalus, pts) if err != nil { return fmt.Errorf("error while encoding H264: %v", err) } lastPkt := len(pkts) - 1 for i, pkt := range pkts { if i != lastPkt { rres.stream.writeData(&data{ trackID: videoTrackID, rtp: pkt, ptsEqualsDTS: false, }) } else { rres.stream.writeData(&data{ trackID: videoTrackID, rtp: pkt, ptsEqualsDTS: false, h264NALUs: nalus, h264PTS: pts, }) } } } else if tmsg.H264Type == flvio.AVC_NALU { if videoTrack == nil { return fmt.Errorf("received an H264 packet, but track is not set up") } nalus, err := h264.AVCCUnmarshal(tmsg.Payload) if err != nil { return fmt.Errorf("unable to decode AVCC: %v", err) } // skip invalid NALUs sent by DJI n := 0 for _, nalu := range nalus { if len(nalu) != 0 { n++ } } if n == 0 { continue } validNALUs := make([][]byte, n) pos := 0 for _, nalu := range nalus { if len(nalu) != 0 { validNALUs[pos] = nalu pos++ } } pts := tmsg.DTS + tmsg.PTSDelta pkts, err := h264Encoder.Encode(validNALUs, pts) if err != nil { return fmt.Errorf("error while encoding H264: %v", err) } lastPkt := len(pkts) - 1 for i, pkt := range pkts { if i != lastPkt { rres.stream.writeData(&data{ trackID: videoTrackID, rtp: pkt, ptsEqualsDTS: false, }) } else { rres.stream.writeData(&data{ trackID: videoTrackID, rtp: pkt, ptsEqualsDTS: h264.IDRPresent(validNALUs), h264NALUs: validNALUs, h264PTS: pts, }) } } } case *message.MsgAudio: if tmsg.AACType == flvio.AAC_RAW { if audioTrack == nil { return fmt.Errorf("received an AAC packet, but track is not set up") } pkts, err := aacEncoder.Encode([][]byte{tmsg.Payload}, tmsg.DTS) if err != nil { return fmt.Errorf("error while encoding AAC: %v", err) } for _, pkt := range pkts { rres.stream.writeData(&data{ trackID: audioTrackID, rtp: pkt, ptsEqualsDTS: true, }) } } } } } func (c *rtmpConn) authenticate( pathName string, pathIPs []fmt.Stringer, pathUser conf.Credential, pathPass conf.Credential, action string, query url.Values, rawQuery string, ) error { if c.externalAuthenticationURL != "" { err := externalAuth( c.externalAuthenticationURL, c.ip().String(), query.Get("user"), query.Get("pass"), pathName, action, rawQuery) if err != nil { return pathErrAuthCritical{ message: fmt.Sprintf("external authentication failed: %s", err), } } } if pathIPs != nil { ip := c.ip() if !ipEqualOrInRange(ip, pathIPs) { return pathErrAuthCritical{ message: fmt.Sprintf("IP '%s' not allowed", ip), } } } if pathUser != "" { if query.Get("user") != string(pathUser) || query.Get("pass") != string(pathPass) { return pathErrAuthCritical{ message: "invalid credentials", } } } return nil } // onReaderAccepted implements reader. func (c *rtmpConn) onReaderAccepted() { c.log(logger.Info, "is reading from path '%s'", c.path.Name()) } // onReaderData implements reader. func (c *rtmpConn) onReaderData(data *data) { c.ringBuffer.Push(data) } // apiReaderDescribe implements reader. func (c *rtmpConn) apiReaderDescribe() interface{} { return struct { Type string `json:"type"` ID string `json:"id"` }{"rtmpConn", c.id} } // apiSourceDescribe implements source. func (c *rtmpConn) apiSourceDescribe() interface{} { return struct { Type string `json:"type"` ID string `json:"id"` }{"rtmpConn", c.id} } // onPublisherAccepted implements publisher. func (c *rtmpConn) onPublisherAccepted(tracksLen int) { c.log(logger.Info, "is publishing to path '%s', %d %s", c.path.Name(), tracksLen, func() string { if tracksLen == 1 { return "track" } return "tracks" }()) }